diff --git a/mlc-chat-config.json b/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..1005a5caa596ebbf3dcc916b97d3284e19ad6678
--- /dev/null
+++ b/mlc-chat-config.json
@@ -0,0 +1,76 @@
+{
+ "version": "0.1.0",
+ "model_type": "qwen2",
+ "quantization": "q4f32_1",
+ "model_config": {
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "intermediate_size": 13824,
+ "num_attention_heads": 40,
+ "num_hidden_layers": 48,
+ "num_key_value_heads": 8,
+ "rms_norm_eps": 1e-05,
+ "rope_theta": 1000000.0,
+ "vocab_size": 152064,
+ "tie_word_embeddings": false,
+ "context_window_size": 131072,
+ "prefill_chunk_size": 8192,
+ "tensor_parallel_shards": 1,
+ "head_dim": 128,
+ "dtype": "float32",
+ "max_batch_size": 128
+ },
+ "vocab_size": 152064,
+ "context_window_size": 131072,
+ "sliding_window_size": -1,
+ "prefill_chunk_size": 8192,
+ "attention_sink_size": -1,
+ "tensor_parallel_shards": 1,
+ "pipeline_parallel_stages": 1,
+ "temperature": 1.0,
+ "presence_penalty": 0.0,
+ "frequency_penalty": 0.0,
+ "repetition_penalty": 1.0,
+ "top_p": 1.0,
+ "tokenizer_files": [
+ "tokenizer.json",
+ "tokenizer_config.json"
+ ],
+ "tokenizer_info": {
+ "token_postproc_method": "byte_level",
+ "prepend_space_in_encode": false,
+ "strip_space_in_decode": false
+ },
+ "conv_template": {
+ "name": "deepseek_v3",
+ "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
+ "system_message": "You are a helpful assistant.",
+ "system_prefix_token_ids": null,
+ "add_role_after_system_message": true,
+ "roles": {
+ "user": "<\uff5cUser\uff5c>",
+ "assistant": "<\uff5cAssistant\uff5c>"
+ },
+ "role_templates": {
+ "user": "{user_message}",
+ "assistant": "{assistant_message}",
+ "tool": "{tool_message}"
+ },
+ "messages": [],
+ "seps": [
+ "",
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
+ ],
+ "role_content_sep": "",
+ "role_empty_sep": "",
+ "stop_str": [],
+ "stop_token_ids": [
+ 151643
+ ],
+ "function_string": "",
+ "use_function_calling": false
+ },
+ "pad_token_id": 0,
+ "bos_token_id": 151643,
+ "eos_token_id": 151643
+}
\ No newline at end of file
diff --git a/ndarray-cache-b16.json b/ndarray-cache-b16.json
new file mode 100644
index 0000000000000000000000000000000000000000..dcc934791ab75abc6f1232e118956ca84d548cd9
--- /dev/null
+++ b/ndarray-cache-b16.json
@@ -0,0 +1,7295 @@
+{
+ "metadata": {
+ "ParamSize": 533,
+ "ParamBytes": 9234108416.0,
+ "BitsPerParam": 5.001536828453907
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7932312201ae2761485f7d412eb0dbfe"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 48660480,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 152064,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 48660480,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e8920c096ece303715da29d808f834ba"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 20658176,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 14336
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 18364416
+ }
+ ],
+ "md5sum": "0b571f3cb6e619d96c6d40630c3be1ff"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0873eb6ddb15076ff9e499315425a609"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "538a9140fd4d851564a8e5686c890abd"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b459ee0e7734cf867044df5858581b06"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1a9657c43d2bea8e04a216f3be1b8e0f"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1cee758ccca6cbe36975f5901632cb6a"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23967261fbec14b496b7fab724ada7c6"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4747ff8880b109fc7cdac257c72e0909"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a03c85f259f400f3ad626ed448f8de06"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5d1502cee18ca38bf9569a4f2900d035"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7e822acd73e2feb8ca61f8aacdcc9f25"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c172f544d6b820912a5d1279126b07e3"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ea7119633580bd91b68e726d11ce41bf"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edc4493565017e3614f855e31a8b9cea"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e70639e61c5a6f828e70f53c956c7a5b"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "54cce2674637e5a9a9b724d8abd43d5b"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "62990000ac40d33b5e13e80a6794e67d"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9cb8aa1c245fb018feb6cbc935dbfe40"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87ecc2cdf173992e37c6e22b776da3c1"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8e353bc00035e776d9db63e7d5196bb4"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "70bcb66e8cf3b0af54f269770cb4a75f"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25d76912d6a3c86237e5cbc316967078"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "49d47a73555153bb2507b20d9bd04774"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbdf427b1e0acda5b18d6dcdb636460f"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "e44ccd97c2fcb8364ca54290494bff5f"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ced8e045499bec3933817d6953afe681"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "817fa4fc575c020e227a82065a0c0ebb"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c5087115c379bdb08e441defb3c6884c"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8626b889867fe49ec7f6423d10fbea38"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "08f7521d12af06f4dc3005b63467301e"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9083a533bca8129b86a454936dd3be31"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05e0fb5fa6e0a151dbbd29826d43d1a2"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "79999b6e37dfb6ff24960a6ff5eae8f5"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80e4fc34fb71582c2691088376138e7b"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b95bfd81c4a8d8176d170b1e6034ca7c"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "95f356828a6135b35c54fa222f55c305"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "52842279650a298ddeba0d927e2ffbca"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ed6f01edc94144612c873b5c04b7ed3e"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d488cc2a2c313f52f333c0dc99274ee4"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d16baa55d9af207a1cbfb9976386735d"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "89e8cc5017ea54b8dfcb39190473b7b7"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99a3e961945d71a0cec35bd853b33453"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9c2be96534fae38bc36c210fa1c79ea9"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2fe138d29ead13a985595e1bc8feb62e"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "3d3a7cb57e3525893704ef5b90577cf6"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa05a36c803f9c3f170792e037edbdb7"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "30273495e93ff39265054d6e5dea870f"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e74089f716018d9bf10283b8d3ece561"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "16e47105dc1c0e85f0e994ebf39e953b"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8eb1ec86ab7eeb2a709f75a0bba77ee0"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0ec0c74c648b0f53a9097b90e280ae4"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64aa5be14a58a85ed8a1bbe4489274c0"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "20f4b8fa85b48dd5d408c9006ea39730"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "763857f90cc3eab1994051b5d512edde"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b7894130f44658e78d760cd5dc55703d"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0831947aac962e67314d37cb09ddec32"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a82e7b0dbb93f2eec513d953d6d64cc3"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5065c02abe656e842bb387bbf34e03d"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05e657b42e97ae7ef1bb1fb6e34bf234"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51f7126252aa56c433965174f6ae8eb1"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a99dc9d0a4f83c597d39f355d211261c"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "467aaf4204905861b799c59e892214c3"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b8d903b91bbd9922e546bdb5d793b3c"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af905a61d3e62e1c40d17e9fab5bd16b"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a94f062339b6a79734db0550f046531d"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "12c180ae705fcce191cbaff8f3cfbe4d"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4e950d83deff4a32cba546438d5929a"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "82674b200d22e463869c3c43a39b665e"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "73699ef754e40aa5b8873257abce71bc"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "985b5840b8ce0e375de207b3a5f8c0de"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1745418f4676400a521012ed8ee6f076"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "33800e5c32e92342b639417acd4dcfb1"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "d8eff008543147da2e0b50398c898e0f"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4be508de3d9252438aba4f647de6264b"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a0da1461b1c30b225d718ba3f0b7af80"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7d5d7e457dfd1682b881bc8680c3ad6"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1d817f83be19dca2dd0aa5fb9005e0e7"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0fa9918f677c5a00f073d2e86ec8d7b3"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80c2fad6fa1a0ba5d6066a9e259881f4"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c6cd38a76fd67e2d7abc5d9b6d2f4cd"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "943bfdca7c057b2f1a7d2686821ad174"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9a846261b8fc87f398ab0a1cc8fb787"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d618f1cae13906bee204a4da7da60711"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6529c3c0446cb21b0526e3843b4fd948"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "15dbda57f274cf542618cd7d8f2642dd"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84150ee0028376bdd451fc25900b4185"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8b8cea6013b424828512d64b2909012"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b74ca5b23f0fa5238378a71c52495bcb"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8b428d8a7ed1dbbb3bd9f41a7781a026"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "08e69d08505661f7551a8c57d4316820"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "70b07c919d27e7fc5595380be4b158b6"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51cd251c279e163f9a8b7f64b287ff37"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "bdd83cdfcc8c25d5df7d211b9abd1295"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a4642756149f1b308b86fdd97419214"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d95ba4f66725445a62546074ea53818d"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff4b728677086705e97e96bdf9b6c29f"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "3d92c34837d04ac9473cd614178dbe9b"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac4877752dfc1a86cbfe31f28bc6fdec"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5788e8512001ff0cd3563119964fe040"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8cd209791b3fe3f4c7fb7c2a9f5bcffe"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1cc83de03adc4be34a9f101d8458bed7"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fd1bbffefbaf25795ef7f378c0ebe4f9"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8b48d937058816c233df2b2cb7e21371"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7cc7456591121088da5eee758d724977"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "fbe3172066f94391ec218094d47effe0"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9118afaa62dcbdcb41c31eadce88a92f"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bf5757fbe6013d4e2b483c6d9d2042cd"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23a0b2af24c9ce6480e89d7c4fdc3420"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "7cf3d78301737f206aefa5b477ff8fc3"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61daafc8f43b59c6d308e2633a0895a6"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2c26d21b1c63f596add98bb5143492c6"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15ea8d0201aab14cc89e5cb37785f977"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "06cbe75a6c667f5efab284447f13a0e6"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d80b98733c25d4f79cdf2be5f080a042"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "abb4e1d206b66220eed4d8bdc889b08c"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c8b216208b08dcaf88b2146c28bdb7d"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "6dbe8312f9b5e1f0982e8b892756f968"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "901d320d6c86427c0edf144d3d2a0b5c"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a24bc0e1dd267b68c7a1fe177d25d53"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3977a531dafa2b60aee26c7b7f5dd9ff"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "9d861f7c2991350e657600955ee7a929"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f79c4877efac93448bbce943e63e14a0"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "507be0ec8d8672267c475fbc32deef1c"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "605496ad25e251edbc9462e980b474a8"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "4a6c3e38d3efc654ab663dd5756ab24c"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3a3dcfa6f5882671de2bcf6ef7713d15"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5eee66ca8e0477316ed1c5f2d0514ad4"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce5ec5b9485fff8f11f13600b17c2fdb"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "da8a6a861570c85ebd946ecb484c31cf"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b9478d35558d6401767c99879841eb01"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3664490b9465d3195ff797bf2a9cd057"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8d5493dbbd4f93991a39712e830a5f1"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ec855fb0d071f621cd9a8cb25a548508"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8cbdd03ec81e73ebdcade755d835348"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "def6a9c5e8f6dda0a4bee7f77c2a17c3"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "71b3d1f9f01f374a24e8addc59c1e02f"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "7b9fee89096d9c8dd9db27bbf8b9506e"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "df7bb42db4210ca3d9728960aed736b4"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf98ffea17c329afdf228eece5813470"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "962959737c5f9b032aa38df86940f7a4"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "d876828df99073e204111cbccccf1817"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e0f66ff197c46575e6ceed2562dac7f4"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2e17099e223959ed75ecfed3e4a20833"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ac3e43c814a1338d7aae590b2133039"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a706c2e4e9360bf828d25e5215d0f8c6"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ed6dde365aea49fd12a58526df50e537"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "12046d09e74cf4be566b5ce91f8267d1"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "78ba5b4f37352c7e7367add8a4e04486"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1a64525c20202bde63132e15e2bad4d1"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aea9c0bd272b054b31b300d9a1cd80c6"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a7b7b3bc7accdc806222461d7931365"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "485e616559fe9c2c444f7cbbe2e66e1c"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "920dfd9b5496e048ea6fd82ce2b8750a"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c595d4e3df3def50b47418cfdff16e26"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "436a74975377a0e16e0efc983cde09de"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0bd1df8b32b7f3ddd019cb2aae21128c"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "15d886d86562b7fe39046afdeabbcd32"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ad01b50c27ca63ffe7f5f3df9bf8290d"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edf503612f59edf7d6355eca975b6141"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5bc34da4a881064e2aff08a2ac7c1f9"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "eaa533f9ce5908ecf60ccd7dc80881d0"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f0fe216d86609c630df4af6de5aa0b6a"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a8682b6da6ae4bb1b3df5ff71e63c39b"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8b230bc58165f171686c2c219e2b827"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "23e05cbb42f9b1c85aff4ff74c929800"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c17b864491ea836dc561700086748c81"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d99c2609a8e53e906b98dd4fdf4e0c31"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19ab27129ee5a4329c92d614262339b9"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "965a5e9cf3b3dcf5aac6688a8dcbb28b"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9adaca8fa50e876723892fb3601b8b3c"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f379aa793cb2c8da4b4f674767a64b53"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cc2e3704a25930074bf3c4146daf587"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ceeb7fa446b82f5519611fb75bcb1e73"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "791b43015f4f501314ab722e388b6225"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2cde58856c9af9c8ec0106197b148850"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "98190f3a4f88dede59f598ddb91b2b94"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8e56f2a4be6b75ccf50158f14dd76acb"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2318d5f199693812f581fac9f1b04e6b"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b19ab81c417bff65aeee25784e74f8a2"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1346a74cb2b723f7dae8738092fc9e27"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "c4718063906715e3004929d9116bd783"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cfd8b0f322d50ef664a345575f0b9b9"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55510bc907509fa6c26b09d8d66e8879"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "32deb7b195fcaabff18a174d9bbed193"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "76cb6e7164301dd19bf705aff1f26e5d"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "736efad18492120448e43c776b7e9a25"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb3c5f9e9c7663b8d13882f22a0f2aa4"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c287e0602a073d45d28d3d3f1dfd9dd0"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "934be68f81995621154452adad6676fd"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f14e9a08a484031adf3a07f050e6ff24"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7939af8318c6096f44610ae6f411f696"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63a4219bd8f0d5088b95588bd567597a"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 48660480,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 152064,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 48660480,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f082397dddce00dec18bdcdf0448c1f2"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 28047360,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "bfloat16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 28037120
+ }
+ ],
+ "md5sum": "97c68ec5e6f50b02655cd803ec64874c"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..3a847dcbebdffce8ad0f5120f5b4847b3560399c
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,7295 @@
+{
+ "metadata": {
+ "ParamSize": 533,
+ "ParamBytes": 9234108416.0,
+ "BitsPerParam": 5.001536828453907
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7932312201ae2761485f7d412eb0dbfe"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 48660480,
+ "records": [
+ {
+ "name": "model.embed_tokens.q_scale",
+ "shape": [
+ 152064,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 48660480,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e8920c096ece303715da29d808f834ba"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 20658176,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 14336
+ },
+ {
+ "name": "model.layers.0.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 18364416
+ }
+ ],
+ "md5sum": "0b571f3cb6e619d96c6d40630c3be1ff"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0873eb6ddb15076ff9e499315425a609"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.0.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "538a9140fd4d851564a8e5686c890abd"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b459ee0e7734cf867044df5858581b06"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.0.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.0.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.0.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.0.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.0.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.1.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1a9657c43d2bea8e04a216f3be1b8e0f"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1cee758ccca6cbe36975f5901632cb6a"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.1.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23967261fbec14b496b7fab724ada7c6"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4747ff8880b109fc7cdac257c72e0909"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.1.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.1.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.1.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.1.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.1.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.2.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a03c85f259f400f3ad626ed448f8de06"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5d1502cee18ca38bf9569a4f2900d035"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.2.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7e822acd73e2feb8ca61f8aacdcc9f25"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c172f544d6b820912a5d1279126b07e3"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.2.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.2.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.2.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.2.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.2.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.3.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ea7119633580bd91b68e726d11ce41bf"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edc4493565017e3614f855e31a8b9cea"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.3.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e70639e61c5a6f828e70f53c956c7a5b"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "54cce2674637e5a9a9b724d8abd43d5b"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.3.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.3.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.3.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.3.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.3.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.4.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "62990000ac40d33b5e13e80a6794e67d"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9cb8aa1c245fb018feb6cbc935dbfe40"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.4.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "87ecc2cdf173992e37c6e22b776da3c1"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8e353bc00035e776d9db63e7d5196bb4"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.4.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.4.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.4.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.4.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.4.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.5.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "70bcb66e8cf3b0af54f269770cb4a75f"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "25d76912d6a3c86237e5cbc316967078"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.5.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "49d47a73555153bb2507b20d9bd04774"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cbdf427b1e0acda5b18d6dcdb636460f"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.5.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.5.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.5.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.5.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.5.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.6.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "e44ccd97c2fcb8364ca54290494bff5f"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ced8e045499bec3933817d6953afe681"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.6.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "817fa4fc575c020e227a82065a0c0ebb"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c5087115c379bdb08e441defb3c6884c"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.6.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.6.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.6.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.6.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.6.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.7.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8626b889867fe49ec7f6423d10fbea38"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "08f7521d12af06f4dc3005b63467301e"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.7.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9083a533bca8129b86a454936dd3be31"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05e0fb5fa6e0a151dbbd29826d43d1a2"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.7.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.7.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.7.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.7.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.7.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.8.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "79999b6e37dfb6ff24960a6ff5eae8f5"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80e4fc34fb71582c2691088376138e7b"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.8.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b95bfd81c4a8d8176d170b1e6034ca7c"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "95f356828a6135b35c54fa222f55c305"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.8.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.8.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.8.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.8.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.8.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.9.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "52842279650a298ddeba0d927e2ffbca"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ed6f01edc94144612c873b5c04b7ed3e"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.9.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d488cc2a2c313f52f333c0dc99274ee4"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d16baa55d9af207a1cbfb9976386735d"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.9.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.9.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.9.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.9.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.9.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.10.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "89e8cc5017ea54b8dfcb39190473b7b7"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "99a3e961945d71a0cec35bd853b33453"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.10.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9c2be96534fae38bc36c210fa1c79ea9"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2fe138d29ead13a985595e1bc8feb62e"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.10.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.10.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.10.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.10.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.10.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.11.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "3d3a7cb57e3525893704ef5b90577cf6"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aa05a36c803f9c3f170792e037edbdb7"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.11.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "30273495e93ff39265054d6e5dea870f"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e74089f716018d9bf10283b8d3ece561"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.11.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.11.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.11.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.11.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.11.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.12.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "16e47105dc1c0e85f0e994ebf39e953b"
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8eb1ec86ab7eeb2a709f75a0bba77ee0"
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.12.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c0ec0c74c648b0f53a9097b90e280ae4"
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "64aa5be14a58a85ed8a1bbe4489274c0"
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.12.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.12.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.12.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.12.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.12.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.13.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "20f4b8fa85b48dd5d408c9006ea39730"
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "763857f90cc3eab1994051b5d512edde"
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.13.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b7894130f44658e78d760cd5dc55703d"
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0831947aac962e67314d37cb09ddec32"
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.13.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.13.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.13.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.13.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.13.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.14.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a82e7b0dbb93f2eec513d953d6d64cc3"
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5065c02abe656e842bb387bbf34e03d"
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.14.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "05e657b42e97ae7ef1bb1fb6e34bf234"
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51f7126252aa56c433965174f6ae8eb1"
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.14.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.14.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.14.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.14.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.14.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.15.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a99dc9d0a4f83c597d39f355d211261c"
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "467aaf4204905861b799c59e892214c3"
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.15.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7b8d903b91bbd9922e546bdb5d793b3c"
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "af905a61d3e62e1c40d17e9fab5bd16b"
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.15.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.15.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.15.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.15.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.15.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.16.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a94f062339b6a79734db0550f046531d"
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "12c180ae705fcce191cbaff8f3cfbe4d"
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.16.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f4e950d83deff4a32cba546438d5929a"
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "82674b200d22e463869c3c43a39b665e"
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.16.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.16.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.16.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.16.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.16.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.17.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "73699ef754e40aa5b8873257abce71bc"
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "985b5840b8ce0e375de207b3a5f8c0de"
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.17.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1745418f4676400a521012ed8ee6f076"
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "33800e5c32e92342b639417acd4dcfb1"
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.17.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.17.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.17.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.17.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.17.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.18.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "d8eff008543147da2e0b50398c898e0f"
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "4be508de3d9252438aba4f647de6264b"
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.18.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a0da1461b1c30b225d718ba3f0b7af80"
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f7d5d7e457dfd1682b881bc8680c3ad6"
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.18.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.18.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.18.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.18.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.18.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.19.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1d817f83be19dca2dd0aa5fb9005e0e7"
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0fa9918f677c5a00f073d2e86ec8d7b3"
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.19.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "80c2fad6fa1a0ba5d6066a9e259881f4"
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0c6cd38a76fd67e2d7abc5d9b6d2f4cd"
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.19.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.19.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.19.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.19.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.19.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.20.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "943bfdca7c057b2f1a7d2686821ad174"
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f9a846261b8fc87f398ab0a1cc8fb787"
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.20.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d618f1cae13906bee204a4da7da60711"
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "6529c3c0446cb21b0526e3843b4fd948"
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.20.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.20.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.20.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.20.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.20.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.21.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "15dbda57f274cf542618cd7d8f2642dd"
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "84150ee0028376bdd451fc25900b4185"
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.21.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c8b8cea6013b424828512d64b2909012"
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b74ca5b23f0fa5238378a71c52495bcb"
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.21.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.21.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.21.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.21.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.21.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.22.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8b428d8a7ed1dbbb3bd9f41a7781a026"
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "08e69d08505661f7551a8c57d4316820"
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.22.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "70b07c919d27e7fc5595380be4b158b6"
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "51cd251c279e163f9a8b7f64b287ff37"
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.22.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.22.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.22.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.22.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.22.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.23.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "bdd83cdfcc8c25d5df7d211b9abd1295"
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a4642756149f1b308b86fdd97419214"
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.23.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d95ba4f66725445a62546074ea53818d"
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ff4b728677086705e97e96bdf9b6c29f"
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.23.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.23.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.23.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.23.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.23.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.24.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "3d92c34837d04ac9473cd614178dbe9b"
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ac4877752dfc1a86cbfe31f28bc6fdec"
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.24.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5788e8512001ff0cd3563119964fe040"
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8cd209791b3fe3f4c7fb7c2a9f5bcffe"
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.24.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.24.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.24.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.24.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.24.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.25.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1cc83de03adc4be34a9f101d8458bed7"
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fd1bbffefbaf25795ef7f378c0ebe4f9"
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.25.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8b48d937058816c233df2b2cb7e21371"
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7cc7456591121088da5eee758d724977"
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.25.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.25.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.25.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.25.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.25.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.26.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "fbe3172066f94391ec218094d47effe0"
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9118afaa62dcbdcb41c31eadce88a92f"
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.26.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "bf5757fbe6013d4e2b483c6d9d2042cd"
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "23a0b2af24c9ce6480e89d7c4fdc3420"
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.26.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.26.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.26.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.26.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.26.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.27.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "7cf3d78301737f206aefa5b477ff8fc3"
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "61daafc8f43b59c6d308e2633a0895a6"
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.27.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2c26d21b1c63f596add98bb5143492c6"
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "15ea8d0201aab14cc89e5cb37785f977"
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.27.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.27.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.27.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.27.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.27.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.28.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "06cbe75a6c667f5efab284447f13a0e6"
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d80b98733c25d4f79cdf2be5f080a042"
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.28.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "abb4e1d206b66220eed4d8bdc889b08c"
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8c8b216208b08dcaf88b2146c28bdb7d"
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.28.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.28.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.28.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.28.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.28.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.29.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "6dbe8312f9b5e1f0982e8b892756f968"
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "901d320d6c86427c0edf144d3d2a0b5c"
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.29.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2a24bc0e1dd267b68c7a1fe177d25d53"
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3977a531dafa2b60aee26c7b7f5dd9ff"
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.29.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.29.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.29.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.29.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.29.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.30.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "9d861f7c2991350e657600955ee7a929"
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f79c4877efac93448bbce943e63e14a0"
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.30.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "507be0ec8d8672267c475fbc32deef1c"
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "605496ad25e251edbc9462e980b474a8"
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.30.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.30.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.30.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.30.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.30.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.31.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "4a6c3e38d3efc654ab663dd5756ab24c"
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3a3dcfa6f5882671de2bcf6ef7713d15"
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.31.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "5eee66ca8e0477316ed1c5f2d0514ad4"
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ce5ec5b9485fff8f11f13600b17c2fdb"
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.31.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.31.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.31.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.31.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.31.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.32.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "da8a6a861570c85ebd946ecb484c31cf"
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b9478d35558d6401767c99879841eb01"
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.32.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3664490b9465d3195ff797bf2a9cd057"
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d8d5493dbbd4f93991a39712e830a5f1"
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.32.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.32.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.32.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.32.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.32.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.33.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ec855fb0d071f621cd9a8cb25a548508"
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b8cbdd03ec81e73ebdcade755d835348"
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.33.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "def6a9c5e8f6dda0a4bee7f77c2a17c3"
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "71b3d1f9f01f374a24e8addc59c1e02f"
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.33.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.33.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.33.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.33.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.33.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.34.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "7b9fee89096d9c8dd9db27bbf8b9506e"
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "df7bb42db4210ca3d9728960aed736b4"
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.34.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "cf98ffea17c329afdf228eece5813470"
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "962959737c5f9b032aa38df86940f7a4"
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.34.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.34.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.34.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.34.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.34.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.35.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "d876828df99073e204111cbccccf1817"
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "e0f66ff197c46575e6ceed2562dac7f4"
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.35.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2e17099e223959ed75ecfed3e4a20833"
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8ac3e43c814a1338d7aae590b2133039"
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.35.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.35.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.35.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.35.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.35.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.36.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "a706c2e4e9360bf828d25e5215d0f8c6"
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ed6dde365aea49fd12a58526df50e537"
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.36.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "12046d09e74cf4be566b5ce91f8267d1"
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "78ba5b4f37352c7e7367add8a4e04486"
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.36.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.36.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.36.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.36.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.36.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.37.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "1a64525c20202bde63132e15e2bad4d1"
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "aea9c0bd272b054b31b300d9a1cd80c6"
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.37.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "8a7b7b3bc7accdc806222461d7931365"
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "485e616559fe9c2c444f7cbbe2e66e1c"
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.37.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.37.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.37.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.37.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.37.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.38.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "920dfd9b5496e048ea6fd82ce2b8750a"
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c595d4e3df3def50b47418cfdff16e26"
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.38.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "436a74975377a0e16e0efc983cde09de"
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0bd1df8b32b7f3ddd019cb2aae21128c"
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.38.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.38.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.38.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.38.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.38.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.39.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "15d886d86562b7fe39046afdeabbcd32"
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ad01b50c27ca63ffe7f5f3df9bf8290d"
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.39.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "edf503612f59edf7d6355eca975b6141"
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f5bc34da4a881064e2aff08a2ac7c1f9"
+ },
+ {
+ "dataPath": "params_shard_162.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.39.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.39.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.39.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.39.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.39.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.40.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "eaa533f9ce5908ecf60ccd7dc80881d0"
+ },
+ {
+ "dataPath": "params_shard_163.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f0fe216d86609c630df4af6de5aa0b6a"
+ },
+ {
+ "dataPath": "params_shard_164.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.40.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "a8682b6da6ae4bb1b3df5ff71e63c39b"
+ },
+ {
+ "dataPath": "params_shard_165.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f8b230bc58165f171686c2c219e2b827"
+ },
+ {
+ "dataPath": "params_shard_166.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.40.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.40.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.40.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.40.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.40.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.41.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "23e05cbb42f9b1c85aff4ff74c929800"
+ },
+ {
+ "dataPath": "params_shard_167.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c17b864491ea836dc561700086748c81"
+ },
+ {
+ "dataPath": "params_shard_168.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.41.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "d99c2609a8e53e906b98dd4fdf4e0c31"
+ },
+ {
+ "dataPath": "params_shard_169.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "19ab27129ee5a4329c92d614262339b9"
+ },
+ {
+ "dataPath": "params_shard_170.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.41.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.41.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.41.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.41.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.41.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.42.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "965a5e9cf3b3dcf5aac6688a8dcbb28b"
+ },
+ {
+ "dataPath": "params_shard_171.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9adaca8fa50e876723892fb3601b8b3c"
+ },
+ {
+ "dataPath": "params_shard_172.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.42.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f379aa793cb2c8da4b4f674767a64b53"
+ },
+ {
+ "dataPath": "params_shard_173.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cc2e3704a25930074bf3c4146daf587"
+ },
+ {
+ "dataPath": "params_shard_174.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.42.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.42.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.42.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.42.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.42.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.43.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "ceeb7fa446b82f5519611fb75bcb1e73"
+ },
+ {
+ "dataPath": "params_shard_175.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "791b43015f4f501314ab722e388b6225"
+ },
+ {
+ "dataPath": "params_shard_176.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.43.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2cde58856c9af9c8ec0106197b148850"
+ },
+ {
+ "dataPath": "params_shard_177.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "98190f3a4f88dede59f598ddb91b2b94"
+ },
+ {
+ "dataPath": "params_shard_178.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.43.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.43.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.43.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.43.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.43.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.44.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "8e56f2a4be6b75ccf50158f14dd76acb"
+ },
+ {
+ "dataPath": "params_shard_179.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "2318d5f199693812f581fac9f1b04e6b"
+ },
+ {
+ "dataPath": "params_shard_180.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.44.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "b19ab81c417bff65aeee25784e74f8a2"
+ },
+ {
+ "dataPath": "params_shard_181.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "1346a74cb2b723f7dae8738092fc9e27"
+ },
+ {
+ "dataPath": "params_shard_182.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.44.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.44.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.44.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.44.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.44.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.45.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "c4718063906715e3004929d9116bd783"
+ },
+ {
+ "dataPath": "params_shard_183.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "0cfd8b0f322d50ef664a345575f0b9b9"
+ },
+ {
+ "dataPath": "params_shard_184.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.45.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "55510bc907509fa6c26b09d8d66e8879"
+ },
+ {
+ "dataPath": "params_shard_185.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "32deb7b195fcaabff18a174d9bbed193"
+ },
+ {
+ "dataPath": "params_shard_186.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.45.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.45.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.45.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.45.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.45.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.46.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "76cb6e7164301dd19bf705aff1f26e5d"
+ },
+ {
+ "dataPath": "params_shard_187.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "736efad18492120448e43c776b7e9a25"
+ },
+ {
+ "dataPath": "params_shard_188.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.46.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "fb3c5f9e9c7663b8d13882f22a0f2aa4"
+ },
+ {
+ "dataPath": "params_shard_189.bin",
+ "format": "raw-shard",
+ "nbytes": 18350080,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_weight",
+ "shape": [
+ 7168,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 18350080,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "c287e0602a073d45d28d3d3f1dfd9dd0"
+ },
+ {
+ "dataPath": "params_shard_190.bin",
+ "format": "raw-shard",
+ "nbytes": 30345216,
+ "records": [
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.46.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.46.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.46.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.46.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.46.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.bias",
+ "shape": [
+ 7168
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 14336,
+ "byteOffset": 28037120
+ },
+ {
+ "name": "model.layers.47.self_attn.c_attn.q_scale",
+ "shape": [
+ 7168,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 2293760,
+ "byteOffset": 28051456
+ }
+ ],
+ "md5sum": "934be68f81995621154452adad6676fd"
+ },
+ {
+ "dataPath": "params_shard_191.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_weight",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f14e9a08a484031adf3a07f050e6ff24"
+ },
+ {
+ "dataPath": "params_shard_192.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "model.layers.47.mlp.down_proj.q_weight",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "7939af8318c6096f44610ae6f411f696"
+ },
+ {
+ "dataPath": "params_shard_193.bin",
+ "format": "raw-shard",
+ "nbytes": 389283840,
+ "records": [
+ {
+ "name": "lm_head.q_weight",
+ "shape": [
+ 152064,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 389283840,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "63a4219bd8f0d5088b95588bd567597a"
+ },
+ {
+ "dataPath": "params_shard_194.bin",
+ "format": "raw-shard",
+ "nbytes": 48660480,
+ "records": [
+ {
+ "name": "lm_head.q_scale",
+ "shape": [
+ 152064,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 48660480,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "f082397dddce00dec18bdcdf0448c1f2"
+ },
+ {
+ "dataPath": "params_shard_195.bin",
+ "format": "raw-shard",
+ "nbytes": 28047360,
+ "records": [
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_weight",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "f32-to-bf16",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "model.layers.47.self_attn.o_proj.q_scale",
+ "shape": [
+ 5120,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 1638400,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "model.layers.47.mlp.gate_up_proj.q_scale",
+ "shape": [
+ 27648,
+ 160
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 8847360,
+ "byteOffset": 14745600
+ },
+ {
+ "name": "model.layers.47.mlp.down_proj.q_scale",
+ "shape": [
+ 5120,
+ 432
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 4423680,
+ "byteOffset": 23592960
+ },
+ {
+ "name": "model.layers.47.input_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28016640
+ },
+ {
+ "name": "model.layers.47.post_attention_layernorm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28026880
+ },
+ {
+ "name": "model.norm.weight",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float32",
+ "format": "f32-to-bf16",
+ "nbytes": 10240,
+ "byteOffset": 28037120
+ }
+ ],
+ "md5sum": "97c68ec5e6f50b02655cd803ec64874c"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca14c9a438f9d75b195d956b7f29556ef8a6b391
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:139509596b7b0a732218c5ed325d61dd04e61f55aed3f64ebc758258232b50d6
+size 389283840
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca33209ba53ce03cae565b401fe11646abab0161
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:132ecb8871a7ab26ce1234724f6f354f83b40e577f0cf4ee83977f1653b2d0bf
+size 48660480
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..57f74ccd60c450e441af8b9c13cec5cf6b5c6a5b
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37f561284fae1ef3a2640b3859b2ce3529948a13d793d17302a32a5a3dd6df2e
+size 30345216
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d961e3e070cebd043a0709c0564c1e95b73a7bcf
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a193ccfadb3dfb228301accd74fd2b137f32e03c2b8e26d56c49012a38637042
+size 35389440
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d7039e28a79b7627f97602d196b316ff2875ba49
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ed7847f761d06cf39db433b34ca99c2c3841b7f7fca18519daa63b87c746ea0f
+size 18350080
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2f615ad1359f94e2838054c3d21d9892d550cacb
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1330e98b2d84d0a17b125a4af2b434a1666d50103f1c8bdd646af77e97be9070
+size 30345216
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4edd58b9ad7408cccaf5fac789a686632eddc95f
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df8dce457f7543eefc9cde3ee196a230b9ff48e56fe08ba2806ec295d4b82d01
+size 70778880
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..28dba49058628eb9b48c504932f4be460f72bc32
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4629204593e9be2d209874d61e4f0d03354dc19526fb4fcfef8fffa93b33d52
+size 35389440
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6543d81a16e6013665b7fbaaba567599dfc2bde4
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:236372ccf608e8b2da75a9f0be8468ca5ad4d84325bab516cd22dbdb03513c37
+size 18350080
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c457c605f2235d99d2daecf00c9c66875ed4e8b0
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:030b16f63db66bdede0d01b1c16005b615854cab0f620a159c655157c47da0a3
+size 30345216
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d40f82ea16057c81927bc02e6737551fad212f2
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b7ceb83b37812a1503eede839d89818d09481cf914deeacfe0fb28ce6b9750f9
+size 70778880
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8d372d2ecc5c0c5c54b80de4f8740f6892691ca3
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c7be15420ca4f4b5f997059bc162943d64cae6375efdf9b80e53120b1b8be58b
+size 35389440
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dbfa216793cf7543c5f4354f4051bc30c9bd1798
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3405c2c88fac19415b228f36c7d298d9c0a4980a3eb5006ad6977a1ce78d7202
+size 18350080
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a827330aa8f36a2672c19fd48f107c8dea1a748c
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8bbe1198d8f32d7af9b06dd6983ff72669ab011bc13dab5aa4870107e875d8e
+size 70778880
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..db8f5bff67a7f7aad461f978f9a18c67a8c60b3a
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:12d96fa8a92c306b842a5c80ddc7fc414e9dbbac4a57fb7b5301db1e521246de
+size 30345216
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4dbcf4a6917f32d1fe41cf7f26ae43bf459b10ca
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d15269a5aab2b901d367ae8e5eebaf7a29c2d598406dcc7c7b83ded66998aa66
+size 70778880
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c0bc6219b637147227cf1a799e93e176dc33672e
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:780e3ff23b8ad093874c1b7671e49423ff5794aa76bdad9a32fb78ca33a75c67
+size 35389440
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fb3d09c36841a4a30262b8df400a856c798d1d16
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ac58393ecfd854e08a8467984c52052f50de550cf9eaebfdd4051c12a9b6f791
+size 18350080
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..aa1a04154e7f62e631ee44ee9b6525b333dcdf21
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:224907cd64bc4e539b5672199bbf5024e55ab62582c295b1e71cd126a7d5411d
+size 30345216
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..313fb4336351d10a4d5da36ac7e8346420377a11
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec74c0a53e39600df22fd13208aafe615a0909a272f7595745a08b5cd405d3e1
+size 70778880
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7724b95049d24026d92538fec258f6240c2a32be
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:aeec1aab325feb69a9db5a615015b3a9aea68937f1adb6dda43956109a3dd0ff
+size 35389440
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..51704a6b8d4dbfe0e01aa4621ec5c80d94f4a179
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:024af7954f6410d7a3044a02698e86e641cbcff5782e4adba040644e3fbc7d71
+size 18350080
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0811ae3b25b74d8ba88f485de1bd6c109df5302f
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b4dd082923f213caa06eec0ea11c7234a28fe27a4aa5e64afcca7c6b31c01123
+size 30345216
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7a8f278264b0786aa9b045b7825029c7c686160
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c98e6d1e3cf0a270f1e422e8bd5904e975c435abdf66d229f0922537810f0310
+size 70778880
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d69938743d2fa6143f967070ab00e1af9f42e693
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2493be4de5486e2e85174ddb0d320a3c32b25681d3019d761f5ed358cc85a3aa
+size 35389440
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8fb916614b453bbc13be269db37c3b698bc467b8
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d504072a88f6e6e3697bb2f12786c05a11a2a43351e1a6dcee3f54e6cbf2f1bb
+size 35389440
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58cd17177643dda01747e227201e67731b64e385
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62d772405ecd823c6b0f88aec8031f36ea9f6f8038450d54d2e935d0a477db13
+size 18350080
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0771abb3e1344ca0a9644640cf863c089d202587
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75b042203b70e50d41d255c7d6e32709f2c93d8e90476e614f40efd7b2b1d64e
+size 30345216
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d2e2e5d4c62493988d3d20d41220ec120f1772d
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da4b55ee33f22795dff3917a33c437fd2028cf32fed288f2058c70a3596de04c
+size 70778880
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d8b5913dd49d4650f5d59918fb51ba10212b2db
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:473a20daff75ee819328f32a178fcbdfd6b397416c7a100f63447b8cd93044c1
+size 35389440
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f1855731d04a3d38ff548618910cd1a16f2a6f3
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6f01077d5814cb68505746ffeef794588de20fe79b483f6cbbcbc8b9476a608d
+size 18350080
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d697ebd49b48e166af6fa15c41f33bdc4ae57193
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d7b301fa51953308b0d1c7ac7c7ac23571e4e21d9e7f4c9c9ebdab4fcc3150c
+size 30345216
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a3c7bd2cace522b20f6bb031a8b7f212a1bc1fa
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be4f3ef496bab960e912e6052123ea2ffaf156db1e963b84a3a78ce64af997db
+size 70778880
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..619e39a8177ee8b4c51eb1fb0d1fae8ce4e14456
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:838ac75b3d175cf1b2587813f380d3f0f91ad0ffad512ab85486e81aeab59606
+size 35389440
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3d17ec350c9fae7368e8c993393a25625567ecc3
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:501fa602f874d34d8a8925f1800c42573862e6e7355868c3cc252e759602555d
+size 18350080
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..905aeba6b307f5abdf990f51c4abde1aec4d2fa6
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ceab39a078fde83222073d92230dede67fcafcedd0109664978b7c1e92e252a
+size 18350080
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cc3edf8df6063fc8d1c3ccaf2c5fc7068a0a577a
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50e8435d7324bae8ff488db5ba87f071403664f4fe6ab906e51f8f07841d81e8
+size 30345216
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8852cd71164c86e983dced23d10e17836b7bd19f
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dbd809773e6e50c1df0d575e95292ea60bf1cc95de0220c4c44b3706638c2695
+size 70778880
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b30652e706df0a642658fb49317f5b23af7c7aae
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:82238a383bb6f2f3470de720a673b5a160657b8fec27b899a7d6aeb0e2ad3533
+size 35389440
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8af7043be455eb89f40e699236d6bb5cae71e6c1
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7370febf4e9da8d85c43d034ad84db1714ad474ca7b5b621232362790aa69ea5
+size 18350080
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6ab016b744b45def81967a5630de87c0a2dd9b28
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:faf6a6cabac28cb95bf7bf7af8e655d3b26120520509fd24428ee61f767a0e23
+size 30345216
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eb652840e5e07c451f3f5e7b386abef10f9de95e
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f64fe3995fc34aef0567349e1a303e99eb7c491e2cbb093d84d705f88b6761f4
+size 70778880
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2990c34e14b179385876dea1962eec644f3acdba
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e28937cccf08e7064201fe1becb76c58dc3e7ab9753c3de7197e6176568cd4d
+size 35389440
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5cb00f44a639e8cf2e453fa3e6328e061cea180
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c7e27f5b5eece0ee174baf83bd4a39609abf270ff0e2f17bea8c75c97fd1ddb
+size 18350080
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..217c025f1d11616cad60a71b4e56e3c47542ffa3
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9eb6c18365bc6157ed7019279afc1ab97aae49faf35b1b25e6efaa777bde2b37
+size 30345216
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6a72ba47a0ed4664c8b20fd4d02444ec1981ab27
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:40b5a84128fdc9bef66f36eed0b794499e371631879f3593d07fc37949eb6262
+size 70778880
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..083e37544827601235562a80107d2dcab6a34fd3
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8023f11ec6dcf25f01cc4acb447e4d18b8c1b54f97f5c875e11bff09c5a0751d
+size 30345216
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fabaf60683e338f6a2551b6142d917ee2cd6c60d
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8fb10b31037c236d30802e25fd02d05b16c52309b26b0235022ab8b9392f55e3
+size 35389440
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8f9249317c3859d5b763180c26c104e1bbda8427
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb805c2ca01ad2650c2635ffdf250b569a5fcabf74b9d21786fea0e441859727
+size 18350080
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06d46f0fa6c442e6d43b173cea10bd348f5b7526
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56dbcb5c07d5fcf7e647234f98dfb0e857c84d5c5368fe4ff0593609c18069b1
+size 30345216
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0154b416904364a925e2628cf088e16799990eed
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:497e67d638640703f32c9baa63f825956a3a6ac8d384420dde2cbce44e072de9
+size 70778880
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a6c34d7e67a405ca5f8ecc6c4260dc0d6c6f46f9
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a416985bf9a79aca5e9555b6fe9a3d12a36be8748f7a17efc88ce67f306ba26b
+size 35389440
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..63045812c2a887824dc18f862279f1c2765b9634
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:278ba2637db0d4c56261141d9198b107063609621421e4db98c46df5f5d33643
+size 18350080
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ed758dfadacc6d42431c6606ed42d69785efae80
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d1261d25ec2cd7a08e534010028dc07b491a56be28a5f6bbcf9962962ae5b6cc
+size 30345216
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..45e0d7390875701acc3afb6ff12c0b8a3f788ea2
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:546b5983a94a1186b351eb880fa0d80c424f049a1f100374cc9eea9000148021
+size 70778880
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a0381d6ebde0c7db471e3591195795a729d9e838
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:609118744ece5026e544494bb9b112ffc220863075849e4e5a9bece98b4dd41d
+size 35389440
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..186f5514eee0ec83c55f9a1f0378aaceeb62da74
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7af10bf833e5c258280a71d0e171c087505435bd907a6584edbde0d97414049f
+size 18350080
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..44e0f7acec43f33b9f63da4f1556e48e8aa7afca
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab8ca4b83228260392ba25f7e777bbec407e6c8957d5480763aa6e2d68fc5941
+size 70778880
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36563f76860a5f057221f093fa25cd7874e9d302
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9dc419079066a8b27a5f2c28754a267d890c8ef928a68a02fb038ba12b6731a4
+size 30345216
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cbc66412f7e606f698ff94fc5a9392631157e103
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8872118c12c803d8139d61631951e5fc01186e762eec25e5570352ab4c77da0
+size 70778880
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f3d4e40b14acefd24663a01b66d405ef96d2660d
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69bd7dd3f24cb6f1e34cdda13547c99e337dc13217da645e8ee0446005b0cbbf
+size 35389440
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ae0183f42ed94b52afef09986142f11a331cefbb
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2185edc9258130e26d29fe586affb6f2ad033e15620718bb622f9a707320a70
+size 18350080
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9094024ebe023e965e7822fe7e59fedcea86dc40
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ed28fa7d9766ced31e11348e0b0e47679d314adeb39c3e6cadf2a5459eed1535
+size 30345216
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c1ae76ea4c8a21276a1aa5c60a7b05d7059ad114
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7c4fdef930cc762c3547145889d53373eed0d15d1ed40162197e9441714b5e6
+size 70778880
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a5f23562e96b082b43b344da44ea21627a90b49
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3122907edbd10f494dc6571125a2738e9cc039e5d016324a38bbb51eeb1b1c60
+size 35389440
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0be5c8860e36e97b6ae1a390d25530ec2c0b55ff
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6842aa906012b8375b786f51e0cf7f5d294a77007ef2356ef7feb7b4c1ccd4a9
+size 18350080
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..be5c0593936ee3cca2f66ff2f3047d3dedea473f
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56943f799951495bf6b118f1f5fd0cf792d662b0048f61d328fd4743caeb1a01
+size 30345216
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9db8b7c250d8d062ab57bb8146566be327844a80
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49dda371827b4dc79e0972309a4010e614d2ec5d4bffb8a87e28f00f58a533f6
+size 70778880
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7e411d6c266743c680398715ac66b0472662e938
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c2600736245bb5a0985538398d3475569b8fb428afec1cbeda45973023314672
+size 35389440
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf562be2d93a402380421cbf2fd2e5e35c100df6
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7b93b0842d5cd5456cdc0bb48714eba144f23d70e47081091e6f8a44eecc75cc
+size 35389440
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..337b3ab9ed06b7d088c87d306458a29747659156
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a1ff6a43767f5b0d1e292d29e590c0927cb97c6212786869e51790eb19bbe9a
+size 18350080
diff --git a/params_shard_162.bin b/params_shard_162.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d18971fcb55dd3bc1ca14b15bf8714543c92495d
--- /dev/null
+++ b/params_shard_162.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13586fbb97d42f1a145b3a0366fa863edf03d691e145da3e962922c7f9d46861
+size 30345216
diff --git a/params_shard_163.bin b/params_shard_163.bin
new file mode 100644
index 0000000000000000000000000000000000000000..12506981aade59ef96cf6ad982c210efda148759
--- /dev/null
+++ b/params_shard_163.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dd0f8b0c67cf3cee176de9fe7e64fe461171bd37419dc4b4ecdfaf071acbce82
+size 70778880
diff --git a/params_shard_164.bin b/params_shard_164.bin
new file mode 100644
index 0000000000000000000000000000000000000000..88260a3b33c79e5a30aacd3a7402195a5e3f43af
--- /dev/null
+++ b/params_shard_164.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:071f5db65e8489dfd8991539571f18d62c728cf7cd65b84bc56bed1d84d7b387
+size 35389440
diff --git a/params_shard_165.bin b/params_shard_165.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9bee080f991a201f9d9f1a82824602dab9ada4e9
--- /dev/null
+++ b/params_shard_165.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:32d006bfbe6547900d7ac210a6bd7f54e44de1f8d93978fe55159446601db81c
+size 18350080
diff --git a/params_shard_166.bin b/params_shard_166.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6dae78368fbdd3ea18d53fd18ba005dd49368616
--- /dev/null
+++ b/params_shard_166.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a955b3d745685c7c037b50f5b6ef8de1a5a1c7561b36d536afd201022cf68175
+size 30345216
diff --git a/params_shard_167.bin b/params_shard_167.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0cc3bcdbaefbcc8c3731d0624d706403ac02e17e
--- /dev/null
+++ b/params_shard_167.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9de5453887accc6e65942bb469ca00e5df1fed7623ea56f023ac169f2c331176
+size 70778880
diff --git a/params_shard_168.bin b/params_shard_168.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d46d7f8d0c8da8427853dd696189bfe0c1459ac9
--- /dev/null
+++ b/params_shard_168.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb61a90236f5e5dfa79d7c0d23ddcd82b0fb2e619c6b7b3641f86db660758abc
+size 35389440
diff --git a/params_shard_169.bin b/params_shard_169.bin
new file mode 100644
index 0000000000000000000000000000000000000000..efc0a531aea756a484e1d695d0b2bf2a1400509b
--- /dev/null
+++ b/params_shard_169.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b27761028b6a4794b6de45f5ff68e639d9068fbb6f098ae6f80e38ca89752ce6
+size 18350080
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..36c60380581db7bf4b45f4f6b39ab78c0dbfa8ac
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:14d982f8c8004da631c20551b941bf2e4299e8d59f70ddfaf6c422aa9a7b2847
+size 18350080
diff --git a/params_shard_170.bin b/params_shard_170.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f37c8e001f2ed7830ecee7f63ae317fce800560c
--- /dev/null
+++ b/params_shard_170.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe11154ca7fbc4ef7748c3faf8d59ebcc2786fa6e61a8a42d7a3bba1fc13f3e2
+size 30345216
diff --git a/params_shard_171.bin b/params_shard_171.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4688ef6ba5ed9342d9c576d553014d08693dee53
--- /dev/null
+++ b/params_shard_171.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0e85de4e817a5fe8ebb702e7a64d47096c27d780f52c04deb5e0ef68ef2dcc2b
+size 70778880
diff --git a/params_shard_172.bin b/params_shard_172.bin
new file mode 100644
index 0000000000000000000000000000000000000000..460025ebb73a17511253a2da94fbf9e405d3a134
--- /dev/null
+++ b/params_shard_172.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2bb16857d719de5f079f18a80297d8d8f3d1065a3754a814cb2f12698d7b62a3
+size 35389440
diff --git a/params_shard_173.bin b/params_shard_173.bin
new file mode 100644
index 0000000000000000000000000000000000000000..17b8b6034b926c64dd2a793786f29a25b9002862
--- /dev/null
+++ b/params_shard_173.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:75f54ada1f995862493f4412ee7831e6df333ddad163deb6f039a20fcae4b536
+size 18350080
diff --git a/params_shard_174.bin b/params_shard_174.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5fe953c3e8041553cfdbf0a1399eb2b2355708d1
--- /dev/null
+++ b/params_shard_174.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:91f0a61acde603ac81650af77e8a5b8a005424ba865fb1a3a1897522947c5554
+size 30345216
diff --git a/params_shard_175.bin b/params_shard_175.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b1402caefbc6aded3ddde28a8b9106c1c9eb04a8
--- /dev/null
+++ b/params_shard_175.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d70137f94fdd11d96ec57b71b3a5853b848d276ad6d6909b2e9d100678ec79a
+size 70778880
diff --git a/params_shard_176.bin b/params_shard_176.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6d00c147dfd50eab0f61bfafbb92729f44575cbf
--- /dev/null
+++ b/params_shard_176.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce87af5fbddd357d8a43335fc725230047dc76bea6f84da239e535662cfd627e
+size 35389440
diff --git a/params_shard_177.bin b/params_shard_177.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80f5ba34a2e8b68c8c45db92f2529e1b18964aee
--- /dev/null
+++ b/params_shard_177.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:abe227369d262d2e45861637c85c55236cb1b1e03b39b4eb613157537a9a5d5b
+size 18350080
diff --git a/params_shard_178.bin b/params_shard_178.bin
new file mode 100644
index 0000000000000000000000000000000000000000..631924c23f60721dc623dac145275f1fbbf0e28c
--- /dev/null
+++ b/params_shard_178.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:383cb3a6b901aaa94e66ba4b0e8046ec65218e760a751963a6a30ec94cd4360e
+size 30345216
diff --git a/params_shard_179.bin b/params_shard_179.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3200353a79fa917151fdb3a154693291069cae74
--- /dev/null
+++ b/params_shard_179.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3a6f26384b42d3471e91e06bd924a797465686c3a91c0bebfe62daa65808ac4
+size 70778880
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c268b90bbd3885ad62d6a06db3bcb4f790c5f86
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b38345b6887b797378f67482ce04360d2e0913584e601184776c9f5998c7a7f
+size 30345216
diff --git a/params_shard_180.bin b/params_shard_180.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf509a1bbc3f972a648dafc3a3ee6435200f609b
--- /dev/null
+++ b/params_shard_180.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07afe75c283b6d52e2225912d562b1f5da85125afacf33321d9f3bcef818aea4
+size 35389440
diff --git a/params_shard_181.bin b/params_shard_181.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e448648662387100b84005496b7fddf6b7525e37
--- /dev/null
+++ b/params_shard_181.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36fe3d6a1d8a2f180322bf1ac55068d77cd0473055b8c1e481333534e4be172e
+size 18350080
diff --git a/params_shard_182.bin b/params_shard_182.bin
new file mode 100644
index 0000000000000000000000000000000000000000..20b6aee38c39e3e7d0bea01003f9f07d4f3c1a52
--- /dev/null
+++ b/params_shard_182.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:21270cde6a786177765a05f75f4728c099e8599562da84c2a8c9b08113195a91
+size 30345216
diff --git a/params_shard_183.bin b/params_shard_183.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f025733d36f20127b5169a54143abdb59acf9a81
--- /dev/null
+++ b/params_shard_183.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:339ab3625d2863618deb8e1e5d750d5f8922f3f98fd293dca2b0e310ee2143aa
+size 70778880
diff --git a/params_shard_184.bin b/params_shard_184.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d9c03dd823b5b9378a514acf30835d54a498237a
--- /dev/null
+++ b/params_shard_184.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:67a8af4279428da135913f4969d98a6140bfb8cc8d9e6d1d3903d407aa2ea168
+size 35389440
diff --git a/params_shard_185.bin b/params_shard_185.bin
new file mode 100644
index 0000000000000000000000000000000000000000..222ee167f5137cace91edafc842cc27ff389305a
--- /dev/null
+++ b/params_shard_185.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d3674a077af3337c5494bb0edb70ebf3c0bc04cca488222c1ccd684a5e73e3e
+size 18350080
diff --git a/params_shard_186.bin b/params_shard_186.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a4f12072ce90aa8fcb7ef151b7363da1089d70d4
--- /dev/null
+++ b/params_shard_186.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e9cef80a6cd0bd80565339fb1e2f86613ce11f0867cb9e11751bcf3b0f0ce58
+size 30345216
diff --git a/params_shard_187.bin b/params_shard_187.bin
new file mode 100644
index 0000000000000000000000000000000000000000..482750b7940d792d69d7e67f1c387e243535e80d
--- /dev/null
+++ b/params_shard_187.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72ea88c90be66ccedc14347c8b7db53e9c21335cf6831a1263362245ec37271b
+size 70778880
diff --git a/params_shard_188.bin b/params_shard_188.bin
new file mode 100644
index 0000000000000000000000000000000000000000..23c62c9e0c35a080250f725e847d87361d532ec8
--- /dev/null
+++ b/params_shard_188.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36e5f989bc2f62a6dc4323647514f9c1a19a6f8de13f68a1ee27ed786157d1e2
+size 35389440
diff --git a/params_shard_189.bin b/params_shard_189.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c67636fe0fda54d29e9c6e6e648d30a28cc34853
--- /dev/null
+++ b/params_shard_189.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d67c4d3e6d215915289b4cc5ca61e432a28ca0b8e095b4c227f16986d7421801
+size 18350080
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..79fce1cfdd79727edc33a1e6da312108503e5410
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:dc321a0638076bbb674f3e6f66f0e9b3ccc2c1140ff356e9a995212893c90f27
+size 70778880
diff --git a/params_shard_190.bin b/params_shard_190.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f8ba65180a7f68b67fd9c1ede2832ca309d59d1d
--- /dev/null
+++ b/params_shard_190.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:10561cda9827f21e639f8bff3353316a85ba673a200e95800fc135aa18abe7dd
+size 30345216
diff --git a/params_shard_191.bin b/params_shard_191.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1f517b010cd16c8706b0e29209710a479192428d
--- /dev/null
+++ b/params_shard_191.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e621269eb08036bf756be8b3c34a9036ddad132894324cc09b514aa0b0f89e2f
+size 70778880
diff --git a/params_shard_192.bin b/params_shard_192.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dcf33f762c1df4543e703ab80f29c1748d57b707
--- /dev/null
+++ b/params_shard_192.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:18a1284e379b69f1e57cb8164977fabdd4858cda253ed9e57d6257435f4740a0
+size 35389440
diff --git a/params_shard_193.bin b/params_shard_193.bin
new file mode 100644
index 0000000000000000000000000000000000000000..650c51012cb1b97db3f8fe6f4c23104f83e9ff15
--- /dev/null
+++ b/params_shard_193.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3cb9f56e0e2a68a98f58ac731c22aba970e7152294a6886cc060fed508b437a
+size 389283840
diff --git a/params_shard_194.bin b/params_shard_194.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7671e1e5f5829b68b089aa72f5531a88c803222
--- /dev/null
+++ b/params_shard_194.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b59bd5b339acf7ac2460d066d88dc344a3b14a9219a6cdcd1c43de698cb5e1f7
+size 48660480
diff --git a/params_shard_195.bin b/params_shard_195.bin
new file mode 100644
index 0000000000000000000000000000000000000000..befd0912c0e0530db07cae77894a3cde451985e9
--- /dev/null
+++ b/params_shard_195.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c3cc2e50c18335652ed225ff25e6ccb6a050b4c5dd74c0d263b491aa7c6c77a
+size 28047360
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bbed3d6d72be6a338f1da6e017601b0f3a08466c
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b901eb1c06db2750238a3e5821863d9d6868393050e78c5c7cec44b0d1b8fe34
+size 20658176
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f9633d729d1bb98db6f2ecc4643c697dfb70dcca
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45c01618b8389d268d0b9f4bb78c67044f0df4aeb851fe7e7ad0b6c5f1b59e63
+size 35389440
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..276d6c5ecc82626fef935f607b0704056ebe4290
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2d81d9aea8104abecbb4987bba156d52e20aef165af1d556f70688ba03607f67
+size 18350080
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9b6d3eb290625a7095fbc521f20b94c54010a5bc
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b6a6ed477ff8e8467d35f37244054978d40a9a2a605752b683818fe82977f26
+size 30345216
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1cb0e537a8ffa826c42706d26e2ddca8e4425643
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc26cddcede9709746957cff7811fe5dc3c5adfbba4e287950771293a9e64dd8
+size 70778880
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..27e79f740820786cea8732f247b6d56b8d18e74b
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8151a51bbfd38e374888f6ef8d5c2d9cff5f5608861b861cfb158318096d782
+size 35389440
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..06fd370d89dd0bd4296b0bef396a4051d9d32e53
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bdd30f49b45d4c10c563b1a893be1f6e403468391737d99325ae1bd975114f42
+size 18350080
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8724ca42282e447b546e06379796c9b896318021
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cd2e641267d4e0e700afaaa3a671b9d2a4cb3fdcc8203ec02a2f28b3db3c7d65
+size 30345216
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d48a7faa14e42158a7d11c465ff2ec1fc9d42ab3
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:243d4d3fcf526f82e835ee84d581175f783bce0a399e3aafe5ea94288c45e366
+size 70778880
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af47fc2b9fcfafef995461a2bc404ba41c67b45d
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:131a728b920114319999ecff20583d6915f07513de4f4e99409ec311745a98cc
+size 35389440
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bf637f71136930525f98294eb46df576a9c71866
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59b17d5862db96011675b24aac514914c4b1f14a45c27f190fc9d3b9d751ab60
+size 18350080
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a5a86d1eac48766f2cc5eb3afe70836cc8b30c91
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b00bd602c520b7be050873857d14514200fd2d6f83738e6ca9178b89127c1db
+size 70778880
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..470ab921fc8d8cbd73267d3716e2e717cb58efcb
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:080b8b3d93225b8ec76b487abcafe6df4ae6c8b0259106766cc4e75563346daa
+size 30345216
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc4f252e6bbe89ef804ea846375c3e9276cf3a07
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6eb54a6755ced7c4a4be98ae103d2fe6d390ca12665054587f0ee3230a2f45af
+size 70778880
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b48234e035e9d4a18cc46756e4b715da559741f
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c52e14422e8a749c6003f025779be7fcde2a89ef86c087e315795a1f2fd30866
+size 35389440
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8e3f041223bf5350383208e859e3c188bbbaf470
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e2c16af1e3219168a88eddb0a72106eaa710d0cfd114a467b388ea71cf6786bc
+size 18350080
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b5159900ea41bbad05535c11346eaf0faaa33b5
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d94eced738525a76e8deed872c5aec82e0d0e3e9b513d6b52fc1faa2cf8baca7
+size 30345216
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..810cbe11b8953489d6c361e0d2452ddf65e42e0c
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d965b956ad78a8d275ace4d9bb23f9f1f08e71b2fed9b2a0bf131d6aa6f1f1c
+size 70778880
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b36d700e296285cce31fd9ca049fcb3e79e009f
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:560e7888629806a0f4f111e977b84cda37e580d21f17acea64d223f9bb5b90e4
+size 35389440
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..96c948878a9e48aa2e20ff7c7fd4457e81b339e6
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f7e547f6261899aa1ed9fba0dfd718acca733144be7af076f4317f25e033e278
+size 18350080
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..720a6a86358f8286258e902d87bde81efc436fe1
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f00109b948614e0b97e1f8a4392c0b81377f7ececf70c525c8b0da01c912b015
+size 30345216
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..60195590a79df084d23922ae6b211a37918282e2
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2313a1fbfd0adcfd4c5d000693b19b993d3c0389b211748b279c08a8b19ad614
+size 70778880
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..53c26e06c31d9ae102e55e6b5eec2890b772f4ed
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:12d35d6d60eb8fe1d5c5d6364287510ef4f71b063d490cdbec18144bbf8f4dd4
+size 35389440
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..080a6633855eae2a3368621e822aa21b59f6d586
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8030fec3eb14bc1a5547b39371efb4f51cfb722e5b829c839aebd2f20a180cc7
+size 35389440
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a8d1957edb506de0571fd94e0b0a532ebaee2bff
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a033e22a3fc24c50c84b5838279873bf4bfe6fa7330e92261372f930f078929c
+size 18350080
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7cdc33938473a2068990fa5f9fc51af47e64f29f
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfa9ad8c3a7df7912e84680af41bbca21cae7944f6e6d167ff555468ca280760
+size 30345216
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9468e93aa04643fa9936e4fd73bd714f8740d3ae
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6be2c55d2e6be837a094a067e7d75804140a307bf5ad3bd7a5d57897f3087482
+size 70778880
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7bad2353bf8d9961496ca4c8391fe95bf620911e
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e03f9675ded9e8ffdb9c0f65279cfda178a5218d430c047153580242bbb07046
+size 35389440
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cceb39debb7665159799ffe3c9fe7d896605c5e
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b389f792f69a50286b91ca6bbe91b96595eec78051e4f646b9ec7eecc8488435
+size 18350080
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..066e4e255f715dc989960250f814b2edae739a38
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3230a5c114db87b546bb21f9839c59bfe7116e8612e334f303eeddc1c961ec0b
+size 30345216
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..04de527e56cc1b297dbb4b49bd57ea70ae12af28
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b8b9455b7e72301665ea43dfaa31366d13158276f30eab1834f0c8a49d480b87
+size 70778880
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7607049121293bc3ca820cebacbf971a0d38633
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62166767b93de0482905c53df6c88a368c375e08de95e15cee3d0fca92e0d6ba
+size 35389440
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c385050527ef0f48af3e82e0bee3d71d99abc43d
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a8e31bdb460b53dc35c412f7f1fd3ad841c64396fe4fd470767a6b4114814ed
+size 18350080
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2d06651047d0b932d60e502fb282d66cc84c9798
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b51af6446d3afb5d61461fbebf38a7135f424b0e0493b44f574f753dbe24074
+size 18350080
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..770b92cd9c4384c04ba099493d8dcf65715bf794
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1f61468c632f6386260f46baff11030ab35d729fa2e534465adafca449515814
+size 30345216
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a9a6da5812f8099b391157385dbab457efa21e28
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a15f1c37d3fef108b758f855642b4961f1166c0234d5545b00509d63b62dee73
+size 70778880
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..78bc3c946ec5d1777d6d9cb1962b99965dd7242c
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6ef98f885d557c85aa32459e20969b1504dcd3f626e0aff9c8c0a89335e53e9
+size 35389440
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..938d3c6a672d846118f6f7a19abdbe4da783f93b
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e9c7d8d14f15cd98af5f1222cb5a8d481cffa60ac5804a88c50cd8a030930b57
+size 18350080
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ad033f1dc99a8d7111f8440c848fca09e3d1cb1
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00fa2e15a418b5ee3a0e8079c38fb218eeaf1cfdbcb662c63e4b54d2ac9346b1
+size 30345216
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c076c122a52957b01a9e92e8079a62fd6ee8e0b0
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccc7ba4255f4213bdd2c9651daf909366ed9000dbc47ea310f0e5c84774187cc
+size 70778880
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99218efc0aacba33af368d1867f55e26959f946e
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7288d5e2cbb1eba0d23834a4d8f1b944ff7d5eef18e2675a4ce1804e199dfa54
+size 35389440
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ebbfde91da1a2e271a31f964f47547a0b9344cc5
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bca338a4bc8d2a0cc57c842fd2db8b9c12f6ecc20753c2ab43871942a6f98d2a
+size 18350080
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..89cfd9d1d89812b9008f8bcec0ba54c000257e7c
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be0b0fd5c49b2af30f2871547b0ffa685d5e26a19a9c75c804ec32f3d49c4df0
+size 30345216
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3de2d73c64ea80d81ecea8496323b46113952997
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:45e0c57c43d2bf28062433266b4daddd7dae6516f876ca4cc87157cf4ea0a11b
+size 70778880
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1cadc2fa1cffac5b3b226ca4d3f093221259d472
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8bf7971cf88c65b4e9ef761f0ddb3265f1a0080dc35471340476f5f72a08f50a
+size 30345216
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b8f676b1551391e553d0f5b6cb247d418bb4bb9
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:812126f7a86f6015e24f4afccd5cf46e66f2df34b1b3632692ec1dd5af654d20
+size 35389440
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..302d4fa2e99803961737c1f2ea1fbc2197ecbd78
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d0f6ba3fd4f13b5facba10e9de50b4a65fb106f0366190e330b14f66ab60f34
+size 18350080
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e760b34e65d6452bbc39133ce4814c919b932aa1
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4e5855d580004ccd9dd67a821be242281d197167293f1ce74969c435aff50d1
+size 30345216
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30403b56a34335dcf5a72075f354c54faead5923
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:388c3f5ceeeb07337792b0d5ed859720fb70b27c9f739c13f1702e5179dd18b1
+size 70778880
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee025964c213293c619636d3c1c8785f3aa455a5
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bc21f169df07ac63b036cc346a5c39951f0f3058fd10840787a69e35e722d9ba
+size 35389440
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d441de451ef165f254fb090c8ac2fed0da901ce6
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bdf64aff55f0a2d75f2ac1410ca844a447b153bd17d9713e167b61df435224e2
+size 18350080
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..78f770c46d333484c2f85fc825a30b2cb4eb7ca8
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e31db32720ee988a48111da881f8e1b7cc646f46fe18f8eb3d2dcdf27f0628f
+size 30345216
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bc6cdf2fc3e34b81d99fac175ef481a52ad5e967
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f08e914c5ccc44b333ba39387b998c3a2a449441483b75938a86591367bc8fb9
+size 70778880
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ff3a432242792aaab210989cf5c8f74261273526
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e0bc8dc677a0d79748b7f694659d6ca3428c72e60ccdc3bf1f816e0f929362b7
+size 35389440
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e093b321aa06df655bef7a2e427fd8d599e316f
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:24298d891e18651867bbbe2753a2d5b8e0c204f56e7a61e3db1f187c201082e3
+size 18350080
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..706b768dbe764c91a40a009502a2c2528a062df8
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff78660f4f6a6095a64da45c0c4888f7bddaa7d1724ad147e75531eaaa42bddb
+size 70778880
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..22743e588f27f93c084e151e574b8521ff05e1cc
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bab120e84526bc9f326d1eb32e18cfeea4da237de2d7da865b80a2ff98d85811
+size 30345216
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8ed0a9cb1c4e787b26d4751f1babbc08c6a51b4c
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e48bb1c23344405d6d6d50b945ad3c010c16f304a8936c49e27aa7bacfa192ee
+size 70778880
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..af1e74582b550c7f8695b4c4b3caa3e8b95d7f52
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9f379bca1902c003b60071985c311101eb9016ab8c8c5808f3339ed88215874d
+size 35389440
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..df7abaf6f4cd6a5359191f1e90c1d8c7ce72845b
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5dced7ea1c7cf8f88404c4c2f4acc19b556c1f6d7f1777037954979afbee3d7e
+size 18350080
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c711f558b05a4648a73e697eab5d9adff824d01b
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a0bd79a44efce9d763fbd5c3d658daf0370880a515c8b2f8173655b092ff6af7
+size 30345216
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..00ceb351211c96535335f854cf152cf675338cd8
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ebf85c4491ecdef74e5350fde6250a9a0e55a8dd421298c9c2813d11eca5f611
+size 70778880
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3b1345a42ab8e75f612627309ab51ad9d27e40b9
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d4584ac8c299748470ae635d4c1868ece908e7ec89d47a16030006af50b4615
+size 35389440
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca223cb512d3d1ac9a16a332984f505877e86c49
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:47442dbdcd8be60d5e87f28fa0911d77b6c626671c5d64b9196e31b147350766
+size 18350080
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..59dcca15b7520156b4ea59980511f2ca6ff1c54f
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e86d1e9b2ecbfae8704b2a63b8895062a002fd9b7c5a880267ba459fd4237ac
+size 30345216
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e19a3ea40d152bd4cdfa9ab2cafd4933e9a23452
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:afbd0447e1f64366e168f9511c901f5adafb23d6f17df170e415b89254f0e6ea
+size 70778880
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f2fba801d46cd15c1af26d1b25607290226b3960
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ad77589bd0883954e50ada2650ec011acac5d7b510a95933afcf0d8ea348480
+size 35389440
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..99dc1af5db969e07824c45cc0ec4f9f558915713
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:da0626961b5484ce6a941c1ad28f5af8831c14bfd13b4a8edfd1ecb141f78548
+size 35389440
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bb5ad3707c4b01e742550b5cf6766d1d20dcb479
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0cc4923fe0ca92f2b26164c9ba80c5f1ddb979461b901e9c6ee9ab821837f26d
+size 18350080
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0b3a52be25b2107f770e92ac443023bf579ae2f1
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5cd4a58f9f1867f303023e7500287e740338695d8fcf70a219a846e0e9087c11
+size 30345216
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ad2d26ecac2fba94d8255522e9c118768ab143b1
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69e96cc7dfb5e974c42d1bfc68f43a28122a8d7a79da366e6fac3c9e838a2e94
+size 70778880
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dea85b48ddaba3c778cfe486b74519cb9bfa6957
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36ef83a641820c808e840a47ce30896468da047ebf4698047e2cc2558c01feed
+size 35389440
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9fa62c7b2046f459267bc6f9e9cf15bf42afb9cd
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b895afdb81428795dacc6b22e55a3b292a1a49bbedd71ba3edf1d216bfa236c3
+size 18350080
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..48a4595c47406d9a6d796cefa3d220b05163c112
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:811a6f3718ebb29d6246f8e5f73f05b24e003a003bdbbe1d11f6375b2290c906
+size 30345216
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b5dd29d3d31238e1ba123d5ff3be8683ba74fee7
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13c0490d91d76ad6a7ed5c80df45adda85876ea427855fd1b29b1a8fa3c78cb7
+size 70778880
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e7279ac2b15d6ce2cbbfc3e08188fc6c247abc55
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:19f2164d072472056e64172fac1f463eee28ab2d76b23eb61f515cf2e93c767a
+size 35389440
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..56cecc2e93d954ba28041b922dd308c5526e3f99
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e452264bcc59473a69a8ecf96fcf40d83bbc8c772811cae438d8237fb4306ee
+size 18350080
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33a1e3a3f84f415506553e11dc364c584b7e36f8
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df00002411349d094ce5395a42e9f4f6dbfd0aac885ac3d5ee2f6568a4f94550
+size 18350080
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b35230bd5f03a06f1b8167f7c8e406436f0970d8
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9cf42584378865985122a0d49354776daea73098c74cafa2da0ee224f084a356
+size 30345216
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f988c7dbeb956785d217e75a979919870ed451ac
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:37f3b22eca5d4399d0a2b3ea41dfac65f398e3a65631641dc2740e03ce43f661
+size 70778880
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fe555a439ef1780c8680a9b18873f8f82e840086
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:06350f8ad051a8138d0b35dddd9ac7737e6e83c53ac13681307e46f59ce02ebb
+size 35389440
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..10a11c7fd6bd70ec41e2c09413f67c729178481a
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3fbf0c228510511a9071c8143e975d79db89868edbc10e2dcca9dd5dfa718638
+size 18350080
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0936e6b45e52329f71bf66a2bba4b7582efbd5c8
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:322a8044e86a4588a283e8f4b7e676221fc66456a0590ddd8eb93b6ee8443d9d
+size 30345216
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eaa6042ecf3d918ff028c1bbea26f6c160239e0a
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3b865391d16a712738fa73a951b29d598f6d6e43a2aa8787ef8412fc67bc6370
+size 70778880
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..218e3fea00ce8a770d871959733afde1e12414a6
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:db058112d8371ac2705c5c96e370b29b0ae7059bbd9259daea10bd7c3945981b
+size 35389440
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7fb66b1a19c120abe6f3c9357930ae17e3acd61e
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69404a025d164277206175bec753bef2cd97b89d7707ea1c6fde36a08fe40713
+size 18350080
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e3ad0f44357916ded56a21b25e412e21a99c7b66
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:caaec4761a2b1e234f27faed925217973ede51c69b2e7818dc5ace6e89bd6297
+size 30345216
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b627c9399e68be8838b2a8f6252c702a1678840
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb29eeeefd991f61792bf744289caee6b7ffa927168cff4ee0c8a7285860efe2
+size 70778880
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..a34650995da6939a945c330eadb0687147ac3ef8
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,303282 @@
+{
+ "version": "1.0",
+ "truncation": null,
+ "padding": null,
+ "added_tokens": [
+ {
+ "id": 151643,
+ "content": "<|end▁of▁sentence|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": true
+ },
+ {
+ "id": 151644,
+ "content": "<|User|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151645,
+ "content": "<|Assistant|>",
+ "single_word": false,
+ "lstrip": false,
+ "rstrip": false,
+ "normalized": false,
+ "special": false
+ },
+ {
+ "id": 151646,
+ "content": "<|begin▁of▁sentence|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ {
+ "id": 151647,
+ "content": "<|EOT|>",
+ "normalized": false,
+ "lstrip": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ {
+ "id": 151648,
+ "content": "
&": 5789, + "CON": 5790, + "Ġrepl": 5791, + "Ġregular": 5792, + "Storage": 5793, + "ramework": 5794, + "Ġgoal": 5795, + "Ġtouch": 5796, + ".widget": 5797, + "Ġbuilt": 5798, + "des": 5799, + "Part": 5800, + "(re": 5801, + "Ġworth": 5802, + "hib": 5803, + "game": 5804, + "Ġв": 5805, + "acion": 5806, + "ĠWhite": 5807, + "(type": 5808, + "(`": 5809, + "Ġnatural": 5810, + "Ġinj": 5811, + "Ġcalcul": 5812, + "ĠApril": 5813, + ".List": 5814, + "Ġassociated": 5815, + "ĉSystem": 5816, + "~~": 5817, + "=[": 5818, + "Ġstorage": 5819, + "Ġbytes": 5820, + "Ġtravel": 5821, + "Ġsou": 5822, + "Ġpassed": 5823, + "!=": 5824, + "ascript": 5825, + ".open": 5826, + "Ġgrid": 5827, + "Ġbus": 5828, + "Ġrecogn": 5829, + "Ab": 5830, + "Ġhon": 5831, + "ĠCenter": 5832, + "Ġprec": 5833, + "build": 5834, + "HTML": 5835, + "ĠSan": 5836, + "Ġcountries": 5837, + "aled": 5838, + "token": 5839, + "kt": 5840, + "Ġqual": 5841, + "Last": 5842, + "adow": 5843, + "Ġmanufact": 5844, + "idad": 5845, + "jango": 5846, + "Next": 5847, + "xf": 5848, + ".a": 5849, + "Ġporno": 5850, + "ĠPM": 5851, + "erve": 5852, + "iting": 5853, + "_th": 5854, + "ci": 5855, + "=None": 5856, + "gs": 5857, + "Ġlogin": 5858, + "atives": 5859, + "']);Ċ": 5860, + "Äħ": 5861, + "Ġill": 5862, + "IA": 5863, + "children": 5864, + "DO": 5865, + "Ġlevels": 5866, + "Ġ{{": 5867, + "Ġlooks": 5868, + "Ġ\"#": 5869, + "ToString": 5870, + "Ġnecessary": 5871, + "ĠĠĠĊ": 5872, + "cell": 5873, + "Entry": 5874, + "Ġ'#": 5875, + "Ġextrem": 5876, + "Selector": 5877, + "Ġplaceholder": 5878, + "Load": 5879, + "Ġreleased": 5880, + "ORE": 5881, + "Enumer": 5882, + "ĠTV": 5883, + "SET": 5884, + "inq": 5885, + "Press": 5886, + "ĠDepartment": 5887, + "Ġproperties": 5888, + "Ġrespond": 5889, + "Search": 5890, + "ael": 5891, + "Ġrequ": 5892, + "ĠBook": 5893, + "/Ċ": 5894, + "(st": 5895, + "Ġfinancial": 5896, + "icket": 5897, + "_input": 5898, + "Ġthreat": 5899, + "(in": 5900, + "Strip": 5901, + "ìĿ": 5902, + "ção": 5903, + "Ġevidence": 5904, + "));": 5905, + "ĠBro": 5906, + "Ġ[];Ċ": 5907, + "Ġou": 5908, + "buf": 5909, + "Script": 5910, + "dat": 5911, + "Ġrule": 5912, + "#import": 5913, + "=\"/": 5914, + "Serial": 5915, + "Ġstarting": 5916, + "[index": 5917, + "ae": 5918, + "Ġcontrib": 5919, + "session": 5920, + "_new": 5921, + "utable": 5922, + "ober": 5923, + "Ġ\"./": 5924, + "Ġlogger": 5925, + "Ġrecently": 5926, + "Ġreturned": 5927, + "ččĊ": 5928, + ")))Ċ": 5929, + "itions": 5930, + "Ġseek": 5931, + "Ġcommunic": 5932, + "Ġ\".": 5933, + "Ġusername": 5934, + "ECT": 5935, + "DS": 5936, + "Ġotherwise": 5937, + "ĠGerman": 5938, + ".aw": 5939, + "Adapter": 5940, + "ixel": 5941, + "Ġsystems": 5942, + "Ġdrop": 5943, + "Ġstructure": 5944, + "Ġ$(\"#": 5945, + "encies": 5946, + "anning": 5947, + "ĠLink": 5948, + "ĠResponse": 5949, + "Ġstri": 5950, + "ż": 5951, + "ĠDB": 5952, + "æĹ": 5953, + "android": 5954, + "submit": 5955, + "otion": 5956, + "(@": 5957, + ".test": 5958, + "ĊĊĊĊĊĊĊĊ": 5959, + "];čĊ": 5960, + "Ġdirectly": 5961, + "Ġ\"%": 5962, + "ris": 5963, + "elta": 5964, + "AIL": 5965, + "){čĊ": 5966, + "mine": 5967, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 5968, + "(k": 5969, + "bon": 5970, + "asic": 5971, + "pite": 5972, + "___": 5973, + "Max": 5974, + "Ġerrors": 5975, + "ĠWhile": 5976, + "Ġarguments": 5977, + "Ġensure": 5978, + "Right": 5979, + "-based": 5980, + "Web": 5981, + "Ġ-=": 5982, + "Ġintrodu": 5983, + "ĠInst": 5984, + "ĠWash": 5985, + "ordin": 5986, + "join": 5987, + "Database": 5988, + "Ġgrad": 5989, + "Ġusually": 5990, + "ITE": 5991, + "Props": 5992, + "?>Ċ": 5993, + "ĠGo": 5994, + "@Override": 5995, + "REF": 5996, + "Ġip": 5997, + "ĠAustral": 5998, + "Ġist": 5999, + "ViewById": 6000, + "Ġserious": 6001, + "Ġcustomer": 6002, + ".prototype": 6003, + "odo": 6004, + "cor": 6005, + "Ġdoor": 6006, + "ĠWITHOUT": 6007, + "Ġplant": 6008, + "Ġbegan": 6009, + "Ġdistance": 6010, + "()).": 6011, + "Ġchance": 6012, + "Ġord": 6013, + "came": 6014, + "pragma": 6015, + "Ġprotect": 6016, + "ragment": 6017, + "ĠNode": 6018, + "ening": 6019, + "Ñĩ": 6020, + "Ġroute": 6021, + "ĠSchool": 6022, + "hi": 6023, + "Ġneighb": 6024, + "After": 6025, + "licit": 6026, + "Ġcontr": 6027, + "Ġprimary": 6028, + "AA": 6029, + ".WriteLine": 6030, + "utils": 6031, + "Ġbi": 6032, + "Red": 6033, + ".Linq": 6034, + ".object": 6035, + "Ġleaders": 6036, + "unities": 6037, + "Ġgun": 6038, + "onth": 6039, + "ĠDev": 6040, + "FILE": 6041, + "Ġcomments": 6042, + "_len": 6043, + "arrow": 6044, + "amount": 6045, + "Range": 6046, + "sert": 6047, + "GridView": 6048, + "Ġupdated": 6049, + "ĠMo": 6050, + "Ġinform": 6051, + "ociety": 6052, + "ala": 6053, + "Access": 6054, + "Ġhab": 6055, + "Ġcreat": 6056, + "_arg": 6057, + "ĠJanuary": 6058, + "ĠDay": 6059, + "\")čĊ": 6060, + "uple": 6061, + "document": 6062, + "gorith": 6063, + "menu": 6064, + "ĠOver": 6065, + "bb": 6066, + ".title": 6067, + "_out": 6068, + "Ġled": 6069, + "uri": 6070, + "Ġ?>": 6071, + "gl": 6072, + "Ġbank": 6073, + "ayment": 6074, + "ĉprintf": 6075, + "MD": 6076, + "Ġsample": 6077, + "Ġhands": 6078, + "ĠVersion": 6079, + "uario": 6080, + "Ġoffers": 6081, + "ityEngine": 6082, + "Ġshape": 6083, + "Ġsleep": 6084, + "_point": 6085, + "Settings": 6086, + "Ġachie": 6087, + "Ġsold": 6088, + "ota": 6089, + ".bind": 6090, + "Am": 6091, + "Ġsafe": 6092, + "Store": 6093, + "Ġshared": 6094, + "Ġpriv": 6095, + "_VAL": 6096, + "Ġsens": 6097, + "){": 6098, + "Ġremember": 6099, + "shared": 6100, + "element": 6101, + "Ġshoot": 6102, + "Vert": 6103, + "cout": 6104, + "Ġenv": 6105, + "_label": 6106, + "Ġ>Ċ": 6107, + "run": 6108, + "Ġscene": 6109, + "(array": 6110, + "device": 6111, + "_title": 6112, + "agon": 6113, + "]čĊ": 6114, + "aby": 6115, + "Ġbecame": 6116, + "boolean": 6117, + "Ġpark": 6118, + "ĠCode": 6119, + "upload": 6120, + "riday": 6121, + "ĠSeptember": 6122, + "Fe": 6123, + "Ġsen": 6124, + "cing": 6125, + "FL": 6126, + "Col": 6127, + "uts": 6128, + "_page": 6129, + "inn": 6130, + "Ġimplied": 6131, + "aling": 6132, + "Ġyourself": 6133, + ".Count": 6134, + "conf": 6135, + "Ġaud": 6136, + "_init": 6137, + ".)": 6138, + "Ġwrote": 6139, + "NG": 6140, + ".Error": 6141, + "ä»": 6142, + ".for": 6143, + "Ġequal": 6144, + "ĠRequest": 6145, + "Ġserial": 6146, + "Ġallows": 6147, + "XX": 6148, + "Ġmiddle": 6149, + "chor": 6150, + "ø": 6151, + "erval": 6152, + ".Column": 6153, + "reading": 6154, + "Ġescort": 6155, + "ĠAugust": 6156, + "Ġquickly": 6157, + "Ġweap": 6158, + "ĠCG": 6159, + "ropri": 6160, + "ho": 6161, + "Ġcop": 6162, + "(struct": 6163, + "ĠBig": 6164, + "Ġvs": 6165, + "Ġfrequ": 6166, + ".Value": 6167, + "Ġactions": 6168, + "Ġproper": 6169, + "Ġinn": 6170, + "Ġobjects": 6171, + "Ġmatrix": 6172, + "avascript": 6173, + "Ġones": 6174, + ".group": 6175, + "Ġgreen": 6176, + "Ġpaint": 6177, + "ools": 6178, + "ycl": 6179, + "encode": 6180, + "olt": 6181, + "comment": 6182, + ".api": 6183, + "Dir": 6184, + "Ġune": 6185, + "izont": 6186, + ".position": 6187, + "Ġdesigned": 6188, + "_val": 6189, + "avi": 6190, + "iring": 6191, + "tab": 6192, + "Ġlayer": 6193, + "Ġviews": 6194, + "Ġreve": 6195, + "rael": 6196, + "ĠON": 6197, + "rics": 6198, + "np": 6199, + "Ġcore": 6200, + "());čĊ": 6201, + "Main": 6202, + "Ġexpert": 6203, + "ĉĉčĊ": 6204, + "_en": 6205, + "Ġ/>": 6206, + "utter": 6207, + "IAL": 6208, + "ails": 6209, + "ĠKing": 6210, + "*/ĊĊ": 6211, + "ĠMet": 6212, + "_end": 6213, + "addr": 6214, + "ora": 6215, + "Ġir": 6216, + "Min": 6217, + "Ġsurpr": 6218, + "Ġrepe": 6219, + "Ġdirectory": 6220, + "PUT": 6221, + "-S": 6222, + "Ġelection": 6223, + "haps": 6224, + ".pre": 6225, + "cm": 6226, + "Values": 6227, + "Ġ\"Ċ": 6228, + "column": 6229, + "ivil": 6230, + "Login": 6231, + "inue": 6232, + "Ġbeautiful": 6233, + "Ġsecret": 6234, + "(event": 6235, + "Ġchat": 6236, + "ums": 6237, + "Ġorigin": 6238, + "Ġeffects": 6239, + "Ġmanagement": 6240, + "illa": 6241, + "tk": 6242, + "Ġsetting": 6243, + "ĠCour": 6244, + "Ġmassage": 6245, + "ĉend": 6246, + "Ġhappy": 6247, + "Ġfinish": 6248, + "Ġcamera": 6249, + "ĠVer": 6250, + "ĠDemocr": 6251, + "ĠHer": 6252, + "(Q": 6253, + "cons": 6254, + "ita": 6255, + "Ġ'.": 6256, + "{}": 6257, + "ĉC": 6258, + "Ġstuff": 6259, + "Ġ:Ċ": 6260, + "ĠAR": 6261, + "Task": 6262, + "hidden": 6263, + "eros": 6264, + "IGN": 6265, + "atio": 6266, + "ĠHealth": 6267, + "olute": 6268, + "Enter": 6269, + "'>": 6270, + "ĠTwitter": 6271, + "ĠCounty": 6272, + "scribe": 6273, + "Ġ=>Ċ": 6274, + "Ġhy": 6275, + "fit": 6276, + "Ġmilitary": 6277, + "Ġsale": 6278, + "required": 6279, + "non": 6280, + "bootstrap": 6281, + "hold": 6282, + "rim": 6283, + "-old": 6284, + "ĠDown": 6285, + "Ġmention": 6286, + "contact": 6287, + "_group": 6288, + "oday": 6289, + "Ġtown": 6290, + "Ġsolution": 6291, + "uate": 6292, + "elling": 6293, + "]->": 6294, + "otes": 6295, + "ental": 6296, + "omen": 6297, + "ospital": 6298, + "ĠSup": 6299, + "_EN": 6300, + "Ġslow": 6301, + "SESSION": 6302, + "Ġblue": 6303, + "ago": 6304, + "Ġlives": 6305, + "Ġ^": 6306, + ".un": 6307, + "inst": 6308, + "enge": 6309, + "Ġcustomers": 6310, + "Ġcast": 6311, + "udget": 6312, + "ï¼ģ": 6313, + "icens": 6314, + "Ġdetermin": 6315, + "Selected": 6316, + "_pl": 6317, + "ueue": 6318, + "Ġdark": 6319, + "//ĊĊ": 6320, + "si": 6321, + "thern": 6322, + "ĠJapan": 6323, + "/w": 6324, + "PU": 6325, + "ĠEast": 6326, + "ovie": 6327, + "Ġpackage": 6328, + "Ġnor": 6329, + "Ġapi": 6330, + "bot": 6331, + "\"];Ċ": 6332, + "_post": 6333, + "ulate": 6334, + "Ġclub": 6335, + "'));Ċ": 6336, + "Ġloop": 6337, + "PIO": 6338, + "ione": 6339, + "shot": 6340, + "Initial": 6341, + "Ġplayed": 6342, + "register": 6343, + "rought": 6344, + "_max": 6345, + "acement": 6346, + "match": 6347, + "raphics": 6348, + "AST": 6349, + "Ġexisting": 6350, + "Ġcomplex": 6351, + "DA": 6352, + ".Ch": 6353, + ".common": 6354, + "mo": 6355, + "Ġ'../../": 6356, + "ito": 6357, + "Ġanalysis": 6358, + "Ġdeliver": 6359, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6360, + "idx": 6361, + "Ãł": 6362, + "ongo": 6363, + "ĠEnglish": 6364, + "Ċ": 9992, + "_default": 9993, + "ĠDatabase": 9994, + "rep": 9995, + "ESS": 9996, + "nergy": 9997, + ".Find": 9998, + "_mask": 9999, + "Ġrise": 10000, + "Ġkernel": 10001, + "::$": 10002, + ".Q": 10003, + "Ġoffering": 10004, + "decl": 10005, + "ĠCS": 10006, + "Ġlisted": 10007, + "Ġmostly": 10008, + "enger": 10009, + "Ġblocks": 10010, + "olo": 10011, + "Ġgoverning": 10012, + "\\F": 10013, + "Ġconcent": 10014, + ".getText": 10015, + "Ġmb": 10016, + "Ġoccurred": 10017, + "Ġchanging": 10018, + "Scene": 10019, + "_CODE": 10020, + "Beh": 10021, + "\"The": 10022, + "Ġtile": 10023, + "ĠAssociation": 10024, + "ĉP": 10025, + "alty": 10026, + "_ad": 10027, + "odies": 10028, + "iated": 10029, + "Ġprepared": 10030, + "possible": 10031, + "Ġmort": 10032, + "TEST": 10033, + "Ġignore": 10034, + "Ġcalc": 10035, + "Ġrs": 10036, + "ĠassertEquals": 10037, + "Ġsz": 10038, + "ĠTHIS": 10039, + ".\"Ċ": 10040, + "Ġcanvas": 10041, + "java": 10042, + "Ġdut": 10043, + "VALID": 10044, + ".sql": 10045, + ".input": 10046, + "Ġaux": 10047, + "Sup": 10048, + "Ġartist": 10049, + "Vec": 10050, + "_TIME": 10051, + ".stringify": 10052, + "etween": 10053, + "ĠCategory": 10054, + "Ġ[-": 10055, + "ĠDevExpress": 10056, + "ĠJul": 10057, + "Ġring": 10058, + ".ed": 10059, + "YY": 10060, + "Let": 10061, + "TextField": 10062, + "Ġflat": 10063, + "_print": 10064, + "ĠOTHER": 10065, + "adian": 10066, + "Ġchecked": 10067, + "ele": 10068, + "Align": 10069, + "standing": 10070, + "Ġ[],": 10071, + "Ġlab": 10072, + "ucky": 10073, + "ĠChristmas": 10074, + "(image": 10075, + ".module": 10076, + "Ġlots": 10077, + "Ġslightly": 10078, + "(final": 10079, + "erge": 10080, + "è¿": 10081, + "ĠPolice": 10082, + "ĠRight": 10083, + "Ġaward": 10084, + "ĠOS": 10085, + "Ġ{}ĊĊ": 10086, + "Ġptr": 10087, + "oves": 10088, + "icated": 10089, + "ем": 10090, + "Ġmanage": 10091, + "oliday": 10092, + "Amount": 10093, + "oolStrip": 10094, + "tbody": 10095, + "Nav": 10096, + "wrap": 10097, + "BB": 10098, + "Ġwatching": 10099, + "arios": 10100, + "Ġoptional": 10101, + "_K": 10102, + "ĠLicensed": 10103, + ".Map": 10104, + "Timer": 10105, + "ĠAP": 10106, + "ĠRev": 10107, + "(o": 10108, + ",c": 10109, + "umin": 10110, + "etailed": 10111, + "ĠHy": 10112, + "Ġblank": 10113, + "agger": 10114, + "ĠSelf": 10115, + "()[": 10116, + ".make": 10117, + "earn": 10118, + "channel": 10119, + ";Ċ": 10133, + "World": 10134, + "Ġpython": 10135, + "Ġlif": 10136, + "Ġtrav": 10137, + "Ġconven": 10138, + "company": 10139, + "ĠClub": 10140, + "Ver": 10141, + "Btn": 10142, + "Ġzone": 10143, + "products": 10144, + "ĠEduc": 10145, + "Ġverify": 10146, + "ĠMil": 10147, + "ono": 10148, + "]);ĊĊ": 10149, + "ENCE": 10150, + "Ġpacket": 10151, + "Ġcer": 10152, + "Ġenumer": 10153, + "Ġpars": 10154, + "formed": 10155, + "Ġoccup": 10156, + "tre": 10157, + "Ġexercise": 10158, + "Day": 10159, + "_sum": 10160, + "Ġasking": 10161, + "aption": 10162, + "Ġorders": 10163, + "Ġspending": 10164, + "ĠERR": 10165, + ".Dis": 10166, + "ĠUtil": 10167, + "âĢľI": 10168, + "\\'": 10169, + "?)": 10170, + "/>Ċ": 10171, + "Ġemot": 10172, + "Ġinfluence": 10173, + "ĠAfrica": 10174, + "atters": 10175, + "Ùħ": 10176, + ".session": 10177, + "Ġchief": 10178, + "ĉĉĉĉĉĉĉĉĉĉĉ": 10179, + "Ġtom": 10180, + "cluded": 10181, + "serial": 10182, + "_handler": 10183, + ".Type": 10184, + "aped": 10185, + "Ġpolicies": 10186, + "-ex": 10187, + "-tr": 10188, + "blank": 10189, + "merce": 10190, + "Ġcoverage": 10191, + "Ġrc": 10192, + "_matrix": 10193, + "_box": 10194, + "Ġcharges": 10195, + "ĠBoston": 10196, + "Pe": 10197, + "Ġcircum": 10198, + "Ġfilled": 10199, + "Ġnorth": 10200, + "ictureBox": 10201, + "ĉres": 10202, + "è®": 10203, + "Ġtermin": 10204, + "Ġ[âĢ¦": 10205, + "IRECT": 10206, + "Ġber": 10207, + "Ġ\"../../": 10208, + "retch": 10209, + ".code": 10210, + "_col": 10211, + "ĠGovernment": 10212, + "Ġargv": 10213, + "ĠLord": 10214, + "asi": 10215, + "Exec": 10216, + "ĉlet": 10217, + "vertis": 10218, + "Ġdiscussion": 10219, + "enance": 10220, + "outube": 10221, + "typeof": 10222, + "Ġserved": 10223, + "ĠPut": 10224, + "ĉx": 10225, + "Ġsweet": 10226, + "Before": 10227, + "ategy": 10228, + ".of": 10229, + "ĠMaterial": 10230, + "Sort": 10231, + "ONT": 10232, + "igital": 10233, + "Why": 10234, + "Ġsust": 10235, + "Ġç": 10236, + "abet": 10237, + "Ġsegment": 10238, + "Ġ[],Ċ": 10239, + "ĠMuslim": 10240, + "ĠfindViewById": 10241, + "cut": 10242, + "_TEXT": 10243, + "ĠMary": 10244, + "Ġloved": 10245, + "Ġlie": 10246, + "ĠJO": 10247, + "Ġisset": 10248, + "month": 10249, + "Ġprime": 10250, + "ti": 10251, + "ĠCarol": 10252, + "Use": 10253, + "ĠPop": 10254, + "ĠSave": 10255, + "Interval": 10256, + "execute": 10257, + "dy": 10258, + "ĠIran": 10259, + "_cont": 10260, + "ĉT": 10261, + "Ġphase": 10262, + "checkbox": 10263, + "week": 10264, + "Ġhide": 10265, + "Ġtil": 10266, + "Ġju": 10267, + "Custom": 10268, + "burg": 10269, + "/M": 10270, + "TON": 10271, + "Ġquant": 10272, + "Ġrub": 10273, + "ixels": 10274, + "Ġinstalled": 10275, + "Ġdump": 10276, + "Ġproperly": 10277, + "(List": 10278, + "Ġdecide": 10279, + "apply": 10280, + "Has": 10281, + "Ġkeeping": 10282, + "Ġcitizens": 10283, + "Ġjoint": 10284, + "pool": 10285, + "Socket": 10286, + "_op": 10287, + "Ġweapon": 10288, + "gnore": 10289, + "ĠExec": 10290, + "otten": 10291, + "ĠMS": 10292, + "Ġ(-": 10293, + "ĠReview": 10294, + "Ġexamples": 10295, + "Ġtight": 10296, + "!(": 10297, + "DP": 10298, + "ĠMessageBox": 10299, + "Ġphotograph": 10300, + "URI": 10301, + "ét": 10302, + "low": 10303, + "ĠGrand": 10304, + ".persistence": 10305, + "Ġmaintain": 10306, + "Ġnums": 10307, + "Ġzip": 10308, + "ials": 10309, + "ĠGets": 10310, + "peg": 10311, + "ĠBuffer": 10312, + "~~~~": 10313, + "rastructure": 10314, + "ĠPL": 10315, + "uen": 10316, + "obby": 10317, + "sizeof": 10318, + "Ġpic": 10319, + "Ġseed": 10320, + "Ġexperienced": 10321, + "Ġodd": 10322, + "Ġkick": 10323, + "Ġprocedure": 10324, + "avigator": 10325, + "-on": 10326, + ",j": 10327, + "ĠAlthough": 10328, + "ĠuserId": 10329, + "accept": 10330, + "Blue": 10331, + "IColor": 10332, + "layer": 10333, + "available": 10334, + "Ġends": 10335, + ".table": 10336, + "Ġdataset": 10337, + "bus": 10338, + "Ġexplain": 10339, + "(pro": 10340, + "ĠCommittee": 10341, + "Ġnoted": 10342, + "]:Ċ": 10343, + "Dim": 10344, + "stdio": 10345, + ".\",Ċ": 10346, + "_source": 10347, + "ĠWeek": 10348, + "ĠEdge": 10349, + "Ġoperating": 10350, + "Ġeste": 10351, + "ipl": 10352, + "agination": 10353, + "Ġproceed": 10354, + "Ġanimation": 10355, + ".Models": 10356, + "ĠWatch": 10357, + "iat": 10358, + "Ġoppon": 10359, + "/A": 10360, + "Report": 10361, + "Ġsounds": 10362, + "_buf": 10363, + "IELD": 10364, + "Ġbund": 10365, + "ĉget": 10366, + ".pr": 10367, + "(tmp": 10368, + "Ġkid": 10369, + ">ĊĊĊ": 10370, + "Ġyang": 10371, + "NotFound": 10372, + "ÑĨ": 10373, + "math": 10374, + "@gmail": 10375, + "ĠLIMIT": 10376, + "redients": 10377, + "Ġvent": 10378, + "avigate": 10379, + "Look": 10380, + "Ġreligious": 10381, + "Ġrand": 10382, + "rio": 10383, + "(GL": 10384, + "_ip": 10385, + "uan": 10386, + "iciency": 10387, + "ĠChange": 10388, + ">čĊčĊ": 10389, + "ĠEntity": 10390, + "Ġrencontre": 10391, + "ĠRet": 10392, + "plan": 10393, + "én": 10394, + "BOOL": 10395, + "uries": 10396, + "train": 10397, + "Definition": 10398, + "============": 10399, + "zz": 10400, + "Animation": 10401, + "ĠOK": 10402, + "_menu": 10403, + ".bl": 10404, + "_score": 10405, + "Ġacad": 10406, + "(System": 10407, + "Ġrefresh": 10408, + "'=>$": 10409, + ".Graphics": 10410, + "amento": 10411, + "pid": 10412, + "tc": 10413, + "Ġtips": 10414, + "Ġhomes": 10415, + "Ġfuel": 10416, + "âĸ": 10417, + "_helper": 10418, + "ĠĠčĊ": 10419, + "ĠRoom": 10420, + ".Close": 10421, + "_attr": 10422, + "ĠMount": 10423, + "ĠEv": 10424, + "arser": 10425, + "_top": 10426, + "eah": 10427, + "ĠDelete": 10428, + "ãĢį": 10429, + "uke": 10430, + "Ġusage": 10431, + "aria": 10432, + "_dev": 10433, + "Ġtexture": 10434, + "Ġconversation": 10435, + "eper": 10436, + "Bean": 10437, + "done": 10438, + "nonatomic": 10439, + "ĠSecond": 10440, + "Ġshooting": 10441, + "_pre": 10442, + "Components": 10443, + "Ġ]ĊĊ": 10444, + "__,": 10445, + "stitution": 10446, + ".Char": 10447, + ">();ĊĊ": 10448, + "Ġpresented": 10449, + "Ġwa": 10450, + "oker": 10451, + "-ĊĊ": 10452, + "iner": 10453, + "Ġbecoming": 10454, + "Ġincident": 10455, + "Att": 10456, + "Ġrevealed": 10457, + "forc": 10458, + "Ġboot": 10459, + ".page": 10460, + "Enumerator": 10461, + "_->": 10462, + "Photo": 10463, + "Ġspring": 10464, + ".\",": 10465, + "ĠDictionary": 10466, + "BJECT": 10467, + "Ġlocations": 10468, + "Ġsamples": 10469, + "InputStream": 10470, + "ĠBrown": 10471, + "Ġstats": 10472, + "quality": 10473, + "Ñħ": 10474, + "-dis": 10475, + "Ġhelping": 10476, + "Ġped": 10477, + "(se": 10478, + "ĠWho": 10479, + "alian": 10480, + "internal": 10481, + "Ġft": 10482, + ">().": 10483, + "->{": 10484, + "Ġmine": 10485, + "Ġsector": 10486, + "Ġgro": 10487, + "Ġopportunities": 10488, + "Ġü": 10489, + "Ġmp": 10490, + "Ġalleged": 10491, + "Ġdoubt": 10492, + "Mouse": 10493, + "About": 10494, + "_part": 10495, + "Ġchair": 10496, + "Ġstopped": 10497, + "loop": 10498, + "entities": 10499, + "Ġapps": 10500, + "ansion": 10501, + "Ġmental": 10502, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10503, + "FR": 10504, + "Ġdefend": 10505, + "care": 10506, + "Ġideal": 10507, + "/api": 10508, + "urface": 10509, + "Ġele": 10510, + "ulator": 10511, + "ĠRights": 10512, + "anguages": 10513, + "Ġfunds": 10514, + "Ġadapt": 10515, + "Attributes": 10516, + "Ġdeploy": 10517, + "opts": 10518, + "Ġvalidation": 10519, + "Ġconcerns": 10520, + "uce": 10521, + ".num": 10522, + "ulture": 10523, + "ila": 10524, + "Ġcup": 10525, + "Ġpure": 10526, + ".Fore": 10527, + "ĠHashMap": 10528, + ".valueOf": 10529, + "asm": 10530, + "MO": 10531, + "Ġcs": 10532, + "Ġstores": 10533, + "Ġ************************************************************************": 10534, + "Ġcommunication": 10535, + "mem": 10536, + ".EventHandler": 10537, + ".Status": 10538, + "_right": 10539, + ".setOn": 10540, + "Sheet": 10541, + "Ġidentify": 10542, + "enerated": 10543, + "ordered": 10544, + "Ġ\"[": 10545, + "Ġswe": 10546, + "Condition": 10547, + "ĠAccording": 10548, + "Ġprepare": 10549, + "Ġrob": 10550, + "Pool": 10551, + "Ġsport": 10552, + "rv": 10553, + "ĠRouter": 10554, + "Ġalternative": 10555, + "([]": 10556, + "ĠChicago": 10557, + "ipher": 10558, + "ische": 10559, + "ĠDirector": 10560, + "kl": 10561, + "ĠWil": 10562, + "keys": 10563, + "Ġmysql": 10564, + "Ġwelcome": 10565, + "king": 10566, + "ĠManager": 10567, + "Ġcaught": 10568, + ")}Ċ": 10569, + "Score": 10570, + "_PR": 10571, + "Ġsurvey": 10572, + "hab": 10573, + "Headers": 10574, + "ADER": 10575, + "Ġdecor": 10576, + "Ġturns": 10577, + "Ġradius": 10578, + "errupt": 10579, + "Cor": 10580, + "Ġmel": 10581, + "Ġintr": 10582, + "(q": 10583, + "ĠAC": 10584, + "amos": 10585, + "MAX": 10586, + "ĠGrid": 10587, + "ĠJesus": 10588, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10589, + ".DE": 10590, + "Ġts": 10591, + "Ġlinked": 10592, + "free": 10593, + "ĠQt": 10594, + "Ġ/**čĊ": 10595, + "Ġfaster": 10596, + "ctr": 10597, + "_J": 10598, + "DT": 10599, + ".Check": 10600, + "Ġcombination": 10601, + "Ġintended": 10602, + "-the": 10603, + "-type": 10604, + "ectors": 10605, + "ami": 10606, + "uting": 10607, + "Ġuma": 10608, + "XML": 10609, + "UCT": 10610, + "Ap": 10611, + "ĠRandom": 10612, + "Ġran": 10613, + ".sort": 10614, + "Ġsorted": 10615, + ".Un": 10616, + "_PER": 10617, + "itory": 10618, + "Ġpriority": 10619, + "ĠGal": 10620, + "ĠOld": 10621, + "hot": 10622, + "ĠDisplay": 10623, + "(sub": 10624, + "_TH": 10625, + "_Y": 10626, + "ĠCare": 10627, + "loading": 10628, + "Kind": 10629, + "_handle": 10630, + ",,": 10631, + "rase": 10632, + "_replace": 10633, + ".addEventListener": 10634, + "ĠRT": 10635, + "Ġentered": 10636, + "gers": 10637, + "Ġich": 10638, + "(start": 10639, + "/app": 10640, + "Ġbrother": 10641, + "Memory": 10642, + "Outlet": 10643, + "Ġutf": 10644, + "prec": 10645, + "Ġnavigation": 10646, + "ORK": 10647, + "Ġdst": 10648, + "Detail": 10649, + "Ġaudience": 10650, + "Ġdur": 10651, + "Ġcluster": 10652, + "unched": 10653, + "Ġ],": 10654, + "Ġcomfortable": 10655, + ".values": 10656, + "ĠTotal": 10657, + "Ġsnap": 10658, + "Ġstandards": 10659, + "Ġperformed": 10660, + "hand": 10661, + "(\"@": 10662, + "åŃ": 10663, + "Ġphil": 10664, + "ibr": 10665, + "trim": 10666, + "Ġforget": 10667, + "Ġdoctor": 10668, + ".TextBox": 10669, + "icons": 10670, + ",s": 10671, + "ĠOp": 10672, + "Sm": 10673, + "Stop": 10674, + "ĉList": 10675, + "ĉu": 10676, + "Comment": 10677, + "_VERSION": 10678, + ".Xtra": 10679, + "Person": 10680, + "rb": 10681, + "LOB": 10682, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10683, + "ĠCentral": 10684, + "ICK": 10685, + "raq": 10686, + "Ġputting": 10687, + "Ġmd": 10688, + "ĠLove": 10689, + "Program": 10690, + "Border": 10691, + "oor": 10692, + "Ġallowing": 10693, + "after": 10694, + "Ġentries": 10695, + "ĠMaybe": 10696, + "]).": 10697, + "ĠShort": 10698, + ")\\": 10699, + ".now": 10700, + "friend": 10701, + "Ġprefer": 10702, + "ĠGPIO": 10703, + "osis": 10704, + "ĠGameObject": 10705, + "Ġskip": 10706, + "Ġcompetition": 10707, + "_match": 10708, + "lications": 10709, + "_CONT": 10710, + ".groupBox": 10711, + "Ġals": 10712, + "\"We": 10713, + "_eq": 10714, + "lan": 10715, + "_search": 10716, + "ĠMusic": 10717, + "asis": 10718, + "Ġbind": 10719, + "ĠIsland": 10720, + "rum": 10721, + "(E": 10722, + "Ġseat": 10723, + "Video": 10724, + "Ġack": 10725, + "reek": 10726, + "={()": 10727, + "Ġrating": 10728, + "Ġrestaurant": 10729, + "DEX": 10730, + "(buf": 10731, + "pping": 10732, + "uality": 10733, + "Ġleague": 10734, + "Ġfocused": 10735, + "apon": 10736, + "$data": 10737, + "CLUD": 10738, + "CLUDING": 10739, + "Ġabsolute": 10740, + "(query": 10741, + "Ġtells": 10742, + "Ang": 10743, + "Ġcommunities": 10744, + "Ġhonest": 10745, + "oking": 10746, + "Ġapart": 10747, + "arity": 10748, + "/$": 10749, + "_module": 10750, + "ĠEnc": 10751, + ".an": 10752, + ".Config": 10753, + "Cre": 10754, + "Ġshock": 10755, + "ĠArab": 10756, + "IENT": 10757, + "/re": 10758, + "Ġretrie": 10759, + "ycler": 10760, + "isa": 10761, + "ĠOrgan": 10762, + ".graph": 10763, + "Ġí": 10764, + "ĠBAS": 10765, + "Enum": 10766, + "Ġpossibly": 10767, + "ÑĢаÐ": 10768, + "ĠJapanese": 10769, + "Ġcraft": 10770, + "ĠPlace": 10771, + "Ġtalent": 10772, + "Ġfunding": 10773, + "Ġconfirmed": 10774, + "Ġcycle": 10775, + "/x": 10776, + "GE": 10777, + "Ġhearing": 10778, + "Ġplants": 10779, + "Ġmouth": 10780, + "pages": 10781, + "oria": 10782, + "ĠRemove": 10783, + "_total": 10784, + "Ġod": 10785, + "ollapse": 10786, + "door": 10787, + "Ġbought": 10788, + "Ġaddr": 10789, + "ARCH": 10790, + "_dim": 10791, + "dden": 10792, + "Ġdecades": 10793, + "REQUEST": 10794, + "Ġversions": 10795, + "fire": 10796, + "Ġmoves": 10797, + "fb": 10798, + "Ġcoffee": 10799, + ".connect": 10800, + "ĠRow": 10801, + "Ġschema": 10802, + "Scope": 10803, + "-Type": 10804, + "Ġfighting": 10805, + "Ġretail": 10806, + "Ġmodified": 10807, + "TF": 10808, + "Files": 10809, + "nie": 10810, + "_command": 10811, + "stone": 10812, + "ĠÑĤ": 10813, + "_thread": 10814, + "Ġbond": 10815, + "ĠDevelopment": 10816, + "Ġpt": 10817, + "FORM": 10818, + "plet": 10819, + "Ġidentified": 10820, + "cpp": 10821, + "Ġcoding": 10822, + "oked": 10823, + "ĠMaster": 10824, + "IDTH": 10825, + "Ġresidents": 10826, + "redit": 10827, + "ĠPhoto": 10828, + "=-": 10829, + "unte": 10830, + "ateur": 10831, + "_STATE": 10832, + "ĠSing": 10833, + "Ġsheet": 10834, + ".val": 10835, + "orse": 10836, + "Ġhers": 10837, + "Ġdetermined": 10838, + "Common": 10839, + "Ġwed": 10840, + "_queue": 10841, + "PH": 10842, + "ĠAtl": 10843, + "cred": 10844, + "/LICENSE": 10845, + "Ġmes": 10846, + "Ġadvanced": 10847, + ".java": 10848, + ".Sh": 10849, + "Go": 10850, + "kill": 10851, + "fp": 10852, + "_settings": 10853, + "Ġpal": 10854, + "Ġtruck": 10855, + "Ġcombined": 10856, + "Ġ\"${": 10857, + "ĠCorpor": 10858, + "Ġjoined": 10859, + "ĠJose": 10860, + "ĠCup": 10861, + "uns": 10862, + "estival": 10863, + "levision": 10864, + "Ġbroken": 10865, + "Ġmarriage": 10866, + "ĠWestern": 10867, + "Ġrepresents": 10868, + "ĠTitle": 10869, + "Ġss": 10870, + ".Ass": 10871, + "ongoose": 10872, + "iento": 10873, + "<>();Ċ": 10874, + "Ġabsolutely": 10875, + "Ġsmooth": 10876, + "TERN": 10877, + "ĠUnless": 10878, + "Word": 10879, + "Ġmerge": 10880, + "igan": 10881, + "ĠVol": 10882, + "Ġnn": 10883, + ".getId": 10884, + "Ġз": 10885, + "Ġsexy": 10886, + "Ġseeking": 10887, + "Single": 10888, + ".this": 10889, + "Ġkom": 10890, + "bound": 10891, + ";\"": 10892, + "ĠfontSize": 10893, + "_df": 10894, + "Ġinjury": 10895, + "(H": 10896, + "Ġissued": 10897, + "_END": 10898, + ":self": 10899, + "Ġpatch": 10900, + "Ġleaves": 10901, + "Ġadopt": 10902, + "FileName": 10903, + "ãĢIJ": 10904, + "Ġexecutive": 10905, + "ĠByte": 10906, + "]))Ċ": 10907, + "Ġnu": 10908, + "outing": 10909, + "cluding": 10910, + "-R": 10911, + ".options": 10912, + "Ġsubstant": 10913, + "avax": 10914, + "ĠBUT": 10915, + "Ġtechnical": 10916, + "Ġtwice": 10917, + "Ġmás": 10918, + "Ġunivers": 10919, + "yr": 10920, + "Ġdrag": 10921, + "ĠDC": 10922, + "Ġsed": 10923, + "Ġbot": 10924, + "ĠPal": 10925, + "ĠHall": 10926, + "forcement": 10927, + "Ġauch": 10928, + ".mod": 10929, + "notation": 10930, + "_files": 10931, + ".line": 10932, + "_flag": 10933, + "[name": 10934, + "Ġresolution": 10935, + "Ġbott": 10936, + "(\"[": 10937, + "ende": 10938, + "(arr": 10939, + "Free": 10940, + "(@\"": 10941, + "ĠDistrict": 10942, + "PEC": 10943, + ":-": 10944, + "Picker": 10945, + "ĠJo": 10946, + "ĠĠĠĠĠĊ": 10947, + "ĠRiver": 10948, + "_rows": 10949, + "Ġhelpful": 10950, + "Ġmassive": 10951, + "---Ċ": 10952, + "Ġmeasures": 10953, + "ĠRuntime": 10954, + "Ġworry": 10955, + "ĠSpec": 10956, + "ĉD": 10957, + "ãĢij": 10958, + "Ġ){Ċ": 10959, + "Ġworse": 10960, + "(filename": 10961, + "Ġlay": 10962, + "Ġmagic": 10963, + "ĠTheir": 10964, + "oul": 10965, + "stroy": 10966, + "ĠWhere": 10967, + "Ġsudden": 10968, + "Ġdefe": 10969, + "Ġbinding": 10970, + "Ġflight": 10971, + "ĠOnInit": 10972, + "ĠWomen": 10973, + "ĠPolicy": 10974, + "Ġdrugs": 10975, + "ishing": 10976, + "('../": 10977, + "ĠMel": 10978, + "peat": 10979, + "tor": 10980, + "Ġproposed": 10981, + "Ġstated": 10982, + "_RES": 10983, + "Ġeast": 10984, + "ĠCONDITION": 10985, + "_desc": 10986, + "Ġwinning": 10987, + "folio": 10988, + "Mapper": 10989, + "ĠPan": 10990, + "ĠAnge": 10991, + ".servlet": 10992, + "Ġcopies": 10993, + "LM": 10994, + "Ġvm": 10995, + "åį": 10996, + "Ġdictionary": 10997, + "Seg": 10998, + "elines": 10999, + "ĠSend": 11000, + "Ġiron": 11001, + "ĠFort": 11002, + ".domain": 11003, + "Ġdebate": 11004, + "NotNull": 11005, + "eq": 11006, + "acher": 11007, + "lf": 11008, + "ĉfmt": 11009, + "Ġlawy": 11010, + "ÄŁ": 11011, + "ĠMen": 11012, + "Ġtrim": 11013, + "(NULL": 11014, + "Ġ!!": 11015, + "Ġpad": 11016, + "Ġfollows": 11017, + "\"][\"": 11018, + "requ": 11019, + "ĠEp": 11020, + ".github": 11021, + "(img": 11022, + "eto": 11023, + "('\\": 11024, + "Services": 11025, + "umbnail": 11026, + "_main": 11027, + "pleted": 11028, + "fortunately": 11029, + "Ġwindows": 11030, + "Ġplane": 11031, + "ĠConnection": 11032, + ".local": 11033, + "uard": 11034, + "}\\": 11035, + "==\"": 11036, + "andon": 11037, + "ĠRoy": 11038, + "west": 11039, + "iginal": 11040, + "emies": 11041, + "itz": 11042, + "'):Ċ": 11043, + "ĠPeter": 11044, + "Ġtough": 11045, + "Ġreduced": 11046, + "Ġcalculate": 11047, + "Ġrapid": 11048, + "customer": 11049, + "Ġefficient": 11050, + "Ġmedium": 11051, + "Ġfell": 11052, + ".ref": 11053, + "ĠCas": 11054, + "Ġfeedback": 11055, + "Speed": 11056, + "(output": 11057, + "aje": 11058, + "Ġcategories": 11059, + "Ġfee": 11060, + "};": 11061, + "Ġdeleted": 11062, + "reh": 11063, + "Ġproof": 11064, + "Desc": 11065, + "Build": 11066, + "Ġsides": 11067, + ".ArrayList": 11068, + "-%": 11069, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11070, + "ر": 11071, + ".match": 11072, + "ли": 11073, + "Ġfeels": 11074, + "Ġachieve": 11075, + "Ġclim": 11076, + "_ON": 11077, + "ĠCD": 11078, + "Ġteacher": 11079, + "_current": 11080, + "bn": 11081, + "_PL": 11082, + "isting": 11083, + "Enable": 11084, + "GEN": 11085, + "Ġtv": 11086, + "Ġsock": 11087, + "Ġplays": 11088, + "Ġdiscount": 11089, + "ĠKE": 11090, + "ĠDebug": 11091, + "Fore": 11092, + "ĠIraq": 11093, + "Ġappearance": 11094, + "Mon": 11095, + "Ġstyled": 11096, + "ĠHuman": 11097, + "iot": 11098, + "ĠHistory": 11099, + "Ġsac": 11100, + "ĠCollection": 11101, + "Ġrecommended": 11102, + ".Selected": 11103, + "Ġorganizations": 11104, + "Ġdiscovered": 11105, + "cohol": 11106, + "adas": 11107, + "ĠThomas": 11108, + "May": 11109, + "Ġconserv": 11110, + "Ġdomin": 11111, + "ĠFollow": 11112, + "ĠSection": 11113, + "ĠThanks": 11114, + "Username": 11115, + "Ġrecipe": 11116, + "Ġwonderful": 11117, + ".sleep": 11118, + "_if": 11119, + "ĉĊĉĊ": 11120, + "orno": 11121, + "Ġru": 11122, + "_target": 11123, + ".\"\"": 11124, + "à¦": 11125, + "EventArgs": 11126, + "Ġinputs": 11127, + "Ġfif": 11128, + "Ġvision": 11129, + "cy": 11130, + "ĠSeries": 11131, + ")(((": 11132, + "Ġtrading": 11133, + "Ġmarker": 11134, + "Begin": 11135, + "Ġtypically": 11136, + "Ġcauses": 11137, + "dropdown": 11138, + "_DEBUG": 11139, + "Ġdetect": 11140, + "country": 11141, + "!\");Ċ": 11142, + "ĉR": 11143, + "appy": 11144, + "Ġcref": 11145, + "('<": 11146, + "\"=>": 11147, + "ĠLE": 11148, + "reader": 11149, + "Ġadministr": 11150, + "õ": 11151, + "ucket": 11152, + "Ġfashion": 11153, + ".char": 11154, + "izar": 11155, + "Ġdisable": 11156, + "Ġsuc": 11157, + "ĠLive": 11158, + "issue": 11159, + "Ġmetadata": 11160, + "flags": 11161, + "ĠðŁ": 11162, + "Ġcommitted": 11163, + "Ġva": 11164, + "Ġrough": 11165, + "Ġ'''Ċ": 11166, + "Ġhighlight": 11167, + "_vars": 11168, + "VO": 11169, + "Ġencoding": 11170, + "-Z": 11171, + "_sign": 11172, + "$(\"#": 11173, + "Ġrain": 11174, + "reatest": 11175, + "ĠEND": 11176, + "Selection": 11177, + "Ġcandidates": 11178, + "Ġsav": 11179, + ".Empty": 11180, + "Ġdecisions": 11181, + "Ġcollabor": 11182, + "ridge": 11183, + "feed": 11184, + "ression": 11185, + "Ġpersons": 11186, + "VM": 11187, + "ega": 11188, + "_BIT": 11189, + "According": 11190, + "acked": 11191, + "Ġdollars": 11192, + "_loss": 11193, + "ĠCost": 11194, + "}\"Ċ": 11195, + "Notification": 11196, + "Ġprostit": 11197, + "Ġauthority": 11198, + ".rec": 11199, + "Ġspokes": 11200, + "ĠToday": 11201, + "istant": 11202, + "ĠHead": 11203, + "âĢĿ.": 11204, + "ertainment": 11205, + "cean": 11206, + "culate": 11207, + "Ġven": 11208, + "However": 11209, + "_arr": 11210, + "Ġtokens": 11211, + "Graph": 11212, + "ĠJud": 11213, + "ĠVirgin": 11214, + "ĠSerial": 11215, + "unning": 11216, + "Mutable": 11217, + "agers": 11218, + ".csv": 11219, + "Ġdeveloping": 11220, + "Ġinstructions": 11221, + "Ġpromise": 11222, + "Ġrequested": 11223, + "_encode": 11224, + "/\"": 11225, + "ĠIcon": 11226, + "uilt": 11227, + "-day": 11228, + "Ġintelligence": 11229, + ".IS": 11230, + "ĠObservable": 11231, + "ĠHard": 11232, + "Bool": 11233, + "idential": 11234, + ".Anchor": 11235, + "Ġselling": 11236, + "CI": 11237, + "AGES": 11238, + "tle": 11239, + "bur": 11240, + "UFFER": 11241, + "RY": 11242, + "Ġbigger": 11243, + "Ġrat": 11244, + "Ġfamous": 11245, + "Ġtypename": 11246, + "Ġexplained": 11247, + "}}Ċ": 11248, + "Ġnuclear": 11249, + "-N": 11250, + "Ġcrisis": 11251, + "ĠEnter": 11252, + "Ġanswers": 11253, + "/${": 11254, + "/pl": 11255, + "Ġsequ": 11256, + "_next": 11257, + "mask": 11258, + "Ġstanding": 11259, + "Ġplenty": 11260, + "ĠCross": 11261, + "ĉret": 11262, + "dro": 11263, + "ĠCast": 11264, + "=true": 11265, + "ĠChris": 11266, + "icio": 11267, + "ĠMike": 11268, + "Decimal": 11269, + "addComponent": 11270, + "Len": 11271, + "Ġcock": 11272, + "Ġ#{": 11273, + "URN": 11274, + "": 11403, + "Ġ*=": 11404, + "ĠPS": 11405, + "Ġdangerous": 11406, + "[p": 11407, + "OME": 11408, + "Other": 11409, + "ĠStringBuilder": 11410, + "Points": 11411, + "heading": 11412, + "Ġcurrency": 11413, + "Ġpercentage": 11414, + "_API": 11415, + "Ġclassic": 11416, + "thead": 11417, + "ĠMO": 11418, + "FE": 11419, + "Idx": 11420, + "await": 11421, + "Ġè": 11422, + "Ġaccident": 11423, + "Ġvariant": 11424, + "Ġmyst": 11425, + "ĠLand": 11426, + "ĠBre": 11427, + "Ġharm": 11428, + "ĠAcc": 11429, + "Ġcharged": 11430, + "iones": 11431, + "Visibility": 11432, + "arry": 11433, + "ĠLanguage": 11434, + "Ġwalking": 11435, + "\".ĊĊ": 11436, + "ifer": 11437, + "Ġleadership": 11438, + ".From": 11439, + "ynam": 11440, + "Ġtimestamp": 11441, + "ipt": 11442, + "ĠHas": 11443, + "REFER": 11444, + "ĠIts": 11445, + "Ġlistener": 11446, + "UTE": 11447, + "_description": 11448, + "Ġexperiences": 11449, + "Ġcreates": 11450, + "RS": 11451, + "cart": 11452, + "black": 11453, + "Ġchoices": 11454, + "war": 11455, + "Ġ'''": 11456, + "Ġordered": 11457, + "Ġevening": 11458, + "Ġpil": 11459, + "Ġtun": 11460, + "ĠBad": 11461, + "(app": 11462, + "random": 11463, + "Ġexplicit": 11464, + "Ġarrived": 11465, + "Ġfly": 11466, + "Ġeconom": 11467, + "-mail": 11468, + "Ġlists": 11469, + "Ġarchitect": 11470, + "ĠPay": 11471, + "Ġds": 11472, + "ĠSol": 11473, + "Ġvehicles": 11474, + "Hz": 11475, + "-com": 11476, + "Ġking": 11477, + "_equal": 11478, + "ĠHelp": 11479, + "Ġabuse": 11480, + "--;Ċ": 11481, + "Ġextr": 11482, + "Ġchemical": 11483, + "ä¿": 11484, + "Ġorient": 11485, + "Ġbreath": 11486, + "ĠSpace": 11487, + "(element": 11488, + "wait": 11489, + "DED": 11490, + "igma": 11491, + "Ġentr": 11492, + "Ġsob": 11493, + "-name": 11494, + "Ġaffected": 11495, + "ika": 11496, + "Ġcoal": 11497, + "_work": 11498, + "Ġhundreds": 11499, + "Ġpolitics": 11500, + "subject": 11501, + "Ġconsumer": 11502, + "ANGE": 11503, + "Ġrepeated": 11504, + "Send": 11505, + "Ġ#[": 11506, + "Ġprotocol": 11507, + "Ġleads": 11508, + "useum": 11509, + "Every": 11510, + "Import": 11511, + "(count": 11512, + "Ġchallenges": 11513, + "Ġnovel": 11514, + "Ġdepart": 11515, + "bits": 11516, + ".Current": 11517, + "Ġ`${": 11518, + "oting": 11519, + "(\\": 11520, + "Ġcreative": 11521, + "Ġbuff": 11522, + "Ġintroduced": 11523, + "usic": 11524, + "modules": 11525, + "Are": 11526, + "-doc": 11527, + "language": 11528, + "_cache": 11529, + "Ġtod": 11530, + "?>": 11531, + "omething": 11532, + "Ġhun": 11533, + "åº": 11534, + "aters": 11535, + "Intent": 11536, + "Ġimplemented": 11537, + "ĠCase": 11538, + "Children": 11539, + "Ġnotification": 11540, + "Renderer": 11541, + "Wrapper": 11542, + "Objects": 11543, + "tl": 11544, + ".Contains": 11545, + "Plugin": 11546, + ".row": 11547, + "Ġforg": 11548, + "Ġpermit": 11549, + "Ġtargets": 11550, + "ĠIF": 11551, + "Ġtip": 11552, + "sex": 11553, + "Ġsupports": 11554, + "Ġfold": 11555, + "photo": 11556, + "},čĊ": 11557, + "Ġgoogle": 11558, + "$('#": 11559, + "Ġsharing": 11560, + "Ġgoods": 11561, + "vs": 11562, + "ĠDan": 11563, + "Rate": 11564, + "ĠMartin": 11565, + "Ġmanner": 11566, + "lie": 11567, + ".The": 11568, + "Internal": 11569, + "ĠCONTR": 11570, + "Mock": 11571, + "RIGHT": 11572, + "Ġ'{": 11573, + "Ġcontrols": 11574, + "Mat": 11575, + "Ġmand": 11576, + "Ġextended": 11577, + "Ok": 11578, + "Ġembed": 11579, + "Ġplanet": 11580, + "ĠNon": 11581, + "-ch": 11582, + ")\",": 11583, + "epar": 11584, + "Ġbelieved": 11585, + "ĠEnvironment": 11586, + "ĠFriend": 11587, + "-res": 11588, + "Ġhandling": 11589, + "nic": 11590, + "-level": 11591, + "scri": 11592, + "Xml": 11593, + "BE": 11594, + "ungen": 11595, + "Ġalter": 11596, + "[idx": 11597, + "Pop": 11598, + "cam": 11599, + "Ġ(((": 11600, + "Ġshipping": 11601, + "Ġbattery": 11602, + "iddleware": 11603, + "MC": 11604, + "Ġimpl": 11605, + "otation": 11606, + "ĠLab": 11607, + "