diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md index 32ad602907d459ebc21681dc2b44508106bb1e63..6dcb24b7356f9f233e4eb2fb29abd14b185cb702 100644 --- a/README.md +++ b/README.md @@ -1,5 +1,19 @@ ---- -license: other -license_name: eva-llama3.3 -license_link: LICENSE ---- +--- +license: other +license_name: eva-llama3.3 +language: +- en +- fr +- it +- pt +- hi +- es +- th +- de +base_model: EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1 +base_model_relation: quantized +library_name: mlc-llm +pipeline_tag: text-generation +--- + +4-bit [OmniQuant](https://arxiv.org/abs/2308.13137) quantized version of [EVA-LLaMA-3.33-70B-v0.1](https://huggingface.co/EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1) for inference with the [Private LLM](https://privatellm.app/) app. diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d9e7e08f5c8e277065c653a7c72987d064f55208 --- /dev/null +++ b/config.json @@ -0,0 +1,5 @@ +{ + "quantization_config": { + "bits": 4 + } +} diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..11427aacb947edc6a3a654eab3c19103729f767a --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,11583 @@ +{ + "metadata": { + "ParamSize": 805, + "ParamBytes": 36381212672.0, + "BitsPerParam": 3.4891900844756822 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 525336576, + "records": [ + { + "name": "lm_head.q_weight", + "shape": [ + 1024, + 128256 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 525336576, + "byteOffset": 0 + } + ], + "md5sum": "9463c11aa916e8d00f7dba9df437be96" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.78.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ed7c6a6aa0e7ecf5f2fa84a744493480" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.78.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "96591622319bc56ba3fc23f88fdd6988" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.79.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "836a7b1d15472af2955c36b2a2704e84" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ebc84cfbb1196e973893664323866b11" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 31145984, + "records": [ + { + "name": "lm_head.q_scale", + "shape": [ + 64, + 128256 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16416768, + "byteOffset": 0 + }, + { + "name": "model.layers.78.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 16416768 + }, + { + "name": "model.layers.78.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 16433152 + }, + { + "name": "model.layers.78.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 20103168 + }, + { + "name": "model.layers.78.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27443200 + }, + { + "name": "model.layers.79.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27459584 + }, + { + "name": "model.layers.79.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27475968 + } + ], + "md5sum": "98b5509835bd226703116d5b5437ee97" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.79.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "d48ecc4031adcef3b3cacb2773a49d2a" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.79.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "039e74bd1c029cad09492fb8f478d387" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 525336576, + "records": [ + { + "name": "model.embed_tokens.q_weight", + "shape": [ + 128256, + 1024 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 525336576, + "byteOffset": 0 + } + ], + "md5sum": "8f8eddcc9ecfb86aa2d20f11302df877" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "75be48e4828226b49a686983bf19da7c" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "14a8323db5942e10d6c9d7c082ef5919" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 29835264, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.79.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.79.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.79.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.norm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.embed_tokens.q_scale", + "shape": [ + 128256, + 64 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16416768, + "byteOffset": 9732096 + }, + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26148864 + }, + { + "name": "model.layers.0.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26165248 + } + ], + "md5sum": "e1ae687f6f46baeb959691e67f278535" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a61e7dc69e390c5722e95abef11c3919" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.0.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "170ab3acde005cf530ab4af89f90561b" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "72058bf8eb33f6afdb4a7ad4c1018e67" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "c465c5a8766bfa331e36efdb7355e4d2" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "03c0a14e892c15b9a559358863f5f680" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e851a1af5ef295b14d3703a8e9f54665" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e61b2efb815401069f9b2def978b9c58" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a51d10f24fa3dae3d25c9f80e11a2e07" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.0.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.0.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.0.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.1.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.1.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.1.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.1.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.1.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.2.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "4ef1c66d880072fde28b623097a9a82e" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1a8d4a91be2d07b406bbc8a398c104fc" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ffe437f39fb0fd5bdb0563732471f6e2" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9910ab20f5288c7a10c9240dd53e2840" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "053a01bd5ba0ea0089351408f2d2fac3" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "0ea75cab611b013e5ec914701b652b00" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.3.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2e779970b8f3e0c9e15f823c032e2ae9" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "39cb198be9582dd0b93450149768572c" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.4.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a76cd7efa74c6848756e2d18322723fc" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d48e56ce14fcd80c2a189be5b0bbd84a" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9b86501ed22a1d4f60619c8e1960b435" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.2.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.2.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.2.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.3.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.3.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.3.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.3.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.3.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.4.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.4.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.10.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "10909fdc28b653a1ee61ee6bd4b38119" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7614b099ca5481ab63a6bc16c3a44a7a" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.10.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b7cbd80f25c950b5297659b7f9f3642f" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f5d7cee300d3e1443056ddb36ff25764" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "cea13a18f7cf6d4781637ba5215283be" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "88d6b5ddf048904f11ba671ea629e431" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.11.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0521100d3106a90ef3d68369088e7a45" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "fefb6a17acc74300c6201b57165c483a" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b22b73437223d77a27cb9672b1056fb5" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "aa7d59eef0f5b396e6e0c4240ce9b9f4" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7e4bdb0dd12c535ecba955795fc97adb" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 32833536, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.10.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.10.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.10.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.11.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.11.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.11.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.11.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.11.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.12.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 23117824 + }, + { + "name": "model.layers.12.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 30457856 + }, + { + "name": "model.layers.12.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 31768576 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 32817152 + } + ], + "md5sum": "7d7ec284e1a04f1f10733cdee2f1a915" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d3c7a2e67c4e974df61f1baa780ecf6c" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b6e5216430fce77ea62ae1ec339d953e" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9f37218f60cdab63fd474903ed63a483" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b2ca3eb5185917614cac1a09c6e90c2a" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f17cc8be7388e8f8a63b617b517746ac" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3d9142aea1586a0d4383c9c989955ddc" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "8e9b30b04e68a3d3c9057932aa719c53" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 28147712, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.9.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.12.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.12.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11042816 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11059200 + }, + { + "name": "model.layers.13.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 11075584 + }, + { + "name": "model.layers.13.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 14745600 + }, + { + "name": "model.layers.13.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22085632 + }, + { + "name": "model.layers.13.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 22102016 + }, + { + "name": "model.layers.13.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 23412736 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24461312 + }, + { + "name": "model.layers.14.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24477696 + } + ], + "md5sum": "151329e58eb34245d0b45cdb57b6414e" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "60c14a93ac696715e35bf87f2fe5a956" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.14.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "7fa3898a42c9bbf9c0dd9434a6d86586" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "933ba78b8804de5d3780329c40cee34e" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.15.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a59dbac06a2b3b3d0f95900f6e7ec653" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "56ceef031e350f3e864da3a1058d9177" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "cb709bc130af8c8e2290d9ab27ead341" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "15935204d95b65d883b7916ca6024c19" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "0a75725c10e90e1de64f30fa60505c9d" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.14.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.14.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.14.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.15.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.15.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.15.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.15.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.15.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.16.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "ceac4c3955102971e8ce86ac844fbeb0" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4635280724b64d65ebd9b5209e38fd38" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.16.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0021bdb179372cfab669e8f5fd107525" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ec2f99476978296b9ac03440f7c4f431" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5895ca03e0d55b89df3c4e78840d3712" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "6836e5629c040b6f7514bcc792ef2c68" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.17.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c9552b20adb7a72f6534630f4f9aa02e" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e9c18750ceff68937b1dec5da8602d91" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "80b7d2e0d45a01288472ae1eacf4c790" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "42dcef1be1f8217cec575de9eb9e74ec" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.16.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.16.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.16.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.17.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.17.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.17.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.17.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.17.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.18.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.18.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "3e30468d43bdd5b716945849c81d4c57" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.18.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4c31b81b5446af31aa7189d0c1b7f844" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "bc340a9903caf93c28a20aae8d7c0ae9" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "2a8678e207a6c4279e76592a18e985a3" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1a59ecd95e8fe2e908aa5a91d31adb1b" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.19.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "65ca1d34ea5f8aa6c0d0e0b53e139131" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "010df8f484ac575fb6502c7dd01f026a" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "630091234e54fb223b3c9eb9787d5f0f" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1f731b4c5dc1816ae2b95a070401e833" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 32817152, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.18.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.18.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.19.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.19.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.19.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.19.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.19.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.20.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.20.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 25477120 + } + ], + "md5sum": "79688258c802dc121ac0a78b529f37d9" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.20.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e96945208ed586940098d622f91a5b48" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "4b393c3a59fa0ce73eea3d08ec4e5b77" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "3679ccfc69f518a8de2f3dec63bd417d" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "2b9b304498ea65115cedf45554850c30" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.21.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1edc3bb2e97234c0eed88e2955b6b170" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ea21ce201eec8bdc4d7a0d4918be4a1b" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d7d8aadc1cc3a62125634088153ee503" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3550792111bb0424df33618a8faa7b57" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a570279de6e39c435e910f28b58353e2" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7caeb3316a204ba318af2d52731eef75" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 29196288, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 0 + }, + { + "name": "model.layers.20.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 1310720 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.20.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2375680 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2392064 + }, + { + "name": "model.layers.21.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2408448 + }, + { + "name": "model.layers.21.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6078464 + }, + { + "name": "model.layers.21.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13418496 + }, + { + "name": "model.layers.21.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 13434880 + }, + { + "name": "model.layers.21.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 14745600 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15794176 + }, + { + "name": "model.layers.22.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 15810560 + }, + { + "name": "model.layers.22.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 19480576 + }, + { + "name": "model.layers.22.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26820608 + }, + { + "name": "model.layers.22.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 26836992 + }, + { + "name": "model.layers.22.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 28147712 + } + ], + "md5sum": "189df3a85696d86f5ce3fca83043b7ef" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3c091a5e9984759c70c1c0bbf58b8e19" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.23.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "31a27e8c43f07df555b2318e3ae2c909" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5ff5ba383668363838bd90d1fc688d21" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "970d01ef8652ccf4df674264fb71d7d2" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e19e9db80c6adc3b6ff0df7458b0c127" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "23ae674530ee524c1d072bc6994f3dc3" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.24.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "91bf0a9b4a02999f875e90794e7f6dd2" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "50e37eb46ad932cc31e1ad5fce518efd" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7d85ebc352904600a0390c04a830101d" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 30490624, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.23.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.23.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.23.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9715712 + }, + { + "name": "model.layers.23.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13402112 + }, + { + "name": "model.layers.24.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 13418496 + }, + { + "name": "model.layers.24.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 17088512 + }, + { + "name": "model.layers.24.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.24.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 24444928 + }, + { + "name": "model.layers.24.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 25755648 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26804224 + }, + { + "name": "model.layers.25.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26820608 + } + ], + "md5sum": "372ee7207b97ba716e1ea93f4d7d3258" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "9b2dd74c359bfedd1975ee02f391e234" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.25.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "120dd5add6e56a533e83f60bff8693f0" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3b66b8d870ce2862714e1c0039f9c61b" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c0e4f6819ec4982e9312c7e93d1fbb5c" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "77f30e6789dc3dbfcd6498ef92a319e0" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "3ba4cae978f181aeb8398644ea57b561" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d0f222932599d53165c75e42720f2c7e" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "b44395d95f38257dd6b2f01d6b9660a4" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.25.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.25.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.25.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.26.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.26.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.26.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.26.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.26.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.27.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "76c947f32d1300e408c38b724b3e6190" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "ced86524c28229e45b8d1a1ef53c6523" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1c93a8af0a3f34438d478a05137634a9" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d9c15ef70b407d48c51469862f649a0c" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "8e4600f0aaf41c072abf4eeb6e55c67e" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "826dd27d74509d2ad0721f9f59e3d0f0" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.28.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "029262ab189adb910837b274bca9c845" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4c893f39e4d7031beb843dc1a443786b" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "61b063176aaba9411fc0b8afc08dcbb8" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "f2bc8e6c74b185609dd30333eff49111" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.27.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.27.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.27.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.28.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.28.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.28.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.28.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.28.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.29.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.29.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "a3b5bd2cc43e04a4fc8047123800ad95" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.29.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "8d7315be2425acacf783aeadc07f876b" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2ba7006a9018e6c3844c102030e2d68b" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ef149f2020c32fb00431bef8df5c8506" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "61a08e7f6b75dc9c74df5709c1e997c3" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.30.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "282011a8944301090e76ee10dca86d48" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "83a16aabd66f70c7a6b842279b2209dd" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "03417ca73a25756be970e3e850957455" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "d0b109f35fb8fff0fa2eaf978188db30" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 32817152, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.29.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.29.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.30.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.30.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.30.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.30.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.30.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.31.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.31.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 25477120 + } + ], + "md5sum": "f0dfdeb73d7dfcf557c52a2b880ee90e" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.31.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "82bd7f8f22a50a107999b660dd4050ce" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "753772091e7dcbfabcc065344301d5f5" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "90ee38e5508b6694d8fd920083ba416c" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.32.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "40655e1a879075e1483a9ae9b96dab38" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.32.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "89b46bcccbb84d51917ad46a5c7274cf" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "426593d25df1a6f0cd644cdca9143aa9" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "0ebbcdec6abce06835aded9cd2060f8f" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4be47783032c0810a55c24d1096ac558" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.33.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c5014906cdb7610a6d380e7fe52248ac" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a29881669a7da2317cbcfc3139687bb0" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 29196288, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 0 + }, + { + "name": "model.layers.31.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 1310720 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.31.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2375680 + }, + { + "name": "model.layers.32.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2392064 + }, + { + "name": "model.layers.32.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2408448 + }, + { + "name": "model.layers.32.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6078464 + }, + { + "name": "model.layers.32.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13418496 + }, + { + "name": "model.layers.32.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 13434880 + }, + { + "name": "model.layers.32.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 14745600 + }, + { + "name": "model.layers.33.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15794176 + }, + { + "name": "model.layers.33.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 15810560 + }, + { + "name": "model.layers.33.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 19480576 + }, + { + "name": "model.layers.33.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26820608 + }, + { + "name": "model.layers.33.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 26836992 + }, + { + "name": "model.layers.33.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 28147712 + } + ], + "md5sum": "663d3ea5f79a75908464348acb765e8e" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.34.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "77aa1ddafd191694e2276564819ba799" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.34.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5bd086430fe6f3cc2e30b6acb6e67445" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3deac5887425daa9cfd51f96750046db" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2bec1b5a0b3b1d723dd5e6379c4edf19" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "485f512b0e06f534d70519b130c3e916" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.35.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8f4c7cf4e3c36d0e6c54f0a129e80a26" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.35.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "d5bd5e47a5d4cfdb2af72392637b0b4b" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e19354f1776a32641e4e8c2a8e0b6672" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "640784ade41a60fe229d272addc4b46f" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 30490624, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.34.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.34.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.34.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.34.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9715712 + }, + { + "name": "model.layers.34.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.35.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13402112 + }, + { + "name": "model.layers.35.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 13418496 + }, + { + "name": "model.layers.35.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 17088512 + }, + { + "name": "model.layers.35.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.35.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 24444928 + }, + { + "name": "model.layers.35.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 25755648 + }, + { + "name": "model.layers.36.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26804224 + }, + { + "name": "model.layers.36.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 26820608 + } + ], + "md5sum": "d586f5d8ca62622166e25e2a8e8f4956" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7f3909da8cb310b5e5189b16499ec26e" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.36.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4ad60e8b457bed9a04d0ddaf1619895a" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.37.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "1e67e4ac8eb1a87c9a30a7a9ba32367a" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.37.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "75d8700f0063d0908f63cff8f5fb9c0a" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c2d06a0ccb749276be578e2eb936674c" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e29f6d10bdebdd6331becbf8a9cab7eb" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "8461d5551bcf1879743f3c343b7fa4bd" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "6b0e2961f8575695eceda7da9d0f37f2" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.36.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.36.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.36.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.37.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.37.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + }, + { + "name": "model.layers.37.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 12075008 + }, + { + "name": "model.layers.37.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 12091392 + }, + { + "name": "model.layers.37.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 15761408 + }, + { + "name": "model.layers.37.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.38.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.38.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "316df4deccd7162dd6e30c2092474bc8" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.38.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "81d410a47b6cac2426f6f07950e877f8" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.38.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f39227cdf637de8cbd097c5f0a0d99bd" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.39.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c1e46448472daf986a929aebf05d4f4e" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "de7c5bb6475035ab7a180fc2e017ebba" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b5b0f55068dea712df0e8ba8004c6b65" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.39.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "26ace1cb06dbd77d13c298d8b82c0f9a" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.40.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "79794fc05c8bc5aca1041ae559c6347e" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2c686523f9431d5fa6bc5db9408fea67" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9ce6b6cd14b48055171830eebe8f9df8" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 28114944, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.38.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.38.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.38.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.39.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.39.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.39.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.39.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.39.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.39.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.40.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 24428544 + }, + { + "name": "model.layers.4.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 24444928 + } + ], + "md5sum": "b409dc54596956045d0f2013365e66f9" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "191ad6585549931365b82d2939134c40" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "fb84db30c70c25d2113b2336ab1ab225" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "e720da8276c1de86caad1c080f54f9e7" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3c08c5d13cf8103e2747bab19e4e05e5" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3a4e6d152b292e1e29d0d74998048145" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "a5d661aed048bedbd0e7f35142eff7d5" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "f397fab706e9d6ccb0d644b441d9008e" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "8b81771cdb143052502875bcf7a3ef98" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.4.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.5.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.5.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.5.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.5.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.5.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.6.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.6.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.6.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.6.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "f49b36e162d1e5b17137044a41769b47" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "06451d52a9500921ccc360709a8e2714" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.40.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "17f4a68fd756d3ed6be4579bbfae3bb3" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.40.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "f2bf1cebb48b24a0abb1f49eecbe1799" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.40.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "530182c82d9beab2a0e368096986b3bb" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.41.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3d011576606c0a00e2746c6afb881fb0" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "3dec439d891afa5ad12373c854944763" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.41.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "c7d950dcbb3a5b46997819685d0795cc" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.41.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b29643ef87dfc30a32f0d0a67291e777" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "70a98791b86571e1641232dbb985c0a5" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "26d211ba334f1a1921acdffcf68497e2" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.7.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.40.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.40.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.40.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.40.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.40.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.41.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.41.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.41.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.41.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.41.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.41.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.42.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "61605444fe236d9509650de778f667fa" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.42.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b03c085a6e1c0b9d35a3bc75b2ff7d25" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.42.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6c5299fbd419d58db5e6963fa58a19a1" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.43.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5929c338eb01797036979835857dff10" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "b7d999778853421d617cb2567e98aaf9" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.43.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "667f3883c9e285f161b602b8927e931d" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.43.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c408bb0c9004ea2d423d09d50e91289d" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.44.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "23c17a07a11417c8da222d9cbbf449db" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "fdfb6d673bae818c84a13212c54eda0a" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.42.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.42.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.42.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.42.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.43.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.43.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.43.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.43.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.43.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.43.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.44.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.44.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "f3350cf0719a56a1615ce1239073084c" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.44.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8ea00796a378d243cd0212722fbdfefc" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.44.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "60111112a0f357fb526cd8b4b401ece0" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d8f2b085821bea719f49ee86bad9fb26" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.45.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "163e4ea6728c35daca4b775aad18acd7" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.45.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "abc7682ebf421676e907352aa3edc549" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "9282478cca6ad4022b24926a5a093d41" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.46.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d9a6c0e52ed014a2dfa765ad36ad80d0" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "0dc6fc0c29d8dd6888cd6ec007f4154e" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.44.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.44.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.44.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.45.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.45.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.45.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.45.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.45.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.45.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.46.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.46.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "cb3601147ddd64ed931971fdabcd17a9" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.46.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "9fea46687b47aa1d525b56d876821c6f" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.46.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "d2cc008dc7a06027665281bd5a3458b9" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.47.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ff283919686d5effb41b0b0a37f9e190" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "1d44aef620d24a8578556968c8a97d9a" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.47.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a5c391467bef959560969b342a3462b8" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.47.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1d3239614c2b771277a3ce7a21f9646d" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.48.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a69e7c99b0508def4718f35bcd108243" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.48.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "8ae38a6431d1ec71845e43b7d3f3ab4f" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b848b12413a2f7c220964b44103ce95c" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "db3b18ba3ccdc784bc44d890fc31f40f" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.46.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.46.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.46.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.47.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.47.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.47.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.47.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.47.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.47.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.48.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.48.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.48.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.48.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "6f1858db3d43073a9cf086d680d0c73c" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d3b4da709fb461d6273ce453f7946049" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "85b28cab6d3a92f8466d4a6657b93de7" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.49.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "cb38faf29da247131332a862faa187ab" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.49.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "482c120959ba08527f9725dccec951a4" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.50.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f5c9ca431a0abebc89a97d808594ba20" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "800cd945dcc3c12c23909bba1d8724b0" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.50.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4b4e1a79642e0f0cd8570689014cb6cf" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6916c12ccde77524a0e734d6f42f099f" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.48.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.49.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.49.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.49.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.49.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.49.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.49.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.50.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.50.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.50.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.50.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.50.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "d771479e7942ea53084885b8759a7bb3" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.51.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "0ddc2f5bc25c37d01bc9d8f93c24fb8f" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.51.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "14de0b66d528cf885ccb94340b3d98a2" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "d665ad055d7477f47125aa03eef5ba0f" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.51.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5ef196f87911faa89f84938a6c7ebb4b" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "1db79a68b971390382ea97fd69a9eb51" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5fc8c490f03482279c099cbfc7a1ea11" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.52.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "72ef00b9dfd0ed8c4245cdebba0600f2" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.52.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "64b626ef74280aa70b05841254329b3f" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.53.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b8954120824feba5b85e3412fea947b1" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "03cc1ee790d09f972d50aea55ee08cc8" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.51.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.51.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.51.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.51.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.51.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.51.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.52.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.52.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.52.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.52.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.52.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.52.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.53.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "d28ea9cc567e78232cc12b5fc3fc05c0" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.53.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3e5132e7db9b37f0f163ad32c2e662f9" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.53.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "dc3d44d37d005d1d91fa09f9e9212eea" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.54.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5cb3e5bf84ca2e445edf8c07a172bd9d" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.54.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "b487174f550a12a29413cff95b33f8a1" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.54.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "ebcc56ce54f3d62bfa4e4967f2069e43" + }, + { + "dataPath": "params_shard_242.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.54.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "01eec3599893e412eaa96d2261969f07" + }, + { + "dataPath": "params_shard_243.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.55.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "40353563945bf09bc27bc19e34117619" + }, + { + "dataPath": "params_shard_244.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "66914c19b6601cf2a6a54f72e1aa244a" + }, + { + "dataPath": "params_shard_245.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.53.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.53.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.53.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.53.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.54.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.54.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.54.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.54.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.54.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.54.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.55.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.55.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "8113da9a83fd07a9c8ef903e35ccb010" + }, + { + "dataPath": "params_shard_246.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.55.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a1c1e26163299aa7af2a33f7696daf90" + }, + { + "dataPath": "params_shard_247.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.55.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "aa7b58fd9277d2b7476a1e53176b0330" + }, + { + "dataPath": "params_shard_248.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "afa3a9d800546f9ce59b8077819118df" + }, + { + "dataPath": "params_shard_249.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.56.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "eaf19ec8ed914ac77914094de94bf424" + }, + { + "dataPath": "params_shard_250.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.56.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "25c12572c958c206f5f3693388fe9e27" + }, + { + "dataPath": "params_shard_251.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.56.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ca8dc7a29d2709de52b18da815e20e51" + }, + { + "dataPath": "params_shard_252.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c257be2b35e2cbf48bc7cad5a2df95be" + }, + { + "dataPath": "params_shard_253.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "ec6035c36d50ffaf2b5f78d4637e6155" + }, + { + "dataPath": "params_shard_254.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.55.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.55.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.55.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.56.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.56.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.56.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.56.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.56.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.56.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.57.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.57.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "d71be3e68748a7ae68507ad4e02f40e0" + }, + { + "dataPath": "params_shard_255.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.57.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "75e455e948ff6f8d85ac27980ac360b2" + }, + { + "dataPath": "params_shard_256.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.57.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "309798ce26b05daa9f3f8ecfe45d0a2f" + }, + { + "dataPath": "params_shard_257.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.58.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c53a86f522aed4a394a8674561a752c3" + }, + { + "dataPath": "params_shard_258.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "f5b93d0226f4f741d3fdd496a44d192c" + }, + { + "dataPath": "params_shard_259.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.58.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "388a10c79fa4096b8e1487472528f097" + }, + { + "dataPath": "params_shard_260.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.58.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "46fad40110c820f00e2b233cb8673585" + }, + { + "dataPath": "params_shard_261.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.59.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "5a07670e70b6cede22a91ee102f0182b" + }, + { + "dataPath": "params_shard_262.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.59.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a0b9cf65a8dd57f201dde5ae2b4659e1" + }, + { + "dataPath": "params_shard_263.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "cf67d6e45299c98c5ee5729e3917c6bd" + }, + { + "dataPath": "params_shard_264.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "240dddfc43bd0b6f129331e44b44a821" + }, + { + "dataPath": "params_shard_265.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.57.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.57.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.57.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.58.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.58.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.58.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.58.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.58.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.58.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.59.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.59.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.59.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.59.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "b60202c47fac3afd632d9ac670faac5f" + }, + { + "dataPath": "params_shard_266.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.60.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "6e34b66c4e59c0172071fb2ef4a2dc95" + }, + { + "dataPath": "params_shard_267.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "e94fd11141927d86902e41531ec43fc5" + }, + { + "dataPath": "params_shard_268.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.60.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8104a6a6d98751f4a807c9a025f03c89" + }, + { + "dataPath": "params_shard_269.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.60.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9ed3ce7d2929688676fdc89137183356" + }, + { + "dataPath": "params_shard_270.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.61.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "aaa387bb67acfdb1fe626989b43cdda3" + }, + { + "dataPath": "params_shard_271.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "f8d64b92139f6b8d19ad553ecb9ec71c" + }, + { + "dataPath": "params_shard_272.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.61.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "eb8be11590793ffb76a9f5a92a30b1a7" + }, + { + "dataPath": "params_shard_273.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "2e2004200274040f5d334ceb81234ad1" + }, + { + "dataPath": "params_shard_274.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.59.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.60.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.60.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.60.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.60.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.60.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.60.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.61.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.61.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.61.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.61.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.61.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "8e34af529454fa3352481dd821a9db0a" + }, + { + "dataPath": "params_shard_275.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.62.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "39acc7ea0f22d30103f6683c1558fc1c" + }, + { + "dataPath": "params_shard_276.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.62.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f9226be6c1ee5fa4e90909b780c88d06" + }, + { + "dataPath": "params_shard_277.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5485a1fe880ee563e255a78a0796cfdd" + }, + { + "dataPath": "params_shard_278.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.62.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3da09a5a12edf8267ae626c32351b995" + }, + { + "dataPath": "params_shard_279.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.63.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "7696e752f0a375154df695ea40c5d1ee" + }, + { + "dataPath": "params_shard_280.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5160edc8ab8df92a51661d32b46b48cd" + }, + { + "dataPath": "params_shard_281.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.63.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "51dbf305e24ce01c3ba4dabaf2f9dfc6" + }, + { + "dataPath": "params_shard_282.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.63.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "08701a83c2806de0ff0f081911bea6e3" + }, + { + "dataPath": "params_shard_283.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.64.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "844fa12a9c50d1641eacb57a723eaa65" + }, + { + "dataPath": "params_shard_284.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5fdf1a1ddabf0b395da4254cf874bfe4" + }, + { + "dataPath": "params_shard_285.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.62.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.62.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.62.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.62.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.62.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.62.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.63.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.63.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.63.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.63.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.63.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.63.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.64.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "7849f3bd1b9f7dee4e3402861c421cc0" + }, + { + "dataPath": "params_shard_286.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.64.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "3198e3354ffa3dc45a8ae53ce6c2c591" + }, + { + "dataPath": "params_shard_287.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.64.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b086d32c90d2988a2d996fd675d206b1" + }, + { + "dataPath": "params_shard_288.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.65.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "e7a565ecce03d60d4bc860084308d39c" + }, + { + "dataPath": "params_shard_289.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "973588fb4b511437a274a8e7bd9d201a" + }, + { + "dataPath": "params_shard_290.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.65.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "75eb23877198ad6af29814170fecd8f0" + }, + { + "dataPath": "params_shard_291.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.65.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "cc912ad7a52e9c3ddbd1d4ce4a7ffec1" + }, + { + "dataPath": "params_shard_292.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.66.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "71dacccef95774e715c90b92db1571fe" + }, + { + "dataPath": "params_shard_293.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "9df55d7b6c36a50b07c9814fa06193ee" + }, + { + "dataPath": "params_shard_294.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.64.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.64.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.64.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.64.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.65.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.65.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.65.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.65.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.65.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.65.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.66.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.66.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "e84f6cd9b973d7dde01506ecf3407207" + }, + { + "dataPath": "params_shard_295.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.66.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "9c714c911c2d8abdb2661ed87aba1cb3" + }, + { + "dataPath": "params_shard_296.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.66.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b64f04d0654d63e32b448c2a35e51ff6" + }, + { + "dataPath": "params_shard_297.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "8bd9e65bdf0058d9991c8ca3ac2cd1b0" + }, + { + "dataPath": "params_shard_298.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.67.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "bf62b4d766acd4457ed09ee9a13ea4bc" + }, + { + "dataPath": "params_shard_299.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.67.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ed484bf3521d49669465e2a430771163" + }, + { + "dataPath": "params_shard_300.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.67.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b4b54e96016a9d90f631014e66cb92ac" + }, + { + "dataPath": "params_shard_301.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.68.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2a7d4a5ad9519436c196faa12991bbe1" + }, + { + "dataPath": "params_shard_302.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "77146290bcf8dc7b0e650b84fe9b3514" + }, + { + "dataPath": "params_shard_303.bin", + "format": "raw-shard", + "nbytes": 26804224, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.66.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.66.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.66.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.67.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 9715712 + }, + { + "name": "model.layers.67.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 17055744 + }, + { + "name": "model.layers.67.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 18366464 + }, + { + "name": "model.layers.67.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19415040 + }, + { + "name": "model.layers.67.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 19431424 + }, + { + "name": "model.layers.67.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23101440 + }, + { + "name": "model.layers.68.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23117824 + }, + { + "name": "model.layers.68.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23134208 + } + ], + "md5sum": "b466c1c505d6445311505c896dfbf8d0" + }, + { + "dataPath": "params_shard_304.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.68.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "ef8efe822e0f5a9e7ae34d4294f02f91" + }, + { + "dataPath": "params_shard_305.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.68.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "acd5bdc67c47ff71c307070e93309a24" + }, + { + "dataPath": "params_shard_306.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.69.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "23ffbfe400ac6f7fb0e6667c7a26e0bf" + }, + { + "dataPath": "params_shard_307.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5291d8d1e732387e76d9e47fcc766362" + }, + { + "dataPath": "params_shard_308.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.69.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "9394c0d2ccd24a2439b0f75a511bf373" + }, + { + "dataPath": "params_shard_309.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.69.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b0dda348500720cc0f8ba9086fe081fc" + }, + { + "dataPath": "params_shard_310.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.70.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "a36977944c96bbce927f64253ca1b30d" + }, + { + "dataPath": "params_shard_311.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.70.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e167c0083ca579a217342c054063ea5d" + }, + { + "dataPath": "params_shard_312.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "a7d5853cb219e9981a1db91075cbdaa5" + }, + { + "dataPath": "params_shard_313.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "fd58597b45ce3193e6ebfed16b961416" + }, + { + "dataPath": "params_shard_314.bin", + "format": "raw-shard", + "nbytes": 29163520, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.68.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.68.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.68.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.69.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.69.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9732096 + }, + { + "name": "model.layers.69.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13402112 + }, + { + "name": "model.layers.69.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20742144 + }, + { + "name": "model.layers.69.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20758528 + }, + { + "name": "model.layers.69.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22069248 + }, + { + "name": "model.layers.70.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 23117824 + }, + { + "name": "model.layers.70.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 24428544 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.7.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 25493504 + } + ], + "md5sum": "6544824af6890180ad570760a0e68750" + }, + { + "dataPath": "params_shard_315.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.7.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c2e70de44e732c98a7a109bb8dc55bf8" + }, + { + "dataPath": "params_shard_316.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "a36445b35d1080521d8aaff7173f7f69" + }, + { + "dataPath": "params_shard_317.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "711b0d6503cdce79d66bef836b6e614c" + }, + { + "dataPath": "params_shard_318.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "0ef48c31c99e1b75c6e26bb23dbbffda" + }, + { + "dataPath": "params_shard_319.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "413687e3f3f2a7adfd0cced58d248755" + }, + { + "dataPath": "params_shard_320.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2da288b879a5730832cd70a2a7c49de4" + }, + { + "dataPath": "params_shard_321.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "4d8258d73c1f1a8f545e1a528833358a" + }, + { + "dataPath": "params_shard_322.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.9.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9b947ae875b144e76f616d47e7053b05" + }, + { + "dataPath": "params_shard_323.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.70.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "c7145ffe90194b0ce33b0916eeddf0f9" + }, + { + "dataPath": "params_shard_324.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "b1ef06c807f90c676603f4987c7ddbc1" + }, + { + "dataPath": "params_shard_325.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.7.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.7.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 7356416 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 8404992 + }, + { + "name": "model.layers.8.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 8421376 + }, + { + "name": "model.layers.8.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 12091392 + }, + { + "name": "model.layers.8.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19431424 + }, + { + "name": "model.layers.8.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 19447808 + }, + { + "name": "model.layers.8.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 20758528 + }, + { + "name": "model.layers.9.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 21807104 + }, + { + "name": "model.layers.9.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25477120 + }, + { + "name": "model.layers.9.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26787840 + }, + { + "name": "model.layers.70.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 27836416 + }, + { + "name": "model.layers.70.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "b5629095d878e41adf439a5076962c2e" + }, + { + "dataPath": "params_shard_326.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.71.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "0f08a4e5c794fbad4611fdde2365eb1c" + }, + { + "dataPath": "params_shard_327.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "7b43e8c2333ce395f0846ead7313724e" + }, + { + "dataPath": "params_shard_328.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.71.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7f38ff1848412a95f1d1be2d26acb0cf" + }, + { + "dataPath": "params_shard_329.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.71.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "bc173e6cd7b7751ff8b4570d4c8c9174" + }, + { + "dataPath": "params_shard_330.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.72.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b256e3504519c2452433c594656ba553" + }, + { + "dataPath": "params_shard_331.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "8968eff5f05cd68013f5705e0d4a49ee" + }, + { + "dataPath": "params_shard_332.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.72.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "da2950c6995e41cbba14bd60c2e6f092" + }, + { + "dataPath": "params_shard_333.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b602f3a5f7fa1dc0ca0a83910010076f" + }, + { + "dataPath": "params_shard_334.bin", + "format": "raw-shard", + "nbytes": 33112064, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.70.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.71.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7356416 + }, + { + "name": "model.layers.71.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 7372800 + }, + { + "name": "model.layers.71.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 11042816 + }, + { + "name": "model.layers.71.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 18382848 + }, + { + "name": "model.layers.71.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 18399232 + }, + { + "name": "model.layers.71.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 19709952 + }, + { + "name": "model.layers.72.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.72.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 20774912 + }, + { + "name": "model.layers.72.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 24444928 + }, + { + "name": "model.layers.72.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31784960 + }, + { + "name": "model.layers.72.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 31801344 + } + ], + "md5sum": "e769dae7e61d12e566ce44d3e6bbe51b" + }, + { + "dataPath": "params_shard_335.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.73.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "b383a4776a7115b15a25c49e47222447" + }, + { + "dataPath": "params_shard_336.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "1ab5040953bcf2c1aeabb37ca72eb229" + }, + { + "dataPath": "params_shard_337.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "0df09c626c1c2a8babe4a89d336629f0" + }, + { + "dataPath": "params_shard_338.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.73.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0b0857cd8b8806639720028dbf2d3cb4" + }, + { + "dataPath": "params_shard_339.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.74.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3d2dff8e34c6d7a4396084e081914c49" + }, + { + "dataPath": "params_shard_340.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "5ecc150fce6c0b1c44eb2a0d227c546b" + }, + { + "dataPath": "params_shard_341.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.74.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "8e394dd30221178614e8a3ea06c42b5f" + }, + { + "dataPath": "params_shard_342.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.74.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0e0520a12868ce01cf97054f0efb5cb8" + }, + { + "dataPath": "params_shard_343.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.75.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2544d206107765e464ab361af06f93af" + }, + { + "dataPath": "params_shard_344.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "26337721be31f3513a39c529535e6920" + }, + { + "dataPath": "params_shard_345.bin", + "format": "raw-shard", + "nbytes": 31522816, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "model.layers.73.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 1048576 + }, + { + "name": "model.layers.73.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 2359296 + }, + { + "name": "model.layers.73.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 2375680 + }, + { + "name": "model.layers.73.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 6045696 + }, + { + "name": "model.layers.73.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 13385728 + }, + { + "name": "model.layers.73.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 13402112 + }, + { + "name": "model.layers.74.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 14450688 + }, + { + "name": "model.layers.74.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 14467072 + }, + { + "name": "model.layers.74.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 18137088 + }, + { + "name": "model.layers.74.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 25477120 + }, + { + "name": "model.layers.74.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 25493504 + }, + { + "name": "model.layers.74.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 26804224 + }, + { + "name": "model.layers.75.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 27852800 + } + ], + "md5sum": "4810cb81d5430512fb09a6ee4d6df179" + }, + { + "dataPath": "params_shard_346.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.75.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "527362986d09c2430207fb66198e3494" + }, + { + "dataPath": "params_shard_347.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.75.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "be706ca3e35941c460fe1beda72fe693" + }, + { + "dataPath": "params_shard_348.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "05f7770c809284c57f11ca14c120df2c" + }, + { + "dataPath": "params_shard_349.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "28161ff0ab2f11a9596370e304e90744" + }, + { + "dataPath": "params_shard_350.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.76.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "54dd52650eb66031520b4a2e51309c91" + }, + { + "dataPath": "params_shard_351.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.76.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3d17d20f8f91a9d776252cbf4f1158eb" + }, + { + "dataPath": "params_shard_352.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "model.layers.77.mlp.down_proj.q_weight", + "shape": [ + 3584, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "38fd8aa4329b81f5502faf19fc6e3557" + }, + { + "dataPath": "params_shard_353.bin", + "format": "raw-shard", + "nbytes": 234881024, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_weight", + "shape": [ + 1024, + 57344 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 234881024, + "byteOffset": 0 + } + ], + "md5sum": "291b59c89611851656a7ab796121afe0" + }, + { + "dataPath": "params_shard_354.bin", + "format": "raw-shard", + "nbytes": 26820608, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.75.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7340032 + }, + { + "name": "model.layers.75.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8650752 + }, + { + "name": "model.layers.75.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9699328 + }, + { + "name": "model.layers.75.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9715712 + }, + { + "name": "model.layers.76.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 9732096 + }, + { + "name": "model.layers.76.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 9748480 + }, + { + "name": "model.layers.76.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 13418496 + }, + { + "name": "model.layers.76.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 20758528 + }, + { + "name": "model.layers.76.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 20774912 + }, + { + "name": "model.layers.76.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 22085632 + }, + { + "name": "model.layers.77.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23134208 + }, + { + "name": "model.layers.77.mlp.down_proj.q_scale", + "shape": [ + 224, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3670016, + "byteOffset": 23150592 + } + ], + "md5sum": "9f1d7e43338d2e1f3fc5660262fb081d" + }, + { + "dataPath": "params_shard_355.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.77.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "99efb87bbeecc42b76de491a669e3e20" + }, + { + "dataPath": "params_shard_356.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.77.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e386d2414bdf25b64218e6c24b8d1c4c" + }, + { + "dataPath": "params_shard_357.bin", + "format": "raw-shard", + "nbytes": 41943040, + "records": [ + { + "name": "model.layers.78.self_attn.qkv_proj.q_weight", + "shape": [ + 1024, + 10240 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 41943040, + "byteOffset": 0 + } + ], + "md5sum": "7cbcb504c9c7c77a5a37a388bae51440" + }, + { + "dataPath": "params_shard_358.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.78.self_attn.o_proj.q_weight", + "shape": [ + 1024, + 8192 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ba6e448fbf3b8acc11a7b19d320dd063" + }, + { + "dataPath": "params_shard_359.bin", + "format": "raw-shard", + "nbytes": 12075008, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_scale", + "shape": [ + 64, + 57344 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "model.layers.77.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 7340032 + }, + { + "name": "model.layers.77.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 7356416 + }, + { + "name": "model.layers.77.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 8667136 + }, + { + "name": "model.layers.78.self_attn.qkv_proj.q_scale", + "shape": [ + 64, + 10240 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1310720, + "byteOffset": 9715712 + }, + { + "name": "model.layers.78.self_attn.o_proj.q_scale", + "shape": [ + 64, + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1048576, + "byteOffset": 11026432 + } + ], + "md5sum": "84f23e4428dcadd4329d359bd990870b" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..f39d5693d4ce83d5d28cafa0bf961007f510bb2b --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337105c253138d50df4883c961cb6922a124ea2948623330d0996eac132b8d00 +size 525336576 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..62c021842f4d09fddb1e9227a309e49929da4a5e --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4325a8402afe94a7fc0fc550caaa0ab9245898bdccfcc230d4ffbd94aa924a6e +size 117440512 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d7c6ccdfe958f1c72e00bb93a54d304bc6650a8 --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5594b03b2becb3b8270c655ccffc01c9be0e8344428df00551799f22befd44e7 +size 234881024 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..db0244e977c3e82cb3a1910e1255a1cd3fd29dce --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:221cefc95ea3fbd1afdb2e182208e072aca03870128c48767649bcd1745521f1 +size 41943040 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..0dbe3d481ea4b0266c45796bec5c0f64c612bca4 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5801b61045c08c7d827643cb86b36e670b2b310652ae303addb3a5f153863a +size 33554432 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..735c9ddb8be7e73c29f08a7868cc25591d37c742 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1416a5b909ad024f5902f1d4dc3545cf1baf80e364c621f634d68085e9e7ac7b +size 41943040 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0a2d7fafb93832a8042b7232b8559afcc724ef8 --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73e404debe7c5b72650cea02835c7608c78d37959bb95d6ef420768dce4d2a8 +size 33554432 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..efe1ad4269844c0a17c3815c2fc31ac397c76a17 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2f7819a0becadd493fc4579ff946b12f3f89f544d0df25e2f129953c233169 +size 117440512 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa30744a51dcf2c5d64057f44148fed36fae0dd3 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb53df9ae08d172b8f419e41a8efdd3641eb378711a48cb0aa19dfc0335500a +size 234881024 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4397c4f1a86845c59ee7385c1af23fe5da479e6 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd89c8664d8c675be89bdcc70699e3a832b0128ac240a12838f722098b8bf80 +size 117440512 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8787fa6f97c0de85706b23ace7106d1ef967c7e --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb675a56ec0eba2a560172f15974d2a64993380a7d24ba234c5e6be7a3b7affa +size 234881024 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2f76b386592cf755edd4f0d32574270f47e02ec --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b64fe3d42fb57a064083303a7ff18da6f25c96db18a5aa142229ce8c2fb8b5 +size 26804224 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..333009fe0b1ab8649d2879cd70ce998a63ae5220 --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387105d11fa6339fc5f071659521d20612f8b2239c64e15c74e9aa75357b8adb +size 41943040 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d9585209f792c8ea6a3ec88f1c94d56693d43f6 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769dfa534abdc2c115bc14f3b9e2864678821315829eead2d679e10739be4db5 +size 29835264 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..474ba5bca6a5814e649df0fd2c5947167b1a7c01 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f69422d3fbe73cf03dc02ccda9dfe928546c58812388a216bc7783d66807440 +size 33554432 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..756281d73f91343a561f56eb94c0e311e85ae9ff --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98446efef79f0ababd454f3df6aa419abce8e8416f833cd3b52cf85280b9028 +size 117440512 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ec3a6c60455e885f5932984ef0ce5c64dcd274d --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8182ec3185df815ff0a97401cae02a71fdb0217ac0430bc60a79cc33ed5c6b1e +size 234881024 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..79dce0c20edb865a9462b03a74dc2d8b7c6f0a1b --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58078d52a7beed4656edc85e1fc16e573f2e68fe89a9011a1e445befe4c5b78f +size 41943040 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..d78d56c36a1b71c53c370618e2438b0c372fcf05 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc52a43d7bab36ff4e6fbc03b1066182845ac845544c537d3ddf7a5ea1763c1 +size 33554432 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7bb9491e6ce6bf2353695751a0a9a7b94af3767 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c934648a8c0f8056be8e13f69f427adb8b4921b50fdc3a9583bf322e477a0c30 +size 41943040 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee767186d9d8d55681b96a1cb76416b84941b84c --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:912b4dd66e7e992ba727db45660d054b08f2d438c9893d1960fd67e198552bdb +size 117440512 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..29fcbbde986562c868bb2c67e6863073c23b89f8 --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7e3949c108238fe2bd80f65c5ef45d11c0fecd9cf508c8b47ae2f2c454ec82 +size 234881024 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..4198b43581260e0e4f89f5de7a4734cf991daaec --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5b8f567147f4553d7ceb99d1ada3a9c6ec7c737b1440802bf82de0fc9b5c59 +size 28114944 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddb409a612aabe86c0d2d948140b79945f5c81d1 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554b72b00d743439d077a411dda6e036d9e0c4b91332dc3fd1e2d528c3570666 +size 33554432 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6c92f5ce4f57a674c1d71d380cb005fa1e692e2 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce2c4ee5803fe5ff34c97b4cb2f6c98a7b24fc454a30a24710bc0fdae68bc31 +size 41943040 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a49f24bc947464d284187c038d65ce078350c92 --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6387a9a8b8650f564066a14fcce8aae382f6ba9074ef876c5295ad8425a1d5a +size 117440512 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..797ef780ad44d1dbe20f545132182be171c472da --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15951016d229c1a7cde8c1a2220b3f8141b42a7019a1a44d7629bdee7c38dbc8 +size 234881024 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..2aa7e2ed1ded4825b7adc39724c812d6dec283ed --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a693abef2d8413cac0e5b34dd61c3bb218f0b5de579a181cd208a76dbf1858 +size 41943040 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1278203722b0c331660be1d95ed0e8ff04162c1 --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae46f8f97e012b2d406dd6222056314e87aeec1d4059bb2f09b7101315cd2cc8 +size 33554432 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..032c011bfab6984687e9e8d2b18d4ba0db3a22e8 --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c0e334acc1a4c9b86b7663843c4b4f171c9526b084bc2395a7fbe5197777d8 +size 117440512 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..926620f718ab51577d0a8c6d965adef366bd770c --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631326819663f8f89261456c91730aa3e7c24434030ae3160d9403e3ab410667 +size 234881024 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3aefb36dc659806501e32fb728b699377b649d4 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c9fc46f7e848e771dd9ea6e8b8b334769239036c2019c5aa5e0df2d36f5c84 +size 41943040 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..d932c567e945cf3c3204b88224d9a9f8f0bd9cb5 --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f555bd2c974b12cde910e94844c74da6d487b6fb1f48941d5c8e6e72f36e77a1 +size 32817152 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9f99acba14cb95f3d15aed671e90c945384e64a --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057e300580e7a88baa3f7680557ad1ac60690712fd49109f2b60ad13024e8b8a +size 33554432 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..947e8c0a34faeda33e697be5f736a9841bf7f2d7 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e198d53f3463374e3493bed21b0326c9dc7b094b806bf1b9a9525885c2172a0 +size 117440512 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..0066fe2ff741201834e7831419f107459b7f5ca1 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d75ef128909f6df193c3dcb3735e78a135727cb3f961642ceeac4f36657c5ae +size 33554432 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..2934a3ed6047d19d8bd259198728ef29fcc7956d --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfaab7461fa3fa05e8fe068d9ae1f031813be5b08363162bcc68555a48aa1d7a +size 234881024 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..7856a8b628482589f074cc19a23b7a8775b93c29 --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c125f7fc18afefe525a03344e5bea9606084bc318384ec59ab63b6367a044103 +size 41943040 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..92b75fc914a648da3152e76410a9e88d240b08e4 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb639e124cb13db5892d60abb1686e56de1d99d8734b93293051d9cfaa8c777 +size 33554432 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..3045fc9141df9169e51e59dff14b02ade81ac0f2 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97957b47ecad9b6ab20ec2b4c1506927232700c5938ae2fb16a054d1149ad5b4 +size 117440512 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..95d2404e57d5a5f0b3802a34ae962be22190524c --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33671550635e718d877e329b4f9d1ae49c9286678df0136d9ca607b36196a20 +size 234881024 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..d77aae2da5198e4fe69bc137dc929c398f8ffb01 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44cab61b5db127baf1a7927b78281310062cfa0dd36ddd8240839c1f5845547b +size 41943040 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..22e468b7c213c2e1512891360215039b125f1700 --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc5797fc748aa3f8801c75396e7a77f88acca7c5667a32dffec035f95accf7a +size 33554432 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..635eea3b21c042b537f2ff597e2766562d40f8a6 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be28418ecd03b9feeed864adc234e63834bc741ef3593e78b0d4db0a857c6c9a +size 234881024 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..9914f3f4334b079ed13d057283ff27a1227cc0f2 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f085dc6304b6c105936dca34dde68d04e1d539213fa8b2f4a3490171fb5efa93 +size 29196288 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..29e893e79a59512c8dae9730636a6c73ca6f2983 --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf0d5239da0549929cf1bc94cb75fd1100a2bc4e70919bbb775b22fb250c0a4 +size 41943040 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..fe2cc6d561ad9c2dfb6c32ea6336fa881b103855 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32275468dcb60ce8933fa02195456f6b1ed8ebfb17ab4c85855e6d26c91e29f5 +size 234881024 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1171de102e509311f719931f957899a78e5c988 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e399553f3f6c922bf014034363ea4c843671e060455dd5644a8d1c8365eefbe0 +size 33554432 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..2aae975d250c6e5ca3134dbd3692a858c67308b9 --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d303f1c7a01ef88135bda19d291fadc6ddd50221d6800889357079c0549de314 +size 117440512 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..284e0a59e85e3c933c2aa3c1819c3d6eab51cd5c --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dcf965487b667534bfd333b86462e2497f49a075466e2d4b58eebe4682e461b +size 117440512 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e1b7ce3dc47de002fbc55fc109eeb318d90dd2a --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a814486d7291ea71b51ed21c8474016d84ed97e4f83d240c2df317d4096b1b9d +size 234881024 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..73ba359ca2095245d3a874a51dff7a36c6769842 --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fea02f2be004f5f1bdf0a73407e7d86e57d606801d2e65fcf17f1697a0c0da5 +size 41943040 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..cedcb16be930359e6c3bcb8b45dd66a38a81454b --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfacf659bcccdb8280842e4c7e073efe18103b5e164c581893f2ee7d653482ea +size 33554432 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..0532b1f2931a5d34407fb6ba8ec29bb3cc6e34a2 --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e604aa0d78281dca02aacc907945a223d3e3221a76a7f293804dee5363fd37 +size 117440512 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..61b6b39be48430c43d581edfbccbe596be9c4d7d --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e9d5dfa08805402ce06b9a501da35bf64af413f74357121e164843bb1a61e0 +size 234881024 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2f00f47b70f25b0790215b15d3fd4ed1ac0aa6a --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3395910123741ba76e952f66b05f23afae1c506517f815af000993ae03b0b7f5 +size 30490624 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..95d5ea304426a226b15f9d3e7abfb38b327a1412 --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c285b78040f5a3f8d1e24e93665641aada4a782152de7f186e781602883780c8 +size 41943040 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..0f87e077d040896f541c982b509b8d2ad6fafee1 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46144db6864d60274158dc60bc6c6b9c1eec6de0de73559f660f914a3befbd18 +size 41943040 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..d80570879ee9ddd5c9276f0fb8a43b08b58011f3 --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55e4abb18d0e92008e6ebebc4adbbcd82fc65afac497924d4daeec70a15f1802 +size 33554432 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..a1cd46b9d8e0c030171dedf5a7232deb02dc37cd --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48f1072a2d9abaf82bb8d58873bbc44ae066e77e7ead2ec1fb922721a323dba +size 41943040 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..376354469c6eb8dcee159d75f4f64ace6cf5a19d --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474a4a2580cead402a58fa855380409e056ed520c946aeb32cbc5481d67c841f +size 33554432 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e00539d1b72e975a57bb5011036c44a44254d5f --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8176c0f9cd6941bcf29bb45ca2e6fb655cc7fd0cfa35fa9bc74c9c5e52515d4 +size 117440512 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff6e4eb29ca96454367e82b7e7c96aca64fe3c38 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f6fbfe0f87c84d7c04b6882a03d3a615be4089b03a5fad8d845c83a653bdee +size 234881024 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..b24225046a6c910b5b3093e39711d7526c72e078 --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b01c2453a8c7713c3a3bfe79aa69b5810d251d2c5ec45c955a1b6e08893dfbc +size 117440512 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..b32a507d7715be2d31394806a99ca228a95787e5 --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267f98eeb8680c6d3921f405d8e09028908c0396074b3c7e41bee465f6995ad4 +size 234881024 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c58dfef1ced15108201a50da5aa2667c23fb5e0 --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c493ec2b18207a6fc2352154c76f91925bd7a70f89c7ea48dfe0bd41930916a0 +size 26804224 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d002503428b64107e79a2645d393471710a6671 --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317da61d5d1649b7fd305d3f10de895d4fd5e94f072b36973d061c0bb7c19e5a +size 41943040 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..953e6a2cbf104ee1bf7605b2d8589adfa12d8725 --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:558ce6faed2fd3f8a925b5aecabb7b221bc7a417ea6828603dd98868e75a498a +size 33554432 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..77f51bc0d0f4434bcd6884dfb810ae5fa353987d --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fc7fddc15c5861c6a4f460f0ebb338bb939ed30fcd2b200688abfbb92a3535 +size 33554432 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d92401ae7220f299621af4afcaaf5cd3a790c92 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f08321409f9596dcc25f4b39e10a2a645e0f4b9caf47259a9c1abe8b2bebe88 +size 117440512 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..804c06dc3d40efd37279cdc2dc694b788c4532cb --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e3f166c093ee17eb9406427913c791c99377c8a480e0091fd7327c3412f72e +size 234881024 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..111743484e74edf074438d435aa1e54c266ecfca --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134c3ea15b37731bfff68bacf19b600c13210b4dfc6036bf2ebd64e15b531bb9 +size 41943040 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..f613b873cb2082ddfe1a587d9a6a2a3161c6cf84 --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecda3fdee5363f3874dd8d58de476a28c30381ea2f3b1a9e131759e2d41efa1 +size 33554432 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..d713b974357274235f7bdb1014756714dc63625d --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4093ca4be606597dd0c9e46fab783296fd09ce6093096327a9345bf921ad36c +size 41943040 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..49636a90f3585a8ee76c9f83c765a04c7a274a42 --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7230cadeab807494b615e17387e730a092205c8ce7d3daa663686693cf6a3706 +size 117440512 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..40b54ac15ab9e02eaaceec563a84d2b602b6235f --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8e9dd5d964e31af86400cd22248edd69e211cac925100376351b486bc4677a +size 234881024 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc2349a0402e8e03fd95522e187073fe1704b787 --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e2928d3a711b332b0caec3617e2ab4e82e98db09674e55a22f0cd044f045f2 +size 28114944 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..b42b6546e0ccf4741bbb5925c4851e1be1501140 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3706b364a2ae2f43c2e09bd5857233ac3ca85934c8ac36cf179993e0c9111cf5 +size 117440512 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..86fecc6a3f8b0003515027a3c0a7a94e717635f3 --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9bc616d856021d6c21e22553fde53b79f08ec188fb758721410f3048093ba2 +size 234881024 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b03c527da2337986a117eed45c451e2fd333824 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951f48a3f6c8370b7224bda2a4684f1b85c77bd8ad1f43729c35f41c7b9eaeaf +size 117440512 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d217e9718e09d8089446f0836336be9ae91889c --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f746a9a405bfc6df3d08cb42ca0f868e5de3916e795a4608899bd9523f4e16 +size 41943040 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec914d24f9232b6dd2ab164a387b8d618b6b1d1f --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fb2673c386439e28274956e48995c3b3710b82800afea9be012519a58aaf58 +size 33554432 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..131659063e5ff14cf37932e8674d0437bca451a1 --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1109a2534e07eb2e043a8a7680b3fff652d3b10ec359dfb38a4c36020eea11da +size 117440512 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..67fd8c97b61dcf5ab741e3f5c8f9ba6bd39e5c58 --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d0e3e43c5f24a0dde5f442a22cfa5056d4e2eaeae99d551fc2ccd43b057be70 +size 234881024 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..c490c29cc147a908af74093afed8a330d6e53628 --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68a8b342ad72c6c8ac3e62fc852a025c7aa45340418b5388fa1848fe7fe7885 +size 41943040 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..927074740e28dba3a4fdfd175b2c2c35e5194414 --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:018fe18b0c959fa78147325f5e689874588b394d6bbef9de437d273afa4488d6 +size 33554432 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..9adedc01bc36c72fe13c4655c86c2bd32ad3a615 --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6769238cd63fc580622242080080cb2917fcd64350692cdacb1949e59d028d26 +size 33112064 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa4223ff841d0d5eb5e7e8dc5cc0b85b2c8877c0 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1370f422a280f55f372e389b4f5d37c7b1aed9de91c17f186b44cf703f2211b +size 41943040 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed35d9f0dc0febcda31f82f6a170611fad15a75a --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c49015a5bdf61f63e6c76acf6f65d2c47c177ebc417cadda4ea96365ac419d0 +size 117440512 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..372f708ad811f7ef7812f95b96eb1624df1495ce --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac17e7c36cb9deb16778a4d686edbd6803c2df9a5cdae28ecf9460abffb4593f +size 234881024 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..c20ecccee1fb327549ddd5ffa15e08c15342ac80 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e348959aff0eb0b1fd42f2a276e2971fcf54557dc6a8f00fdb17d3acf6cffa8 +size 117440512 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..923a720470db8bb933750b67ba078d8c1652f602 --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4871c8a41f50218d8ec2a1f51d2ff1ed270b88f6aea99f1c9d833e2ad26f623 +size 33554432 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c3203644091a5488aa9b968ba57c997b509989c --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022a7299c84a245cfc971d796999e00946ac5980442a5335757f26fe147a76e6 +size 117440512 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ecfb073dd09d51dfed986699cbe91f96537d33a --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d25bd2461b069f7fc466bf4a96ea0822b27ed9fd5e08cdad67db45af7ccd63 +size 234881024 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..04cadf910dbbddfb47edc27c3bffd274376db179 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081f3425fc46714c56648e76745a447170a1e0e79df93e76a6b3868e0084f88d +size 41943040 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..d46a110dce0093cfc1064af4e976aac6cfb43ba1 --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bea0e120e962642f47a75fbb702afc7739ccd89a4843854f2f39308d37822e +size 33554432 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..cfb8336d1c1c74f54c2193706520a95cd32005d0 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f604fc876abbc206b09d4f9c54cff366b2309699ec134ddbe4aed4dde590b10e +size 117440512 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb3e5fec35225d140686ecb21ee27806be741439 --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3826ee6bfb01ce3f82e06627163baad3667ea9ccbb20a44e722d126b748d09a4 +size 234881024 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d79471e5820a32d884747cd50ea7017ad38c039 --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7a2707f926f5aced031a5e18b85317133913b834d080fd90172d645e8f0f2c +size 31522816 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..93d6183d9921cd46d46abc36c6717bfdee6ab81e --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:924b8addcc60efb3c34bab38a86cc2d46776e5abfd286a376b43b4e6568aa23c +size 41943040 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..46014f7a01928e1baf1658ed27b7a3f2b8a1670e --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89a96a1b53948635e011743e9e527343b9d781b7b37adfdb7998f7718561da9f +size 33554432 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..49832725e33c202a68e10f581575d808b160df6d --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36306e267971333d5379dbf579310c5d578af9cc271422848675bb03c725676a +size 234881024 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2cae9c2bf95f71eb49bc0564f90f615c196a998 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4deea26b6985fc520b5e450309175cb583a47d2f53d9f349f96f189c6246be30 +size 117440512 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..70d2991529d042b1a3186e6513775e9252f30a6a --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b45787f9c96ddee0dd9b076d8bda35f5f4e9b2bfce12e0cf947d97bd08ed28 +size 234881024 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..d79e3517ddc59041b443cb5e9c987ac79d44db30 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8186c9f4ae16884b3390c65c3176da8431cfdb279a2f4ef1272da8a22d0e6b +size 41943040 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..6dc458ed818d015cb95935694ec33d62f7d1f697 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff17eded9eb9bc5c767d4596d4d457e0897571a11038e7c2a0e3424c9331d80a +size 33554432 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d5f7fc06ff153916771d45164618de98ca3a9f7 --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd29fa1a4bf4d7d91b4f1c04ce2a9afd3620a6d950eaff9417945343e50d82b6 +size 117440512 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d03964fd7d32170c58cca6b9e7a82107aea719d --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ed2dc79cbafc5a5efd59858ad365b75aade8b0d852015c1d615855651506c9 +size 234881024 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..3de6adf51aebae6430ffde45ccdcad9a2b9a5123 --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde6778e067131362cdf148772344e11a4b0e731d957f4f1ac9c3521d68e2c1a +size 26820608 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..e764335198d5699a0e0d35e53f9b6c3ed05c698f --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7dd922bb649750513d23c40a0b3b1fd28dd95f33847179933e48ac2297b0f24 +size 41943040 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd5d870d3f30f3b77db44f0de44e64af35b0b864 --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a97350b60cb66f62776e7913cf924fd9138e3e64752df18a4fd05bae0d1093a +size 33554432 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..c09f6dda6efb601af970c48f1a38fb286f810c21 --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7404e944723693e922673e086ad99c2fe0b01ac099eddd3b5ffdf386249888c +size 234881024 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..328aa09056ef87ebb0f0d687ed06d27bccca5371 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8e95a90df4f4afcb92053422671a1e4bcaf7ad3dd1bbf8eca50d0c29204a91 +size 234881024 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8d3574c908c6ae6ad6dd90b256272583c8b38c3 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154ba3d996caaf8fb0bb526cde204715f5a0fc5eaa25aabd85d450c7965f54cb +size 26804224 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f31175b5c3aa6096c44260274339e60bcea14c2 --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39b7cd5dc0151e1264d964e37a70bfb7ada70f02f245239532ca160bde2fc49 +size 41943040 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..74d030c8a71393cda493874d35c4f6bd8f718997 --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb132a97da8e8b7db28f17f0e0e32907670e7debe38155681864bd4817d6d545 +size 33554432 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c343d368e97ddc80c8223ba62c179826d841398 --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4db6b23c4f3d03b34ca72cb816411ac4e399ae6e7ee6c569af79e246900335 +size 117440512 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6c618521ec4fa2f79796c4ee99d8d33ff873104 --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a26184c26702f1d66025a0c42cfd25f2e4f83898831eb1a98bb3382a184057 +size 117440512 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..d83b777f455c3e9aaac5c7a714188696cbb62c7b --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7945461204b41284290593cf18af5f09176847dc1ad4aad727a6ba0121c1c4 +size 234881024 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1c738ac0a438102469d23cfa3f99a4583aa19af --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd8ef0f273c57f0f25e7974e7c49de956b389a0502d4ce61eb14b6ee8b8a4d6 +size 26804224 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..e5a3030175a10ee591337b2237def8f45487ea63 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44bb4c6dd95af1187c4e3d6b114a2be232a5733ae63cdec29274aac6ebfac79d +size 41943040 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..cda71db45d9e944bf459d0cf69179c388b19e7fa --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe93e46a7b88a486d26d72f0d86c81dcdf5b86db817b794363e339c2ba9b732 +size 33554432 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..e15d5013f3cbd66fcd4b8de8827934674ac8819a --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c294a0ab7307f640ffc0481d883a7074b804d0b8b517f88fd25d080b3fde5707 +size 117440512 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..bfa15ba74b31756a38284d523db7ca5c7e580ae3 --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7c5d333ac59c0bb3e87d9d38a103f8ad14893bdcd08364af83003c01bbc0020 +size 234881024 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..38ef032b90495a1230b4249852c65b7544afc33e --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b12e2728bb05ce7ffa2b81b1f5991b0e725444687c3ec9cb116e60663cb03f +size 41943040 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2bcb91d0f9529b511612f614e352ec78a5a0f93 --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078ae19ed5a14cc4f39c4d68b834ea0674cfdf6e43f07798eeb8910b5d43efaa +size 41943040 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..11e87f517b095d1c18ce500f73a6f22f2bce3830 --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29a603ef21435e508cf2dd7345bff50c6fed617e8ea0c9befbfa77139e09f56d +size 33554432 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd868bd5ad0e33497327bf66b754f93b3c0a1206 --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7536d4def1d19a93b0b1472636e18f9f754d3897a9015e22958fc651104cff +size 41943040 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e40527072e723edb2e92804a8665def710e6638 --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2209b73c7d2c157ab3faff2121817cf6be83aafa64b9ec53bf1c83d6cf2c1c +size 33554432 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc80273017b57db56462614236754d299cf07fd7 --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e782be60f24d93ea663584811724a22bb2e57a30d690e3ec20b32b6fa21a37 +size 117440512 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..0144513ae7ed83f7c76851e1ca4b25f36d126287 --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61817efbfbfee06e81ce1639b003ff48591eb93c105456a20b3c94cf94b30f6c +size 234881024 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ad1035f519fcebeef4bd402fb04548e2c07c104 --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a025aae9b0f7d681f79eb01d5b2b64b61a9edebe01699c0bcd1b1b647f62974 +size 29163520 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fabe948ecb525b79182046aca062e1e10b7c46c --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca195bdc73c893e94aabc4bdc186af39e0f899be455ac85617869ec4d15fd832 +size 117440512 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..231c38a7774cb8f9aaa8e5f63f913a1bf8d2f475 --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e235c0cfdb7ecee121a165125ec2cddc72519c8a2b1ee957c8410c525662de6a +size 234881024 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..11e8a9507195478d6cb6d77ceecbeaf0eb6e6988 --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a272161b1f237423671f2f545a7c4bf99960a33a6cd0719c2220261b793be2cd +size 41943040 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..fba7f701ef73a2f966b8d59874df58e9b222cf44 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ccab9d5c0387dd53fc4012eeba7c57d64d60a5d4ec6dd969362e7b5cfe5166 +size 33554432 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..fefa56d4de475ff6e0773d780ccda952a0405607 --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb6d368cf39dc704f358ac2510187ad08f1d6f83c4578ff224f5fe2ed3ca587 +size 33554432 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc4f06c77c33f56095a02ebaf2617889aaf5ce70 --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05fa28f24501bd233c29d22093dfc72557d0b512947cd63c50525d6045eceee5 +size 117440512 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..397be5719f3ccb54ae816516c9b96a10a4147a1f --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d5a1865e55289d418c5b52997b3ee36b17e91201699095f715d335964605318 +size 234881024 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..c01a53ca23dc487e9fdc8ae0b6e40637c52b46ba --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8e682cf7c99a6653fc42fa99727934cab97286f62f2d831fa95d339d941ba3 +size 41943040 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c763ffb1412443e6cf49a316aab6fab91b33ee6 --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80aa198af6f6643fefa27cf94b567897abccd3de97ef4e4aa1fe09cd486f5ec7 +size 33554432 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c8f7f5dfbdb1d7f7b181a5ddfab0c677be8e7fb --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8817bd8cca2f8d1f45e5e1941add9957e648507a4ecd452a0247a2bd545b9dc +size 33112064 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c72bb5ac9ca8e3d2ccc272c11571ca8191bbed9 --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc0e35d66b9c78d2ac2783322e5951e34d192b06d27c9351507516f5643e662 +size 41943040 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..0da742a5a949b6073a7a53000bb61e27fea1afa4 --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e4caff7a94c16bff69741409b5704cd8d114e2aabd87ed0342388eab078bc4f +size 117440512 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..8700a366d609eb613c414d3e6bb0eecc6e5ca60b --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d557e935b205f783b253bb85922f72e5f7b471edac842c146d742b3c069b2a +size 234881024 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..24cc56b3915b27f87d580522f2e5648efb74aac0 --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca97d9dfc8f5ab520379d41de14cca97092045e761d42efd3ca73ec7c00deda +size 33554432 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b9c6418d71bb4f08863aa872370230d92585768 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7bbb1d4a0846b0e2eef3024092b5dfc717a0d12ce12b1977f8f0d96a0975fd +size 117440512 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a9cbef5537d5954d9b7a590833fdc864a4300ef --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fefa02fef20f9ef4d43c1655e404414ab18005ae07fd71981ef0052122900da +size 117440512 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..deed43008a914f3153664551900b577d0c1cbd4c --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf2e453a3b9fcf4e3f34b8216ceb04a5a2ae8e7ebbdd52962e71447dbecfd1f +size 234881024 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..f15c09e9116b801a35993dd19e3d0fce48691988 --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db21c9be8609b473a80cd416d2d3ef44c6727866c2fe01c9724039278f9bfd59 +size 41943040 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..592781a835628536fb111bd1529ccd2c0e95b596 --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c5c358d42fea2be50fdf10533cf371c2788bfc1ad9b378b957192bf14ff84c +size 33554432 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d02d87a8bcb01374b53cfb19d0d1af99f1de186 --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8727f911e6da0dcbbf5360b847e3a670a844d069996f63288c0bf7608c285e67 +size 117440512 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd4063c9b3f0bbbe0cb96772ff6910799f22b1b1 --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fc4cf4e82ee050be7b4d00e5ecc55445c9ef1d47330155cf199eb0cb8814aa +size 234881024 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..2cd608e9f76501da60d0e6ffb628cebec21789f2 --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdf4d30073f000eeda99d77d4302297d88bbc7601565b383c88d23fc8fad4eed +size 31522816 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..0db85f5927216314a3a4c3c2b3045cf1edbdbae1 --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ee3a732d62e9762ec0f3fecac6a614555ae1cb8fa6034cf740a13213db5234 +size 41943040 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..cdc8c1459c31b1866a05a9f0a99ff465e11ecacf --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de7afd2854f997c34bafcbddb0fea4fc6b8f29ec71456fab7d8be10d90507eaa +size 33554432 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..317012d2cbf83eab5300f10e48dff6e61fc6ee88 --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28a88d2e1571c5105ebdd55ec3b494f55c914e53d35771a35a5077f8ec56917b +size 117440512 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..1802bbf5811feeeb8f3c666ee52fb6a3445252b2 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5bbd84358985d5d2604d72c9f97484b510efa561c940ce9878759e3767401e +size 234881024 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..17444bac3092a66c917d84a1966be0065ae917b9 --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe33712a837e19e14e51fcb0434ea50c0fe613e9a49603337b7e12db05d7d413 +size 234881024 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0cbee012d2469a9f67ea2be162963ca5667f348 --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3456d7038b5ea5996f7922701226b0adf76dc8673db309ea4d09f68b885676cd +size 41943040 diff --git a/params_shard_242.bin b/params_shard_242.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb1989ed362218a3fb9276979a38c61d5e178901 --- /dev/null +++ b/params_shard_242.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b87f58b06d8beb8b122da4614467e360f9bb7b1b58762e596dd8337549368b0 +size 33554432 diff --git a/params_shard_243.bin b/params_shard_243.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e7e6245751c3467a2317bb659ce17beee7be652 --- /dev/null +++ b/params_shard_243.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c300fb5f9d1e0afa3a0b6d3ada1241497644bc335e7e30b267cb6870f4c2f87 +size 117440512 diff --git a/params_shard_244.bin b/params_shard_244.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0e1878594d19beee34f186901e0a37e35db0ac9 --- /dev/null +++ b/params_shard_244.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71591442fdce447362caa4e2f0bb6d74b371ceba078ba637665eb1f1c1de4804 +size 234881024 diff --git a/params_shard_245.bin b/params_shard_245.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7526bfbe376aae7ad5ce881829f670992df6c53 --- /dev/null +++ b/params_shard_245.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b949f282d9180f2d760c5be01c86933aff5ed838bdd7c73716d92906fe689c9 +size 26820608 diff --git a/params_shard_246.bin b/params_shard_246.bin new file mode 100644 index 0000000000000000000000000000000000000000..794fd3675f1a7ff5361d66a5abf92e55d3c9a59d --- /dev/null +++ b/params_shard_246.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d48427de71ac0a3a2e6df1af5153e16500a301edb7bb97511a719601bac511 +size 41943040 diff --git a/params_shard_247.bin b/params_shard_247.bin new file mode 100644 index 0000000000000000000000000000000000000000..71fdd4b6730cad2dc8e148a28de3a85ee5e3b467 --- /dev/null +++ b/params_shard_247.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13e9a13cc79a99361b9807f34c78a7ed3f9f59b5c3df205fd1e7e063e18f2cdc +size 33554432 diff --git a/params_shard_248.bin b/params_shard_248.bin new file mode 100644 index 0000000000000000000000000000000000000000..3cb4f7aa1a8a57b31992d44608714f4c8feed795 --- /dev/null +++ b/params_shard_248.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cb32ccf61ff7a5dcffc7fa3c46c9f96e91bd2dd6e8a9089d66015cec2c7dd4 +size 234881024 diff --git a/params_shard_249.bin b/params_shard_249.bin new file mode 100644 index 0000000000000000000000000000000000000000..53e3e474be5c03d222dedc937b2d64218224dd4b --- /dev/null +++ b/params_shard_249.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b44ff8a066c7ce4192df2294b1c4dd3280ecb8c81785568fe33488a9efae26 +size 41943040 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ac286248333a674b509ed2daaf5daca061bb56f --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c36fd0aa11b6d83684df435049b8d469a67009ffb63577878d5d295a006e449 +size 41943040 diff --git a/params_shard_250.bin b/params_shard_250.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f382a1b76f37c57cc84f93be6de1f53735d14dc --- /dev/null +++ b/params_shard_250.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d9f45b2f62c84a0c1674be8529519f47f92be7c29952be6d068c27d837b19f4 +size 33554432 diff --git a/params_shard_251.bin b/params_shard_251.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c370fb042e5ffd7b469ec7a35a616d55f9fc8f6 --- /dev/null +++ b/params_shard_251.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23aa4178976517563f4a91b151704426504d49767dd37406e66c3a20d2ce6e9 +size 117440512 diff --git a/params_shard_252.bin b/params_shard_252.bin new file mode 100644 index 0000000000000000000000000000000000000000..60fc9d713cf87fadd67735cd4506f1c969ae61f5 --- /dev/null +++ b/params_shard_252.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1351a1a05bf9df047c7956a5f18337d0b9099f9641c9a33c5635102b727d42 +size 117440512 diff --git a/params_shard_253.bin b/params_shard_253.bin new file mode 100644 index 0000000000000000000000000000000000000000..562d30539f945acd2af912d188625af58a7159ee --- /dev/null +++ b/params_shard_253.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c55902cf16b5bc4156b6f19340697e484ecceb12481ea6cd5e2a48cf1a9a8aa2 +size 234881024 diff --git a/params_shard_254.bin b/params_shard_254.bin new file mode 100644 index 0000000000000000000000000000000000000000..11cfbccde38e2fe828f195a47764a618c8101b82 --- /dev/null +++ b/params_shard_254.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:097344c840646d923c66988e99390647a6325f084f7a2c451f0afaf47c426fbb +size 26804224 diff --git a/params_shard_255.bin b/params_shard_255.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf529f052392d377b8404d061e7be2ddd9c9bb11 --- /dev/null +++ b/params_shard_255.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe7eb266fa1c94073999484bc0dca42d44c4a43b16cdddd34f3dfe619b74912f +size 41943040 diff --git a/params_shard_256.bin b/params_shard_256.bin new file mode 100644 index 0000000000000000000000000000000000000000..d92783e6ef8265cc9dcf24d6595378eccc819f34 --- /dev/null +++ b/params_shard_256.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ec7f28b74d8f6e0182bc7e4ca8021939120768614c4520caa5998d71a3b951b +size 33554432 diff --git a/params_shard_257.bin b/params_shard_257.bin new file mode 100644 index 0000000000000000000000000000000000000000..c99fa5905adf2576eee4edaee02b0656275d2aac --- /dev/null +++ b/params_shard_257.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4033bec6fbe70c2b26baafcfc3ede5cd7cdc54b8d3dab9c6d8a37edee744c06 +size 117440512 diff --git a/params_shard_258.bin b/params_shard_258.bin new file mode 100644 index 0000000000000000000000000000000000000000..2015a644497bcb4bdb694f5406e0c2fb80ec997e --- /dev/null +++ b/params_shard_258.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4038e1cd5f7328dff454e862e3e5a3737fd14c569a6d1a99bf8329f69ec65e1 +size 234881024 diff --git a/params_shard_259.bin b/params_shard_259.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8c541e201374b4788ab16a31899b1ca9f8b2ab9 --- /dev/null +++ b/params_shard_259.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec6141a20c4228032e64b2fd549b7973261caadb2aa38455705bc30293fecb2c +size 41943040 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..8b88c86f0132da4d01f5a1b7c57648a39c9b3e6b --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b066d87ee2625b3b5f82c961616431f0d59d975776d581cf329e7d73e918c63 +size 33554432 diff --git a/params_shard_260.bin b/params_shard_260.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c53f0b556185fedc4a8855b64d2259c7389fd6a --- /dev/null +++ b/params_shard_260.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd14e5cebb0456728ef86829fc8c87f21a52349235f788a2cbcb391abbc052a +size 33554432 diff --git a/params_shard_261.bin b/params_shard_261.bin new file mode 100644 index 0000000000000000000000000000000000000000..0993acc9f52e10f8cb814b7837eb171309f47270 --- /dev/null +++ b/params_shard_261.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91810d1cc424a790d559f673ff8deaf885a076451d866f227f39ec640632aea +size 41943040 diff --git a/params_shard_262.bin b/params_shard_262.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdcc03dd3dcbf464ee604257cc3c499e4dff06e2 --- /dev/null +++ b/params_shard_262.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acf8351632e21221a352c816a0c7b2c55d5c1d022e174a7a52bea671ecc72eef +size 33554432 diff --git a/params_shard_263.bin b/params_shard_263.bin new file mode 100644 index 0000000000000000000000000000000000000000..700d7f02de13b18ad5826982f000885bef491ccf --- /dev/null +++ b/params_shard_263.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5265bfd34ca68d1f2970d5d2384616304cf4cb2942fd57b4c836e05c6e0140e8 +size 117440512 diff --git a/params_shard_264.bin b/params_shard_264.bin new file mode 100644 index 0000000000000000000000000000000000000000..ae979dca353fdf0af6499a11211a78e3fe6ef683 --- /dev/null +++ b/params_shard_264.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5533908427f3ac7052128034f3b6549c57f73c01334802527f239025e6ca74 +size 234881024 diff --git a/params_shard_265.bin b/params_shard_265.bin new file mode 100644 index 0000000000000000000000000000000000000000..76783520ba94dc2dd2030796aa5f9888e8c177fd --- /dev/null +++ b/params_shard_265.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb0fb390a71c2ebd16a3c0c7b868032aceb21271c10e7ad089bae95a2f94886 +size 29163520 diff --git a/params_shard_266.bin b/params_shard_266.bin new file mode 100644 index 0000000000000000000000000000000000000000..d824553bf5205c40f3ac9657e4030638ef38ac15 --- /dev/null +++ b/params_shard_266.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e42ee246c89c7d4ca4854c77aea719ad998955f89aa22436d1b9a3ea3a2f528 +size 117440512 diff --git a/params_shard_267.bin b/params_shard_267.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d0cfc43561400fc2260f63ffb206c8ccc5f7ea5 --- /dev/null +++ b/params_shard_267.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb34939d2710eba757ffce8240d1f7182b38c784a76ba1800d0ad1b3d276a85 +size 234881024 diff --git a/params_shard_268.bin b/params_shard_268.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e30fb2fbf65191459459de126b8e84ed84a8375 --- /dev/null +++ b/params_shard_268.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac499203596764600eb357a46369860982ca444c47a7b8b5495d076a7a3de93 +size 41943040 diff --git a/params_shard_269.bin b/params_shard_269.bin new file mode 100644 index 0000000000000000000000000000000000000000..a500b9bea3cb20ebb1b653a8c233780f485f7016 --- /dev/null +++ b/params_shard_269.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44802c83594c3ebc67204febeec67b84e79477969c674e29d71e9932dd4d6f32 +size 33554432 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ac2dcdb4e4962445db9b9eb9b62bcdd9dc81836 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539b3ad0ac1407d4550d881ee609d3e9842faeba01eff867d9378563b58cf354 +size 41943040 diff --git a/params_shard_270.bin b/params_shard_270.bin new file mode 100644 index 0000000000000000000000000000000000000000..68c9a74eebd935b61c920239b8e834674de2ba9d --- /dev/null +++ b/params_shard_270.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a71193eff3aabed73e51fc08e7e87f7acb22cd1620257fb4826730429e95d5 +size 117440512 diff --git a/params_shard_271.bin b/params_shard_271.bin new file mode 100644 index 0000000000000000000000000000000000000000..c02117365aafb208e3ca9d474fe776372b18a541 --- /dev/null +++ b/params_shard_271.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4018f5e9a22b9eecd63cd11fe134ca2948584b183440b4e4f721db9b25765d +size 234881024 diff --git a/params_shard_272.bin b/params_shard_272.bin new file mode 100644 index 0000000000000000000000000000000000000000..97c22d949415848b6aa59cc39dd452123256a4f4 --- /dev/null +++ b/params_shard_272.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1d3b1a29c69518541b118246110f8b519cc850fe4a340da46d56c5769e1f24 +size 41943040 diff --git a/params_shard_273.bin b/params_shard_273.bin new file mode 100644 index 0000000000000000000000000000000000000000..907fab2013d084ada2cd3961b6f7196f3e1ac931 --- /dev/null +++ b/params_shard_273.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfed6bb8262a9388d9e1e397a1ddfacd531a188526128ba141023329a5782dd +size 33554432 diff --git a/params_shard_274.bin b/params_shard_274.bin new file mode 100644 index 0000000000000000000000000000000000000000..ffd2b76deaa19d72c081b165a4c253e1fe3b5645 --- /dev/null +++ b/params_shard_274.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a20ba8345e80297274f5a194bd97659256ba0b82ebe6fb6e078d0b20472b1506 +size 33112064 diff --git a/params_shard_275.bin b/params_shard_275.bin new file mode 100644 index 0000000000000000000000000000000000000000..95bef8b6ed6ab94ca5f8e01aa987458d383ffa04 --- /dev/null +++ b/params_shard_275.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c05725c117bb2a5b7617873b1062b9e345e6bc954ccbb0630694d1f3e6da31 +size 41943040 diff --git a/params_shard_276.bin b/params_shard_276.bin new file mode 100644 index 0000000000000000000000000000000000000000..d21708073744e7af1d1a23ccd6d3de095cd910a4 --- /dev/null +++ b/params_shard_276.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c472029bddf709dd7239af659846edd95dbb3aa130617eb05a2434de7822a9 +size 117440512 diff --git a/params_shard_277.bin b/params_shard_277.bin new file mode 100644 index 0000000000000000000000000000000000000000..535ffc982e8046e5d8cdbe5d6cff865f9602abb3 --- /dev/null +++ b/params_shard_277.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3473dd1b6ce98874a8031e0e738551fdd67ef236d8a87e60cc13120b48ba955 +size 234881024 diff --git a/params_shard_278.bin b/params_shard_278.bin new file mode 100644 index 0000000000000000000000000000000000000000..a50ac1b488dd69ff932a3cc849e0346dc58bd2e0 --- /dev/null +++ b/params_shard_278.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e536082aff6f781acc5f800140fd45125e9b7dcf7aca4e286c9a299fd42ecdf5 +size 33554432 diff --git a/params_shard_279.bin b/params_shard_279.bin new file mode 100644 index 0000000000000000000000000000000000000000..a298fe6e78ab163524e1a07f787b270ff3eb77e4 --- /dev/null +++ b/params_shard_279.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655231f9e6233b5cf1e97e7e9b91a678b4959154560ac8fe7271a764064c5965 +size 117440512 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb9200eb6fcd2830d779163f38e8233e4563bbaf --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb461e62e0f2186d6f47647cfccc2d844224e40eed8272cc1b14e8094eaa679 +size 33554432 diff --git a/params_shard_280.bin b/params_shard_280.bin new file mode 100644 index 0000000000000000000000000000000000000000..1825ed2c9a4d2ea8a3026977e949f47c4393e48b --- /dev/null +++ b/params_shard_280.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07ffb3811430bcdf68ea4b041fbd9ca7452707c93e656262affd086bc3e51b91 +size 234881024 diff --git a/params_shard_281.bin b/params_shard_281.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c6934b8646292f71133692c4c1bf3e72811f57f --- /dev/null +++ b/params_shard_281.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f17fb56ecd58884dbca77cdfafe94d7dacdbb835f7b7272acd0b429935adfa +size 41943040 diff --git a/params_shard_282.bin b/params_shard_282.bin new file mode 100644 index 0000000000000000000000000000000000000000..41c5f45e14209c07a3bf76e0c7fc1f0f82de3050 --- /dev/null +++ b/params_shard_282.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c325ece2a2cff00ab52b29c0df482d0af9ca15f67e404666712aa94768fb24 +size 33554432 diff --git a/params_shard_283.bin b/params_shard_283.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c674cbd94d03492b81cc99d38c4e9b03c5cad19 --- /dev/null +++ b/params_shard_283.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5a166f270e23eb0d4894a4c6bab83bfb706dd9ea349302e4e64d4720ab19ec +size 117440512 diff --git a/params_shard_284.bin b/params_shard_284.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c14894bc3fc8dc4c39dcca52740f2bbd9f606cd --- /dev/null +++ b/params_shard_284.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe04da17cccf4435df04ae97ef8ba744891733b3e2e642a77d29ebd221bfc75b +size 234881024 diff --git a/params_shard_285.bin b/params_shard_285.bin new file mode 100644 index 0000000000000000000000000000000000000000..9382a834adbe09ada379b8b044552891445bbbdf --- /dev/null +++ b/params_shard_285.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90cea0cdbf64920e82cdfde5f7c1dda2f533f468017d6d0bf61876fb2e9732b5 +size 31522816 diff --git a/params_shard_286.bin b/params_shard_286.bin new file mode 100644 index 0000000000000000000000000000000000000000..855d739be926a29929f7c8557ce0d84d23aa07df --- /dev/null +++ b/params_shard_286.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a50b15516603537db8251755e0596fe5375f287590cbcd92ebe07f1ffa4b8e1 +size 41943040 diff --git a/params_shard_287.bin b/params_shard_287.bin new file mode 100644 index 0000000000000000000000000000000000000000..341b8170d0a18bd65a1f0522b7a65c0076bce11c --- /dev/null +++ b/params_shard_287.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0eb356b86c4f43e6b8b08bce4824765743bf48e4b945f6737de9f6b2ffa331 +size 33554432 diff --git a/params_shard_288.bin b/params_shard_288.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea378a5f878e4812b23560bde157aa6f54f573f5 --- /dev/null +++ b/params_shard_288.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d025ddda3edfba5843e8a9b7bf4f487ae8c7a73fc00055aeb969c478461f83f3 +size 117440512 diff --git a/params_shard_289.bin b/params_shard_289.bin new file mode 100644 index 0000000000000000000000000000000000000000..156c328ebf45a47b848d224175ba1ab09f2f2eb1 --- /dev/null +++ b/params_shard_289.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea91a6465c84ef8a2455358758562f83f0a5474317838bfc6ae722e25f37aa7 +size 234881024 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..b69dbf7240f393b166c7b7312c55c9f51514d4db --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4757d70130a3b385ef1ced55d66ad24cf2502399b40d99937698ad1b0ab92c +size 117440512 diff --git a/params_shard_290.bin b/params_shard_290.bin new file mode 100644 index 0000000000000000000000000000000000000000..54ab76135e7e6c0ec8669a378c3362a12b0a1287 --- /dev/null +++ b/params_shard_290.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ba365088902541b89b1be35cab62f39e406cdfc1ac88e60c99ad11914e1b9c +size 41943040 diff --git a/params_shard_291.bin b/params_shard_291.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc134e4f74bb2a0e2903abb97b427edeebd9ba57 --- /dev/null +++ b/params_shard_291.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5014383628c93530443089f33f6b5127ad9f8d7f9ab6f98b72967b94122b4b3a +size 33554432 diff --git a/params_shard_292.bin b/params_shard_292.bin new file mode 100644 index 0000000000000000000000000000000000000000..103c20b1189a162edeefc702cdc6fb55e14641a7 --- /dev/null +++ b/params_shard_292.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4600d63230ebd1524fa158d4c0f7c630193f442c9c90eb6160524990d924ed19 +size 117440512 diff --git a/params_shard_293.bin b/params_shard_293.bin new file mode 100644 index 0000000000000000000000000000000000000000..aad6e8bf09c0a9c74cf6c8b7edca9ae360c0a9e5 --- /dev/null +++ b/params_shard_293.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16dd8297a2db3c8172b77a0bd97362edf840a508a7f72c702916a014688acacb +size 234881024 diff --git a/params_shard_294.bin b/params_shard_294.bin new file mode 100644 index 0000000000000000000000000000000000000000..072302161f7069409f9bb37b4830ca46aafad9fc --- /dev/null +++ b/params_shard_294.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa8214d6649027a9cdd0461f0f1027c459fbbefdec5bd791998e28d23e7be27 +size 26820608 diff --git a/params_shard_295.bin b/params_shard_295.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc8c16e25ee2339755056ddfbb1b15db662f9558 --- /dev/null +++ b/params_shard_295.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c4258ccb99bb55ca9ab96d711c21a5a4a0bbb76f4117c4bd7a2ccc59e5bf15 +size 41943040 diff --git a/params_shard_296.bin b/params_shard_296.bin new file mode 100644 index 0000000000000000000000000000000000000000..98af255950b92fea4f6848f04420f674a5887176 --- /dev/null +++ b/params_shard_296.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb1da0fb3cbff801daa4706d60c5058236c50b1aca439e54680e58285a8de6e +size 33554432 diff --git a/params_shard_297.bin b/params_shard_297.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ab500fba972257cc61ba907e2289406c84afbdf --- /dev/null +++ b/params_shard_297.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f157fc953002fe8c6a022ae14a671c608b876e83127f3feb1343259b667d188 +size 234881024 diff --git a/params_shard_298.bin b/params_shard_298.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c83a9c3e6e9693404b541a7d4396327f50e36e8 --- /dev/null +++ b/params_shard_298.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c15563a980c0c8ea40d1b2126312d3fa238b255f1db6dd96087de9101313160 +size 41943040 diff --git a/params_shard_299.bin b/params_shard_299.bin new file mode 100644 index 0000000000000000000000000000000000000000..527c10b14e7f345a16c07fe61b7e2792f076024f --- /dev/null +++ b/params_shard_299.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:642ce108e92223bce1e0be206e524de9822d72aa9d0abe28e8f058611f2cf8f7 +size 33554432 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3e5947acf59d68c682ac28805cbe90873e41a3f --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08a8921e32a85ab2e981965274fc20b15f954dd8b5582b29e3204ffefaeedb6 +size 117440512 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..593baa11df18a1737b096eaf20386f89106f6209 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847a3c160431662f537df53d0e90ee873163fa846e07de947c69d197ccbf80a0 +size 234881024 diff --git a/params_shard_300.bin b/params_shard_300.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee1a25883f31626d4658510a8ffcad5d635c2405 --- /dev/null +++ b/params_shard_300.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7d6c4e3ef174210a6488867cc188df09277d4e5f1922a3296c3110be9d1881 +size 117440512 diff --git a/params_shard_301.bin b/params_shard_301.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c48bc3dadd1f435c3d8e25d130df081e1f562e1 --- /dev/null +++ b/params_shard_301.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf95a523d891572f1bf72a1c90cdcc9790abb21f3249a03d13582befa46b920 +size 117440512 diff --git a/params_shard_302.bin b/params_shard_302.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7da87baa6555295c59a02072e67ba6904f65ae4 --- /dev/null +++ b/params_shard_302.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5056c2c36275ed1408e2125b32221aefa6fb996fc3cc7c4323be88bf391ee6 +size 234881024 diff --git a/params_shard_303.bin b/params_shard_303.bin new file mode 100644 index 0000000000000000000000000000000000000000..44980cbbfafd485197fa70e73f72e026a30d8de4 --- /dev/null +++ b/params_shard_303.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d4b2cd367e81b4073b2ff2a3d97fc19b29aa735f2f443a1e36fb06a7772f16 +size 26804224 diff --git a/params_shard_304.bin b/params_shard_304.bin new file mode 100644 index 0000000000000000000000000000000000000000..40d30923d800cf82dc95ab00fa67d9276d74b606 --- /dev/null +++ b/params_shard_304.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36e60cd1d2f428c6a2f256656b363bf2168082647432c9324bfd64e3c14c260 +size 41943040 diff --git a/params_shard_305.bin b/params_shard_305.bin new file mode 100644 index 0000000000000000000000000000000000000000..31eda068492918832739dde6178b5644dff413de --- /dev/null +++ b/params_shard_305.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a5b00e471bf4424d5df61c48bb404c576a16468fc92c95ac53a333bc40fcad1 +size 33554432 diff --git a/params_shard_306.bin b/params_shard_306.bin new file mode 100644 index 0000000000000000000000000000000000000000..58955c5ea1437d44579ca45d87cc32060552220a --- /dev/null +++ b/params_shard_306.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd641f2aeeaf36080f6fd23e8f9057be227ca19d5fac1b564d1c612263f0b36 +size 117440512 diff --git a/params_shard_307.bin b/params_shard_307.bin new file mode 100644 index 0000000000000000000000000000000000000000..4eb3189067920d6bc5563ec21708548f4efa49cf --- /dev/null +++ b/params_shard_307.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5868cfed19fa86aec38fcaaadd1462dc9abfd1fe782a3ba8073de537f3eaad +size 234881024 diff --git a/params_shard_308.bin b/params_shard_308.bin new file mode 100644 index 0000000000000000000000000000000000000000..c9006cb51edd9ed4d5fffe6413b2a1cc53a23d41 --- /dev/null +++ b/params_shard_308.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbfb4c43dd435bf743d0e6c25f1a34a1bd999f276ceedafaa1644b4e22908e8b +size 41943040 diff --git a/params_shard_309.bin b/params_shard_309.bin new file mode 100644 index 0000000000000000000000000000000000000000..af656d3c0942d28b08c461751a12d2ac41e3b443 --- /dev/null +++ b/params_shard_309.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06db93f528d9360b0bf107da3d8ec704303e692e51d5252a22f5c94422c93197 +size 33554432 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..831de71f61c88a67068a1f1cff802cfc3403fb16 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cdc5016bd734130ecb5f82dad6dc07dd5811b382d5dce78b9bfb1590b767f55 +size 29163520 diff --git a/params_shard_310.bin b/params_shard_310.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bd00aaf21d4dc59aa9c232fcd069c4e634872dc --- /dev/null +++ b/params_shard_310.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b3c84bd51c6f6692f9a41076d2113de927bc379388dc50b904dfcfb53c9bba +size 41943040 diff --git a/params_shard_311.bin b/params_shard_311.bin new file mode 100644 index 0000000000000000000000000000000000000000..a472620fa0407fa9240ef7264b1d7074d8412803 --- /dev/null +++ b/params_shard_311.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a9e2a5182b06558e2e8172c233b5312084b4e4a9fd28f9ebf7827fd2b25e43 +size 33554432 diff --git a/params_shard_312.bin b/params_shard_312.bin new file mode 100644 index 0000000000000000000000000000000000000000..47b57f69d952134a15bc71cf8bc97d3e0da76306 --- /dev/null +++ b/params_shard_312.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e2ee48ace01e6df079b969641c5696b6336607a8b033505528b359c058b4beb +size 117440512 diff --git a/params_shard_313.bin b/params_shard_313.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a57bbb4cfba1c994590d579682492572250ca02 --- /dev/null +++ b/params_shard_313.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7060b104f7cbaedd9e01217a4ef082ad379957b9841d14dad22a2945738d5bf +size 234881024 diff --git a/params_shard_314.bin b/params_shard_314.bin new file mode 100644 index 0000000000000000000000000000000000000000..abba0bde4ba7f96ecd355a5eca42f0994f1d5549 --- /dev/null +++ b/params_shard_314.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042992b6bae397c4ed7aef715dfa680634b35c8c5521b9204701a8191fe711dc +size 29163520 diff --git a/params_shard_315.bin b/params_shard_315.bin new file mode 100644 index 0000000000000000000000000000000000000000..f70a024e9dd1a5ec31c257607e9468207c063b3b --- /dev/null +++ b/params_shard_315.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05eaf06d34071c83069661381356edf03efb219940c19bfa73d20009e1129d5 +size 33554432 diff --git a/params_shard_316.bin b/params_shard_316.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c754c74529a5d7d995d4ce1c19e0e6420dd614c --- /dev/null +++ b/params_shard_316.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9420a5441789d13e3da6fc8c98cca1937387153cdef55aa063b5a0507527c3c +size 117440512 diff --git a/params_shard_317.bin b/params_shard_317.bin new file mode 100644 index 0000000000000000000000000000000000000000..713593fb644634d79045ff15c2fd1d6f17f71420 --- /dev/null +++ b/params_shard_317.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48176a9920d0ba12b426baa557efe2ad5503a5c09efbbe9115a38d4dc18c652f +size 234881024 diff --git a/params_shard_318.bin b/params_shard_318.bin new file mode 100644 index 0000000000000000000000000000000000000000..50979036cdb12f7b482bcc3216c01a80d6af80db --- /dev/null +++ b/params_shard_318.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7b784521c533ff65e5e974b00144760c164ff9419ed5f86a92d0ff6f29445b +size 41943040 diff --git a/params_shard_319.bin b/params_shard_319.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca5b5205e2a39ad97b5db532a1fae5f725865d42 --- /dev/null +++ b/params_shard_319.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2095888b0e20298a36e720e1ef456b73f8c233fe5b9c4b45e49f9a66cfb9d11c +size 33554432 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad848128c81961ee26ae976e6dce753a2306f4e5 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd0fe89c512615d1aee93c46d4b0f0d54e61779cbbb8aa62b4710fe364ffb3f8 +size 41943040 diff --git a/params_shard_320.bin b/params_shard_320.bin new file mode 100644 index 0000000000000000000000000000000000000000..b922f391b208e3eb25a480894c1c33e5a37bdf9f --- /dev/null +++ b/params_shard_320.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56c821278d06b33acc36174a12189a552e09aeaaefa9037b606d565a06b6219 +size 117440512 diff --git a/params_shard_321.bin b/params_shard_321.bin new file mode 100644 index 0000000000000000000000000000000000000000..87b452e3c20f99e24f3b57cfb36cde6a8acaa909 --- /dev/null +++ b/params_shard_321.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a997095720319d88e3c2b4d715fc69b587f1ea520d86bcc25ac3b51f27c74b5 +size 41943040 diff --git a/params_shard_322.bin b/params_shard_322.bin new file mode 100644 index 0000000000000000000000000000000000000000..46868efcfa125bdb31b4bd11b1a3be295930ca16 --- /dev/null +++ b/params_shard_322.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6a3ae1c64607cbde334cdc0c7c8774c95452c3a187c56bdb9dd2d02034328f +size 33554432 diff --git a/params_shard_323.bin b/params_shard_323.bin new file mode 100644 index 0000000000000000000000000000000000000000..810f31b5ffb307813c3dfe42b071c56afa3c61e2 --- /dev/null +++ b/params_shard_323.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bafb4d7eaf2dfb7846f5cd707eaf2523ee4e2695a4efd788a67c89b2cbdf664 +size 117440512 diff --git a/params_shard_324.bin b/params_shard_324.bin new file mode 100644 index 0000000000000000000000000000000000000000..39f83ed3fba9568d4025859209e8bfbc11f5e652 --- /dev/null +++ b/params_shard_324.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50fcf0d0c856fd3541ef0f5bdd74435bf1489ebeb0f59699c2511ee7292b17b3 +size 234881024 diff --git a/params_shard_325.bin b/params_shard_325.bin new file mode 100644 index 0000000000000000000000000000000000000000..941e09d35d461a45280dd6d590a117c4a38eef59 --- /dev/null +++ b/params_shard_325.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ac2c8b9d63144fc9d6496a3e75412d3465221d3b728e91777d90df7e4aec99 +size 31522816 diff --git a/params_shard_326.bin b/params_shard_326.bin new file mode 100644 index 0000000000000000000000000000000000000000..54feda3f3a2b804d859760b6551439b4dfc649db --- /dev/null +++ b/params_shard_326.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce713bf813104a6f2f7f9413ad9f66a8013b0eea2edf433fce434fc631c0c8e7 +size 117440512 diff --git a/params_shard_327.bin b/params_shard_327.bin new file mode 100644 index 0000000000000000000000000000000000000000..10996de03586b9fe8f1ab707d60026ac720092cc --- /dev/null +++ b/params_shard_327.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fae48d32d33508209f813c6e22433fcb77042b603fb89c945fbcf6bed6e6f86 +size 234881024 diff --git a/params_shard_328.bin b/params_shard_328.bin new file mode 100644 index 0000000000000000000000000000000000000000..cdebab1e60431949caa51636346daae5b654c0c6 --- /dev/null +++ b/params_shard_328.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b63d1ee3bec5108a044932fd7fc5c752b25a75d3d479829683653800dc311ac +size 41943040 diff --git a/params_shard_329.bin b/params_shard_329.bin new file mode 100644 index 0000000000000000000000000000000000000000..870beb60b92d10e3d6278594a1d006691b17341e --- /dev/null +++ b/params_shard_329.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2afffba14987df04adf88663978cf43681b706fa5e319da7c258bb964a0fd5 +size 33554432 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..72e9a3263c0fbda6866ebc52f7324b1381e6d2c9 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e15b65d09cc7fc2ecac35ed755014a8c9c822458a38987de87a87c57f0062d +size 33554432 diff --git a/params_shard_330.bin b/params_shard_330.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff1ea04bb72b81111263d974d388d03feedb5bc3 --- /dev/null +++ b/params_shard_330.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b4eb34fd62f63fb48a8d562f4828147bf8b980b1a9610ab765d851722f48e8 +size 117440512 diff --git a/params_shard_331.bin b/params_shard_331.bin new file mode 100644 index 0000000000000000000000000000000000000000..88dbccdcad7f1f68e96f2a9b9b31cdd9ce5d9cea --- /dev/null +++ b/params_shard_331.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186ef2e78888054246d60fe6cac0565da0d5a35fb6120d6ff828327e17f6e091 +size 234881024 diff --git a/params_shard_332.bin b/params_shard_332.bin new file mode 100644 index 0000000000000000000000000000000000000000..67cbbdedb8a3bda5c6aa82fd7a2a24820698872f --- /dev/null +++ b/params_shard_332.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d9da10ee4ca9e4692b7209893de35f319906581c221c9452f5042e73438afa +size 41943040 diff --git a/params_shard_333.bin b/params_shard_333.bin new file mode 100644 index 0000000000000000000000000000000000000000..b870c6d589b36d2cfb2acfa12d87871047db641a --- /dev/null +++ b/params_shard_333.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c29d50848e76c45b9c707fdb487e127b0a7b4e6674ef548a3e164e9f435ea50 +size 33554432 diff --git a/params_shard_334.bin b/params_shard_334.bin new file mode 100644 index 0000000000000000000000000000000000000000..6afe24824ee220f05a33a683696fc842cbde0939 --- /dev/null +++ b/params_shard_334.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117fc429290102034bd5b6b349a0dd05bd4f6f97c67278a9e9feb056478b5cce +size 33112064 diff --git a/params_shard_335.bin b/params_shard_335.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e9ab496e9742e9caecd0217e32c4dc6f9aaedad --- /dev/null +++ b/params_shard_335.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f28d165fd96ce407a56ddf71c020442c76cef389de98de0a14dbac0edf556d9 +size 41943040 diff --git a/params_shard_336.bin b/params_shard_336.bin new file mode 100644 index 0000000000000000000000000000000000000000..eecd8aa2282191f491f2e67ed9e0e5549606375a --- /dev/null +++ b/params_shard_336.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a7400cb0febfab25ca7a0b7a3621b3496442fc3a16bd4e484bbc1b32175384 +size 117440512 diff --git a/params_shard_337.bin b/params_shard_337.bin new file mode 100644 index 0000000000000000000000000000000000000000..47499a4ed6ca70380d6a09dd3ff71d490a19959d --- /dev/null +++ b/params_shard_337.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d8d1db948e558bc21bdf9abbb4fce2419856c328c910b51c271dff64f5edb0e +size 234881024 diff --git a/params_shard_338.bin b/params_shard_338.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb98ec30b1637c8e2cd55e50dacb6b0e8226cbb9 --- /dev/null +++ b/params_shard_338.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e512fa96592132cd6b9e855bfc34e82c5a32224a60fdc09595bcbe3ca4a780c6 +size 33554432 diff --git a/params_shard_339.bin b/params_shard_339.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7023767815408dbdb664816061a5d9277d87af3 --- /dev/null +++ b/params_shard_339.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae59199ff1d0f051fcaceb00c96d486623552e635ef58336171582a10062ed1 +size 117440512 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e08678e45115c11daeb9c983c65910661481c58 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c84e8f2deabff5e7951c08b3ddcadc00956adb40feee274090e157b93339b1f +size 117440512 diff --git a/params_shard_340.bin b/params_shard_340.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e27e5d5b0a1495ae78c3fdb884d1c29b02a473e --- /dev/null +++ b/params_shard_340.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:328dde3e486a738e7ea5219ede465bc1dc0444554d84faeab16726163d926da2 +size 234881024 diff --git a/params_shard_341.bin b/params_shard_341.bin new file mode 100644 index 0000000000000000000000000000000000000000..32961f864496ba37a8c25a851d1829476318509e --- /dev/null +++ b/params_shard_341.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0b8d00dbeb3aa86cc0667cc2e6e46fcad82e29b19f515a0f812a361a967c83 +size 41943040 diff --git a/params_shard_342.bin b/params_shard_342.bin new file mode 100644 index 0000000000000000000000000000000000000000..58fd747d8bc3a024ac173970a7614e7dc45b57d8 --- /dev/null +++ b/params_shard_342.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75e589cd9dc9d5566988d8bfef6677cbd4501f910a16dfda6b3e10173d92c94 +size 33554432 diff --git a/params_shard_343.bin b/params_shard_343.bin new file mode 100644 index 0000000000000000000000000000000000000000..322c156002f5aea6a574eb3fa51c4b83b6b2b233 --- /dev/null +++ b/params_shard_343.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2278c52b86793d8eab60fa21482026d191129d3923ff0c56334b2ec885d0fee +size 117440512 diff --git a/params_shard_344.bin b/params_shard_344.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb3cdd655f3ef512464afda5c2bb32a3d305f9a1 --- /dev/null +++ b/params_shard_344.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77eca453dd9c96f304a41ff47cf1af529d3dec5a798a4246a2c1494184a91e3d +size 234881024 diff --git a/params_shard_345.bin b/params_shard_345.bin new file mode 100644 index 0000000000000000000000000000000000000000..af94b647cfc1cb1e07c23b4e3085646ab8f7982d --- /dev/null +++ b/params_shard_345.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955015a1e6eb7645c7cf3e2ee7d64c4bf86ef2bd3912a6b8c92026865f2d2226 +size 31522816 diff --git a/params_shard_346.bin b/params_shard_346.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b11c5702cf8f091d90bf77728bb1bd0049861ce --- /dev/null +++ b/params_shard_346.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917828e730e62e5e91caeeebbdb9e467e936156255749664058faadd651b3604 +size 41943040 diff --git a/params_shard_347.bin b/params_shard_347.bin new file mode 100644 index 0000000000000000000000000000000000000000..71cadad42c59bf6f32c6219980c4a8393fe04512 --- /dev/null +++ b/params_shard_347.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54195477c10a0154ef2be5e5506e8dbbf75ed5182789c014d5b4ceba684915ca +size 33554432 diff --git a/params_shard_348.bin b/params_shard_348.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c87c19038125bc0315d8441310244aed33f759c --- /dev/null +++ b/params_shard_348.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76120368b38a469e9c0e3d857fae2970aef2fa952318d09ef8740a0ad1bf341f +size 117440512 diff --git a/params_shard_349.bin b/params_shard_349.bin new file mode 100644 index 0000000000000000000000000000000000000000..10749703e76073e058bf3089b06a7040c7d10bc1 --- /dev/null +++ b/params_shard_349.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5678e1c2eb9ff6d8e991b2cf0607fb0d489bf5622096e47a9526cf46955dff80 +size 234881024 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..35421fe428cbcc6e8abc0a0066d487dd70f20328 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb99668452e2b2c6da6fead358bba0cf70cc38f453e71f29c02cd7dbbe2d370 +size 234881024 diff --git a/params_shard_350.bin b/params_shard_350.bin new file mode 100644 index 0000000000000000000000000000000000000000..6eea79f525a606bcdb315974fb7c1cd5bdac3f5b --- /dev/null +++ b/params_shard_350.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa4e4029c3fb1940c3be948930a58a9b11148b0ebda8d18c265df5d599b9982 +size 41943040 diff --git a/params_shard_351.bin b/params_shard_351.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff029445f321d87ee016800d3840414f518940fd --- /dev/null +++ b/params_shard_351.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6662be5998966f3e2b71a0fa47862d8cf3c631bb46a1a58060b0e667b9ca72 +size 33554432 diff --git a/params_shard_352.bin b/params_shard_352.bin new file mode 100644 index 0000000000000000000000000000000000000000..2fe8be91b64d507ffd6bd933c73f9aedecd4027d --- /dev/null +++ b/params_shard_352.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7a73c345935243a72d469ff49e825197b605c1ab286ce01819d64b9259bc1b +size 117440512 diff --git a/params_shard_353.bin b/params_shard_353.bin new file mode 100644 index 0000000000000000000000000000000000000000..bbc64336226dc3501ea4a3e573561242b41324fc --- /dev/null +++ b/params_shard_353.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9352e78cbd74be60302dc03ee73c7b4e94d404048edb04387e60745cc65ff9c8 +size 234881024 diff --git a/params_shard_354.bin b/params_shard_354.bin new file mode 100644 index 0000000000000000000000000000000000000000..b967cd48673c3ab2d756bb3553391a5935cfa7ad --- /dev/null +++ b/params_shard_354.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3def78c04f062a57c74d880b85bba11c144eeb1ce38212426cdc6c774a110b6a +size 26820608 diff --git a/params_shard_355.bin b/params_shard_355.bin new file mode 100644 index 0000000000000000000000000000000000000000..67bdf8d90e91ea300bf62aaeab04cb8bc782cfab --- /dev/null +++ b/params_shard_355.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a9346a8988163dbc799d0886e7293fd252ef37c784b433837060854aecd3b67 +size 41943040 diff --git a/params_shard_356.bin b/params_shard_356.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ba3545d0657e3d9397787bb481655148df9d749 --- /dev/null +++ b/params_shard_356.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85775629eefcfa48d6ef1602d285624df7419175c8b9ca4e9b09687844d0f7d1 +size 33554432 diff --git a/params_shard_357.bin b/params_shard_357.bin new file mode 100644 index 0000000000000000000000000000000000000000..31171d0c889ae2fc5a1e2f749b36457fc7be2855 --- /dev/null +++ b/params_shard_357.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8cd80874c4c29c5731014ba1ad282a1939ac4fb91f5c4c31c2a14f311a5184 +size 41943040 diff --git a/params_shard_358.bin b/params_shard_358.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea67242da32a0c4f6efc46a3ba14c842ec2aab97 --- /dev/null +++ b/params_shard_358.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a68209688e36230645dced217e7c54d625c02be050d36839107260373182ea7 +size 33554432 diff --git a/params_shard_359.bin b/params_shard_359.bin new file mode 100644 index 0000000000000000000000000000000000000000..71574154338869eb22c7883a7f2f186b4eea1a4d --- /dev/null +++ b/params_shard_359.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27635af0b6ce9710ea619bc59ceaeef54e1348e311683c3b51b9cece47d0eaf3 +size 12075008 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1c419d7519366c37d674bd78de26e253ff7b132 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbc71c91a0ccda7f9f7776a3f148d41ead2f098bc87653ecf31485b2ef5b029 +size 41943040 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..29df90e96f0ee6e5c6a541d78a2fb25399c46234 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac099bdf9c743337b5bc5cf5dd1c87dc0c0c63cc752824832167b08073306ca +size 33554432 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5d6e90c2bc75e8468fee26b6e07128593380209 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5234ea1e2140576a284308402beeecffb40dd9146c8eddd289fc35f83273dc58 +size 234881024 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..9186499ada5600f91967cbb53a5ac9df9b3ec393 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1afcf955c0a295da8a4710cc1e04d5511bfbb1c4a16516d007320e8ca78ff6f +size 41943040 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..7643c073eff42653968a89b81c2a21c4630b149d --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c9e6f830eef04b569265318b9e8c6b3bdb0ad9a4421f3e77578c104da2dcb9c +size 234881024 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..41f123cf6391aa7ac77f9c632ad24162cd6b08e2 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52f6a5597e72118865fb8a9f599d5e94cba5bebcbaacb5f3d28df91024812e7 +size 33554432 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..10fe03293e3b90842fbbf4e25cec20c43e17235b --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d26b80b3eca040fb0234a958a4cc19b8260c67628049ac68ca506025d5096d +size 234881024 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..495d489ad43441a41e0cac2546cbf037a50c84e8 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c299ea878ce999c6b8a187a9890efce0f6da5664d1ba5b014b94c6347c44b8 +size 32833536 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..363b5cd031d3a0678ca60fc6a6e7998b6f938597 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1168742671c4c1ecb6dd33d8b3d27b53125ffb340df8621b932f649b9bf4fe39 +size 117440512 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..fcf90ffc34c55b85bc5b5387b686804564e58d0d --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f273b9eb27418c14453001e650621dc440a32fd7b5f0aebe2f21d0b331f0c1 +size 117440512 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..e5bf3651b4580bf4fb1d5354d12172b3c0f83ca2 --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef3fea00cd65956274276fdb4f07a871c01f8900d93fe72fa610cef208f369f +size 234881024 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..877c9d5b24d9e9a91a792286ae832d0a2c81a4c6 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3860409b5cdd1fdc9577cea07d566ad0c49098a4f123880e66b87bd606f337 +size 41943040 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..c69d25f3f03eeef64dbd6ea206297ba981a2674d --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ad9da89036cd0a90fd6d87ab9c81e015fe0ccc064c8b29ee47842703331434 +size 33554432 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..64ca71fe0e172c3e73fb39a46fa0b11754c96469 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91dc14abf5825680bd0603b87937632fc7793083935eb6d0768e1450e84780ac +size 117440512 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..9bfc727543ebfd36d059bf2a904983d066054f45 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2336ac54c0ee65a328f0279bff3e3ea08161f96cc11134392775daf6d169ee9b +size 234881024 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed76a6f77dfeaa96b9d41dfc753490d73d50b113 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32ba11bf9cf299562a3accc01055efdfbcdadca866adf97ec0f7d2105ded52f +size 31145984 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..df9e0e08d7647e1d2512b4e3f53fa52c87d146d9 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59934046eaf1feeaf816abd3047b8fcd74dc889f8be9f3f9887a2bab0c77f2ac +size 28147712 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b2f1c93f06acc4e2b6045442bc1927cd55e4a56 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72781bb9df2811744c6f7b70b8f379c755767b665a98ba54c666efd05c84c490 +size 41943040 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..73e74e5cf8a25d82bb5306740992e822fb89d121 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93d9a2353ecabf959d9034731617f6e9bc9726bd20707e86cb98bb82c40922b4 +size 33554432 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..b61b4e7a8bcc1237cec47488c86ef8b5f7d469c3 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79e8aa393da1d2048fe4f2ba865194d51a24fc63711b6e171e2a2ea9960c0a2e +size 41943040 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0521a14e79155bf719ce9b2a8ce8f9ef9f05f5a --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91a0c4ea0d056664bcb0bcf9b9d181630fdfaf2192f1d11cf2c032ebd833769 +size 33554432 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..876e0cb15135af83b7632f19d78e4ee8fb593be3 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f0e062d559f3fb093154c02569085f33c8c51340fd1ab4f9553ab78a72c3d2 +size 117440512 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab3b05b2e343f74eaa4c2e65d608a5ae927b320d --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe3186e8745613cb1cfa96fbd9685a3b6df222c49827bcb8f33e2d0cfb2a15c +size 234881024 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..e741d92ed547649dbcb5b88073d48c9aa2eeca4f --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67feca80518f7c7d76f59ebe3604709f16eb09ae32327580f1ce0d6e92170ef2 +size 117440512 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff40117ae23394e0643708eaef432a6991583dbd --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd87fd9c18a5591ca33ec3dc1490f5b1327724a589425e660e50f23cad798e8a +size 234881024 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..cce86363f047c7afd7b3dbd86a142705b36e6dba --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9bed849e4a8d800bb31762146782f0d35b0a6a416c6aaa5ad8e50ae4d431e5 +size 26804224 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..fcefb0b63769deb755eec7d6424e02969d6d3618 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ba8bb6c1f57bd43c68a0b9e3a9236d0cec400c8a6479386f2d60bcc99125d1 +size 41943040 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9374679741990040a7bdb96af29ad023f6431c6 --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:558fa2d1ba99af549dc70c4a44864302963edf685f09208dbaf5ea357c312fd1 +size 41943040 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..6967b652741f8d160fafe7dae86073fb857fd57b --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536ce6dfb55ffdaacac83be4e56ea07e3d1c810791e98d8ae33398e6f92d0a16 +size 33554432 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5b2b60f3086c0eb305799e2e1dafb9828a83bfb --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84d3178bf59166b615b015cfd63006d0cd9903c3b5cf68ffb18ebb2becec515 +size 117440512 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..852c0ce3d44b5b7e456d956e31249cceb5ad0688 --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14fb91842192012a9a8323c5779108c5934bd1d1d2b951a14702dd635b291394 +size 234881024 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..d56c481b95a2408ffb97d50525880b6aaf252d91 --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ce2ac83c5d5149939d8a7ab7f2612b87fed0edc7ef5aeccb124a26f862074d +size 41943040 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..ccbc7e9f7c74fcba3f6550cacd93531bd91731be --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b34b22be26213fe9258b64e423e55122a630c5f8d9e79fba8f5177ea3bc755 +size 33554432 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..735c4180c732f0937e1f493fc3845b1557a87faa --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03974aff66ebba2379d5dcb608c1e3d94b951a00a7bf1441c1ccebb15e74113 +size 41943040 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7b88a18dff0421cec24702952f4623626733aa1 --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d11238be32cf9b16b5d6ecabf0b0065e866fe95f91d504c0b81f8ba80845ff +size 117440512 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3bc659cb922aa9c83067ec21c639a83a438417c --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60989fb9876af533dfec5901af323deda42b31e28fcc167b1609be489f514e09 +size 234881024 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..edbafa0202a30b5259505f3077e1bb6d5f426f0d --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d243a546ccba5f7761f81d5043f3b1bd24b6e766dec6a4f8760b44ecc47f24 +size 28114944 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..6046a7b4a3cd04c21c6cf19e4f2bbb9ac9cf38b0 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e4893fda2f237daeceb8cd885329fe988e49c58c9d646cdefb08ddf1b0f189 +size 33554432 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2849ed0b082ada0464ed11e69241c53299fe0e0 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3302c4d7614e6d9ce29c32d9e824936afeaaed0d62e267218734190314c9dfa +size 33554432 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5f58ae80527a17f8e8d3bd07bbb4bea1adf155b --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cdde489cd52f57f6409ed7bbfbefb5e44b1c59d5ff3bbda60f8c4db16e3cced +size 117440512 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac42b8bd012c1020f5e116917603ea0cc23cee6e --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433faf697d61c48ea1ad1d864097172085b086d4990e63ea3b025a1a5faea96c +size 234881024 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..5852fe0c0668d3fa16c59bd160b05a7f7396fd60 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8042627ecba85a515022f0783ff703ce898649ff7c504aeeccb9ebc986d979c +size 41943040 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf1d0f6f9c4af23d451702288a4348cfc5fa2da0 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb12471a31ecb8ad906d4491ea7c4c375559b700e834fae3705fb18c9e53f058 +size 33554432 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec06511420b3c3cd0a287cc7cd21171e10c2a057 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76cbe57a2e6508ac32f280e84ce0d2c49ca28f82c3c827a907ac9b5fccf53e1a +size 117440512 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..a3c8275b6c6544d13011200c271c6f0c8277ec2a --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c76d04caccb03dd217ebaa88b63ed5ff2a202235fa81c1e37dde711cf17963c +size 234881024 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3c8383689e9c68ec9619901919c45d9bad39814 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3d16561b8b30a09427220a30bfd434da6420b52c96d4872777e39264d0ac5b +size 41943040 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..12ef5111080ed802e45434f01b24bee078aba658 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7180cec17090465541d71c188c4e46a5cdf26ebb74a33f5a7d3600b0d270bfc1 +size 32817152 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebfbcf6fc68f5f8685b67c66e0ef6b25bf0d5a3c --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe64623f055d2a2e3127cf5cd28d1292e00e75a7782aab550efc9584303c858 +size 33554432 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..301e9113a56e3faa82f555da405b5164b37f246e --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69c553a7ec861438bb990b21b88739f276c2832d1cd1b6c27cb4143c8e86278 +size 525336576 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..67c04c172892136a16dada8c398e3ef7f1fd58f7 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408a6afd445554e59bebaa9440af8eab5d60d3186ac65a4a8da6d999b1062366 +size 117440512 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..895de1ac9d15c0c430628357083e4b355edd9564 --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f859ba1e58f7aa4e6136eab24058171602a213a1678fddf5d8bc96836c717b95 +size 234881024 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec60f7dbc8618298e2ab9ae7018dae556b4475e1 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315a731ef118c1277d3173f1fc29003aaba8a057d5042e16e390c8f9f0a6d7f1 +size 41943040 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..b02e6a321de61ed01f3f2069e2e9acb5c0babdd2 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59095c521ccbd479fe6c1dcf5170bfdea10e878b0ec2220038099ee8caee43b7 +size 33554432 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..511c81f6f0cf543aa528bc2c2a85b71da77064fc --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f4fda4c4b24eec382d2fc27294a904d93631324734d7a84a3892f36ec4971e0 +size 117440512 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa46eb7c4c25d1452ad967aa8526806d22ff6394 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23f9a4114b83bcda69261ed36c787628c97d629d70b170a3500f87dc4dbb5df +size 234881024 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..46eaf83fb14d7da49d1dd884551907b79cb919e2 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb612f3381730049e2a85ed822d3ac57af2cbb02a174e0359c4c8892fb40e49 +size 41943040 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..1429d39abbb8b3556ad004a0aa9f6a479a6660e5 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb63b0467cb4dbfbc525035be7ceed18adc3164a50d3d7d4575dbcac02504af +size 33554432 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..78d89ebc1d9444e2f4a1bc295e345824ccc4a3df --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963d9835ae4798abad330d3a779792df11c0a56dcfca85ad8b3e188928e289f0 +size 234881024 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..95e572a8420c581d691db7ba490d4bcdf51a1b47 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cfa5c3a370d4f3939cfcc5069f354dab82b4b9150f49cfb98326531ccc81f55 +size 29196288 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..06d13d44e21e3a2941acdaf9acac712ba3bf78b2 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153ee5c270bd894efd71b9d171f1c7b052d316904b785c0eb8764cdeeb6ff1f5 +size 117440512 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..827b57d8d352cb27f0e761a6e7c6f80baaf6318e --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3105fe4c1719599459dfca2ae65b6c3ef70c519d7cd3c7ca90df45ea6343833d +size 41943040 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..3453f7e298140fa3a3ec3201bccf95ef429ba9b6 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91be415440e8ffbb94bba8e684372c8e2e97ea736e1b87d3751e13b807f9a783 +size 33554432 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..f631dd4ef8dde70e809ccce595b7a0d64aa41a34 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73387875fe3f3f87cf54ebb9b75dffee43d63ec6b624c60ed14558728a16af57 +size 117440512 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..505c2290adaa14da54b856d19a1cc2022b84f444 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61544e691bd4abf1e54f547c54b681dd41512fd01556e02127f8ac6c0896199a +size 117440512 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..73c8ed1cdb1d322473f77681f48e567781af1e29 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16d4244803460ceed4ae7283b5e41ec8638fcb93329d7c7d36d8131867419550 +size 234881024 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fcd9c46d384062f87887fd7e66e8c264df3b9b4 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014b8e333d07f04b470deb25a6278ee0e266695f90f3594467ee7187d757fd70 +size 41943040 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..299c2cde93202070b537df53fa5ac675c8063a43 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ccc121d77af4a69db9c7d45bdc8fb4caf10ac69bda9b0e4dc385cb6a471d39d +size 33554432 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c0df2f7c8e244ab06ad25780b98845c428c3866 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95361d380d9d961c48452ea9ca552867a74cb554c6fc4418cd4fc1f22d97ded0 +size 117440512 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..661350bda0f3eef6af72bb694f59159678425907 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5572eba7d050c4c0838260d4730501996ebbc95c2320f1b19dfc101333edd44b +size 234881024 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..eca254efbca967aae94a0f2a79c00a438db9b15a --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb083685361b58a30371eed4ee937616058e1e3722d9ddc0e8df3c004867cf1 +size 30490624 diff --git a/private-llm-config.json b/private-llm-config.json new file mode 100644 index 0000000000000000000000000000000000000000..3f0100e662aa3cfcac4a91c70dfc701e93952572 --- /dev/null +++ b/private-llm-config.json @@ -0,0 +1,51 @@ +{ + "model_type": "llama", + "quantization": "w4a16g128sym", + "model_config": { + "hidden_size": 8192, + "intermediate_size": 28672, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "rms_norm_eps": 1e-05, + "vocab_size": 128256, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "context_window_size": 4096, + "prefill_chunk_size": 128, + "num_key_value_heads": 8, + "head_dim": 128, + "tensor_parallel_shards": 1, + "pipeline_parallel_stages": 1, + "max_batch_size": 80 + }, + "vocab_size": 128256, + "context_window_size": 4096, + "sliding_window_size": -1, + "prefill_chunk_size": 128, + "attention_sink_size": -1, + "tensor_parallel_shards": 1, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "temperature": 0.7, + "presence_penalty": 0.0, + "frequency_penalty": 0.0, + "repetition_penalty": 1.0, + "top_p": 0.95, + "conv_template": "llama-3", + "pad_token_id": 0, + "bos_token_id": 128000, + "eos_token_id": 128001, + "tokenizer_files": [ + "tokenizer.json", + "tokenizer_config.json" + ], + "version": "0.1.0" +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c91fde4f2240d14fb005a6ab3a9e6fd9245d069e --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2064 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}", + "clean_up_tokenization_spaces": true, + "eos_token": "<|end_of_text|>", + "extra_special_tokens": {}, + "legacy": false, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "tokenizer_class": "PreTrainedTokenizerFast" +}