diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md index 20004291aacfa6744c64d8bdf192378d39ff1d78..444c44b0cc4665aca8709ec09689c36535abcb0d 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,26 @@ ---- -license: llama3.3 ---- +--- +language: +- en +- fr +- it +- pt +- hi +- es +- th +- de +license: llama3.3 +base_model: huihui-ai/Llama-3.3-70B-Instruct-abliterated +base_model_relation: quantized +library_name: mlc-llm +pipeline_tag: text-generation +tags: + - facebook + - meta + - pytorch + - llama + - llama-3 + - abliterated + - uncensored +--- + +3-bit [OmniQuant](https://arxiv.org/abs/2308.13137) quantized version of [Llama-3.3-70B-Instruct-abliterated](https://huggingface.co/huihui-ai/Llama-3.3-70B-Instruct-abliterated) for use with the [Private LLM app](https://privatellm.app/). diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f98e357c05745bf2cf79816dbac3b1d79de5789 --- /dev/null +++ b/config.json @@ -0,0 +1,5 @@ +{ + "quantization_config": { + "bits": 3 + } +} diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..3552cabe7f17b994f8cfcf2eb945692c0d504061 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,12343 @@ +{ + "metadata": { + "ParamSize": 805, + "ParamBytes": 31776318464.0, + "BitsPerParam": 3.04023285660184 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 420679680, + "records": [ + { + "name": "lm_head.q_weight", + "shape": [ + 128256, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 420679680, + "byteOffset": 0 + } + ], + "md5sum": "79cdbbd110de7ccddb1a2f1e20de7ac6" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 52584960, + "records": [ + { + "name": "lm_head.q_scale", + "shape": [ + 128256, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 52584960, + "byteOffset": 0 + } + ], + "md5sum": "3b30e9c6343f50a2014db07dfbe274f1" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.78.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "73afa85da1905264dc494d9e6b27fe4d" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.79.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "fea5dbcf103f48516c8f992cfe9c9575" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 23560192, + "records": [ + { + "name": "model.layers.78.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 0 + }, + { + "name": "model.layers.78.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 16384 + }, + { + "name": "model.layers.78.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.79.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23543808 + } + ], + "md5sum": "3f3e891011ff2117488cdbb65bd8b20b" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "1d69e1a70629f31d4d7b3906b749a2ca" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.79.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "72598d1cd490b1c5a3423a7c56609137" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.79.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1ffaa645f81e45117969cecf8d61627a" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.79.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dc90cceb96db03b52d379ee6f6a3b52b" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 420679680, + "records": [ + { + "name": "model.embed_tokens.q_weight", + "shape": [ + 128256, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 420679680, + "byteOffset": 0 + } + ], + "md5sum": "8b8a02a0c14245a32993c53a4df286b0" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 52584960, + "records": [ + { + "name": "model.embed_tokens.q_scale", + "shape": [ + 128256, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 52584960, + "byteOffset": 0 + } + ], + "md5sum": "8c3f7f6a3dadd8a3303d0c97575306d9" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "7f8b25a32cc9aadfd2c87f0c0e59bccc" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "aab0ca339f72c50187d60563bbd7318d" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "c6ff248935c2a0444ae2dd7c271ebfee" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "19a47b56cded04eea6bd8c59333d173d" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.79.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.79.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.79.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.79.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.norm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.0.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.0.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "73c4d00dd11db7bb97cca6cc8a4df70f" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.0.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "d11d3db0404829f9a95ad8626bee65a2" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "eee14a06a7ff8af2a8a40e956758fad4" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "b1c8cebefc9c968a444e9167da2658b2" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "acb6d7c6b6cad9bdbf93ea365149d943" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.0.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.1.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 3358720 + }, + { + "name": "model.layers.1.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26869760 + } + ], + "md5sum": "bff83f5d3bbf0c238c3aff0f71fc7c22" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "8fd57c1ab7c515ccc9d180251f05e96e" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3950726b590b1cf44e282aca0cee203a" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d4bd3675e51b116621a8a011f6d699d5" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "7893e49b7700cedd34b78f0ded01211a" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "bb9076571ea32f2b22768019986360f2" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e9bd9281a3528e7de2f40529c184e050" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.1.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.1.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15138816 + }, + { + "name": "model.layers.2.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 15155200 + }, + { + "name": "model.layers.2.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26902528 + }, + { + "name": "model.layers.2.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 26918912 + } + ], + "md5sum": "8cefd0e01f539422ecd756f645029cff" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b9e8c1fed47f5ed78084f975e257e6b9" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ed5351207ae2d2f93434474176bc60d4" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "30c9135385eca92a09052d4a1a40a11d" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "52acf9ad2eb65cbbead8833ae08ba4ff" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.3.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "560e4911bbdb076d77ba9b7c7d824fe2" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "ef1901213aab8b10d5f3846b5e648fd2" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.4.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "77423014c7b04cc8269583c2f31c712c" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "34e3abf0288ff2556dc3d426bb4337fd" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.3.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.3.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.3.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.3.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.4.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.4.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "13fd53f828807211798fb01ff489c6ef" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "77a44838a2538159967ed4e986d45083" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "74136ce030ad261791a4b2f4a8a33c25" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "972d38d1ec185f63ceb2baff1a643d11" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.10.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "657dad5739760faf063989ea173a0864" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "ae3b24e223102febc95780075a2647d6" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6626430a4961902989c450819a8208b5" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bf76abfddc38f962757761b58c835d06" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a28391fcf030500e1ced11075b08db7c" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.10.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.10.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.10.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.11.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.11.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "4bb1ab4e35c086dffb10b2214dc16d23" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.11.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "27a675ae250b21a7debdcac72e157608" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "1fb0d9f80999338b005cf740b0d1997f" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "7034ceb1471d7bae370eed99753368cd" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d42e207414d06ef06202a524048e8cd7" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ede5f88a50c6708023f9ab7d8806653c" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "1bd0479b9e5ea6bf744ccd0aca10cab5" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1e1559106ebe2e3dfc67d6ca8935b8df" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.11.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.12.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 3358720 + }, + { + "name": "model.layers.12.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 7557120 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 10915840 + }, + { + "name": "model.layers.9.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 10932224 + }, + { + "name": "model.layers.9.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22679552 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "7060216ec8e25ddad90cbca1e0f0a017" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "4554e588ce60dd0776a2f8f590aba283" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "7c6290747eb0837939e65b9684872654" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2dc2d8498a8e729231ec2c05293a2a7a" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d16373f3773e88a201a761146f3227ef" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "f79983ec7047f10d23edaff868355e6d" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dfa85fc4b233ae245a00de31104d671a" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "4e279f740836b9f1601cdb8da1248a9b" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "42726d916108ca5eccb87f034cad8b42" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.12.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.13.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.13.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.13.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.13.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "2ab51983af8b3308c8e43cf1970004cd" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "4107ee6fbc8ada79d728ad42d4af4202" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d827e6b3eb081af0fc7ca68b3dddf20b" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "733730caa8431bf71e3b08f2eddb1ce8" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.14.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "8883f23dc41d8b30be6a46c985884bd5" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e771f1d324e81284d2f85bcd8353459a" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "06ed877cc2761a7b68f1e7b1bdb56490" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0c139f1cf2678ee739e77a6ed0560600" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "fa0ec91bf67686e46eed3a7a6405df98" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.14.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.14.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.14.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.15.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.15.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "e0cc343e9d18554ffb9ac22c123a5e13" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.15.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "5e8b568fecf31fa66dae3de8ad59de2a" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1c62e8fbbeece15d69fa010101fd9009" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f75212c3073b66d6e43fdc2baf02aa03" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e4ccf08bd8ce0d2a289fe1639b1a9681" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "15434de9ef0a03014ac6922b152cab18" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.16.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "82ede31818a5ad43c679755818cd1eda" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "2a1e45ddd474e838bdf9a0e01e9e83bc" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "6b8eef6484c95ae8a1eb9c743bcafe1e" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "38f347e549881ec4705dcdbf9f11e15a" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.17.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "116bc51485415aeaa3760cc74b3837c1" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "557b36a7739a2ccd3320595ca7ba1ef9" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.15.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.16.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.16.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.16.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.16.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.17.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.17.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "48c634e846ad22e37e66f11edc0909b1" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "fce103e779fcf2fc25e605ab0b9719b1" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "0e96004e82864c3a44fb0aa566ad272c" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e41c80aab30b365fcbf2261902b12ef0" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "8aee3ca82772e10ed899a75a182ecfc1" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.18.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9552c968bbd9d7cbf71bfdbb5c32aca2" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2a4f64366952c05c9f7b4090d082fa05" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.17.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.18.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.18.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.18.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.18.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "55d87dd44a6d4153fe807481ceae10eb" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "044fc57468a87eed6d5b9b1f27f53e13" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a504fa51980120b0dea15944c174353e" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "dfba4273d180d805f1c26a52b4ad4cb5" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.19.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d8e3b6eb73844418284e411fcb215940" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "8757948dc951c523a2c7f8cdffb35420" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.20.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "28d19ccc96b3480b6ad84971607c9d41" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "811b2a6d6494701b3f2c5b4c75dc1f65" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.19.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.19.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.19.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.20.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.20.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "0b5c11cd5febae92836f7abfd2233d5d" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "409b1146445b3ec3395477bd50ae31d1" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b136aaf524bcf1e64e0e0bb8be4d163f" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "38fe372c888a0e55f78670ea65bd162c" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ccdd3faf44a28fd66ccac9ed1438710b" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "89247e3964cd17cfb39d6e5f81cc4f3d" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "bae35fb14b2e3417dc1568c6fa159127" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.21.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "da1bcedbc7af6f1d95ea23c485402166" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3f6f010ec02f644ba41790347c24f309" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.20.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.21.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.21.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.21.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.21.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "d1ab16f4899c40176bd0559cb52620cc" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "d5c980b81d56bd3716e105cd09427b8b" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "890932abedb47da48c4aeaf77d6850b9" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6040914fd07bf53d6a865963e8543e56" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5338d53633a4664ffb1c5b6067b84f53" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b782df8b4fd6a6a4d49b820386e46524" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6783b1a38db73a66450572fa80abd038" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "919c1f404a543b91b388961e0b3c9222" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "bf73c81ca01a9ca68c9a33a5bef6801a" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.22.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.22.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.22.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.23.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.23.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "2ecdb3ad81bbd5f299d7740ae66ef0e4" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.23.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "847c02737b894f8f1fa15381a32e4b5f" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "767cfd5e3921ef9528d6ff2fcab36be6" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "3d31c061900a657fb26bc71db482a82c" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "33d787d60b7fa2bb6932eb90575ba68d" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "44800e0c022e224492528e44ee2a72fc" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.24.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "15582b67dac4f8fdc91b5850b8b736f7" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e1c15283254b90f5f7b7071e586da128" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "1b27b8841e3d58d28f74ef0ad67ce2e2" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "73873fa14c0d9690ab5d97d26e258c33" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.25.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dc799bed5066067e3e12e1b6627daa3c" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "414cbb6300129ec9a9d86d0327dfb4f4" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.23.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.24.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.24.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.24.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.24.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.25.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.25.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "039374e6388f810e54b0060ebea2008b" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "0b31b640bcc95c439871debb05fb2b26" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "81f34db7fc818292f4630d0206ebf848" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bf67d719623382151aab27cfc7e7eaf8" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "abe7c0a89c76991d579e9e138598a9ee" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "59c42d3ffb93b713eaa80cf41a7f1e0f" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "fbb56783657958f741befc81e5c58255" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.25.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.26.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.26.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.26.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.26.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "61abc2f2703a8de2727c9b5678dc9e78" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "fc5ba546e621fd7d196e8808220d68f8" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "31ad68dd4f8914073c010688027d7b15" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "84f6dfe6a21846674a10d096467612db" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "330b196b258c59fc58b34d51ffdba490" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "b7928cdfc1370099217e29501fa14776" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.28.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "6297587dbbd0abe8b39ef64f9b8a1cd0" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "bfe95a9d453512b2e6df9f12c520a09a" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.27.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.27.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.27.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.28.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.28.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "51a60d2e23ff96a676597261187bd658" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "18904d992b8941ba6fabc70af54fe53f" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "c7aad44c325219963f66ee5cfdae8f66" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "9e070f920ca578585ab6797574a50c95" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "036e0ecc074ced034806b9bb4e917f49" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "5234ba0e1be023147060485fa0e89a71" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "bdf8f9257332b384867adf898332315d" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.29.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "bb2085c7a09bbfc1f97ddf3531042e73" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "197dec5bbf297aee089dad3b25870fb9" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.28.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.29.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.29.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.29.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.29.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "9c6f90b857cd79a3c642b2a9365c21ea" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "ff0bb771603f7cd9abef78cffc538b04" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "19203a078527f7756731c95d01d5ae5f" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d8455fc821167782b36d093563217abc" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.30.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "26c5cc1bd2067294788e43e47b3c78a8" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "28b4123e235184465c7e98acacd837c8" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "2f1917eedf33690b7b4cb8a807d098dc" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "46316e9040239d462713e0d5d4af8c9d" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f67bd1df2853b51a8e551d03d092e9e2" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.30.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.30.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.30.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.31.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.31.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "f40ea5121e4d0c325c112e133493059a" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.31.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "d65a708e8cbf48c46ac3d7bd2685d9ba" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.32.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "5db234e48602acc8a5ada0e4a52924cc" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "2ea0e51323e65853b0c0fb548d46d941" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.32.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "245ff2ca45128c54a060d149824a8362" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.32.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f5bdb67257a8d0ec9783a318ee1e58ea" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.32.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "86acc0412c23c80669b732370f374777" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "20c105ee4cbd3c31fc96c17ecc560c46" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.33.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "e01bcad0105bfa6745812ff36aa15486" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.33.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "79b84e83d19d148b79158e9ea5f22673" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.33.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "6f21ca093c9837e35a81757c2ef22bab" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "4971a35d6332f0eb661275c23305b329" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.31.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.32.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.32.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.32.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.32.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.32.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.33.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.33.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.33.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "16e0f7922ab7e78f8b86b6b63482f526" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.34.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "be4e0a758dd7b59ded8259969a1d68ad" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "8a9b9b18937edb39a2a359275ef6a868" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.34.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bacec05aa7ec75fd7c8392ffe6d117c7" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.34.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "fa111b95be1e677e8b11c64fd5055ce6" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.34.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "17dc0633a62503a6b949acedd22c7b05" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "dfc09530d6f2c2bfb31b69a593025f96" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.33.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.33.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.34.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.34.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.34.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.34.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.34.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.35.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "bbf4d3e2c5231c260aa2da93f0a8e8da" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "33792b7e0c0ee1ba0dae7973e9eb52da" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.35.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "35265bb7012ae9434ed01be6485a2cf7" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.35.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4aca80513a06bbc992c557a00fb5c7af" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.35.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d39e4b92b05390b409a5a8c83f28054d" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.36.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "207f4907ea1704d6d4e9e927d6a7ff4a" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.36.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "49e50b2597b2408afd8189876cac8dbd" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6574e7c83ea56706f5f9d405662c5dd6" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.35.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.35.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.35.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.35.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.36.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.36.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.36.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "00563dc3d84838b21e73eec3b8e2ba0d" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "91c8736a199ccbf25e822965989e420a" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.36.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "5d3e27b481bfe6846d72dfc549ff8461" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.37.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "11af5d4f1631aece0a6910c6992438ca" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "09190a20dc3c98dbefc34999e1b5a4c2" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.37.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "181463c091cf44b9612f82e73b252db4" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.37.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7104e69e0e99c84e7a2381e21bbc3c3e" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.37.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "aa25b7c436049ef72550b663079a2f8e" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "a6d1f4bddf59aee06efff4812a8581d5" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.36.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.36.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.37.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.37.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.37.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.37.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.37.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "8eb8bac431847c3cff1073c91a0781de" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "cfe30a1ef82e78e26f0e52fce425a14f" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.38.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "ee5d08fb6bce0bb757323e34621741dc" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.38.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6c193ebe9758e5c43956f712a27e7e8a" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.38.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "bbd26233a0b167f39e4cb504b37b5da6" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.39.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d7606c54081045ba45fea0dc92bf4c48" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c2e1ca98b7748ce8dc80125be667b84c" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.39.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "3a10f801f546e74245df9314c315a7aa" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e97b4a84970a292885220b0e38d1e0a4" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.38.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.38.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.38.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.38.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.38.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.39.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.39.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.39.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "aa83e2fe057a478a62f6bc1ee07334cc" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.39.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.39.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "6281cb6f33aeb77a8084e7fb5a7f3e57" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.40.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c4d0087e3410f3dc7fc14fae946c89c7" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.40.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "88b2114358229e6968c43423a52faee3" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.40.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b716d0d619321e8fa87df19932ad2cf6" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.40.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "ea770c4b55a9ee2fa3d6cb902a9697da" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.40.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "f0c4f1819933e919a2b3e3ca3df0fe93" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f9ea880fe6c16b165a5eb9a8684b0094" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.41.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "be3e208ea9fbe3ef644bc07f7a728a6e" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.41.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "316a5103795dc7bd210d660f986723c3" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.41.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "35e08612d6db8a744e3c38ef5120cdc8" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "88fe4aa2b32b6436fe25e8b44d7767e1" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.39.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.40.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.40.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.40.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.40.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.40.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.41.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.41.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "6b9430683697ec232906e9fb20bd3ce2" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "a194f7bb6c9edfdd1205ecdda4c39428" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d2fa94c3d61a46fb92f90ef40cc4894f" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "489af120e1a665501194bda6563b4ea4" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f8136254944e0e70f44d7d7ba7e24054" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "249e781a11c6d9532355cff4c105dcee" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "ad94a15d9ab0695acc54889543abdcb0" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "146c8bc753cc5ee9b1b9a96cea850c42" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c3a62d9564c953486d3ddc04c89c3123" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.4.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.5.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.5.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.5.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.5.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "45941108f09b68d900186c00aba2a94b" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "06e710a4e6ea3916b07bbe59a367a03d" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "baeb79f75b9ab4dceaeb2ab9b658aac7" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "b60fdd552522027a671c38921ea0bf50" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "8f9c6368777bc501ca0b9077a050d1d6" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.41.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "06fa823c373a137caefa1a0519c14e35" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "bed715c96f069b24f17c46b0f6e83250" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.6.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.6.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.41.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.41.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19320832 + }, + { + "name": "model.layers.41.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31068160 + }, + { + "name": "model.layers.42.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "94f891372465568577d24d0d11f18913" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "37e5b208d8e02af2f21cb088fba03b74" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.42.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "faebfbdbdc772dee10f29c6e17f2e71e" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.42.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "10324289083c13e446eb323f06604e3e" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.42.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "f0d22ba32d7ac290647e5300e1cced7e" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.43.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "74922fa9a66d01ad977200d5cbb27cd6" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6cf196012e229f76303ab52a2d2c491e" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.43.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "6863ed98e66bb4042df4f98786db2999" + }, + { + "dataPath": "params_shard_242.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.43.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "ba48b4a862551a1e1eb21db4c922004b" + }, + { + "dataPath": "params_shard_243.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.42.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.42.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.42.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.42.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.43.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.43.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.43.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "8d7afe9b58ce7a229878d9b80c9d29e3" + }, + { + "dataPath": "params_shard_244.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.43.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.43.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "402e6d30b16daef35b91c69540b2acbb" + }, + { + "dataPath": "params_shard_245.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.44.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "c8bf53f3412f223b9e382f6a8853a516" + }, + { + "dataPath": "params_shard_246.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.44.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "89b48ea6b70c8b07ec51c02bf84f9d65" + }, + { + "dataPath": "params_shard_247.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.44.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e43023d3d3e2d742a18d41e63fc0bba6" + }, + { + "dataPath": "params_shard_248.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b595941e0febfec805dad92e87b80941" + }, + { + "dataPath": "params_shard_249.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.44.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0e479116e203772da3ceb8bb2ae24e9c" + }, + { + "dataPath": "params_shard_250.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6bba03fc6d27c49611571282c882a0ab" + }, + { + "dataPath": "params_shard_251.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.43.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.44.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 3358720 + }, + { + "name": "model.layers.44.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 7557120 + }, + { + "name": "model.layers.44.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 10915840 + }, + { + "name": "model.layers.44.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 10932224 + }, + { + "name": "model.layers.44.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22679552 + }, + { + "name": "model.layers.45.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "fc94756a5a9aec91716b2f1a2eae1eec" + }, + { + "dataPath": "params_shard_252.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "dda85b84cf5fd0ea915e48ccb8ce753a" + }, + { + "dataPath": "params_shard_253.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.45.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b110a651e266403ea92edb07226f3a70" + }, + { + "dataPath": "params_shard_254.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.45.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "29c15be99e1359ad2f4f023b2bb139b0" + }, + { + "dataPath": "params_shard_255.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.45.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "1272d48cb8a2f8be96fe82cfba6d8e8f" + }, + { + "dataPath": "params_shard_256.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.46.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "75bcb8ebd2408201c9ab30bcf2f807c8" + }, + { + "dataPath": "params_shard_257.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "777c765c7a1af35382672dab65e3804d" + }, + { + "dataPath": "params_shard_258.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.46.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "1144ad87f491865586430b6d688a4e11" + }, + { + "dataPath": "params_shard_259.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.46.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "0d3f1ba5f3d0d43071874b68c306bfe1" + }, + { + "dataPath": "params_shard_260.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.45.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.45.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.45.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.45.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.46.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19320832 + } + ], + "md5sum": "16a6affab016d42a28ec94d6e30c1cea" + }, + { + "dataPath": "params_shard_261.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.46.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.46.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "f9a8320a43b2bb2f275f53af197730b0" + }, + { + "dataPath": "params_shard_262.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.47.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2213dac164533de1b3c0f30904de9d7d" + }, + { + "dataPath": "params_shard_263.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "728d2a72e60c96048d8757874a02fe30" + }, + { + "dataPath": "params_shard_264.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.47.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b11c3f71b25764498a53b74e79b1a7d2" + }, + { + "dataPath": "params_shard_265.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.47.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "c88506aaba44183d6df84a4d361a9920" + }, + { + "dataPath": "params_shard_266.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.47.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "040c732d1d561c015b244b9e40a0109f" + }, + { + "dataPath": "params_shard_267.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b0097fdc592c33c3516cd795ad887b59" + }, + { + "dataPath": "params_shard_268.bin", + "format": "raw-shard", + "nbytes": 22745088, + "records": [ + { + "name": "model.layers.46.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.46.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.46.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3375104 + }, + { + "name": "model.layers.47.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3391488 + }, + { + "name": "model.layers.47.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3407872 + }, + { + "name": "model.layers.47.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15155200 + }, + { + "name": "model.layers.47.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15171584 + }, + { + "name": "model.layers.47.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19369984 + }, + { + "name": "model.layers.48.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22728704 + } + ], + "md5sum": "4fab0bed53a347c07db8a06cfe3a195d" + }, + { + "dataPath": "params_shard_269.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "cb7ec1195eefa871d875515d5c7d37a8" + }, + { + "dataPath": "params_shard_270.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.48.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "ccfe6aa0dae82846de4d0b18dbe394af" + }, + { + "dataPath": "params_shard_271.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.48.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4b3ee0e08045d658459dd4c697617e0e" + }, + { + "dataPath": "params_shard_272.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.48.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "b110e4bfe38869fd0dc2a307471a1325" + }, + { + "dataPath": "params_shard_273.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "8cd1ca77cad8a418e188853134f62597" + }, + { + "dataPath": "params_shard_274.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.49.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d307892b2ffd48d1f6bf9a37e01d7b9c" + }, + { + "dataPath": "params_shard_275.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.49.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "c0fa6ee6a47fc8432f69433ad5e9b860" + }, + { + "dataPath": "params_shard_276.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.49.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "f3ab1dc7c843bab266ddf278118a0cba" + }, + { + "dataPath": "params_shard_277.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "7cffe00103e964ad9a7ac8daacc44d85" + }, + { + "dataPath": "params_shard_278.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.48.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.48.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.48.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.48.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.49.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.49.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.49.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "83ebf5b207f97051485fd611e2d08e74" + }, + { + "dataPath": "params_shard_279.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.50.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3a9107d68b48aba9f28f6f61ba96969d" + }, + { + "dataPath": "params_shard_280.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "efbf40c3521af1971c4c9254ea8534ed" + }, + { + "dataPath": "params_shard_281.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.50.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "9b71eb119f716f542fcde2273a33cc2a" + }, + { + "dataPath": "params_shard_282.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.50.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7df80668daf5f08a67b12b767b826a5a" + }, + { + "dataPath": "params_shard_283.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.50.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "edf1d2ebb7838fa2246c98cdb97c2dff" + }, + { + "dataPath": "params_shard_284.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.51.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "5fd789175927ab7c5cd1931434d78dab" + }, + { + "dataPath": "params_shard_285.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.49.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.49.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.50.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.50.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.50.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.50.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.50.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.51.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "5a3cb81296c9a107c3056dfb10f1456f" + }, + { + "dataPath": "params_shard_286.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "81bd2e5217f3b24051048faa3bd7ba4b" + }, + { + "dataPath": "params_shard_287.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.51.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a707b6ca1eef3dfbef49c655e8a38189" + }, + { + "dataPath": "params_shard_288.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.51.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a63fea962cee79dfb1303eb847f65f18" + }, + { + "dataPath": "params_shard_289.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.51.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "76e64cbc0e07e1fa5ba51f99c933db73" + }, + { + "dataPath": "params_shard_290.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.52.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "19dfe77405e442e7c710d4bd648d70a7" + }, + { + "dataPath": "params_shard_291.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.52.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "15ef1063531fb566ed04306757f350a2" + }, + { + "dataPath": "params_shard_292.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "459d170a7b147cdd0b46c041125f66c0" + }, + { + "dataPath": "params_shard_293.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.51.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.51.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.51.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.51.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.52.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.52.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.52.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "1c7decffa65f466debf15246aa7d34ad" + }, + { + "dataPath": "params_shard_294.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f95966390189acd6f90863537477b293" + }, + { + "dataPath": "params_shard_295.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.52.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "41cb5bb91ef5a509969a4970aa5f5b22" + }, + { + "dataPath": "params_shard_296.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.53.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "744e8e2c54a95f3475252da0655fe3a3" + }, + { + "dataPath": "params_shard_297.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "0a8f876baefa316e53e9e90663d4f3db" + }, + { + "dataPath": "params_shard_298.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.53.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0658b6efb7ac5cbd626ad06be8877dc0" + }, + { + "dataPath": "params_shard_299.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.53.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4ac075ff11a12b39458bbe2531e7e7dd" + }, + { + "dataPath": "params_shard_300.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.53.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d6382e4aa66038ec97caf207573956b2" + }, + { + "dataPath": "params_shard_301.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.54.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "ae72177b00631fad04bd24c204712716" + }, + { + "dataPath": "params_shard_302.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.52.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.52.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.53.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.53.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.53.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.53.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.53.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "b98b45b606596cf440114c8b3af73468" + }, + { + "dataPath": "params_shard_303.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.54.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "5af5b2369730fd2b39869ef24b1f6bcd" + }, + { + "dataPath": "params_shard_304.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.54.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "648cab0559350a81111fbb1db6b4e5b0" + }, + { + "dataPath": "params_shard_305.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.54.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e3c0b6058dab6ca0196a1acc67b43d74" + }, + { + "dataPath": "params_shard_306.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.54.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e118d8c7adfbc9aae2fda211a8f1995b" + }, + { + "dataPath": "params_shard_307.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.55.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b781cb4b812a55d924c0d6cf77bb187e" + }, + { + "dataPath": "params_shard_308.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "886fa0be360455e0ff18982ff27cef12" + }, + { + "dataPath": "params_shard_309.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.55.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "f74fbf24019964166f2063d51b9459ec" + }, + { + "dataPath": "params_shard_310.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.55.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "d3b7b62c037fcc6f7b41cb7fe57b6cae" + }, + { + "dataPath": "params_shard_311.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.54.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.54.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.54.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.54.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.54.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.55.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.55.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.55.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "c14779f4408cdfecf96311a4680a4fe6" + }, + { + "dataPath": "params_shard_312.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.55.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.55.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "e65ac71373ecab1fde6abe6fa8eae8f2" + }, + { + "dataPath": "params_shard_313.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.56.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "cb0053f7163e9320952efb12797dce2c" + }, + { + "dataPath": "params_shard_314.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "7a259312665ad6aa036031ac8f408a0f" + }, + { + "dataPath": "params_shard_315.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.56.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a36f56ea4d75755a0e5aa9f6b85de953" + }, + { + "dataPath": "params_shard_316.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.56.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e671438e6097c7109b845bd8b47ae5ac" + }, + { + "dataPath": "params_shard_317.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.56.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "6274b508d0669005c02dab612862a3a9" + }, + { + "dataPath": "params_shard_318.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6c69c7eba33f852ed949a9988199b2da" + }, + { + "dataPath": "params_shard_319.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.57.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "b7ca576cbf672be908480f3c02fe369d" + }, + { + "dataPath": "params_shard_320.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.57.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "5a042da84404d2c6d6adc62c7204ff50" + }, + { + "dataPath": "params_shard_321.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.57.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "25200225ae8538c73cbaa81d172c1078" + }, + { + "dataPath": "params_shard_322.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "6bfe7a5bc4987e6395d3373bf13dd77b" + }, + { + "dataPath": "params_shard_323.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.55.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.56.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.56.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.56.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.56.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.56.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.57.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.57.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.57.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "9dbc5c3e1cb2d8f24e88f8bae8665000" + }, + { + "dataPath": "params_shard_324.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.58.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "cdd05a3b8fa72b2722590682c31318da" + }, + { + "dataPath": "params_shard_325.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "751e1950c44dca8c6c0a49d6c1674d8b" + }, + { + "dataPath": "params_shard_326.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.58.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "3817f806d12cba763f41b13bcabe61bf" + }, + { + "dataPath": "params_shard_327.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.58.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e1f3514df8130ff4305e68f917864b4f" + }, + { + "dataPath": "params_shard_328.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.58.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "aa7207864ef3970b99fda49810e7384e" + }, + { + "dataPath": "params_shard_329.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "1737a3142f9def8fbd6b54c83fda2616" + }, + { + "dataPath": "params_shard_330.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.57.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.57.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.58.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.58.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.58.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.58.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.58.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.59.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "a3fb00eddae71d294b35189aedda9056" + }, + { + "dataPath": "params_shard_331.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "0189be740712437c41b83f619bcaeedb" + }, + { + "dataPath": "params_shard_332.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.59.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d44f64eec2d90e478bf715d28873b7b8" + }, + { + "dataPath": "params_shard_333.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.59.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "762015935c4e0b5e58dfc83c5ef099f2" + }, + { + "dataPath": "params_shard_334.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.59.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "e4c5959cc6794a66cf9e304b8fbaf9fa" + }, + { + "dataPath": "params_shard_335.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.60.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "446b0c09cbc6e8dd4cae13217136a95c" + }, + { + "dataPath": "params_shard_336.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.60.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9951d3caa7255d44583550ed2a14d23b" + }, + { + "dataPath": "params_shard_337.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "4667e0d02a83dd1bab4fb341b326102a" + }, + { + "dataPath": "params_shard_338.bin", + "format": "raw-shard", + "nbytes": 26927104, + "records": [ + { + "name": "model.layers.59.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.59.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.59.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.59.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.60.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.60.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + }, + { + "name": "model.layers.6.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26894336 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26910720 + } + ], + "md5sum": "c0fb71c1bcca08c8d7035b19997a605c" + }, + { + "dataPath": "params_shard_339.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "87f9b1ccec25a88ad6a85b25d078e746" + }, + { + "dataPath": "params_shard_340.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "c1293b91143ab5ae0b6c9bf9f90462b7" + }, + { + "dataPath": "params_shard_341.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6e4e75d2bdea5bdf85712852601b4e41" + }, + { + "dataPath": "params_shard_342.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.7.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "2023ddf4527240a9f58099d0797229d7" + }, + { + "dataPath": "params_shard_343.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "9ee8a7c22da25c3d7af7b9f6f7f84f21" + }, + { + "dataPath": "params_shard_344.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "c6d6291d120982f79dde12fa7540cb10" + }, + { + "dataPath": "params_shard_345.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "d99e6be5707aabfd4c63ce9c06b1c174" + }, + { + "dataPath": "params_shard_346.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "23d1d03b5ebce3346cda87063f003910" + }, + { + "dataPath": "params_shard_347.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.7.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.7.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.7.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.8.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19337216 + }, + { + "name": "model.layers.8.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31084544 + } + ], + "md5sum": "b563c3a24800396f720383d4855c53c9" + }, + { + "dataPath": "params_shard_348.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.8.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "e8790c045a58c694ef741b15f2469058" + }, + { + "dataPath": "params_shard_349.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "662a560332a9dede932e4c39922336f0" + }, + { + "dataPath": "params_shard_350.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.9.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "953ba7a7cd61f13c163e52bf3ac1302c" + }, + { + "dataPath": "params_shard_351.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.60.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b37237f68fc391314f6c037dcf6df226" + }, + { + "dataPath": "params_shard_352.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "fde0853993310bd6005d4f8dd42a7536" + }, + { + "dataPath": "params_shard_353.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.60.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "1f1e80cfdcdf264cc95ae669e97b6f53" + }, + { + "dataPath": "params_shard_354.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.61.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "33dbc2cde8ac393aacecacd6f148a4fd" + }, + { + "dataPath": "params_shard_355.bin", + "format": "raw-shard", + "nbytes": 22712320, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.9.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 3358720 + }, + { + "name": "model.layers.9.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 7557120 + }, + { + "name": "model.layers.60.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 10915840 + }, + { + "name": "model.layers.60.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 10932224 + }, + { + "name": "model.layers.60.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22679552 + }, + { + "name": "model.layers.61.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22695936 + } + ], + "md5sum": "7306dd969da1c3ebe997b7249c6e0488" + }, + { + "dataPath": "params_shard_356.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e1c9cd039ea87de7e0fab2e9082273c2" + }, + { + "dataPath": "params_shard_357.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.61.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "abb8202049197d4073124d449b22f114" + }, + { + "dataPath": "params_shard_358.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.61.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "2d04334289ae754a0ba8c8f005740c02" + }, + { + "dataPath": "params_shard_359.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.61.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dcacdc81d33fad9e268473a6ee88aed0" + }, + { + "dataPath": "params_shard_360.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.62.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "b018e1310dd16a90eb0e12e97f5efcac" + }, + { + "dataPath": "params_shard_361.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b5fed6e979f8a62d0f71e9d10ccb4182" + }, + { + "dataPath": "params_shard_362.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.62.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "683edcb23cea67fd3dc37932050ddabd" + }, + { + "dataPath": "params_shard_363.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.62.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e4b0096a509cba19045562b1ce391222" + }, + { + "dataPath": "params_shard_364.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.61.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.61.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.61.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.61.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.62.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19320832 + } + ], + "md5sum": "1254dcf3649d3583c038ac244fd0847f" + }, + { + "dataPath": "params_shard_365.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.62.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.62.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "f5f86152e455e7df4b1ba2993918d61a" + }, + { + "dataPath": "params_shard_366.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.63.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "152f836ced39e8d4be6b26fd35f9a152" + }, + { + "dataPath": "params_shard_367.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "99a448fb0f31e72d93afbba5aad0cbcc" + }, + { + "dataPath": "params_shard_368.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.63.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "92d2d65dfd78d2929dbcab9103c07a64" + }, + { + "dataPath": "params_shard_369.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.63.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "44a49955b5c02ae6bc604d4909fd0bf0" + }, + { + "dataPath": "params_shard_370.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.63.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "9ebaf0819e18eca140e12190d346bc4b" + }, + { + "dataPath": "params_shard_371.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.64.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "c3231c8afc65961385d88be0654caeac" + }, + { + "dataPath": "params_shard_372.bin", + "format": "raw-shard", + "nbytes": 22745088, + "records": [ + { + "name": "model.layers.62.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.62.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.62.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3375104 + }, + { + "name": "model.layers.63.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3391488 + }, + { + "name": "model.layers.63.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3407872 + }, + { + "name": "model.layers.63.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15155200 + }, + { + "name": "model.layers.63.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15171584 + }, + { + "name": "model.layers.63.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19369984 + }, + { + "name": "model.layers.64.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 22728704 + } + ], + "md5sum": "647b0ee82354fa4f10900672bdc3ba6d" + }, + { + "dataPath": "params_shard_373.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "3eb99d1c90c0a53a9f095a49fc09fa64" + }, + { + "dataPath": "params_shard_374.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.64.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "09c921a28614bcb7380128fc2e0157d9" + }, + { + "dataPath": "params_shard_375.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.64.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a8aa673d5a001ba8fb9f86b5eb62611a" + }, + { + "dataPath": "params_shard_376.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.64.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "b86b2994a37bb9c00731ef2d0dda539b" + }, + { + "dataPath": "params_shard_377.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6210dfed1ea62936cffad1daf6fae108" + }, + { + "dataPath": "params_shard_378.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.65.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "a8fdddd90db43512f731364f9aad279b" + }, + { + "dataPath": "params_shard_379.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.65.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a854339a32af1f0c5ef51aa58eda688f" + }, + { + "dataPath": "params_shard_380.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.65.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "38f53003a3609ada142abd21a6d28bc0" + }, + { + "dataPath": "params_shard_381.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.65.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "296e824b39f20afe7d2654eb7363bfea" + }, + { + "dataPath": "params_shard_382.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.64.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.64.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.64.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.64.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.65.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.65.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.65.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "c17c596b2739c1769996b534933b982d" + }, + { + "dataPath": "params_shard_383.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.66.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "68d5042279e6ec60aa8944be6aa3c27e" + }, + { + "dataPath": "params_shard_384.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "94eb47e929bc7aab401d3371c8bbac79" + }, + { + "dataPath": "params_shard_385.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.66.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "241673a2708f5438b2ecf560edd6ded5" + }, + { + "dataPath": "params_shard_386.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.66.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "f13735e836f79c8afb8df28b484fef8c" + }, + { + "dataPath": "params_shard_387.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.66.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5620a21ca85a0d7ff64d3fa8fbb00295" + }, + { + "dataPath": "params_shard_388.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.67.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "99a0a843106946bd0d7ea335e223e7d7" + }, + { + "dataPath": "params_shard_389.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.65.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.65.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.66.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.66.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.66.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.66.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.66.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.67.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "c59517d6689edeebb9b679f9a7600ff1" + }, + { + "dataPath": "params_shard_390.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "2c1e9046d8b630c3289e84ffdc092500" + }, + { + "dataPath": "params_shard_391.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.67.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "912d0cf53aec6185f39f63793a287493" + }, + { + "dataPath": "params_shard_392.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.67.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "646d1b1f7e502c577883d301c7cc1ec3" + }, + { + "dataPath": "params_shard_393.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.67.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "880bebebff9c1cca6429cdebc072e5e0" + }, + { + "dataPath": "params_shard_394.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.68.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "b83c294c10c704b554190f599b2cdb1e" + }, + { + "dataPath": "params_shard_395.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.68.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "5c46bcb9044420eb1a544ff3aa1c48cf" + }, + { + "dataPath": "params_shard_396.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.68.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "d507bf4a646ded61091ce49bcd5dbfa1" + }, + { + "dataPath": "params_shard_397.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.67.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.67.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.67.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.67.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.68.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.68.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.68.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "079f11849863c6ac245b494bb3e0ae70" + }, + { + "dataPath": "params_shard_398.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "6fd4f1ca3b7ac1066d1ba8b2f33bc063" + }, + { + "dataPath": "params_shard_399.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.68.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "4943762c16fa049047b11532fcb28cec" + }, + { + "dataPath": "params_shard_400.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.69.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "e78d6f4d00ce09fd09ce9a2d14623793" + }, + { + "dataPath": "params_shard_401.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "f10bd8b08e1bf71f052e8036a0ee79db" + }, + { + "dataPath": "params_shard_402.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.69.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "9211825a8aec27805522c0235ad2d778" + }, + { + "dataPath": "params_shard_403.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.69.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "7b3989eca3addb150345b7a641eddd53" + }, + { + "dataPath": "params_shard_404.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.69.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "42b3290a330a22da61f070ea790b4522" + }, + { + "dataPath": "params_shard_405.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.70.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "84d7ce8100278122933bb61ceced82c6" + }, + { + "dataPath": "params_shard_406.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.68.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.68.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.69.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.69.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.69.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.69.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.69.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "9eb56e63f8d1fc81c43cc5e2905b1071" + }, + { + "dataPath": "params_shard_407.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "07aac6375f7d9612894ddf3daab94f92" + }, + { + "dataPath": "params_shard_408.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.70.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "bded2f04ef76d585d15cbc3a2ab4c745" + }, + { + "dataPath": "params_shard_409.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.70.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6d16279eb95d7d3a8ed1b90c122d919b" + }, + { + "dataPath": "params_shard_410.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.70.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "8ab51a22eac05f788b16588480cb6177" + }, + { + "dataPath": "params_shard_411.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.71.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "73c34fccfbad831dae264c9c26da8269" + }, + { + "dataPath": "params_shard_412.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "762623061e9801fbfa9b2379f109db06" + }, + { + "dataPath": "params_shard_413.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.71.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "10f9cee642b8be8c72229cf6175734a2" + }, + { + "dataPath": "params_shard_414.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.71.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "ae475a394cbc37b6d0f01b569a290b45" + }, + { + "dataPath": "params_shard_415.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.70.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.70.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.70.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + }, + { + "name": "model.layers.70.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19304448 + }, + { + "name": "model.layers.70.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19320832 + }, + { + "name": "model.layers.71.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 19337216 + }, + { + "name": "model.layers.71.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 19353600 + }, + { + "name": "model.layers.71.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "9b986f4ccdd3d8652d4f6240ef8b5b04" + }, + { + "dataPath": "params_shard_416.bin", + "format": "raw-shard", + "nbytes": 31068160, + "records": [ + { + "name": "model.layers.71.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 0 + }, + { + "name": "model.layers.71.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 4198400 + } + ], + "md5sum": "78ffcc950147d9859a41558994a25b1b" + }, + { + "dataPath": "params_shard_417.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.72.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "9200787421ae6b7b2366eed844770e7e" + }, + { + "dataPath": "params_shard_418.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e469ed30655dd20b7693ff7515956d7c" + }, + { + "dataPath": "params_shard_419.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.72.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "cd6215285d09156a8654022ce4271b33" + }, + { + "dataPath": "params_shard_420.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.72.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6dab4486bc615e050daba042e038b8a9" + }, + { + "dataPath": "params_shard_421.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.72.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "d9c25e8fda3e0340e89655c4e5df3415" + }, + { + "dataPath": "params_shard_422.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "e1be5e9905a727fdbe114df4f9396d89" + }, + { + "dataPath": "params_shard_423.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.73.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "f3f77732e53f2a4505a0123f48b7e9cb" + }, + { + "dataPath": "params_shard_424.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.73.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "e22c192922902fba9ad3fbc1437a9643" + }, + { + "dataPath": "params_shard_425.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.73.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "55bcab4f47040d999b123e2dd8d32d84" + }, + { + "dataPath": "params_shard_426.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "2120925b10523ff20a4273235fdacbb7" + }, + { + "dataPath": "params_shard_427.bin", + "format": "raw-shard", + "nbytes": 30269440, + "records": [ + { + "name": "model.layers.71.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 0 + }, + { + "name": "model.layers.72.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 3358720 + }, + { + "name": "model.layers.72.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 3375104 + }, + { + "name": "model.layers.72.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 15122432 + }, + { + "name": "model.layers.72.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 15138816 + }, + { + "name": "model.layers.72.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 19337216 + }, + { + "name": "model.layers.73.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 22695936 + }, + { + "name": "model.layers.73.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 26894336 + }, + { + "name": "model.layers.73.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 30253056 + } + ], + "md5sum": "a0e6891c0518c227c74637249a23f534" + }, + { + "dataPath": "params_shard_428.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.74.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3269b4f1a016fb81c930409747ff83c4" + }, + { + "dataPath": "params_shard_429.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "eaf85026c17fd3d6c11ef3591f28d1c2" + }, + { + "dataPath": "params_shard_430.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.74.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "75bc7026f230836b6575f66870012412" + }, + { + "dataPath": "params_shard_431.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.74.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "288cfa3562e13e2db1eda557bc8e5a6b" + }, + { + "dataPath": "params_shard_432.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.74.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "287269deac3d37fb6ee0070b207497e6" + }, + { + "dataPath": "params_shard_433.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.75.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "3874921a218ef383945be2b5f30b06fa" + }, + { + "dataPath": "params_shard_434.bin", + "format": "raw-shard", + "nbytes": 31117312, + "records": [ + { + "name": "model.layers.73.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.73.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.74.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.74.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.74.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.74.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.74.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + }, + { + "name": "model.layers.75.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 31100928 + } + ], + "md5sum": "bcf1bb95ce730782806ed46218e58935" + }, + { + "dataPath": "params_shard_435.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "cbd384c04400d8096923ca8718a8b2fc" + }, + { + "dataPath": "params_shard_436.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.75.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "0d43411773653ebcfd3110c5a116d583" + }, + { + "dataPath": "params_shard_437.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.75.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "a67b2f3c5fe028d6422373ed2c72cd5e" + }, + { + "dataPath": "params_shard_438.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.75.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "3f9d2ce23bd31e5ae8688ab323561179" + }, + { + "dataPath": "params_shard_439.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.76.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "6e7a78abdba3445d672b3d70a9dfef10" + }, + { + "dataPath": "params_shard_440.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.76.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "26a993446541ac84d90f0532645d0096" + }, + { + "dataPath": "params_shard_441.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "7bdc9b1f3c4e4a3ddfda571eff97e015" + }, + { + "dataPath": "params_shard_442.bin", + "format": "raw-shard", + "nbytes": 26894336, + "records": [ + { + "name": "model.layers.75.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.75.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.75.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11763712 + }, + { + "name": "model.layers.75.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15962112 + }, + { + "name": "model.layers.76.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 19320832 + }, + { + "name": "model.layers.76.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 23519232 + }, + { + "name": "model.layers.76.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 26877952 + } + ], + "md5sum": "4ef3fd46bd28ac700e3de2df00982741" + }, + { + "dataPath": "params_shard_443.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "4b9708a470c627b39afa81b0835fa35e" + }, + { + "dataPath": "params_shard_444.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.76.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "5b12a93c61c7b1331170ea937b24343c" + }, + { + "dataPath": "params_shard_445.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.77.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "7045fe94e8f2233f001440bd858f48ae" + }, + { + "dataPath": "params_shard_446.bin", + "format": "raw-shard", + "nbytes": 188088320, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_weight", + "shape": [ + 57344, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 188088320, + "byteOffset": 0 + } + ], + "md5sum": "b664affea57f5fe94adf02f2348c0941" + }, + { + "dataPath": "params_shard_447.bin", + "format": "raw-shard", + "nbytes": 23511040, + "records": [ + { + "name": "model.layers.77.mlp.gate_up_proj.q_scale", + "shape": [ + 57344, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 23511040, + "byteOffset": 0 + } + ], + "md5sum": "edde67e4b7d45c1b7d56b75ee2de3088" + }, + { + "dataPath": "params_shard_448.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.77.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "4dceacfd05ab66a0957e2b5ff2f5b487" + }, + { + "dataPath": "params_shard_449.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.77.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "dfd3b2fb6fa58c97062352e320bbb410" + }, + { + "dataPath": "params_shard_450.bin", + "format": "raw-shard", + "nbytes": 93978624, + "records": [ + { + "name": "model.layers.78.mlp.down_proj.q_weight", + "shape": [ + 8192, + 2868 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 93978624, + "byteOffset": 0 + } + ], + "md5sum": "26e15707f2a1a62436b65aaa1440fc1b" + }, + { + "dataPath": "params_shard_451.bin", + "format": "raw-shard", + "nbytes": 31100928, + "records": [ + { + "name": "model.layers.76.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.76.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11747328 + }, + { + "name": "model.layers.77.input_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 11763712 + }, + { + "name": "model.layers.77.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 11780096 + }, + { + "name": "model.layers.77.post_attention_layernorm.weight", + "shape": [ + 8192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 16384, + "byteOffset": 23527424 + }, + { + "name": "model.layers.77.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 23543808 + }, + { + "name": "model.layers.77.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 27742208 + } + ], + "md5sum": "6181ecb751235ee96894c279856ed024" + }, + { + "dataPath": "params_shard_452.bin", + "format": "raw-shard", + "nbytes": 33587200, + "records": [ + { + "name": "model.layers.78.self_attn.qkv_proj.q_weight", + "shape": [ + 10240, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 33587200, + "byteOffset": 0 + } + ], + "md5sum": "8b01a9d49ea5849c6c347843512845e3" + }, + { + "dataPath": "params_shard_453.bin", + "format": "raw-shard", + "nbytes": 26869760, + "records": [ + { + "name": "model.layers.78.self_attn.o_proj.q_weight", + "shape": [ + 8192, + 820 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 26869760, + "byteOffset": 0 + } + ], + "md5sum": "68347252bd94011bf38374dde220b720" + }, + { + "dataPath": "params_shard_454.bin", + "format": "raw-shard", + "nbytes": 19304448, + "records": [ + { + "name": "model.layers.78.mlp.down_proj.q_scale", + "shape": [ + 8192, + 717 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 11747328, + "byteOffset": 0 + }, + { + "name": "model.layers.78.self_attn.qkv_proj.q_scale", + "shape": [ + 10240, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 4198400, + "byteOffset": 11747328 + }, + { + "name": "model.layers.78.self_attn.o_proj.q_scale", + "shape": [ + 8192, + 205 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3358720, + "byteOffset": 15945728 + } + ], + "md5sum": "9716d55fa609e6f60cc57f2e9f6ef526" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddfa968cf7b25f36fd20cde9f2177ffc795c706d --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2c920c6bf5c104bb79707055f466fd8994501321c94519e2ed7c83b55706c5 +size 420679680 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bb3e59c56269f6c7ac35af59f2ef756f60006e5 --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d649e7f8f35c4029219d64a807f706eee519f419ad0ab3a158f9487aefb0d5d +size 52584960 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..bec29a03a26ebcbd7cd755cdd47fcf90c6ea80fb --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b788d52556ba992a8325b50f6fe9c054e3578f8deaa07b1db8c633f97ff293 +size 52584960 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..50c83d844d60783b8b7cf3d57891ffb0497803a0 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b206232e032bec38ec39111e9ab22af159c3d189f49dbd553275f310b300b92 +size 23511040 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..008f5623b827643e4fe3b1012026a7df272a5e2e --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9ff2ba0d38ac9f60fc7bb6e3c43156abb2f6192f35c192e5f4c50dd5e33d3a +size 93978624 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..017b6f8924e4d9962eab59304b3b0d9868f8aa8d --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:063673645290f02373f8f3355fcc7a0cc0170b7302d4dc08148b7f0ebe119175 +size 188088320 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..1468c26e56fc868a7e236ebd17442aab1c9d182c --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4087b45e7cd5a8c8fe4cb122bf3885c6939644851f68d87cc02950a5321ee63 +size 23511040 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..c132000f2da1d0a2b76f75f0c3f9495ca9d0a86a --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:304b850ef47e8921919fa6a8f6f040f0b98d562c3676edb05662e0169b665a85 +size 33587200 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..21f9ebd2f516f02258d840e0a0ea1ae937e9b34c --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94db35ee96812b8fb1d1047afe654a9971395e5f9001b10339b8a0f08aa27b4 +size 26869760 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..96e5717a25cc341dfed5cc7f5cfe355a93f767f4 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268ffb3dc01d0fb9aa1cca160d9ea2eefb955e68e8b1d9722c15c71080a7773e +size 93978624 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..56620a79283e6b59f7bd935f89a0dee9e32cb21e --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb836df0fa7abe829c2d9bbc84781f54c0582b22723f00ae5fd0136ac94da1e2 +size 31100928 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a4a67328a02abd47f5cb2c61729b87ec48d6850 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b204461c4dcd943acf03632e136be90cca1c29d61a0995966f9c80693598a5 +size 188088320 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..75e84c8e2e629f0711ab00e0970681b87aee9f4f --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad58533ccae3d27afe1beca1cb4824f38cf24f42a24766713123851da7fdb3b +size 23511040 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a73d24b1a8260091322892a1ab6f421af5c5a0b --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de4042ae00c20cd1996f6c8ad7c9f8848b05878a4474399967eb14698b44e48d +size 93978624 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..15a0de782e92101159909017123577d5d41af4be --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97fe24718b26428881ed1cbc7c9835220be1c81735d2cf3ed2ad2949fcaf34e0 +size 33587200 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..c65070e44ae2aaa98a94a4c76c29bf769a276d8f --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27251681bfc7f5e82b9f580895a55376acba9fd13857261aa9ea81cff72aa140 +size 26869760 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..3cc6b74ec3136d0c3f7283b7a9fdcd3767024730 --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69f24c1e58af877f7517cde1485ada2226926da26f1edb3a076a56688ee4eec +size 93978624 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..1bb2a9c819ddc618c834e4662619b168eeaba532 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f282054ac2b8a6d425e4b533a7d3d612eb18f42399aabb427cb087ad179e5aa +size 188088320 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..403fb81f3ddfd6c3052f9489929114db5e7269d0 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac466517f0e2069cda0999a6d26d594bc369cf19c27ba871a4dd905e23c1743 +size 23511040 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..375dbc5da71a44d06b20e539de7cb3e554ea5a8c --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ebd4628f8d1beb9e942953ac54f7d8150cdc93e4fb2c10e60e4ec4cd1bd2b1 +size 33587200 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd5b20e297a4266ce4bdaf31efec3f85a170e373 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eee39cd443e63a9a5f271fa6de122f28219389ecd16eb2c63c604998969c584 +size 31117312 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..74d6921eff2e6da136937aba41a0f8a0fc01c3bf --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e44343f685e4bb2f0e3c2d985b55b251105bed6257a0248f7e55d35475c587 +size 31068160 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..544435e54ecbfdb8c76645046d359da691d7cb1c --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d7eee7ffee33c2c62ee544eeeb49711a443d07bb102f327609438c3364cbbc +size 93978624 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..8eaf829012e6149eb6e68d051a3a00545bfe011f --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71a827077a18a270c0426e0eca925882d70b72a6df6009496320f13d4c74cee +size 188088320 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..a09db55fde002bbfdd32b98149fc9b0cfa63a578 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf793124732639cc7371a41e88b62c3eb61a15013a6141edc3edcf09a0b7fc3 +size 188088320 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..733a2a82d3cf05912a901a1f5630521fcdb4cd2b --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:393b301c296ba1729ddf2f7d25b4cba59e02611fba21be4b9297a66398fedc0c +size 23511040 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b07c00f35f40256ad7c46688f4c5e4161974abe --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1dc1ace2b6850ff08e581a8207fd62f2a223959facb360ab8e437b86758a5c +size 33587200 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..1500090f79772e8f97e7d8473a0c36459d8b3cc1 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b065a70d951dc621aff741c6eb2de9ef9dc86e2601e518057f5aed6ef1cf3ccd +size 26869760 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..21510743202e22f08868a9903b70084027acb5df --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f7b8eb0357eda73a24c69c719a0a2274fa497980828bc05437193ca044543d0 +size 188088320 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..6313e7a324dd4467a98730dcbdc91bc1d9f52b9d --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a715ff7caa913994e828190523cb12a44668db9658c37d18a73d41b676e19364 +size 23511040 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7fb71f91dfc59e155c9ac0237126ae5c5c6dce7 --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae731188fd7899259c1ecf18ffd42e14daeb5099c0a8c6e6e228f10ea39768c +size 33587200 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..00f5bcc667a07ce29a3dd05c6acdec932a13b930 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6db9950cee2acb4ed72dcb1676b48d6a078c463f928ef2872abb351b77b361 +size 26869760 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..60980f7310f850e23e390edaad731a13735891cd --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae89e7ead49c86cfc632e0de3c8bc127e0d36e50ad8d57ef1c451b79a29d327 +size 93978624 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..f1f90478bef89d8c5fa970a01d7d0d596d41b8f9 --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cfa0d29adfa8611b2a462cbbbef634e92699f472c77ff23c58a678ed59f7daf +size 30269440 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c62ff77e7d11bf259cef80b98d2772be8b50830 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5fbad29da8000a1257d8ab8ca7ab7704aa09686cf9ef8af0f665262e3e4582 +size 93978624 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..018dd3170e96254cbbfb54705d55b3094736c719 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b98856ffcdeb15c94ff15afe0960199219630c5d3b2844947380b8920291e5f +size 23511040 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..37bf909491168024f2f972e8776d187d647de337 --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad26c77c7ef84b3eaa871bca574ba6f00dcf4c71862d9265650e3b464f9844d3 +size 188088320 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ba3293c33bc952950e63463308021d6a1a01adc --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0499cbb76426b1dc103f9e23ad7fc7bbd0e13cf943e9f4c5729a5c83270e2d9 +size 23511040 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..53bc9752b0f0f0beaf4a75804a708ef31016dd23 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6c82b55221ab0e2bc5c1d1833250f0ac155df1dd1f9ea74cf4aa5e19fbf597 +size 33587200 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..33d3db8331f10aebdae5e5dab1b98db6d8d90bf3 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00f22c9134f4ab9b3178140fd7ccf70f491d25d2628473988af1f96df7147b09 +size 26869760 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..49af25cb11277541364165fb8a201f1d2032aa56 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f2eed1ee5c4baf0a09facb9815ec5cfc54e762e540c19180f050b6d3c8a17b +size 93978624 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b5a6865a67272373cbf5871118ae8507cee74b0 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97309c6b0f2570f074a978be85044a776a3c32324c06dfabf03acc194be79b67 +size 31117312 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2ac2a42adf14a361b1847ca254ef68fdc6bc73b --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae19ba0b308b752a2f85ce458cb61127b449c0bad6cc55e0b7b1d70ba29035ed +size 188088320 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..78bfd07d6829f8179f5812226dca455a70b9b035 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07942ca49445c61f39aa5e06c7ea8dea0a0cf6518701541131f3d7007d984556 +size 23511040 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fd278b2e69faae7b9631f9775c2164e9158a5e2 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc374572fc853c39a823991e924c28b15b0fd49fbf98c0c7874425f3d8e50a6b +size 33587200 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff3252db601e8f3cbfaf012bc8a866f1d50496ca --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c3eb9717ae3da5d43cedd99798ac61e3f7fa29a0338f5e5418a7a18837f7d8 +size 26869760 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..018f4789bcc6f83658f7778f3dbf272fc2066bf6 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2cc9b9bb4f3ef09ad9b20bc657abd73c6401177383867d949adb92c76ee1bf3 +size 33587200 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b3e8dc3a4998b8e402bfe28134b85e19ef6ec7d --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747571bc2515f167dab82cbeb186c349a6adb518f9d107911a2a96a962be2a8a +size 33587200 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..304af29b0ef609226024e48657e113db23f9dab0 --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577ef1b4a0ad6a6b6e5f0b87cd77aead9deac30171ca0c82b1598bbba7548353 +size 26869760 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..99f0db7b003587e2c3e68b82e9169f1557142b89 --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3113e03fca644bcecb9e7ef5dfe27201a4a951b73225ed1fe733eacd6bfd4a +size 93978624 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8635226a9749570cca5757723f6c958713fb847 --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:228be67af43065b28a03aa549c661812d2d62e28f936c731ebd1a54eaa5b2686 +size 26894336 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..69d8bf3e95816b34827f00603bc7fd613ccfa142 --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b11c7ef720d8bf45ed458213a99328cf0b092b129e0fbb94fc5217de475cc1 +size 188088320 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..8fe449e22222267a65cc1a3529b69719da7f41fe --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c48f09facef4b5de9e9cc5450b0a600ba5d9a712ad631eee6d32958d69f745 +size 23511040 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..d42b12c6a32a991d81160f0cce36db24da96032c --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ddd0131a77fc4d4439647b2a6ea6b13a8a1e6d860cd118cd6fa391b410b1c5 +size 93978624 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..482af91ef7a6d54bf9776758907e5e202f88e216 --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e03d4065c30a570b9bb4b102ace29f948eae975cbbf10f4297397c957e3a834 +size 188088320 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..6943984481358b4064710ecf32dc95648b0e2552 --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62700817179990428398e6348c6818e92393dd0ec1c2243bcc19201101258ca1 +size 23511040 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..45793b11f71e4376209dca014ba224d0ed52217b --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b9e58bdbcca2d4632a2d96cc01937afd173a24759ff12fd9b8e3c9507ded73 +size 33587200 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ecccd60713cfde52767239acac4393227439ca8 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:345376c3f175dfa69d8edf249f19eb0aa62e312583a72b7fc177ce8dfa54e1a9 +size 31117312 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..e23faa8722b1ac4ab66c0ed7ef4c8e7455a430d3 --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e0f747e1d973798e918d969b6bb06a016622a30fb42620e500fef8121ae640 +size 26869760 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..2f40f6c09c1473209a699a7cdb7ce31c1e23b692 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bc60eab30ccdcf44a85d80fbe2c7ca2bd683a8f32a09e20c4b61f2ec1f70642 +size 93978624 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbf1e56ec42e540c9c057963a0cc74b8f2e4867c --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e069e13a96a26d429ffa4e5535ecb1ff56dd73076d69d47f2766a3f4702d46 +size 31100928 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1733253cdcd70035e18d2eab727af09d1c668c8 --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e33ce0d970a635766393f2b4c4f6fe832fe62edc57c9568f8c9f2177f631d51 +size 188088320 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f0d9b5c3ef75252965fd22352b76e14476248be --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ed16a52cff0fccd2b6393b51a2ec5c16888025239310c7619397d08ca439a0 +size 23511040 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..5216cd64d1932e29db67f9eeb3c399128126b2df --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd7a9d16e12930d0e2c3432c0896c283e5447ef422e0b810753fb69c1169a96 +size 33587200 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..66efb673b9c7a5781020f2d52d31dd58151def1e --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c89499d7b4d3c3551f30f9f5f9b72b177369640fef3e9398e3c53fee9ee5a94 +size 26869760 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c201d316ecee74727e5853d6f4fb0417785e878 --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cd6292e20ae73cd74a5201200c2c6e83b8cb938f6d4b64d09a24d7f319ff9da +size 93978624 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d0d2fbfa2c81aabf6cf98a0bce99bd07685b07f --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1a1b1beecf95aea0407fe1ffbf50805082535af68603e55aa1a6649ad7f9af +size 188088320 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..188631564f365bcd55699f3e7eaa250e4017353f --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e1e08fcb5c0600a4e65ddf01fe2441b56e0a75f84fd74e5403414b35fb9318 +size 23511040 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..1084110859b72fda35c857f3e6294eb96f78704b --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f0326c459780afe0eb63a2f93dd81ea1ddf5da9726282a590037ad748e302f8 +size 31068160 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..f43cc4d93d217a05109f9f0dec08c02ecf7ae363 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468aade889f57d825ef6caaa62215a6fd3b56d63c3b3ba894d8ba49146dd96d5 +size 33587200 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..49243d406013a879d9a3491edf27e8adba862942 --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8e71b89cef93cae8aa325b1e372440898659f3e50431afb780b5687bc65a3e +size 31117312 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7e5a2b5cb2ecaba685809d51ce0b428a4c77b22 --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d25e4ecb7ab2f6b30cb8a687d2d8a92c8d2fde2b3fe04fa670ad5e4f8bfae7 +size 31068160 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..d87c832f4d8247facde6e8de94c7d64d9d0d7fef --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9138114c783e7ecd59eec596bc00c9f3f1f3a115be620c2543676a857ca0e6 +size 93978624 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..5461b9203c5717a15962680fa58c0038a8d93546 --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b7d1bfe770911af75c99356de4d19798765d829c271a9f185b58b92b217828f +size 188088320 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..edc24550f694a367ba63a5a7849421b947f874fd --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ea3d25943bb149de4bf12bd1fb547afa83eaf7f2933c210fc5517a2c3e850a +size 23511040 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2a908d237754d1f383a5992208fe8d1f1d317c0 --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3be73c8b923a781dbd27e32e84f9d19fa272eee912061203f4ea42ed8ecac4 +size 33587200 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..91d186f362fab08e5953ba1926e3d54a5a81b146 --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b6955ab0ab17aff1137a4612340b093e202d1d9e30bc94b723e752c5ef8d2c +size 26869760 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..48258922b9ec7ec9c7de6e976ea0b994bc3efa65 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e87a6629bc6bc51d781f57045a970a973358a24333eee30e1bc5527978e498c +size 188088320 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..2844a7ae422bcdf14c45d3a8ed347b94bacbdb0a --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02bd1875a9dad20f9e2e33fb97850dff28c1f96199fd3c7c2396d7036202cc81 +size 23511040 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..975dcfc9850e1e1d1ef81aa631ccc8d81c9b6f2f --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e87d47a39906d247cae0c1f0aa53695c1354eeabaf04b9d40058093ff5d52085 +size 188088320 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..36ca62dc30848ed4690e146bac0cfca8759858a0 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e9ecf06c29458f3dc9a458fabd844a00b78b43fd9d812302d5f9e804bc79e0 +size 33587200 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..aff454874ac116d473750b5612468c8d66d574a2 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25078eb1bf22f777ef85c2688ef698bc1ce53632df9bc3f6226f456596687cc5 +size 26869760 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..85c727ed3ce89d5cd73d95497c2005ec51a9a1c4 --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651a0efa43daa450ce227f3ace29f76f684e3534e08b6b9a82726d7f0bbc9daa +size 93978624 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..96399fe5db9a5e35a8f8552acf01454087bd5db1 --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f1049af379b133da068bbeed505101e9f4aba12cc2c75df1a12fdafc40638e +size 30269440 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d2dd1022036d624bc247a6a79b8f51e0b54251f --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4768df5b2ce0d1642f422da9d1a2d1fe7ae1d8865138881a50cd5e3b3dc1b17 +size 93978624 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..6718b9f3fa0740cc3e46e9ef075de94fe92fb14b --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd366b08fd46dc0d0d35d49736ea9c72619db4d84d61598609df6b66f8cb4ab8 +size 188088320 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..941448a23af08f62b9acd8a969a22a99cbe1dd7b --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bba99e30943598ead7393c6ddfb697f9b6460cb02d8939d02f9278811df11c0 +size 23511040 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..b32f1bdab2a0b492c78dfd69a281cf8f62600f30 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02df718512daebb9b18df7933e34ad374cfe0a2a8a77f3dd5ab8b0649e8972e3 +size 33587200 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..596b828cdea962e7dc27a2fd7178b2a2530a64f1 --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95e3c2f5a9fefbbd9f435e7d8575af94a623afc56a8ef3d9c3112ac2950dd57 +size 26869760 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7c4ba971d2b74d94247de383fd9918ce39c179b --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f644d2a209a8566f938e861fe587ae6ed565871e157e18bcf3263ac148b140 +size 93978624 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee94feba37075b23f5a1556b85602f25584b4c1a --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37f639147a2777163e50eb17248a6931194b56382a61535cf9d8cc4bb3841845 +size 33587200 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..25df8c9645ae8eba854ffa792c0d83a34a8ded11 --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4a76c409579621b803c549dcfc562fa989691d681f64566db506a9a7b5068d +size 31117312 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..67562b8d23b7b2610f6701e6e9bbec1185290896 --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b7aa57b5c803af347aaa16dfb422eafaff6e9c2b40db2b5332dcc4362379f6 +size 188088320 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..e529f010c25a446ae8b3c5ac2729c88539774a81 --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8243d63a08dae5dee2885ca6cbb86235d762e2ebaa3deebde2014d22ef487a5 +size 23511040 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..5799b05a3d732086356179c9e8e364af29d4bfc7 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaff60586727f8c0b976eb34f9f34820900c55ab924c89c1f425701e809634fa +size 33587200 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7d19f56ff2d54fa6865bb87314d4a167baf8ea4 --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69295d06f066e71d815b17b470715a444dd5aeb89a968f55180e9493ce07648d +size 26869760 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..2419ac70381f647a631cd316cd8ace27ab351c05 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822729b5d9fe869dee07d40ee0eefcc81dda5032718df2366dd8a4e29b103f64 +size 33587200 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb165d0a7ba6dc92f916590f91abe8385139a45a --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087d4f3d9f150cb81915dfdf4eb4da47735ab8b8c359e5c056426315c24a9816 +size 26869760 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd61ea762244bbfb5bb2d0e185249bc155486940 --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22ed92b9351ca83bd5128724d85960d4f17b1e57f9e20fc544b6e2dee14bfec5 +size 93978624 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..bdbb05baa2eaf5ce3e0f2a51d03069d283670b6c --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f846d4e38bd7e64117bc459ee1a5f082a46cdba4ec1eda4ac2f29c607106b3 +size 26894336 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3af48cab34f3e9916b052a8911f4fe03a358eb0 --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b44a9c0414eeade6e3c8bb3c84ca3a05e87e29cee417b4a3c87c2ac822d349 +size 188088320 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..812b3bb967dbbaee314a4545f7f9cd680d3b2c0b --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9776da79e8b96da4490ad47204f5fc137ee4dd485e4dc0075081c37b55940fd1 +size 26869760 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..690bc2c1e3c2cdae9115a915158588d2273cbab3 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de229afea33c6c1aa717e4082e7aeb1c09d7579a10151cf0e87784fcde8ffd4 +size 23511040 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..502d51835914b65fe03f07c2753ace8a66a06f24 --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99781b23ef1a6efe8158738b56d49f58782eaf24642535322d1d09be6dbbb31f +size 93978624 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ac1ca1c320015680fd6f08c9320fe9dacf18299 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6365ee443e8206adc0b8477aae270092dd3c55309e3fd01e2c70f003e0ed25af +size 188088320 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..48bf77d194b497851a39bd6145a9e3d953ffcf42 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ef7cc315dcfce49e55f2521093ca35e051bdc2a2a4031bdc8cf51938ca8c402 +size 23511040 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..b50ee8aab82da97e28f1664cd9015a983adb9f6d --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3423d4d6b51be4aee54defd752c00d3ba3ff5cb0b2f2400a2f460a8da717e0c3 +size 33587200 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..75f3676f5ba4fafb9de88dd8b10097abd33f6f18 --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e31ce41e62b18245caf830a4ddb9b2162ab308d371169b34ec0af557f9896ed +size 26869760 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..29c17afa83fd822c445ac2bb8af7830fa5216dde --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34123e6ce16669e1e49c9fd9a2bcdb85db3a2e0c9c6ec57423bd9514565b3f07 +size 93978624 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..093acaa9ab8f3180d0f149dba4d70b6ff161426d --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be05efb3571df38928b38613053f1be97abee92e3447f3f1fdd8d39fc7d4b3b +size 31100928 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..663b18f89eea15c7af742d86f155c5e5f102e3ac --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0875f4166c21dd56c61e51d87edae3e1b172025aae85517095576e7c5127c7 +size 188088320 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d23400e357db4f5dd71393f97fc75b8887f6015 --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b87b17f380321b8c2e042289126adb84ef1fe86242c943181150d6e414dcb6d8 +size 23511040 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba7fd2eba01ba9a1b952554ba6e4380f19b42db7 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86837b68753ac384a81cb4cc7578c57311e8fdcc5f50bef95daab7313e1526dd +size 188088320 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..ccb85640bfd09ff420158271d8c9c4b6c506aff6 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22cdba9ab398555c46416e08ba0330525f12d9357ceb2252f11019af183b90dc +size 31068160 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..a546e6a7e4475b72d833bc47441ec000d2b9b881 --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65a05e58f2d081e68efe866b6c16b4fd9e17cadc110a955d9e6805d72ced9308 +size 33587200 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..b77a9f741586ef1871de87bf16fb0b4ec2369c70 --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02eac780761ceda0035bdb30043e76a63aa53c424070361f3619d9afe69b52cf +size 26869760 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7620e35205aa73ad45087a15fd398f9003b3397 --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddbf606c92d7acfb6647a5e48164ff90f45b8ca22785f96c670a4192b468c6a0 +size 93978624 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5cb30590379fb9609a82940958ae77948453d67 --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f556d4c32941d3cf4d89b4786395f4c8d0a363b0bbe21b82685d32c52890ac +size 188088320 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbb2e15f667d8a47e7f6bb21eab840225b05c9ac --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80675e65630778c5322d6c1d41f9eff4e73e9e71dbcef1a662f75afd47add686 +size 23511040 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..04b144884fa798a413264f827684b775a00c1e2d --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c7d3855a590a70e95ffd9edfc283624bef91c84756513faad876ad87bde324 +size 33587200 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..32f20d5142222277806345e286cafd6a26a11b31 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce74bc56a2dd49d412f78baa3c2826af9bba9e1bddb40525558dbc4946cdb25 +size 31117312 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf071d77cd38632cf7f0ee5f53d946ecf56bc138 --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39f9c947cb20618440eaa71586b37db47c98081984fd04c8686c5655429d6a1 +size 31068160 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c909b6182ae208d46d893d188d82cc17b438594 --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4926ea4581d7e88f431dd1da48340fefd99edf1bf121057f8b6eda88100204c8 +size 93978624 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..36739631a93dce6b4156a3f8e395527bab35ddbc --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c56fe6a1a7ddab746484410847047905358c787e09fe8ebead861f254eef4f +size 188088320 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca022ec7e8913e79b5dee1692a6e337002626d9c --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34a7253d25b4e91b98641272c396cc9bab14c3df1ddab19d652f0b454f7d66a +size 93978624 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..4619ee8f21be87e7425a427ef6b25425d426895a --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f6748def9a07ac185686181cb53fdbadc106f933a9b97fb880f53efc4f367b +size 23511040 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbb86b768f994a37f412dc52dcf60a2cf343dac4 --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db82f2f2c90c9d72b3fcbe23f4ea562cad50ebc3f9b1135d8aacb8ae15edbb90 +size 33587200 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e9fed1a285c7672d7296a3f06baf1b082d0e7b1 --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5fd3db74031bee5e1de1c2a1436f8280d9b8b5dd45e485fd3e814a89e2a761 +size 26869760 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..93a4c0db43f38e9f55b955aa89df98ad820a08d1 --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0d2486508b8547cd1f8f4357c2b6ad4e108fdf73288251a23e0e2aab454b9d0 +size 188088320 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d3e4aa1e33e836dbf7a5955daf8fe5e0886dd5c --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a37b321b07e38a6899feb9f5bfaa80eaf4fa01ebda0f2ff13c8e37510dd38d5 +size 23511040 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..222a61d400edd3abd54792c71773d1dc18faabc4 --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff7d276f62d8c2b57f14c67dec0869d90e77d0e2401d81befefa3bbe35f951e +size 33587200 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..31fbd10c45d38558a779a2db1a3ffb316c6f9550 --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e1c9d8b55e92c17837faabb62a804baf19b793f6625a322dabf4ff4bf74acd +size 26869760 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..971d5389394495007083339efd1f769833687fed --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8ada6fc1464eaeb8047b59355c9f4f0d17b5300e8961c2c84edbce8490a7eb +size 93978624 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8ce00a7416ac58868451b9b62d8684ec0f4fa7b --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54a12c4e2b0a8780afb0b6e49b31b53d9776ed6ff32a11390890a5e403d4e67a +size 30269440 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..aca76c2ed086ce1365cb9686fa837a34c40811f8 --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e9b2fe5cadc81b32ac178983e15558d4df7d799ef7d25f7bc8723594142576 +size 188088320 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..97eb0b21394655f0f7c86c1de475a2fcf7f5c113 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ea97b4abbcea448909c513a588adfbc09061542ff72f76939ac068c33844ee +size 93978624 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2bde4c2b31d65a60de1306c711cbe2f235ac1aa --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35d2490a0b4a02de322182f9f30a569745c59ea47fb8cbf9eebfd3d3f6b70d4 +size 23511040 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6a3c67b135fa188f7d286c5bfb3c0f300d654b2 --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364b43e9857b59b4f24a1cf4a43adedc1e6845f8bf01cc8b47599d9bf49bdb99 +size 93978624 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..9750e1f36a4f086389bdda96628bc776a0d609aa --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa53958255498bf8b1a6dc229f8c0cc6f432edee327b263af9447051833a4da6 +size 188088320 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..2350ade96e2496c0c24e7ea7933b15eb90e299f5 --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a270192974cbd274ca84aa7a24acde35b76c6d98151c20b58d887dcb52ebf7b9 +size 23511040 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..072560ce1962fa9fcc7a128e64fde95f5ce79987 --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e2bb318ebebb805804a911684a4c20c1cf6fcf9be52a91adfead6e6f749ddb2 +size 33587200 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..456ce0551bdbe99b9c5d401113b7a907b1428580 --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f523cc1914e040d4b728056b4283983e3aa7e4a0666798e25a25b697a304902a +size 26869760 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..b47c207d26752132d1d911720d570caeb1369a37 --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ee4442a7a721f44d4312f9cec65cfdfcbbce135a0f630b93bce1106680f8c6 +size 93978624 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..81ca441b5d5944fab97ae007dfc736cef6a1f34d --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4d4c48dba687e095ff567a73ccc2e8dad241cc913268f45d583907a7968726 +size 31100928 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..fcd17279d36a0a260b3035d00fa0a97c9822353a --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5704cfa5752b84fc59b7886d29f93d281feda443b2c723237717d4851235680e +size 188088320 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d0b26ec340fe964199bded191e31d0bd4d29465 --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5351d7cb62b02743d55a109cf0e6d7eb15584652401f3a031b86863bb67edfa5 +size 23511040 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d617f6e89891137872f7102ef92cf06c6422070 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36fd9685d15c031e910c9a87b0c7ceb3dcbc5df9a83fc85ee09dc4e49d26b63c +size 188088320 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff033f18b98cd9f6360f2a5ee2ef92b1a701f715 --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6079671d8caeb95bcdfcb34b92e684fdb095af1a8e471a036d80fd9e940dd4 +size 33587200 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..188376d0fb110fcc9ce12cdb8c3b3700908d949c --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78cdcb52c1ff21df419809fbb3b5eb9b47ebbad9704f285309e9257323db9012 +size 26869760 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b61d01a87df39cd57742ac5b5ea2fe9a96091cd --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b755af7cc73d6981c6fb7c261456cf493301eaba30a091565c34e0ae940bf0e7 +size 93978624 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc8de38c651f11d7741948df3b0214fdda199f04 --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626f8b8b5659a891e89ac15087885f1750dfed096f568d4bc2ce4f0fd3f9aecf +size 93978624 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..8899330bdfd6bbe0bc000935621bb17eae6602c0 --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524628462ca30fda6311215915a55da213c545421ec8c8ab275604cc9258aff8 +size 31100928 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2bbc3d8e7bf8b6b34f255759b0ed57802a02e2f --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be32e50cb0f9804f870b7eb68bb6f00655f426d58b9c96339c1285cac3290935 +size 188088320 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..239bf6659ee3f6d642423be090981bcf16e59389 --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628b07d6182b74822d41f49ea814d0b2de0f126add31f6266bd9052428ab3eab +size 23511040 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc21c8248f4646b15d4cfbf45ac630a73096377d --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38bd7b29c0dd884343f2ec182619fba462482faab06ef46d3d1747dfd4d3dc6d +size 33587200 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ffba97c23b8554b2a4e059fa7172faa5e7546cc --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51892af54961abcaadca6cb1d25feefabfaf989a5a9fdd844896f413afe5de71 +size 26869760 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..2f64e2fd2febf30aea2d571211f87a52a5accd0f --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a591da7a3ccc661a4b69fb036db2a7772d6803d2953e3392df29c845d8414c7 +size 93978624 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..89b34fef3e50aabb6f563cc1b55166ee6fd2cdd8 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9a3397fc1d8757177bbd0724471f02ff4edd66388a4c0994f8e191b5e1dee3 +size 23511040 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..49129490e25800a5c03d4cf3bcd1778472d2cfc6 --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d58f961513afd6fd6a035be6e10a3187742e077230357c22896466b1f2126664 +size 188088320 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..52ecebd979761fafc999100d55497b065a0a9414 --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1232400b4758fe804eecc0a0c24819839858c16a13a5ef8b628b0a70665ee521 +size 23511040 diff --git a/params_shard_242.bin b/params_shard_242.bin new file mode 100644 index 0000000000000000000000000000000000000000..9642d03970454a026a71d99259fb6f01e01a932b --- /dev/null +++ b/params_shard_242.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c96c65e4281d9c96b6ed66db9ed4112b10938827a6fb3fb58f3c649ca935d246 +size 33587200 diff --git a/params_shard_243.bin b/params_shard_243.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4ea1bdbaf433d646350e86356bb4d04f1308f23 --- /dev/null +++ b/params_shard_243.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63625e164cd6959afe633ef554ee0af8ab7990671e6971c20fd58bc37eda4326 +size 31100928 diff --git a/params_shard_244.bin b/params_shard_244.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd832b016055ce1a2ed2372fa2de3e932a5a12fa --- /dev/null +++ b/params_shard_244.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77718bb0adfe97883087f2e9db2d8097fad7ffe61fa4a75695219ab89f2dfd29 +size 31068160 diff --git a/params_shard_245.bin b/params_shard_245.bin new file mode 100644 index 0000000000000000000000000000000000000000..e484f98c58265277fab4ed85f9ab36306e2babed --- /dev/null +++ b/params_shard_245.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4309eecd13f3763c2d964b2b81e34ac76737f08519a005eaa8af9cdc4c706a9d +size 33587200 diff --git a/params_shard_246.bin b/params_shard_246.bin new file mode 100644 index 0000000000000000000000000000000000000000..ecde108416b9cda9804b1cbf23f62f540b1ee0e7 --- /dev/null +++ b/params_shard_246.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39aa0b29af0d29be0e2b6a195f49b5f542290adc432ffe2b45312f3a8f213dec +size 26869760 diff --git a/params_shard_247.bin b/params_shard_247.bin new file mode 100644 index 0000000000000000000000000000000000000000..d844dacd3b58578b564f64253eae6234c5e52ed3 --- /dev/null +++ b/params_shard_247.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5de76827be44418aeff140b4bf771b1d431c2b729accc50b43e984971d4d7da5 +size 93978624 diff --git a/params_shard_248.bin b/params_shard_248.bin new file mode 100644 index 0000000000000000000000000000000000000000..96aeb3a9554e327ca848b1e2c66a07bc0f28196e --- /dev/null +++ b/params_shard_248.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8230209ec6af1a2517593ba56028fcc31a86e98df514ca73275c04b2159ace5 +size 188088320 diff --git a/params_shard_249.bin b/params_shard_249.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f79609d4a891b7e44b45184724af97b9c655515 --- /dev/null +++ b/params_shard_249.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5006ec922ace822b2fb6f901c49ae26ec08e787c2df9553ffe6a9882529d07 +size 23511040 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fdac40ba8480669f76ca442272af6b525ce3b5c --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c17d8454aefbd4a9f1e649ddc5dfa6ffe7911a01ff250e45e25cd7d3e552eb8 +size 33587200 diff --git a/params_shard_250.bin b/params_shard_250.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4706e7f60503cfdc9a9012e854c3f570a44e005 --- /dev/null +++ b/params_shard_250.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a96659257fb5908d6cf0559244de888c4e436ee29bc56763d831401a96f6ade +size 93978624 diff --git a/params_shard_251.bin b/params_shard_251.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ee2e0a87ddf234ddcfcfc959f8d498c6833e4b1 --- /dev/null +++ b/params_shard_251.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039ccc477c67fb436e47295afd469e9ea8c29913c99a36847e094f28fe6d5257 +size 22712320 diff --git a/params_shard_252.bin b/params_shard_252.bin new file mode 100644 index 0000000000000000000000000000000000000000..e908ba2e8ebfe3ace28f3b624cce4fb13aae58b5 --- /dev/null +++ b/params_shard_252.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4aacf5a21b4db21e20963e7cc353a8e9592b7a9f657f4ec45b3ce9bba48590e +size 188088320 diff --git a/params_shard_253.bin b/params_shard_253.bin new file mode 100644 index 0000000000000000000000000000000000000000..9bb6ed562b486a3bc6b4ba0c5fb84b4ca86da7d8 --- /dev/null +++ b/params_shard_253.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daaae5f36f8507abe1c5ba59c0d297e28d39fa8bdef95d43094d25fee3585dd8 +size 23511040 diff --git a/params_shard_254.bin b/params_shard_254.bin new file mode 100644 index 0000000000000000000000000000000000000000..73e9a901ddf18572cd828fda248c1969473073a7 --- /dev/null +++ b/params_shard_254.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b877f53b3cfd8cd82ffc271cf4ce9c5e1353f9ec4f055e32643c0ad83c899f8 +size 33587200 diff --git a/params_shard_255.bin b/params_shard_255.bin new file mode 100644 index 0000000000000000000000000000000000000000..91326b18585c6700ae90b4cf055290b6e0ff5e95 --- /dev/null +++ b/params_shard_255.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98ed68ef0c1c30ce512b798c4ffe6b62c9d615bdf39da824cdd1afc2b9ff2b10 +size 26869760 diff --git a/params_shard_256.bin b/params_shard_256.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9480b63fda8ee43d9a838912294748c5ac33d20 --- /dev/null +++ b/params_shard_256.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:281f7d44af223c2b084a828b4c2e575b71d70a9b12cfb9d3918cce6c6fce2668 +size 93978624 diff --git a/params_shard_257.bin b/params_shard_257.bin new file mode 100644 index 0000000000000000000000000000000000000000..23ffd5d43d92fff21465f97bbdc9885a49349e85 --- /dev/null +++ b/params_shard_257.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e08ad33b95d607f8b5359c1f6932583b75c718931acd87183c108b100775480b +size 188088320 diff --git a/params_shard_258.bin b/params_shard_258.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca1482d502828ffaa635fa223299bfeaac2500df --- /dev/null +++ b/params_shard_258.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921dc2fc70a8b2f61a23a168243ece9692c283d5a1e63244c57f255e4affa483 +size 23511040 diff --git a/params_shard_259.bin b/params_shard_259.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b8c598a6bb64ebf3ae7d10657c7fd17a05fe941 --- /dev/null +++ b/params_shard_259.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d3ef1fffd8586eedd2a347cf3e2a257d5e35c6aee6488703a91f22e5f4c7d8 +size 33587200 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..a49c4f950f79bf861fa21427b372d254a5c2bd9c --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecd2504f06bd30a98b70f977bd8d77e00ca96e373a9914252fa5e41af758818 +size 26869760 diff --git a/params_shard_260.bin b/params_shard_260.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdf53faa92ce363b961f73c0ecab8e2c20b179e7 --- /dev/null +++ b/params_shard_260.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec82e183aa31fa1b937bea973b5e2b5fc820d5142ae51e2cce3eb1d756fbc86 +size 31068160 diff --git a/params_shard_261.bin b/params_shard_261.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fd47658f0eada60682dce9ab9174cecec97f9c7 --- /dev/null +++ b/params_shard_261.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebee31273a5560eedf5b8678570b5e446e8179a23aaeee504387dd0151330f32 +size 31068160 diff --git a/params_shard_262.bin b/params_shard_262.bin new file mode 100644 index 0000000000000000000000000000000000000000..35b85687ee21a2e796626dfe1bc5d79879631521 --- /dev/null +++ b/params_shard_262.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb27929a9892bc70182c15a020cf08da346fe58fa9e0e28a12277a6cb94b8e34 +size 93978624 diff --git a/params_shard_263.bin b/params_shard_263.bin new file mode 100644 index 0000000000000000000000000000000000000000..ced623b01f3cba2b20b107331e8cdb40f4c061a2 --- /dev/null +++ b/params_shard_263.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a23e08d503d3aa81db161ae075d9ed66d8abcb66d78531343c4ec5e90bddfba +size 188088320 diff --git a/params_shard_264.bin b/params_shard_264.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3822d968bf96c06ab394ccf456e50be273043d2 --- /dev/null +++ b/params_shard_264.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a91d08728b9bc48c09392235b89bfbfebf1c8034fc4ea8cd1a17fa451bd6a34 +size 23511040 diff --git a/params_shard_265.bin b/params_shard_265.bin new file mode 100644 index 0000000000000000000000000000000000000000..92aac3db6ba62a33569d1deddbae0b7ff00f084a --- /dev/null +++ b/params_shard_265.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa27597542cd232918bcc39e15b1ea2797eddadff88f3a6255d31ca77bb602e2 +size 33587200 diff --git a/params_shard_266.bin b/params_shard_266.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e6cc8dadb5776fdb25af6019b204d1f58be8e7b --- /dev/null +++ b/params_shard_266.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26491aeabe34a36b78b38a169b5230115897832176de3a44666bca0618f38079 +size 26869760 diff --git a/params_shard_267.bin b/params_shard_267.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ad2beddbd0aaab29c4a9c66bdeeff6ccb314635 --- /dev/null +++ b/params_shard_267.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2247bfc8b61ec9732af2d41fb6c58fc6abe4cfa1e93578fce614f4dde060110 +size 93978624 diff --git a/params_shard_268.bin b/params_shard_268.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5c7764ef2195973439f8be05c9acad042980129 --- /dev/null +++ b/params_shard_268.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f63f37e69c503862844f391b671e870530042b0d91d1d324b300b49dd24196 +size 22745088 diff --git a/params_shard_269.bin b/params_shard_269.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e87bfefc7006c5103df6faad043cf6bd055d811 --- /dev/null +++ b/params_shard_269.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e68cb76baa5b74dd7ab39ef31e153efe204744e9a8081e553c8558e51b48dc +size 188088320 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..460136c2af9d8f57cfa9cca8fa062bd75de052f8 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa4267119d211b08130f3950cd5f92dfff7d33751c08d31156dca57eaae990f +size 31117312 diff --git a/params_shard_270.bin b/params_shard_270.bin new file mode 100644 index 0000000000000000000000000000000000000000..e134812f7cb2b067c860d900f747c8fbada49565 --- /dev/null +++ b/params_shard_270.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce05ce68eed37712b53d6a7c603e8041cedc9bc97b7cc5cb0c06733ea0bb7ab +size 23511040 diff --git a/params_shard_271.bin b/params_shard_271.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a3bc3dcfb5fc5c125f95b05c63836f6fc2dbc07 --- /dev/null +++ b/params_shard_271.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97cd4b6c816ed04288510de7d34ed1e1b6203f73aa166d03a5390d76fab88174 +size 33587200 diff --git a/params_shard_272.bin b/params_shard_272.bin new file mode 100644 index 0000000000000000000000000000000000000000..907391649a0206072e1d4b0fff3d931afa0a5ccb --- /dev/null +++ b/params_shard_272.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:955b01186085becdf9439e57250bbe30699be45d69ee38a2a10ae1da48e67dc5 +size 26869760 diff --git a/params_shard_273.bin b/params_shard_273.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f23f29440587fca0603bf423d2c907d323fae2c --- /dev/null +++ b/params_shard_273.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f42435018b1e22163d603913b39f296b0fde1766ed7e63b31c3422907835ad +size 188088320 diff --git a/params_shard_274.bin b/params_shard_274.bin new file mode 100644 index 0000000000000000000000000000000000000000..11f8a6396f61d14e57fa5f2713e379f986eaf54e --- /dev/null +++ b/params_shard_274.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:091cda090af4c57829b10c0579518443696484c891d860e4ff9f5b8e30338033 +size 23511040 diff --git a/params_shard_275.bin b/params_shard_275.bin new file mode 100644 index 0000000000000000000000000000000000000000..35a689b0dc2ada67aab9901a3993463d0f9daa02 --- /dev/null +++ b/params_shard_275.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c340b1fb90af1b747d1a6360f5ebb47335adaf999f78ffdd3128ba828a4d86 +size 33587200 diff --git a/params_shard_276.bin b/params_shard_276.bin new file mode 100644 index 0000000000000000000000000000000000000000..61812e07420e017308503016b426ad88cab70742 --- /dev/null +++ b/params_shard_276.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ee11360125675098ced00d5692bbb28b40dee131e09d5ded71b7cbd7a3845a +size 26869760 diff --git a/params_shard_277.bin b/params_shard_277.bin new file mode 100644 index 0000000000000000000000000000000000000000..9b8c99794ec89fa20ab7691d9ad604d21f195217 --- /dev/null +++ b/params_shard_277.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53520d393ee395c56ca81f5de7521a0836fa9a290f857bd6e3665ec714b5a1d +size 93978624 diff --git a/params_shard_278.bin b/params_shard_278.bin new file mode 100644 index 0000000000000000000000000000000000000000..b3386ea939b1066a6484546744caead6ebf89faa --- /dev/null +++ b/params_shard_278.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8bd95d237b8574ca3d28d995777fa56da108d626c5f0eb340bdd63a2019653 +size 26894336 diff --git a/params_shard_279.bin b/params_shard_279.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e3fdad5556298a6daa69c4b3584aedb7d7704ba --- /dev/null +++ b/params_shard_279.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a684403d292b284bdd017a482e05f560e6ba0969bc66b6fd9af65f341e89c4 +size 93978624 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4351919c19aa0ebf5b7829505a1aea9cd45a45a --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544e00785f0777fb217c95765dc83073a0be416d6e26ab355dd856ed3e52374a +size 93978624 diff --git a/params_shard_280.bin b/params_shard_280.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c4273002d7c7b4920dd0ea99b45ea1457609bd0 --- /dev/null +++ b/params_shard_280.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42450dcc5c8b2e4aa8ea0c3d293544ba4855e6b1c97dbcc00fb84f0f9e4b515c +size 188088320 diff --git a/params_shard_281.bin b/params_shard_281.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b6f93328af63eeba6fd4567bc10b7b4eedc1fce --- /dev/null +++ b/params_shard_281.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7993e11e4653efddbc3d8b927cb8877908d61aaff4bc21bc4d2a5362af4c29 +size 23511040 diff --git a/params_shard_282.bin b/params_shard_282.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e9a175e45f122cfa693e11899621a2cbc777af4 --- /dev/null +++ b/params_shard_282.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b7ad88737084cf2217520b2cb094d4c58767553410cb5001d3f4d503f36f13 +size 33587200 diff --git a/params_shard_283.bin b/params_shard_283.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bf9225a7a8e52a5037c0047a596a03e2fa586e4 --- /dev/null +++ b/params_shard_283.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f2e80f60ac6e2f1366a852452a7fadb97ea49681ab778b89da81b75c2771df +size 26869760 diff --git a/params_shard_284.bin b/params_shard_284.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa2e1d0afa6f505e6c6134e6ec0590676e2f0d85 --- /dev/null +++ b/params_shard_284.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2248d4db9ec3bba1869a08ae1130db502c3dc88bfe50bcf7f875d32d6c19d90e +size 93978624 diff --git a/params_shard_285.bin b/params_shard_285.bin new file mode 100644 index 0000000000000000000000000000000000000000..803197f86274978512459cfdc7539114166b8f7f --- /dev/null +++ b/params_shard_285.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a641b207c5bb64fcc595cbc51fbe7bcd45ddd4fd0447259ae14461ea331fa7 +size 31117312 diff --git a/params_shard_286.bin b/params_shard_286.bin new file mode 100644 index 0000000000000000000000000000000000000000..099418809e863ff0ce508bc00ac10d9f6fc393b7 --- /dev/null +++ b/params_shard_286.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9055de2638d8e95b69fd677ee897bf739b7bccfa69a21bf08fbd1c6a4b4496e1 +size 188088320 diff --git a/params_shard_287.bin b/params_shard_287.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b69d64ca534081ea99c04a3897bb497ef35ae34 --- /dev/null +++ b/params_shard_287.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fb2247dac333b0e7e53ed73b57323d0c3d8d21fd314714ce23a158f4fb4eb7c +size 23511040 diff --git a/params_shard_288.bin b/params_shard_288.bin new file mode 100644 index 0000000000000000000000000000000000000000..b689cbd0dcd2b97f17e95514156a521bc0dd381b --- /dev/null +++ b/params_shard_288.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6303ea4fb10ae63c5b3af9a2a0afedf3a1a1ed886d9fe82daade08a09fb0896e +size 33587200 diff --git a/params_shard_289.bin b/params_shard_289.bin new file mode 100644 index 0000000000000000000000000000000000000000..77e6eb52c265762cb8d13eb16195cd7b78740e0d --- /dev/null +++ b/params_shard_289.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f3c9486c58e487f6c8d2aabb783fb8a6bcf4a24b15d05a33d0b4495b2f25ab +size 26869760 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..d9ceae5c8032cc45caae4c0e0c7e97bb9d139b18 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4623c74101d6030860a82c3fb7e9d740cfc0130b6ca6c06e91b0b7384d4eae +size 188088320 diff --git a/params_shard_290.bin b/params_shard_290.bin new file mode 100644 index 0000000000000000000000000000000000000000..45c92c044fd2dd2318be0db1a67642676ef4a6c4 --- /dev/null +++ b/params_shard_290.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344e9ccb8e1f148d5fb1de2df7137b0528188ed7ef66b2bacfcdcfdf990a4f07 +size 33587200 diff --git a/params_shard_291.bin b/params_shard_291.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4cacf42af87f238ac08881a5ca7be60ab4af263 --- /dev/null +++ b/params_shard_291.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec431460e5e38acae5555afd8a470ddcc0404f8292a816188252c26088bd2852 +size 26869760 diff --git a/params_shard_292.bin b/params_shard_292.bin new file mode 100644 index 0000000000000000000000000000000000000000..5abd5d9d892069ad11cf8c2b46fecfeecb24c9fa --- /dev/null +++ b/params_shard_292.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a0e9bf532d40433ac273174151e33ddd54f1dcb31f947051116aac439ae72f +size 93978624 diff --git a/params_shard_293.bin b/params_shard_293.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a15f93db45ac2c724fcd35cdbe027957d416122 --- /dev/null +++ b/params_shard_293.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8243ad24cc681c56451ba5f5e4a7012ba3d2821c37120f04928a3adb62a7dae6 +size 26894336 diff --git a/params_shard_294.bin b/params_shard_294.bin new file mode 100644 index 0000000000000000000000000000000000000000..496a0ab33761cd24e2ab48f5ebbda5c461c281ac --- /dev/null +++ b/params_shard_294.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2dcc06d569dedfc6c8ca5fcdc05381be5b962fae0c278969a70aa5316c40c53 +size 188088320 diff --git a/params_shard_295.bin b/params_shard_295.bin new file mode 100644 index 0000000000000000000000000000000000000000..069768173223f1c6239cdba7305f1a2be82d2900 --- /dev/null +++ b/params_shard_295.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4cc5d965701f427f0aac8cd3a33dec4795d15aec4dbc4df8c334c602d034cd +size 23511040 diff --git a/params_shard_296.bin b/params_shard_296.bin new file mode 100644 index 0000000000000000000000000000000000000000..1266ed6526290ed1111b10ea1941a6f700fd9388 --- /dev/null +++ b/params_shard_296.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9061f3897c7bf36b6f9a47b3a1da42b7168ff4e695043265f08626e1f4b2eef9 +size 93978624 diff --git a/params_shard_297.bin b/params_shard_297.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ea9a8259aac68835cc42b72546744fab8535694 --- /dev/null +++ b/params_shard_297.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b256966d2dfdc3c1cadbbe0d61db1d66321745cb0f724d03af0394856c208b +size 188088320 diff --git a/params_shard_298.bin b/params_shard_298.bin new file mode 100644 index 0000000000000000000000000000000000000000..9090998c8b6cb70aba9081594b974927d94ee429 --- /dev/null +++ b/params_shard_298.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df46c3431a7d733001eeccd56cfa382f024126382f21056bc41b3199eabc198 +size 23511040 diff --git a/params_shard_299.bin b/params_shard_299.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1434a3cc19aaa9cb0e83f1f1202d7e956dbb1f6 --- /dev/null +++ b/params_shard_299.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f473d64ee273e5ad0aeb9b6384d7d7a27a858e291ba4b9997b03326e17c2a91 +size 33587200 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c05bae5b29b2656df01f5fe098a11d4df9eccf7 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb903802039c3d76c6ff3229e1a3365787523be3eb879c6d5b13b5c111eb60ef +size 93978624 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f5676d35fd32948bdebc4ea760e0ddc1513e5a0 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7490098f9b9a373c6b69517cc9e1c1fa2ffae44d7488ebb91ab4806d8c0a0bc +size 23511040 diff --git a/params_shard_300.bin b/params_shard_300.bin new file mode 100644 index 0000000000000000000000000000000000000000..b611f5a187f2c063690cbda51db9e7a9267eaee3 --- /dev/null +++ b/params_shard_300.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8033e1aa530a8073ca64f38455f802d4c3939ac55724031b8b9d5c46b3b064fc +size 26869760 diff --git a/params_shard_301.bin b/params_shard_301.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3fa2287752551a071758a079dc8f3b62966494f --- /dev/null +++ b/params_shard_301.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee10482868589f7f0de70cf7092049e09f6dd3498295eea50aa4bbdbcbf5eff +size 93978624 diff --git a/params_shard_302.bin b/params_shard_302.bin new file mode 100644 index 0000000000000000000000000000000000000000..0da43264bb69e8bdcf190b16942578cbb60c3736 --- /dev/null +++ b/params_shard_302.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf92d0ab52ba5778a5cf2a86c15804eb728cda6524689cbbe4f8fd059738d85 +size 31100928 diff --git a/params_shard_303.bin b/params_shard_303.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c50db1bf332ef307d1c20f116bef4fdb15494b7 --- /dev/null +++ b/params_shard_303.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a25149ec17beb10f340ba35211e7dd24d9b6b80e2759c3f7f6fcbbf99ccdc14c +size 188088320 diff --git a/params_shard_304.bin b/params_shard_304.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fcba844fd215103bc3da33d8fedb62ad3a0b9e1 --- /dev/null +++ b/params_shard_304.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459638db3b5186a5822ddadb37bdefa9aff1575a0e2ac08be30f79c85ee96faa +size 23511040 diff --git a/params_shard_305.bin b/params_shard_305.bin new file mode 100644 index 0000000000000000000000000000000000000000..71c535bc899b730c7499fa3e702b40d28636611d --- /dev/null +++ b/params_shard_305.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654302e145388854c08aff3c3760f243bb3ac2a6f2c84b5ecccb9f5f30ccd7df +size 33587200 diff --git a/params_shard_306.bin b/params_shard_306.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4ad7e7df99f4d0d26b76b4df3483aebd8a49912 --- /dev/null +++ b/params_shard_306.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f2f48ca179ab3a64066e287926b7905b43a11759043e83d67f7903abd8cd17 +size 26869760 diff --git a/params_shard_307.bin b/params_shard_307.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b3f2c82f793f973b30f1d197d2be1186594e24d --- /dev/null +++ b/params_shard_307.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afb4e0bd09adeaae3f001ecbd0846c49f2ec7dbde19be45e95ab7395e673b22 +size 93978624 diff --git a/params_shard_308.bin b/params_shard_308.bin new file mode 100644 index 0000000000000000000000000000000000000000..47584bd0d4f9755307978cc66e4d1c9a09708655 --- /dev/null +++ b/params_shard_308.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ecaa443b3fe8baa6ac97d0b40d53f331e1f03808cd43086f42067d4915053a +size 188088320 diff --git a/params_shard_309.bin b/params_shard_309.bin new file mode 100644 index 0000000000000000000000000000000000000000..507243d07b50218e303e8e272d5f769d7ce5805b --- /dev/null +++ b/params_shard_309.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60bb23ea2c9ca1490eb1b08b65cc28c4f0c90f0454adb93b1912cf4dcd07a853 +size 23511040 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d47f6b736c1e1e5ec77ce7941e6a4f2dddd6b19 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421a9dc7a7f198abbc900cd04502d0811fcb5239bef6f21c87f61b670d6f9408 +size 33587200 diff --git a/params_shard_310.bin b/params_shard_310.bin new file mode 100644 index 0000000000000000000000000000000000000000..e711135fc4e386df00c0cbfa51da82ddb793f00e --- /dev/null +++ b/params_shard_310.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762256354568acfcab2d91b7193bf98192e80c45563c64e9dcd473716e31e7de +size 33587200 diff --git a/params_shard_311.bin b/params_shard_311.bin new file mode 100644 index 0000000000000000000000000000000000000000..db5406a53b91db9075dd8b62958fd13de967f20b --- /dev/null +++ b/params_shard_311.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21fa5ae2e0541e581c6cd61becd688e1244da37145b6282c8a7f28a627fb92d5 +size 31117312 diff --git a/params_shard_312.bin b/params_shard_312.bin new file mode 100644 index 0000000000000000000000000000000000000000..d129d8b5091e52afbc6ddde526592e21b1b14b60 --- /dev/null +++ b/params_shard_312.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7491b21073445d4f9ee79d3d9d63d21d8b65a99dc95331b5e50694bd95dabe3 +size 31068160 diff --git a/params_shard_313.bin b/params_shard_313.bin new file mode 100644 index 0000000000000000000000000000000000000000..96f41b8278545900972b50e2161687069419bf75 --- /dev/null +++ b/params_shard_313.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a034f38904e490878b65bc4c6be47c310ac21a7446f86d603cf1208a421e7330 +size 93978624 diff --git a/params_shard_314.bin b/params_shard_314.bin new file mode 100644 index 0000000000000000000000000000000000000000..50c1bcacc2923e72b8e926fa124abf9305fcb34c --- /dev/null +++ b/params_shard_314.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66aab5de186230c5c003448f9b1a20d0f6694069e69a69b81033bc06eb530c81 +size 188088320 diff --git a/params_shard_315.bin b/params_shard_315.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e1eb2f4d5f6f9880b908da76ec7dd252f8dbf32 --- /dev/null +++ b/params_shard_315.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:449408a5df7b3253cc90001ba1e4fe02ecd3f9bbf2c8f98a425a5eb415ddfd5e +size 23511040 diff --git a/params_shard_316.bin b/params_shard_316.bin new file mode 100644 index 0000000000000000000000000000000000000000..55b65908a04d2dd5d609e2006f5e5609ebd0934f --- /dev/null +++ b/params_shard_316.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adada7639c4018f0bafcc57bf8cd43fc7e540020da0ffb7ba07d063a95488373 +size 33587200 diff --git a/params_shard_317.bin b/params_shard_317.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ea8a5823d15e78c2a586c3266fbaef80a0d8a42 --- /dev/null +++ b/params_shard_317.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7a5147917f6905899a4ed5b159fa0aa813f6ee708240d02c345c83cca4d50c3 +size 26869760 diff --git a/params_shard_318.bin b/params_shard_318.bin new file mode 100644 index 0000000000000000000000000000000000000000..310a6e42e1bc7c591f9b5972ba0cbf887cbfd357 --- /dev/null +++ b/params_shard_318.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f670a33efa7619890f0d16bf31b9e28edbcc78932ac6abf3524d371cc26b2be +size 188088320 diff --git a/params_shard_319.bin b/params_shard_319.bin new file mode 100644 index 0000000000000000000000000000000000000000..491a7e2a7f277f860cc43aa47938c9e0d7eec4e7 --- /dev/null +++ b/params_shard_319.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b530c900f74a0191121e2e0bc35767460f619b4749b52b1679fc1039736609b +size 23511040 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..2627d2260f0c4e84ba209fd7cad44556047e8090 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045a416c75db9a1d71895da54d1b5a13389027f723adf2ea2c011e68f95bf45b +size 26869760 diff --git a/params_shard_320.bin b/params_shard_320.bin new file mode 100644 index 0000000000000000000000000000000000000000..e317761222931ae14f213950492c0f796739f481 --- /dev/null +++ b/params_shard_320.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c12d5892a71b6de2b020a0b2b59a7e70c6ff9b06ff3b53c969a49976b91ccae2 +size 33587200 diff --git a/params_shard_321.bin b/params_shard_321.bin new file mode 100644 index 0000000000000000000000000000000000000000..6890b03a2aa710fb57239d3cfc2755a952d4b7e2 --- /dev/null +++ b/params_shard_321.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10e74dbb7d993c4ed156be1b6e52d76d3428c1492818f47d1c641ed8637bf5a +size 26869760 diff --git a/params_shard_322.bin b/params_shard_322.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbda4c5d7c3fd2e2a75f02a2e1f8ef4de5efdce6 --- /dev/null +++ b/params_shard_322.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c68509c7c274b0a792be1ece7840e9d242e39aa86b5c0dcb3711ebf2399eeea +size 93978624 diff --git a/params_shard_323.bin b/params_shard_323.bin new file mode 100644 index 0000000000000000000000000000000000000000..05d44b1f9a27a14ab45da582eed3f45d9ec9e150 --- /dev/null +++ b/params_shard_323.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3e118cd5bbdec23344bb70c2aad87d4b987bdd378f829e8d0079f958e2310c +size 30269440 diff --git a/params_shard_324.bin b/params_shard_324.bin new file mode 100644 index 0000000000000000000000000000000000000000..97cd66aad6e5fff6bdf1c16276805da8b26abc3f --- /dev/null +++ b/params_shard_324.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef628ead4765e17bb3cb1168deedc0d9948b374740be9e61d0fe6cebce22928 +size 93978624 diff --git a/params_shard_325.bin b/params_shard_325.bin new file mode 100644 index 0000000000000000000000000000000000000000..95199559ac279fb4d51b8f544999f2653ae88de2 --- /dev/null +++ b/params_shard_325.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65578c43ca7a2ac2bca91c15c020098dca5244ea57f7d02ef2ab15b33f2117ed +size 188088320 diff --git a/params_shard_326.bin b/params_shard_326.bin new file mode 100644 index 0000000000000000000000000000000000000000..b05e0ca96b00eee0995ded8a81fac92783fa4e20 --- /dev/null +++ b/params_shard_326.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395522fd7479e5965c91ea78b464046ae3c4b6f66c02a0ecef09353809eb562c +size 23511040 diff --git a/params_shard_327.bin b/params_shard_327.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a26ccdde681db15f4af099c49a3fd0f20461b7f --- /dev/null +++ b/params_shard_327.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f929f6e23341342e74c2dce6d4f5df69b31205b0d07a805bba5f002058e5ae1 +size 33587200 diff --git a/params_shard_328.bin b/params_shard_328.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bff1964011204ad320013b507032e13b54d5c57 --- /dev/null +++ b/params_shard_328.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75cb6c5a85ab6906b31d791f552f6376036a0e94ba31644c6a3bcaaf4deabe9e +size 26869760 diff --git a/params_shard_329.bin b/params_shard_329.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b17caaf79081f9bb410c6cb565c57b498fe150d --- /dev/null +++ b/params_shard_329.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf86a34ee5e38d4b047810600953bce83b6267cf2c6e93cfd922ff3821b7f8d +size 93978624 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..3eb8b2e043cce729c4feddca26c09c18093fb29b --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd0dcc11ecb5e7adfc327df4a832b4558e9529f9c0c6f658facb927853d14207 +size 33587200 diff --git a/params_shard_330.bin b/params_shard_330.bin new file mode 100644 index 0000000000000000000000000000000000000000..c07079f5f10842e2843db8bd61d2184230a3add3 --- /dev/null +++ b/params_shard_330.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49df0797922c249b477ab0ccf8379b57ea0b322d9529105f460b86ebd561d8ae +size 31117312 diff --git a/params_shard_331.bin b/params_shard_331.bin new file mode 100644 index 0000000000000000000000000000000000000000..355c03456b04b5fb4e1add9c89340beeea4c873c --- /dev/null +++ b/params_shard_331.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0e061b6a146d1511a67687af74989f61450d1dea7ab077b465a31cf3914d05 +size 188088320 diff --git a/params_shard_332.bin b/params_shard_332.bin new file mode 100644 index 0000000000000000000000000000000000000000..8a347100141651fbf10b7fb46d73e87cde5265fb --- /dev/null +++ b/params_shard_332.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff592f4f133dc89736364c6b0556e68cfbdd278221cf409563f7ee8bda124714 +size 23511040 diff --git a/params_shard_333.bin b/params_shard_333.bin new file mode 100644 index 0000000000000000000000000000000000000000..ada2ae22173ae673ccdb49841756fa1da95f5d9a --- /dev/null +++ b/params_shard_333.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd0de633a4d965cfec419c462b4355e3a6aaca8a131549f3f6f74e15400f6a2 +size 33587200 diff --git a/params_shard_334.bin b/params_shard_334.bin new file mode 100644 index 0000000000000000000000000000000000000000..580dacf970bd691e34d643d0d8c8372949f5ce8f --- /dev/null +++ b/params_shard_334.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89625b69974600c7a2f53df79ea20e9cfede8f286e9e444a2902ca5e43e5f4f9 +size 26869760 diff --git a/params_shard_335.bin b/params_shard_335.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3b3c15e77fd22d6231f3a76db4650c501d39d65 --- /dev/null +++ b/params_shard_335.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a84c732ca36e1f3a5a1cb2bb32785fd0aaa01cd35b6d1fe0c965f75f3f6af1 +size 33587200 diff --git a/params_shard_336.bin b/params_shard_336.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a990a50212cec2bcc042be1533dde027e3b73e5 --- /dev/null +++ b/params_shard_336.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b70dae8f86269f5012dc7e6f224a9f3b6553bbf26385fdf4284e7fb93cd9034 +size 26869760 diff --git a/params_shard_337.bin b/params_shard_337.bin new file mode 100644 index 0000000000000000000000000000000000000000..cba8b618c3f020001ee953bb6b874f8b4dac8280 --- /dev/null +++ b/params_shard_337.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5a5fcf25e11f808ef952ebc961c81d3f8c48b610c447143fe475121968dd52 +size 93978624 diff --git a/params_shard_338.bin b/params_shard_338.bin new file mode 100644 index 0000000000000000000000000000000000000000..b2e1d6fa2e39f902cfa5cb8843643001211678b8 --- /dev/null +++ b/params_shard_338.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8bb719880c086926ccbceddd1dbc58fbef704fcd56873012e7bd4324ef6937 +size 26927104 diff --git a/params_shard_339.bin b/params_shard_339.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdb03acf806041ac47582a566f7253a9197ff67f --- /dev/null +++ b/params_shard_339.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21cd112faf4271a318fde31df540ecebb0ef316bd50a2d1de5fac4ea7799a627 +size 188088320 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a4a2266c0d79d96e41a5b2fb79b7561cd167f82 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f89f4529d7e173b01f9650251aa376abb89a077859dfc041d9c24c21eca3c26 +size 26869760 diff --git a/params_shard_340.bin b/params_shard_340.bin new file mode 100644 index 0000000000000000000000000000000000000000..8a05d8664a2736e82cad2429a3076008ac3e1f04 --- /dev/null +++ b/params_shard_340.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf09fed54c31359ed85b7cb518a927e9c560dc5e3e2726fb1a4a6a0839a75fc2 +size 23511040 diff --git a/params_shard_341.bin b/params_shard_341.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c73a1b3985f35bfa20887bf2366882a6d845216 --- /dev/null +++ b/params_shard_341.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:252a1c9f4eb82ee3c86d0ca316084efb813364d23d8b9b081604936ce0f0bd3c +size 33587200 diff --git a/params_shard_342.bin b/params_shard_342.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a66ec29fb479ec812191e051e049574c8494330 --- /dev/null +++ b/params_shard_342.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60971b48ef59ff545f63363bd401e1463b4867d68e28133d06ca9c03850678b1 +size 26869760 diff --git a/params_shard_343.bin b/params_shard_343.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba14cdb8c657a6383e57fff8aa5bff08d740135d --- /dev/null +++ b/params_shard_343.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39fcff5feef1f4775aee7a2fff42db2d49fbdbc414a4c6ee826477f6b9a1f5e7 +size 93978624 diff --git a/params_shard_344.bin b/params_shard_344.bin new file mode 100644 index 0000000000000000000000000000000000000000..70417bf38fe80a1084775409d46e89fe06d5c475 --- /dev/null +++ b/params_shard_344.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d50920062373bee6de4b89ad25d065d138b1065e6bd0ea9a23234934f83b42a0 +size 188088320 diff --git a/params_shard_345.bin b/params_shard_345.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b0059650dd9691ee9c59b5971fd2832f7446f12 --- /dev/null +++ b/params_shard_345.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff2502900b914d4e5e4e147fe0feba976cf968d8341a478df4b5700c3ac11f2 +size 23511040 diff --git a/params_shard_346.bin b/params_shard_346.bin new file mode 100644 index 0000000000000000000000000000000000000000..632ffad3587504aa56e2ff66d99674e977d2e14c --- /dev/null +++ b/params_shard_346.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e01472d6d9d25100720fa72a2f5c6b0f8a4b198e8a60a13b57fea6141ab18f4 +size 33587200 diff --git a/params_shard_347.bin b/params_shard_347.bin new file mode 100644 index 0000000000000000000000000000000000000000..3d3df5961f1e16f116d24d470ab1efcc6756b7e0 --- /dev/null +++ b/params_shard_347.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81cc376e65fc5e90b0fd9886192b6109ddfc4dea813b7ce3aca522809ef18ca +size 31100928 diff --git a/params_shard_348.bin b/params_shard_348.bin new file mode 100644 index 0000000000000000000000000000000000000000..42f4083ca7a55686ed7091b8068a5bbf3a79889b --- /dev/null +++ b/params_shard_348.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc3506402a922f55447e9933f120237388b48bbe2a708de6caea42dd1290dba +size 31068160 diff --git a/params_shard_349.bin b/params_shard_349.bin new file mode 100644 index 0000000000000000000000000000000000000000..56448d3f5ab7f9ec9b1e6541486ae38fc47cda80 --- /dev/null +++ b/params_shard_349.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08b4636f93ee765c003685d3d1eab3b9c44654ce693bef34badcb273304591d9 +size 33587200 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..d425bb88aa3b30a46a82789a03cb452417e818c6 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8420060514ed9530cd90647eb74af3a69864ca8184a4fcade01e5d8bb38c12 +size 93978624 diff --git a/params_shard_350.bin b/params_shard_350.bin new file mode 100644 index 0000000000000000000000000000000000000000..ae4af5d5560f4bd8cf9e1e04f3406d9fd3560328 --- /dev/null +++ b/params_shard_350.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa062548f1277e79ae52d0cb545f0c1881b1f51c3ae0d6ffcbe5e47e614d8309 +size 26869760 diff --git a/params_shard_351.bin b/params_shard_351.bin new file mode 100644 index 0000000000000000000000000000000000000000..de83288e0608d42088040e401d9f7693f78c8138 --- /dev/null +++ b/params_shard_351.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76279c1c0c2184971d5407d9a5ec676b18fe9dad10bf0a2911b7a130aa1a0ad0 +size 93978624 diff --git a/params_shard_352.bin b/params_shard_352.bin new file mode 100644 index 0000000000000000000000000000000000000000..41a9f40f47be6f18a5f51c352b8f4e7c665e97eb --- /dev/null +++ b/params_shard_352.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237cecb95cd46a045968545c29f4326bbb54432a289c8b71e6be2cc4d2ebe577 +size 188088320 diff --git a/params_shard_353.bin b/params_shard_353.bin new file mode 100644 index 0000000000000000000000000000000000000000..988e5ae00d762a4880115077818798afd906c042 --- /dev/null +++ b/params_shard_353.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047df59166fcd571d83751849d21658ca6cbf376fbbc4351f4bc0ef385310a37 +size 23511040 diff --git a/params_shard_354.bin b/params_shard_354.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e4703334f6cce8ad4f2dd03f89c5fa2629962e3 --- /dev/null +++ b/params_shard_354.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49f4c9edcc8b044b66641c03dbcbeb63023bb14d2b0fb2cee8bdfa7173e8b8c +size 93978624 diff --git a/params_shard_355.bin b/params_shard_355.bin new file mode 100644 index 0000000000000000000000000000000000000000..e822172543fd83f384096a6e9cc80cb879649712 --- /dev/null +++ b/params_shard_355.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f103564a6f8f7d7f7859cd1b67ad18a0692263368938c200791f34ca575593f1 +size 22712320 diff --git a/params_shard_356.bin b/params_shard_356.bin new file mode 100644 index 0000000000000000000000000000000000000000..56c43a443b16553f92d5f261add8eb4bfb819899 --- /dev/null +++ b/params_shard_356.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e3743892a9e3689c4bfc59e96fcef980e1acb15a2f0d2af2ea54b4c268550c +size 188088320 diff --git a/params_shard_357.bin b/params_shard_357.bin new file mode 100644 index 0000000000000000000000000000000000000000..ce963e6e71d420fc6bbd5b16208f40afba3ea05c --- /dev/null +++ b/params_shard_357.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd73e2a6052d16d9ff9076869302c9982a7bf237f6d22ddfa3f7c8eeae98483 +size 23511040 diff --git a/params_shard_358.bin b/params_shard_358.bin new file mode 100644 index 0000000000000000000000000000000000000000..11b9f35a29121b972ea45aa146ac8e6305becd3a --- /dev/null +++ b/params_shard_358.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d634cd227841e1a5b6d61406a1015e85a338eca9e3dc9753ed2ff859779e0ce2 +size 33587200 diff --git a/params_shard_359.bin b/params_shard_359.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ce4d0c3cbecf0c0ceaed14317bb519c6fdc0977 --- /dev/null +++ b/params_shard_359.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9276cd848ccf27fd97da26d50b6f5cd2ddbbda17bfedfa3a4848d8f52b201856 +size 26869760 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..c554ec943d1786bebd51d913bdc2bb709f79774f --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f0b6ec09143eac2acbd4d0b0544518188179f7cf827a0565e3aba2722514a0 +size 30269440 diff --git a/params_shard_360.bin b/params_shard_360.bin new file mode 100644 index 0000000000000000000000000000000000000000..1689488ad5fa3f55daac0cf368b487a2cb3c1b47 --- /dev/null +++ b/params_shard_360.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d194ca5703750cee9e82c5fbf534ac2b591e47f16824bd842a04146912061c9e +size 93978624 diff --git a/params_shard_361.bin b/params_shard_361.bin new file mode 100644 index 0000000000000000000000000000000000000000..1850d257bc42086bcac79dddc5f65af2ec4a9481 --- /dev/null +++ b/params_shard_361.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a781ff9bb418cd50c89b85c0724eebab1186da3245757e16ac0a17af51d31669 +size 188088320 diff --git a/params_shard_362.bin b/params_shard_362.bin new file mode 100644 index 0000000000000000000000000000000000000000..cbac45f0b2140a307a1450be7ea7f20e07b3d58c --- /dev/null +++ b/params_shard_362.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2c50c35bd5855ad0cefcc794c76cf58bd099d1da8fb839965eddb43d756674 +size 23511040 diff --git a/params_shard_363.bin b/params_shard_363.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c42eb9618465491bf64021c5c713bd8fafaf7b2 --- /dev/null +++ b/params_shard_363.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e59ae3e1e498dfc031ffebccf9f5e9aaa9ed8066054771d5f7e7ff2ab7b0cea +size 33587200 diff --git a/params_shard_364.bin b/params_shard_364.bin new file mode 100644 index 0000000000000000000000000000000000000000..7642cceac7105373ca4c88cd6111c44847f85431 --- /dev/null +++ b/params_shard_364.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eade6386588cfa6caccfca72578213f7f6f2177e1abceb5ceeac9d6b78d8d377 +size 31068160 diff --git a/params_shard_365.bin b/params_shard_365.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a7f1b3676b3b042e43a99eefbf91abb01f81c81 --- /dev/null +++ b/params_shard_365.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90dc4296754f03a6ab6081cab59afe9ca16188ce106b00b01885797ea22bc0e4 +size 31068160 diff --git a/params_shard_366.bin b/params_shard_366.bin new file mode 100644 index 0000000000000000000000000000000000000000..a80fbd36605f51d05b9ec449a6726a846fe3fdd7 --- /dev/null +++ b/params_shard_366.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6066b02dee226425c4162a4e641d032f6beaec46fcb852af1530fc13214be1 +size 93978624 diff --git a/params_shard_367.bin b/params_shard_367.bin new file mode 100644 index 0000000000000000000000000000000000000000..8d5cd1a5d64cc6f0ebd1dd78c2c74f00db0d1de9 --- /dev/null +++ b/params_shard_367.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b501e4de25448e6cfe451a52d0a0172132a248a7759a6f0af7e9c85f4d8029 +size 188088320 diff --git a/params_shard_368.bin b/params_shard_368.bin new file mode 100644 index 0000000000000000000000000000000000000000..6861a3a07a03680e9fe347b378cf390ccf3f648c --- /dev/null +++ b/params_shard_368.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f06e715cedc78480026d8bcdf3f1ed158c2803e7f89d420aee674d28c3053e1 +size 23511040 diff --git a/params_shard_369.bin b/params_shard_369.bin new file mode 100644 index 0000000000000000000000000000000000000000..0536ecee6927f9ed4c7b3639f7b7c563e2f6380e --- /dev/null +++ b/params_shard_369.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b6db3e99325ed6bf41534908a57183fcb862631b938504311913a0ace9b572 +size 33587200 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..81a5278dfd4e6375053642bab751db2e46459171 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e242ec39c9fd4eef831454ac2f3773cbf38a8c0ffac1d7ec2a2857c57b0056b7 +size 188088320 diff --git a/params_shard_370.bin b/params_shard_370.bin new file mode 100644 index 0000000000000000000000000000000000000000..55837cb4b1efb44b6f9caf0d436e0f2e2f7482a8 --- /dev/null +++ b/params_shard_370.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f256790992c80d8b0c1b737db98929828da573738e24efe8e5e6e080d960e26 +size 26869760 diff --git a/params_shard_371.bin b/params_shard_371.bin new file mode 100644 index 0000000000000000000000000000000000000000..422cc7dafff4f5a2d309f94b6e5ca40a6f060d2b --- /dev/null +++ b/params_shard_371.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:996b11084dd10c9a600c4113a4fd38bdbb229b09bace051eb54c69d57257dd11 +size 93978624 diff --git a/params_shard_372.bin b/params_shard_372.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5ea526f8ca6e4dce0b7129f82d38fa7fd2e716c --- /dev/null +++ b/params_shard_372.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5792e843f3b474b60a6e25bc955c1cd422afc1a4328ce747593ca90c7cb0d97d +size 22745088 diff --git a/params_shard_373.bin b/params_shard_373.bin new file mode 100644 index 0000000000000000000000000000000000000000..da5a7e9160dd1b91cddf382c00465bc9a139cc5e --- /dev/null +++ b/params_shard_373.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66d0fb66366e578584c840d3f3df9d815c1c2ab77490dc8b0ed964df9d7aeff +size 188088320 diff --git a/params_shard_374.bin b/params_shard_374.bin new file mode 100644 index 0000000000000000000000000000000000000000..3de289306687b2264f5564d7ac78cd3b85917b7a --- /dev/null +++ b/params_shard_374.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d615a694ad69a276ddcef72a62457d496977f89fcafe8fd90b9f9637f8da2e +size 23511040 diff --git a/params_shard_375.bin b/params_shard_375.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8e38758e031335fd0f6f03a761a2a3776ea2b1a --- /dev/null +++ b/params_shard_375.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eafb690756056f8cf43aba93344a36404d7a7ab11354138ab2cc254a0ee7baf +size 33587200 diff --git a/params_shard_376.bin b/params_shard_376.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb64a177ffc1193e45c2ee0158f8882b0a918512 --- /dev/null +++ b/params_shard_376.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1112df4556119d97ace317a8779340fba0b6324a05734ee1ff71af909be760bd +size 26869760 diff --git a/params_shard_377.bin b/params_shard_377.bin new file mode 100644 index 0000000000000000000000000000000000000000..17a8590ec1895df604510713739f1514d9582888 --- /dev/null +++ b/params_shard_377.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:459a2e75a1e8636c85e5c3502c36d973f824849ebf5cdf3f44104ddc68f24e82 +size 188088320 diff --git a/params_shard_378.bin b/params_shard_378.bin new file mode 100644 index 0000000000000000000000000000000000000000..48d6f340e5f6a123caf879234b204b0b52e5927e --- /dev/null +++ b/params_shard_378.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77cc43c18db0baec288efe07053353b2c74fe32ed47fbb489ab3439e3ab99761 +size 23511040 diff --git a/params_shard_379.bin b/params_shard_379.bin new file mode 100644 index 0000000000000000000000000000000000000000..2a01483de77ef2481d1939e5a4194fb1018d845b --- /dev/null +++ b/params_shard_379.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d03412b7c8306796d9db18a14608e151f240a4d6451dc5e6ab6046d4c8dfa585 +size 33587200 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa8cac738a0a5a8b738809ca4e7b197c8a34a7cf --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba30c54c5ff5a097f1674460df99a05dd83ad330c60768ee9a66d3016dda135e +size 23511040 diff --git a/params_shard_380.bin b/params_shard_380.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f4e032e486260c6293a368ca6bdcecfc2ae1f50 --- /dev/null +++ b/params_shard_380.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69373aa48b727e1fb4716b49dc5373b82daa62030b9bff09cf7cbedd8b4a3c07 +size 26869760 diff --git a/params_shard_381.bin b/params_shard_381.bin new file mode 100644 index 0000000000000000000000000000000000000000..c11beb2c78d71294b0d8df20922802a2bbf2fa84 --- /dev/null +++ b/params_shard_381.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6521afd4346d07f76d47203f9161054562cd304f25dbb590b2f83114f01290 +size 93978624 diff --git a/params_shard_382.bin b/params_shard_382.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8acce2f0efe9dbfbeedf477ceb0aa02504d78aa --- /dev/null +++ b/params_shard_382.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c15c1dd1ffbb8d9147d9df7565b20b5faf9ca99d5d44752d13f96477a2f275 +size 26894336 diff --git a/params_shard_383.bin b/params_shard_383.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c393c6afec390a6da8967fe91216d1c9cc7f0ed --- /dev/null +++ b/params_shard_383.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ac4a302d41d45be93138c4db80a4110d0d65f7d87dab38346e9f71122e7848 +size 93978624 diff --git a/params_shard_384.bin b/params_shard_384.bin new file mode 100644 index 0000000000000000000000000000000000000000..18a92a1af2fddf931944d4a6c6de38c079ffb384 --- /dev/null +++ b/params_shard_384.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d78b6aaddda92ab9f591344cf237ca95c3d1ec7c191fe76c10d3c706e9effb +size 188088320 diff --git a/params_shard_385.bin b/params_shard_385.bin new file mode 100644 index 0000000000000000000000000000000000000000..aff2e89214fc89cecc918c73eec3cbe305dd335e --- /dev/null +++ b/params_shard_385.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d6aec5650d417a0731fa566c2fc88a66f99e0dc716bd9adaf7739a4f5302b7 +size 23511040 diff --git a/params_shard_386.bin b/params_shard_386.bin new file mode 100644 index 0000000000000000000000000000000000000000..8103cd160f9ddf146fa3f73d07bb732d133443f9 --- /dev/null +++ b/params_shard_386.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639d4e17e351adb2cc933d598e556d2a3999c9be70b08f63d760e00d61e1bf61 +size 33587200 diff --git a/params_shard_387.bin b/params_shard_387.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc72c235036e1f445ddd290e0bddee3ff7795a34 --- /dev/null +++ b/params_shard_387.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5683d0f5c62ca36f61424fa44ac11981d77954eaa8fd79e252bc7fc4721e7ed2 +size 26869760 diff --git a/params_shard_388.bin b/params_shard_388.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ea088114b22623c2585adeed584875fc67add3f --- /dev/null +++ b/params_shard_388.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2d207ac19bfbcde76887b870bb240b8e155d1e5a5193c6ad74e94a3c0cd9d7 +size 93978624 diff --git a/params_shard_389.bin b/params_shard_389.bin new file mode 100644 index 0000000000000000000000000000000000000000..05fbe0ff1f97a40d5285d53486751936c6761c9c --- /dev/null +++ b/params_shard_389.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b348a22d291945750057af75d3aa6eed2f42f19c3c53fccf485f1dcf9ee32fd2 +size 31117312 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..1efd4efac02f1771709fe18769125cba904c77cf --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e041ee2b3bbdb2b839f60eaa8332be8dab562d19e96cb2c590bb6f5c66c35482 +size 33587200 diff --git a/params_shard_390.bin b/params_shard_390.bin new file mode 100644 index 0000000000000000000000000000000000000000..69bc74ff537eaed2c01d58e07494aa3d5ffe1c46 --- /dev/null +++ b/params_shard_390.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8b89a65db524b1b1066597fee950a25f73ac9c1e7a2bcdd3c8a68cefc1035da +size 188088320 diff --git a/params_shard_391.bin b/params_shard_391.bin new file mode 100644 index 0000000000000000000000000000000000000000..46960e03c8b0c256c75d0c1da7bdde85c5c055ea --- /dev/null +++ b/params_shard_391.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f712ff93511d6d27fb21ca1582a2fbc18f9149c764e5d7e734786c2d2f8edb7c +size 23511040 diff --git a/params_shard_392.bin b/params_shard_392.bin new file mode 100644 index 0000000000000000000000000000000000000000..b14a5e7dc2a6efddd2c191abde1816a619471d83 --- /dev/null +++ b/params_shard_392.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1a21a50272dc30ca433185f91fbfb3776891375ce51f671312e2bf9437b4c6 +size 33587200 diff --git a/params_shard_393.bin b/params_shard_393.bin new file mode 100644 index 0000000000000000000000000000000000000000..16f34710dda20da622cb88bac76f5ae7e8cffbd1 --- /dev/null +++ b/params_shard_393.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ecd03527e500eb32c8d5f01d41d3c46908a5b21ee9a9b53c0e980b54bfa8db +size 26869760 diff --git a/params_shard_394.bin b/params_shard_394.bin new file mode 100644 index 0000000000000000000000000000000000000000..bbe298f756808382ec23ec292d88bdc8c89d5932 --- /dev/null +++ b/params_shard_394.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e3946faf2e07d58422baaa54218e63a54241618c3142e1ed29f0f4f84f1a68 +size 33587200 diff --git a/params_shard_395.bin b/params_shard_395.bin new file mode 100644 index 0000000000000000000000000000000000000000..e5651c46153538ff4e286272cdc68a8fb56da6ae --- /dev/null +++ b/params_shard_395.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888a7aa66bf8e51608e634a4ca4b9facdeb752e165b9f7e67833c20e4bee5641 +size 26869760 diff --git a/params_shard_396.bin b/params_shard_396.bin new file mode 100644 index 0000000000000000000000000000000000000000..fb8909e54d9db91b0790011004ea18273c76ceef --- /dev/null +++ b/params_shard_396.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0febe6386ce3d745d2a9f1e1a6ecde1841989e786498fc952637a4de3663c7be +size 93978624 diff --git a/params_shard_397.bin b/params_shard_397.bin new file mode 100644 index 0000000000000000000000000000000000000000..2339bc8b2cdb01e4d1c464250fa4a74746494564 --- /dev/null +++ b/params_shard_397.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89cd76d55c0d4f53a5fd21a93e736869fa90064ec2226aeae332dd5f2a43e592 +size 26894336 diff --git a/params_shard_398.bin b/params_shard_398.bin new file mode 100644 index 0000000000000000000000000000000000000000..abba671891db332da121eff52840a3ced557e136 --- /dev/null +++ b/params_shard_398.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bde41b06960b66552624f5e9a16f012908867c61e4005a184a59b2c8682fe5c +size 188088320 diff --git a/params_shard_399.bin b/params_shard_399.bin new file mode 100644 index 0000000000000000000000000000000000000000..e082750a5a2aab23c060859ddb37c22454b52b76 --- /dev/null +++ b/params_shard_399.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b206851b4aa693ada625420cecfaa4817bb92f118a104eb05eb2d8ae22c788ab +size 23511040 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..3451df20ba6844475289f62110757c12915e8c0c --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69464da60af41403a10b3d366a81d45f73dc7d45b0d91ed2ac29ee156bf04c10 +size 23560192 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..8f6aefb70f60372890cf68b19d54a835be2fac4d --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec0798da0f18ff08a5927fcfc35539eab65d567c2780ae893cea49c49cf7f56 +size 26869760 diff --git a/params_shard_400.bin b/params_shard_400.bin new file mode 100644 index 0000000000000000000000000000000000000000..9219b3c46ca8e958561b316c52215c23cbdd6af1 --- /dev/null +++ b/params_shard_400.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28beff8e9faae6b30707ee8ed8772021a0909c74c27563ea4976645ff5014d1 +size 93978624 diff --git a/params_shard_401.bin b/params_shard_401.bin new file mode 100644 index 0000000000000000000000000000000000000000..73bb48bc489d6f044fabd44c6ed73179263e433a --- /dev/null +++ b/params_shard_401.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6663bba9f35976cda3a7c7163a8f1f6482fe0bbef79dab4144387733cdc0572d +size 188088320 diff --git a/params_shard_402.bin b/params_shard_402.bin new file mode 100644 index 0000000000000000000000000000000000000000..72425789a75442041d134737cddd309f0d458aaf --- /dev/null +++ b/params_shard_402.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b05e71ab4d6afc6d1fd6447e5d8c0f9cd1e0ab88cf0f3ede722009ea4658bf +size 23511040 diff --git a/params_shard_403.bin b/params_shard_403.bin new file mode 100644 index 0000000000000000000000000000000000000000..58f607837e676a7ee425167db4d1086e0b654986 --- /dev/null +++ b/params_shard_403.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ff9208c5f973681901c11be984588d08fe03d1cfc7bb1eafa4d056fc3afc42 +size 33587200 diff --git a/params_shard_404.bin b/params_shard_404.bin new file mode 100644 index 0000000000000000000000000000000000000000..f84dbcee7bf57b1bfec6c9ecafa701b5e746494a --- /dev/null +++ b/params_shard_404.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d5b303b3a99a4f8f4eb489a74c13e8b903b99310698c2cbb9f718dcfc81915 +size 26869760 diff --git a/params_shard_405.bin b/params_shard_405.bin new file mode 100644 index 0000000000000000000000000000000000000000..a5a00bcedf6ed5e9cf5e98b4f94b8713ebb22e22 --- /dev/null +++ b/params_shard_405.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565585324ad569bc9010955aa14a7fe18261a4fe19d9cbff3e63819c8d4819e1 +size 93978624 diff --git a/params_shard_406.bin b/params_shard_406.bin new file mode 100644 index 0000000000000000000000000000000000000000..43c4a78b5d99a74ef7db67a8a437b4351b314875 --- /dev/null +++ b/params_shard_406.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c98da0f0c4b83658f868aacb494785e3fab53c439bc735d6864f46021035aec +size 31100928 diff --git a/params_shard_407.bin b/params_shard_407.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb225b9657198023e5b592d7e09b15d184f6cb95 --- /dev/null +++ b/params_shard_407.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc88524a0231cff2dece5a7e6ab7e3ed95833a67306975525489ca13d1e3578 +size 188088320 diff --git a/params_shard_408.bin b/params_shard_408.bin new file mode 100644 index 0000000000000000000000000000000000000000..54c378bc56bd29269379f7795d267491eed17bee --- /dev/null +++ b/params_shard_408.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67dbc14e9884aa95d8af00c43da036302c122fe85ec9c7e0e15ca625dffe436 +size 23511040 diff --git a/params_shard_409.bin b/params_shard_409.bin new file mode 100644 index 0000000000000000000000000000000000000000..b000d3ec4037c188028191f939b9380d489e35f5 --- /dev/null +++ b/params_shard_409.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c408f34d5a16a8111dad207efbcc0ead2364f02b30b0abd2007695ed7823ca6 +size 33587200 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..7af382ae053fb534aa32a7298b894fe95e18a403 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f659884140a74a633e116922af9d49722b9cc5e7d6d0c20d93a4c125c3da560 +size 93978624 diff --git a/params_shard_410.bin b/params_shard_410.bin new file mode 100644 index 0000000000000000000000000000000000000000..713f77482c80a3da87fd0025c0f058f6600ba050 --- /dev/null +++ b/params_shard_410.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2892acd0a49b016732b93d65e978b560138e3cd19c3c0947e4f9f70392e30b2b +size 26869760 diff --git a/params_shard_411.bin b/params_shard_411.bin new file mode 100644 index 0000000000000000000000000000000000000000..6fc7d8cd988bac5a53a4cf101a93911421134e77 --- /dev/null +++ b/params_shard_411.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55cf5ee050dd14ee6460fdabd0ac227a23ad7650768aa8c617c3f3266dcfcab +size 93978624 diff --git a/params_shard_412.bin b/params_shard_412.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf67929a34a93e356a7a8b6d3b3186ab5f2215a8 --- /dev/null +++ b/params_shard_412.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd47109f0b703b04366560d42690514475314a3efac616b4fda05cf2e301c2b +size 188088320 diff --git a/params_shard_413.bin b/params_shard_413.bin new file mode 100644 index 0000000000000000000000000000000000000000..26870a08e819080231c2f36aefcfd7519d7d140d --- /dev/null +++ b/params_shard_413.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8b155b3eb5f2be5c2c15ce5fd038a948eef0e5b4ec002df2fa9b759b86f5229 +size 23511040 diff --git a/params_shard_414.bin b/params_shard_414.bin new file mode 100644 index 0000000000000000000000000000000000000000..b80414c238d092c5943fa500b231127b7d6280ea --- /dev/null +++ b/params_shard_414.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b529d321d75889f3ccdaa00ede3265f36fa9d39ba88e042793b31064e2eae3f +size 33587200 diff --git a/params_shard_415.bin b/params_shard_415.bin new file mode 100644 index 0000000000000000000000000000000000000000..d00e8cf6a529887ee8e7ec0eb3f58ff27ae0b7b5 --- /dev/null +++ b/params_shard_415.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5638609b7c850422c554ae006d018d17f817ce88b05267b136045acb4ac24f54 +size 31117312 diff --git a/params_shard_416.bin b/params_shard_416.bin new file mode 100644 index 0000000000000000000000000000000000000000..ceeb605bd6e07f592e62fe9cfb21546cdffa6c4d --- /dev/null +++ b/params_shard_416.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2dafe4ce0fe1e5963f844dee2f1f02d90bff6f5bb38f9d7f12774273f2d5c54 +size 31068160 diff --git a/params_shard_417.bin b/params_shard_417.bin new file mode 100644 index 0000000000000000000000000000000000000000..48689497cbb4aaa2267501e08b004955ea586368 --- /dev/null +++ b/params_shard_417.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30afd9ab0ae3d7ac4ba0e37b73427a273f0a506660a49ed5ad939d2dc84d58e4 +size 93978624 diff --git a/params_shard_418.bin b/params_shard_418.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5c5313f396f9ab5e8fadeeaed15de004811905b --- /dev/null +++ b/params_shard_418.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853bc61e9a63b4b71ef014cc00e5ee15dab756134f4e8b72c2f144a51572dec9 +size 188088320 diff --git a/params_shard_419.bin b/params_shard_419.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5278f69f86ad126e4510daf45f2dd0572f8afc1 --- /dev/null +++ b/params_shard_419.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3170c8b0875a487421f65cf2e90882749d02ef4d71db80a4b1e06391927091 +size 23511040 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..f60c2fcae04d4a7c4ffff262504de982fce7ce1f --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd7e8e3ca08ad2889f88c6fe275d24d3fa9fe961b309f1076866c923e61f5ea +size 188088320 diff --git a/params_shard_420.bin b/params_shard_420.bin new file mode 100644 index 0000000000000000000000000000000000000000..74be039773e82fc65d31582fdbfbb5dc2754ca37 --- /dev/null +++ b/params_shard_420.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49f3433edc766c6b8bb110a53d96aa00136218b7f0d22092b7931dc012a6804 +size 33587200 diff --git a/params_shard_421.bin b/params_shard_421.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ed3f5c94b9545ff8474f93000ea7975a624fa97 --- /dev/null +++ b/params_shard_421.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0acdf3919212ac1ea707ca9bab5aff4cb3bf4e0cd0c5405c91b31d369d0826c +size 26869760 diff --git a/params_shard_422.bin b/params_shard_422.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ae56e1ee7042a18e5fd463f37b86f752aa14784 --- /dev/null +++ b/params_shard_422.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bb909d1fff27c8b02bb5eb26ecdf58f45b53de3f526b606d7cdbe1dac4a157 +size 188088320 diff --git a/params_shard_423.bin b/params_shard_423.bin new file mode 100644 index 0000000000000000000000000000000000000000..3bad3d96cab3b67dad9a5097b6b19c5f8b3ad0a2 --- /dev/null +++ b/params_shard_423.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2255c0c6642a63fa327b5f4cd51ab4966b1c214cee9955f7c4fa3ec38a910965 +size 23511040 diff --git a/params_shard_424.bin b/params_shard_424.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4395cb4e4dbc0c96856ddc9cad80daffdff9e15 --- /dev/null +++ b/params_shard_424.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63395af714b1af9b4e64764011a5461e7e9221e7b0bfb65000858b1c25e9c261 +size 33587200 diff --git a/params_shard_425.bin b/params_shard_425.bin new file mode 100644 index 0000000000000000000000000000000000000000..6de5d1a408b070c78c1fa32348b2fcb37668932b --- /dev/null +++ b/params_shard_425.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08d613c9d98cae9c64eee71fe42b830d5285848addb89bcdd578274f0effdf9 +size 26869760 diff --git a/params_shard_426.bin b/params_shard_426.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab9a9984ff65e40b7f048f874e5517facc6844c3 --- /dev/null +++ b/params_shard_426.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f2348b094dbdda383dfa7bcd8ecec63575f696cfb500ffc48a2aca9125a5d9 +size 93978624 diff --git a/params_shard_427.bin b/params_shard_427.bin new file mode 100644 index 0000000000000000000000000000000000000000..688ee081e485b2b28c86858d7235a5cd68ec7c7b --- /dev/null +++ b/params_shard_427.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917844ed2ad7c725294c888875e82092558dbb789e5ebefe21059863a15a5f67 +size 30269440 diff --git a/params_shard_428.bin b/params_shard_428.bin new file mode 100644 index 0000000000000000000000000000000000000000..539c5fee7fd8f1b068efedea05ef8d94bdd089bd --- /dev/null +++ b/params_shard_428.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7f454e1c0b84865b265768bcec5a4b678db440b5b1612044bcb4ef8945a17a +size 93978624 diff --git a/params_shard_429.bin b/params_shard_429.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aac8ae6c4fceb867dedfb6b37a095035db3c992 --- /dev/null +++ b/params_shard_429.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e9a91434dfd254498295edb115189e529d45037ca3b22e74e19fa247126638 +size 188088320 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a8df5155b0a481eeeaf5c39d05ed0e8fec8cb83 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59c283fe6d46961798db6035b00b917184d1bbe4c7fce3a7de74b2253a6beb41 +size 23511040 diff --git a/params_shard_430.bin b/params_shard_430.bin new file mode 100644 index 0000000000000000000000000000000000000000..39a2ab63db3771a4aa91b1badfb862f09847d0f5 --- /dev/null +++ b/params_shard_430.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68d51e586ccb08a33700e4a42693005431daee6b323a8be001d95202a9d9284b +size 23511040 diff --git a/params_shard_431.bin b/params_shard_431.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dc115a430e484bacd138e25052fa69b6b0d5358 --- /dev/null +++ b/params_shard_431.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e434aebd982cb5aefee7c529689cd9c9cc08c41fff9d2649aaca3411c83a6d12 +size 33587200 diff --git a/params_shard_432.bin b/params_shard_432.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb01b7f8600a813196acb277b78a8cd72545b502 --- /dev/null +++ b/params_shard_432.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e793a229dd2642f33cb1c5d1278683da12fd54d8dbe8d9bd8d65eaffee8a8f +size 26869760 diff --git a/params_shard_433.bin b/params_shard_433.bin new file mode 100644 index 0000000000000000000000000000000000000000..2144939eda600982717ebc0871432a3bc5ed6f21 --- /dev/null +++ b/params_shard_433.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bbe477610f0e4f8339837525e0ea409f0cb4ef0cc9bfe0701459917cb3e925 +size 93978624 diff --git a/params_shard_434.bin b/params_shard_434.bin new file mode 100644 index 0000000000000000000000000000000000000000..f248242c00bbea744fa6b14a4bc7ee286b92e516 --- /dev/null +++ b/params_shard_434.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80cfe19e45a580d8d7e33548b5257e192410f0eda1adf6d79a2055739e2a14fd +size 31117312 diff --git a/params_shard_435.bin b/params_shard_435.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c5fc3b459d8bc25fee7059c05523edf75ed5df1 --- /dev/null +++ b/params_shard_435.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ee514826a391ae9dad0aebc0bb5ddfd2ec0cfe3f86dc220a172a45c0ad257f3 +size 188088320 diff --git a/params_shard_436.bin b/params_shard_436.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b17faf641a6c122a9c6ded44660dad34a6d0625 --- /dev/null +++ b/params_shard_436.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68f979c356011e34420d5e185b02cbccd07e6271cf4578b667d820912171356 +size 23511040 diff --git a/params_shard_437.bin b/params_shard_437.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6775ecb773729877231044960d4e1b28569afc4 --- /dev/null +++ b/params_shard_437.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47642128e9405fbe23eea5369d8cd328c880c12ad68006b6430e9e8e62d9097 +size 33587200 diff --git a/params_shard_438.bin b/params_shard_438.bin new file mode 100644 index 0000000000000000000000000000000000000000..75f502f470a5c7a6e819c8fc14872a9aec7cf9ba --- /dev/null +++ b/params_shard_438.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03cf971cc40bdbe6fbe91cd395950969e6072437b1181d4caa67c709195003da +size 26869760 diff --git a/params_shard_439.bin b/params_shard_439.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa3c2936d0c772ba9ddc76aa7ac11db70d70c9d4 --- /dev/null +++ b/params_shard_439.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752258531c39797c467ba6f3a9c61ebaf5b9ed641e60c925ea50a38650fd11e6 +size 33587200 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..d8d2c2f21974641d3e2db3958919e7c3323d16bb --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c35a0728e0def0a35f9e208f528f352ab509ac34497dfa9e0dc5a8dbed89866 +size 33587200 diff --git a/params_shard_440.bin b/params_shard_440.bin new file mode 100644 index 0000000000000000000000000000000000000000..f9343d9955e01e1050dcbeb766d8110900be9ab3 --- /dev/null +++ b/params_shard_440.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac88a560cfc6c7e458a458a1ee044ac378d7435989653fd45a99abe58e066cb +size 26869760 diff --git a/params_shard_441.bin b/params_shard_441.bin new file mode 100644 index 0000000000000000000000000000000000000000..387c3b4a1093827fc4ed1ee63dbdca9b641a3013 --- /dev/null +++ b/params_shard_441.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fc12cbb43dd41e93ee1c4be793e0b74f45a1c85dcdddd052a2cad304436f62 +size 93978624 diff --git a/params_shard_442.bin b/params_shard_442.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4d30956e57a520165f0c135886957f4a73f6c7e --- /dev/null +++ b/params_shard_442.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba659f96cd1e75b2f4373ad09b1503d444fbc945d71765449a96f9139468f71a +size 26894336 diff --git a/params_shard_443.bin b/params_shard_443.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf811d2463a794b823a32dc9862f29cda1e754bf --- /dev/null +++ b/params_shard_443.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d2c61b097945d94e2bef0f2280580f604d954ee7d4bc21f46ee411c77cf146 +size 188088320 diff --git a/params_shard_444.bin b/params_shard_444.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d478599fb187a2323b608387095593b69a2be08 --- /dev/null +++ b/params_shard_444.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffab4ee3009fd6fb7178fa63d8e916af947d16f92301dcffb3ec8b288227044d +size 23511040 diff --git a/params_shard_445.bin b/params_shard_445.bin new file mode 100644 index 0000000000000000000000000000000000000000..f16d79f181e18e1008e45aaedd6730996a83b4c2 --- /dev/null +++ b/params_shard_445.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e1fbdcf93e414352e25abdec40de80e6c6406e8bc5c702fb0df3d2e5731a3a +size 93978624 diff --git a/params_shard_446.bin b/params_shard_446.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0bbec2fd1eb30046c5d5abce8c2846f545583a4 --- /dev/null +++ b/params_shard_446.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8bbdcbf027fb938a2254ba01242a88ae2b69014bc18156c90466813b1c0293 +size 188088320 diff --git a/params_shard_447.bin b/params_shard_447.bin new file mode 100644 index 0000000000000000000000000000000000000000..85b3e6c2e116629029b9dc984b8e10835f5aa60b --- /dev/null +++ b/params_shard_447.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9aad7029e1fb86eddfff28ede35e96f1ca0965d605c0c4a467871810b035dc +size 23511040 diff --git a/params_shard_448.bin b/params_shard_448.bin new file mode 100644 index 0000000000000000000000000000000000000000..91f54768d47410dd2c0f4e02b35f55dfa2ba7294 --- /dev/null +++ b/params_shard_448.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd810723b907fa2ffb205a2a03bb844c70f5ce7386cc935eb5c3a0bf8b19c289 +size 33587200 diff --git a/params_shard_449.bin b/params_shard_449.bin new file mode 100644 index 0000000000000000000000000000000000000000..3214083c1992faa7347e7517018e855130a0f6f8 --- /dev/null +++ b/params_shard_449.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a12911aae01db778e5b4222af0eff6294d31775723d0cfbfdce877559c9e60c5 +size 26869760 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..358134fe127c5a44f987621e2f80e5819596c96e --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c1099ba3802aae36f3d97a86f64dcaf412c97eb9273b1c441849355e0265621 +size 31100928 diff --git a/params_shard_450.bin b/params_shard_450.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c78cb6c7494d0f875eef3138564c801915abddd --- /dev/null +++ b/params_shard_450.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4883ba3be2dedf68d489ccef84e5abaa25c09a23da479e03e04080cc55f2a10 +size 93978624 diff --git a/params_shard_451.bin b/params_shard_451.bin new file mode 100644 index 0000000000000000000000000000000000000000..4cc0cd4d78444a3e20dcb59a4069b24629621132 --- /dev/null +++ b/params_shard_451.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86aad12305b901461ddccf03c8a0be5c61addcb5a6cb40486022c1dc39b9c3cd +size 31100928 diff --git a/params_shard_452.bin b/params_shard_452.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1d57839d0ece756428f0ad78cd32938fcdbed46 --- /dev/null +++ b/params_shard_452.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d0559e49fe9f51d57a8b5bd165ef6314d2899f891fc9fcdc76514541ce4e72c +size 33587200 diff --git a/params_shard_453.bin b/params_shard_453.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e51618798dfc4704a062f1331955588d7e7a9d4 --- /dev/null +++ b/params_shard_453.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54162f1a9b5bf96c5735173e49467657289b27e6f72a65958400f3f700a1403 +size 26869760 diff --git a/params_shard_454.bin b/params_shard_454.bin new file mode 100644 index 0000000000000000000000000000000000000000..7b0a2a06cf22116e1976ab3a8fc138158799005c --- /dev/null +++ b/params_shard_454.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffbfab4871c03e73b2a12d03d5d51846c8deefe56c9d2fd2aefff658317840b +size 19304448 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..a353c7120ca6b7afe69a8cd58e132cd6bf61b5b3 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e9c425629b73f04e7ec7fb2215a4a473a7ac4ad35cd48b3b1a06617578eb3e +size 31068160 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..907acefd157e41722d5e3c1a803032d10344414e --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782d8c6c45f44579ed3d6aacc55635cda1565dc5ebf4b75592859af6acca753c +size 33587200 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..f9daa251ff093c9d394b3bf18d4ed13bce2d693d --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b55aa57b9c2707a35957d0973b902c734d3cc40436d64fbf3a7512f6a872ae +size 26869760 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..677cd3144e80454bb04598082ca9e373a26a5230 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80364e9844b1fb1ddaad4e888c6db9edb4cc655e8fcf0b5581bd5bb9577ff6c1 +size 93978624 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2f3cb8e49a6193a33b0b7db5c8c2a84adcddc5b --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29faa8c2df217af0e9913ad9bbc72c63404579f38278acd5f8ccf5914ebdc04a +size 188088320 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..658895592bc2294eea40ea41bc801a02d66d4ff4 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac57919f3061b72498fce1c0c4777198efa6f1f90c17cd2fb21e5e423cf973b6 +size 188088320 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..91a6784d5fa7c8343180a6ca7d3ce563c63c4102 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c054c8a160d95049a51e01af8f5ae460e39acc3ec79a2cd03ea2eb1ea6fce2e +size 23511040 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7d5137ae4f7205186c80396749536a408292913 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79de4e3a960f863510b64c9781de8dabb9fbf030711c1a8f5ef3cf918d0348ba +size 93978624 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..1996f1a277589134a7c86a9f697bf879cbb5c060 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450ba0f939b8d9df7325c21a3d06e50730d075e83aed6de797237bf2ecc7ae23 +size 22712320 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1ea64f7a604c1c25607e08e959ea439063b879b --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b29aa435edcabc66a1f11aa1f63973325c1b8952d9fbbe6c827c19c9c915d2ac +size 188088320 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..485e7ced5858abc87834d203ea2da79b6613c316 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d61b81ea74091e7ca5ed73180b6bb745c6259764c6eb05282197ece70f13def +size 23511040 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..de72615adb290084f3ff4b9be4c122f21355d6ba --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b3fb0fa4b45ffe59d50cc46ca79959f8af914c42da10f61dcbdb8315358b1a1 +size 93978624 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..c571d4f6d7d3d36377b0f2c1449e7a2b5d35816d --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20558ba591d3ffdcb24910a7eea6996e93276c19c2676eb62b78c1b889c75c3e +size 188088320 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..06644fe980d4e9ebedee0925cac1789f4aa7ad28 --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b185bc7eac6fcc4471fc39c110ac14bc4f32f0b5fbf085e8f9182b5be4a230d5 +size 23511040 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..064160b955c76baf506a85cc40103d6d67ff28e1 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ab21c159e7e275cf36ac7588c0b4c588ffc8597f2eb4fd7980dbce5a93c7a1 +size 33587200 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..8b30fcce8e907d488dd5e5ddd201cca2fdb0143a --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ef6a461095dbbcf54eefec46581da0ccd6af8a14e13c1be9a28d1e852392bb +size 23511040 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..0545707d39d61da93f8ac4524dd33d41d497239d --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659d0b334032812710695a18556095e354da639c749d562ec41c17fc83693571 +size 26869760 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..bda5b73c118a18c9a4409ae6281aba43ef98c53f --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929be7bf92dcaca83d1bb32d8d8316feebe3818f2ced9bce960ccbcea502cad2 +size 93978624 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2fec696b7ebcb504863cf1244431efa18a612b5 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d3d2134c8cef7e6cba9c418b0a21d38b0bd6b6041afd98e4c9a7cda7e9ba35a +size 31100928 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..435567c808de8ae3b0d914a51965aeeffffe8a9e --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f76f586ddddf6dd5f1f9c97b5059c0bfdbac0f53481a69663808373ef6677a7 +size 188088320 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b299dc8055fc395b606135bdd74ec5de073afd9 --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b812c71c14436b3335eac2ca9cc103996a1f2ff6eaf2708bef878fecb1d9bf1 +size 23511040 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..40b51a679031cf26e9c9f589b495ca0d823b53e2 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b58037febc6f8bca307ddef368d9a12bfb330d675b65ae1090871b9bbf2e7a +size 33587200 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c4d1ba52398b53cf961673e323830a2fd5c4ec4 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5546fdd8b772290c897efefcfbac033df1e6ce0e6403d0c6f32facdf7f0406ce +size 26869760 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..52e3b8611a29121520ffd8404ef85ef7b7486185 --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733e17b66d18a875f37a5b3b4ec6143862f997dbf9a297d4f253fe9615104f74 +size 93978624 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..51a7693cea7a22a738980a54799b69a47f84fea4 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:512d633518c9200222a414ed8136357a11153da57ca723226d559d48abcbddba +size 188088320 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbf19f85484f6117f7a519547f1bb100317a2517 --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb3ab22089fa8bc1f7e7bd3123633370d8e40c45a1574824fb10fe41d18f834 +size 23511040 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e5f5d72e89fe50e8d82dec4b3aa4e4f9f56708e --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc117939de738722dc6ba5777362c8345ef9fcb183de10da108cda79080344c +size 33587200 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb953e72d8134ec1e9d587fd2c022da0851098e6 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafc72f100708e683c1bb0e6959b0c764c3cedc2bd5f9a804716d088d131178f +size 33587200 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..43e681ec6067bf39fc4c446faf143b477798a427 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ef2b36910d7ba6dc142272dc02895dfa3b4c4d5a41a583ce73d0036f246cfc +size 31117312 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..05dfa7c07556f92b586358f751f8533e176f8481 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ac96b3aa9fa058e39eff046274f88e63df967ca1270f92ce82f531a0b9ca02 +size 31068160 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea2a2fd606c0fcba89d1c744a0e763042de50eee --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59d6b16f6fd4afe5d50e53e0e3dfe89ebd07a23e5e43113ebfe10642b197b01 +size 93978624 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..c52f696387a1ede23fddb7858b32544e596d0ab1 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b00d46d3e27293527424729b70a60b2b1cc91160c190468d1064da05acd6ad +size 188088320 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..06ecdf7f6b363450c9adcb6c4aa3e405cde51f29 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7054995619a9c8fd7cf569fc28d454f6e0b5929688139dd103e30af249cb890f +size 23511040 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..4bb9aea3d8f3971c2970a337525f9acb8d45966d --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02a8a3646a134ba3e3b200fa6acbe54f51a2a5eee0815af5b9961f4877d9c762 +size 33587200 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..90bda01f9d707633691b7a663c0d1973190fbc0c --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8502349dec8e1fe3315326ae2cafe98e59b08f264842c38a2ca515cad358a5 +size 26869760 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f3955bad0018a165d5fb83737779b1042f47bd0 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863254c0becf521e355f30da6a6c3938f21e88d097fb1f6e84aa8bd361d8a5c3 +size 188088320 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..defd63455e1bffce03d576d08d8d0b0e13c25fcb --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829f2c3b3fc0195af1e3e56f698a87e39011c399a4402bcbc6a16880dbafccdd +size 23511040 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..db74eb08d80393e14b40091d43a95dbc86daca60 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998ad1ff71c0e5a044de82a50d00685c391eb1f6a0595562f00807e36db6d93c +size 26869760 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ef4d7f46dfb6032ff7b67862ecf406961cd5d56 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b078f5de1659d88dd746a85d15858d2a63b91cd931af24c423d71975f2d120d1 +size 33587200 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..897e508aab1a0937e154d0e2b9b606d999a8beea --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222715cca0cdf263461bf388d197c981bcab7655d410b1d9adbc3457dd85a73c +size 26869760 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..8aa3c2d314dd5958ae214bf705cc3e8955b7543f --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c52ce3f4fbcf94499462ac56482f12f54ae02b38c7ff1e47089cb16835a9626 +size 93978624 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..301b15a487585b84442a2ab03481f76d4e21ee46 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c77c2472011de569993bd83ee0b3cb648a53f13ad62b2d96f821238cc71bf916 +size 30269440 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..652a992ec3873b06ec4430b28aadd6f162a40c87 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cfc6a9f6533b09bf418827b2191c5585b0f4d3644e79cf9121b8390a08b3432 +size 93978624 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ae65b1ea74f0707b9af08b329500438b7341750 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cba112ecf90c65e97a9348ec17de74f8f39b18b066175b5746d80a29ad2389f +size 188088320 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa304c617f2bff0fd77b0aa4195e4b06d21ee5a1 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:826eda17857a7c1af97358e85aee3170ea386405e614cea74f91b077b1785f82 +size 23511040 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..9404c0775223adf8ee6c1e9928c4e8f7136d4e91 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba228d0dcc7dce6286954744ae33ef62b3a88795eb3a2999b110a139bf42cb8e +size 33587200 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..a52a027c1aed50e6fa3a288e692675bb38a1a322 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e181cbbf60dfcb47a38fc18f71f1b9892f11d154246897a05a280f58e0a53df +size 26869760 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..724a606b07877fe036c1f0f359e9d2d92c376d1b --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f76aa661600a0283048e80fed7dd13ebae91382a3ee50aa517a687e017a0fc4b +size 93978624 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..7694800e5f45d2e81f147248ea148d8e4a952934 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df518524036de3579371783d2f82625dc04d9238cc17f0e3ee8b63b18d7b3542 +size 420679680 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..936dd65e238d17cc7d0ea500ae79c33065360cb1 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ce01aa68f421228b3c2d02f02487fe26aaf28c6e15d98499b4f17940c1171f +size 31117312 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..aac8f0178828220b47e6010a03a44b3a805e0b0c --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cecb1cc41405be7a5be6d0355d64884b73d749e724d6d6dede88997f5434c132 +size 188088320 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..9897b402688aab615b5bc2f6e989651be300942f --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a6ced6ead6fddb3e11f3c2cb44b880aad593846069143de53443bb616189d2 +size 23511040 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..b23c619bc82c0deda9d180a276b570b8d6642d9d --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630962f027cb223a307b7e1ff0f0ed2b8c4c6c0cf8c1ccbe5db3253a8451ed14 +size 33587200 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..4977fa8c6abd84be935e937e57b2f07a9c7fa996 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd50f7d86b4edc34a7e06be78cb0822e30d7b8cc41feabff0e43bf75b2a9fe79 +size 26869760 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf89e5bae5cbfdc9e546e3f43e05172c1a8e14b8 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a810137299d1cbb8da5d177115c75e4799380d8ca2afc616a993566c132d274 +size 33587200 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c8d850d1f5a7b77349252598cff06ab0892c8f7 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34974af1bf5193660361eb572bd76df12d342fe85c4ee12f144ccc3e8b5e391f +size 26869760 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..924af971d8252ec57084dbf58d80e990b0bb4831 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82cd44d88cdb9f61476e63dddb87fdca6fd1f0d8467f6eaf468085e299cab348 +size 93978624 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..8be18fe9f345b954b99ed48ef3e0385b405e87c7 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1163f183cf671fb7a6566a0dea05101411027d1270e9f1659ae9ada3182345f +size 26894336 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..629c553cb47f39da6ef8332d2b44fe57b169f33c --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f8e3f25b37e81f2bf837a8ab6f5819b7c8aee9d2af5105f3146be5c29e9d6e +size 188088320 diff --git a/private-llm-config.json b/private-llm-config.json new file mode 100644 index 0000000000000000000000000000000000000000..912f09278d4a22102bdde44099f198993b85289b --- /dev/null +++ b/private-llm-config.json @@ -0,0 +1,55 @@ +{ + "model_type": "llama", + "quantization": "w3a16g40sym", + "model_config": { + "hidden_size": 8192, + "intermediate_size": 28672, + "num_attention_heads": 64, + "num_hidden_layers": 80, + "rms_norm_eps": 1e-05, + "vocab_size": 128256, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "context_window_size": 4096, + "prefill_chunk_size": 128, + "num_key_value_heads": 8, + "head_dim": 128, + "tensor_parallel_shards": 1, + "pipeline_parallel_stages": 1, + "max_batch_size": 80 + }, + "vocab_size": 128256, + "context_window_size": 4096, + "sliding_window_size": -1, + "prefill_chunk_size": 128, + "attention_sink_size": -1, + "tensor_parallel_shards": 1, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "temperature": 0.6, + "presence_penalty": 0.0, + "frequency_penalty": 0.0, + "repetition_penalty": 1.0, + "top_p": 0.9, + "conv_template": "llama-3", + "pad_token_id": 0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "tokenizer_files": [ + "tokenizer.json", + "tokenizer_config.json" + ], + "version": "0.1.0" +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..1c1d8d5c9024994f1d3b00f9662b8dd89ca13cf2 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9e4e7fb171f92fd137b777cc2714bf87d11576700a1dcd7a399e7bbe39537b +size 17209920 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4fd26877f22f3a80ec2f4f83f941857317c6f43b --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2065 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- set date_string = \"26 Jul 2024\" %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message + builtin tools #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if builtin_tools is defined or tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{%- if builtin_tools is defined %}\n {{- \"Tools: \" + builtin_tools | reject('equalto', 'code_interpreter') | join(\", \") + \"\\n\\n\"}}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {%- if builtin_tools is defined and tool_call.name in builtin_tools %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- \"<|python_tag|>\" + tool_call.name + \".call(\" }}\n {%- for arg_name, arg_val in tool_call.arguments | items %}\n {{- arg_name + '=\"' + arg_val + '\"' }}\n {%- if not loop.last %}\n {{- \", \" }}\n {%- endif %}\n {%- endfor %}\n {{- \")\" }}\n {%- else %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {%- endif %}\n {%- if builtin_tools is defined %}\n {#- This means we're in ipython mode #}\n {{- \"<|eom_id|>\" }}\n {%- else %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n", + "clean_up_tokenization_spaces": true, + "eos_token": "<|eot_id|>", + "extra_special_tokens": {}, + "legacy": false, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "<|finetune_right_pad_id|>", + "tokenizer_class": "PreTrainedTokenizerFast" +}