diff --git a/mlc-chat-config.json b/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..88b92694abb994e61e7694161e96e1b0c4bf668f --- /dev/null +++ b/mlc-chat-config.json @@ -0,0 +1,74 @@ +{ + "model_type": "llama", + "quantization": "q0f16", + "model_config": { + "hidden_size": 4096, + "intermediate_size": 11008, + "num_attention_heads": 32, + "num_hidden_layers": 32, + "rms_norm_eps": 1e-06, + "vocab_size": 32000, + "position_embedding_base": 10000, + "context_window_size": 2048, + "prefill_chunk_size": 2048, + "num_key_value_heads": 32, + "head_dim": 128, + "tensor_parallel_shards": 1, + "max_batch_size": 80 + }, + "vocab_size": 32000, + "context_window_size": 2048, + "sliding_window_size": -1, + "prefill_chunk_size": 2048, + "attention_sink_size": -1, + "tensor_parallel_shards": 1, + "mean_gen_len": 128, + "max_gen_len": 512, + "shift_fill_factor": 0.3, + "temperature": 0.7, + "presence_penalty": 0.0, + "frequency_penalty": 0.0, + "repetition_penalty": 1.0, + "top_p": 0.95, + "conv_template": { + "name": "llama-2", + "system_template": "[INST] <>\n{system_message}\n<>\n\n", + "system_message": "You are a helpful, respectful and honest assistant.", + "system_prefix_token_ids": [ + 1 + ], + "add_role_after_system_message": false, + "roles": { + "user": "[INST]", + "assistant": "[/INST]", + "tool": "[INST]" + }, + "role_templates": { + "user": "{user_message}", + "assistant": "{assistant_message}", + "tool": "{tool_message}" + }, + "messages": [], + "seps": [ + " " + ], + "role_content_sep": " ", + "role_empty_sep": " ", + "stop_str": [ + "[INST]" + ], + "stop_token_ids": [ + 2 + ], + "function_string": "", + "use_function_calling": false + }, + "pad_token_id": 0, + "bos_token_id": 0, + "eos_token_id": 1, + "tokenizer_files": [ + "tokenizer.model", + "tokenizer_config.json" + ], + "version": "0.1.0" +} \ No newline at end of file diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..2043f809369d7d2296bb62ec168af7131032d4f7 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,3137 @@ +{ + "metadata": { + "ParamSize": 195, + "ParamBytes": 13476831232.0, + "BitsPerParam": 16.0 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 262144000, + "records": [ + { + "name": "lm_head.weight", + "shape": [ + 32000, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 262144000, + "byteOffset": 0 + } + ], + "md5sum": "186b2dde3a9eff8b8c633031ec403339" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.24.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "9f5702372678f645c083f14ca4ab8b95" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.24.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "b25a40b92df2f91c8dab2b518d912483" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.24.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b8059a4c1032e3f08b639911c8d1bcaf" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.24.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "00ca5cc5d7f19a572ad06577dea72aa1" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.25.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "f2e3c0b8ecf774e3ab6bb93e9718ea5e" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.25.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "dd7fc43f91c71b5146a1e6bdfc2e3a5e" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.25.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "33f0e7a6adc631cf94e4e437f69f6112" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.25.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "dcea29c22fcd157154d2b4079de93688" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.26.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "b77fbe54dab9017a04fe1f78b4d4f6c7" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.26.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "1e2af700acc5afbc2189c76b8ebfdfc8" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.26.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "800f8575ef1f2f4930836ad11efeba49" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.26.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "ff6f73dd5579654b2989d5c37a1339ef" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.27.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "937434cf707eb9cd73fd922f0f325cf2" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.27.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "928a2b739bb6b01cf2313511ee148341" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.27.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "050e8141aa544a2040c48259965afc7d" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.27.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5eb6304dfb4140e682858feeccdfabdb" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.28.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "ce3b6112d41ab8bf1c3a5e4ace0e6352" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.28.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "377a997d33ac2896f81dc5d5a964b977" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.28.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "688588e6a832ea7b3097204742647115" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.28.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4c83d99bddc657f4d0e44e3a898dedf1" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.29.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "03d1ee0d8374573cdb9376274fa7ad7f" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.29.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "d087b6d2478ff0e32935e8773e96fba2" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.29.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f0ab56d3e1578029f045ad11421401cd" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.29.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "3b05d4831d3f8530701b60ec41566987" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.30.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "bd353da6a1d684d3cc55c604b81cd110" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.30.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "f471f02f08878938fa0c64b6e5915c21" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.30.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b5aae30cf84eb26a1c1d20f46ec6a463" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.30.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "b8eab0a2c266c964b3b81ec108cef7e1" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.31.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "02c6ef4c11a83509a9172dd3c1c99e0b" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.31.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "23320f0b33062d540805ece08838b5c5" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.31.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2a31b3425ffb0032f858a98776b06e46" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.31.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "586254277890d975e948864f90646e73" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 262144000, + "records": [ + { + "name": "model.embed_tokens.weight", + "shape": [ + 32000, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 262144000, + "byteOffset": 0 + } + ], + "md5sum": "925c0893977c37bb2a47e5223c82a187" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.0.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "139abb4fee646c9313daf0db69c5721a" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.0.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "cd07340ca2d9fb4796a774ed34b5cc48" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.0.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "74b49f4390e004ee9d7c96cc5593f9c6" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.0.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "5aedbdc23b2f98d088284c36c611382c" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.1.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "6246e903531b99cd8730c79a46bdcd61" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.1.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "19518905955bf449e2642a1bd7282ceb" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.1.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "4ce82b7923d147b25b6d2b8eb8d76bae" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.1.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "6ac57c5cfe0769f22c9811f80be81d9d" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.10.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "e70b26b97ec1ceef8bcffe60ff400e35" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.10.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "acb899f6f0bc5b6532f2da5d64c5d5ac" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.10.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "6f32cf82c9943851974657da42c8f1dc" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.10.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9639fc721ba2501512f15e10d920c57b" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.11.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "73a18b4973e43be3e7a58f9374d5b812" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.11.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "54d17d861248ed4951c43401389d98b7" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.11.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7519b35896097839bb43aff4d8404792" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.11.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "4be8dbbe84262ee508eb4e3a9bbea15c" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.12.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "5dc410d19e52d5c90de98de55d672140" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.12.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "d8c9075d8ec92e790e5eff01f99b274c" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.12.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "76b04d7c3f00d3c00e9dcc390e2815e0" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.12.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c3d2a2854ad6b775b5c8eba072717d92" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.13.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "42b9d322d2e610fbef9d4368f60101d5" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.13.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "2e7ce52fdf2b9e0e18256cdd373a6699" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.13.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0f2898024c308b6dde39aa2d9a4764b7" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.13.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "26574c3a8a2e2deaf6bb32bd355db8a1" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.14.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "3fc5a2fba13eb841fc2717a875b1d4fe" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.14.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "051621f8886973f9f34771c3a0e16107" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.14.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "05f75b303c38eaf4ba979ed82da80ecf" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.14.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "53d18374a4be61951af774622b5ae892" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.15.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "effa2712df3c219b3ab276f9e9f036d1" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.15.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "ccb4114f69b23b7ae6e4e4f554aa7fc1" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.15.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9e1262a0d185e5b4c1ee9d677a818da2" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.15.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e5e169ce7384d6c7fc41b794509aad6d" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.16.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "6edf9342b24e466210ea739e26f97417" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.16.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "39585337bfd8c9aec33483a972b31e00" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.16.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "28d2bbc4c89576cb4a98bcf2d53e9316" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.16.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "49d6915c712251c5b5cb1f3ddd48cbdb" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.17.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "7f80f02ac990f82a5e8ed162f247963b" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.17.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "0cfddbcc68a932dbc336a932c8873ef5" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.17.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7fcec4f1a425a90f7ca05f9d068a61d5" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.17.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "73994554e4e2f4113ed3a7a1164d16fb" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.18.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "8734ab45e088f6b8e3e765e1da038775" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.18.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "438a3c7505a9074757c96eb88ab89213" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.18.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d8b2aed10b4be15c4093cdd97de636dd" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.18.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f82a26ad8b7e22bcd538bb864703b406" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.19.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "ecf514b12a5a9ddc230dc548ffdaa603" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.19.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "acd549fcfc786e53d24afc8b4e5a6d4d" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.19.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "eef00277b6bd5876efadf044e56d0118" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.19.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a3ed124ae0badee2a25716ab14e5ed5f" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.2.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "3fdab346029dc00d91c89ee966ada7ac" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.2.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "0c3ad6da8b1939f1a219721cf3021075" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.2.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "64518fd75c3d937345ac903702590e5e" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.2.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a5175c66fc31221d48f8bed7e1f4120a" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.20.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "03be79df00498e93947bff1c23aa8cff" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.20.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "6586b260e80d765a9389eef4a6941276" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.20.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "994d22374218d153683a2029f136a986" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.20.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "60ddc9931ebde1a12219700024491604" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.21.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "00388e537d60a1fb821f6841bc8b5639" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.21.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "d871fb17b4a3200a4593c40ab8d782ca" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.21.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "393740e9576977f027df7ce907ccfe05" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.21.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0d3b3dfc843f5fbb09033c2081e525a0" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.22.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "0d8c8a054c5692aad1643b85c2629507" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.22.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "5143da8850d2cb0eadde68dc8cb7e0bb" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.22.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d06fcb20449271a615715fe33757bd6f" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.22.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "1ade4b5c58afa1328382e99a42f5eeb6" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.23.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "6ba0523f841f07024ec1b646bef0eede" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.23.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "d949c1ea9831bec47865102f294f8619" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.23.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "c5c1c4b773ae666c69ec38b953ee5818" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.23.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "a0ab8dcc94dd030b543865a18fd3bc57" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.3.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "210032bc66a9e7a0c37f8b91552de3d1" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.3.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "284e8bb0dc3b1d72c4afdcd67f3107f8" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.3.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "5db9ac1f94df3e1c18a1bdcdac66aca1" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.3.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "0eb9891df107199167b848676d683396" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.4.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "7e280ece8b9c816b37e7c1bf1c120653" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.4.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "953ed357ad9bd6bc8919dd43171c63f9" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.4.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7a0311823dd93aabcde107b3ca2e9f92" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.4.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "f5c6c5ef3f38c57470f08d0d16f1254d" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.5.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "c121142ea0d944c240fea1e403536131" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.5.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "2c32c4951a08f99c2817d65c210225cb" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.5.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "95f29d86f877c14b1e8f0da88a7752c4" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.5.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "9defcc877964c34610caecbebc740d9a" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.6.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "cd0969d69201c60bacbea5fe4e78aa80" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.6.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "151d80607eac81f28cd68615568e541d" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.6.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "8fc5408952cbbb3489c54aeffe0fb6bb" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.6.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "43d47223abe837632cd80c5c452ed28e" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.7.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "9b0f0b8d7db7cbf5b55da3c91e771980" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.7.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "a4e4832fb8a91948687e8e25b49e02f7" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.7.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d9b461527be7736fb9bfda51be7fc111" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.7.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c3cb30016490db46d59200a79a2d08c1" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.8.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "36ac74c4772f93f4470a2d3d4d52d2f2" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.8.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "540c6b7bf2a00f9f779b90b9baa4d2a0" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.8.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "6329b273e5e36d567239ea537c04038b" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.8.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "e46625a1270db315a78356a6db71641b" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 90177536, + "records": [ + { + "name": "model.layers.9.mlp.down_proj.weight", + "shape": [ + 4096, + 11008 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 90177536, + "byteOffset": 0 + } + ], + "md5sum": "11ceb698e222607ff0748fc38962e2ea" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 180355072, + "records": [ + { + "name": "model.layers.9.mlp.gate_up_proj.weight", + "shape": [ + 22016, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 180355072, + "byteOffset": 0 + } + ], + "md5sum": "af80ab267c90cf546b6c4d933b633a40" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.9.self_attn.qkv_proj.weight", + "shape": [ + 12288, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2114932a725f6e253a45ea3afdc0df6e" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 33554432, + "records": [ + { + "name": "model.layers.9.self_attn.o_proj.weight", + "shape": [ + 4096, + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 33554432, + "byteOffset": 0 + } + ], + "md5sum": "c2c9460d521a25c3972a3fa060015b03" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 532480, + "records": [ + { + "name": "model.layers.24.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 0 + }, + { + "name": "model.layers.24.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 8192 + }, + { + "name": "model.layers.25.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 16384 + }, + { + "name": "model.layers.25.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 24576 + }, + { + "name": "model.layers.26.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 32768 + }, + { + "name": "model.layers.26.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 40960 + }, + { + "name": "model.layers.27.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 49152 + }, + { + "name": "model.layers.27.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 57344 + }, + { + "name": "model.layers.28.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 65536 + }, + { + "name": "model.layers.28.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 73728 + }, + { + "name": "model.layers.29.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 81920 + }, + { + "name": "model.layers.29.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 90112 + }, + { + "name": "model.layers.30.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 98304 + }, + { + "name": "model.layers.30.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 106496 + }, + { + "name": "model.layers.31.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 114688 + }, + { + "name": "model.layers.31.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 122880 + }, + { + "name": "model.norm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 131072 + }, + { + "name": "model.layers.0.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 139264 + }, + { + "name": "model.layers.0.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 147456 + }, + { + "name": "model.layers.1.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 155648 + }, + { + "name": "model.layers.1.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 163840 + }, + { + "name": "model.layers.10.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 172032 + }, + { + "name": "model.layers.10.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 180224 + }, + { + "name": "model.layers.11.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 188416 + }, + { + "name": "model.layers.11.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 196608 + }, + { + "name": "model.layers.12.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 204800 + }, + { + "name": "model.layers.12.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 212992 + }, + { + "name": "model.layers.13.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 221184 + }, + { + "name": "model.layers.13.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 229376 + }, + { + "name": "model.layers.14.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 237568 + }, + { + "name": "model.layers.14.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 245760 + }, + { + "name": "model.layers.15.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 253952 + }, + { + "name": "model.layers.15.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 262144 + }, + { + "name": "model.layers.16.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 270336 + }, + { + "name": "model.layers.16.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 278528 + }, + { + "name": "model.layers.17.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 286720 + }, + { + "name": "model.layers.17.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 294912 + }, + { + "name": "model.layers.18.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 303104 + }, + { + "name": "model.layers.18.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 311296 + }, + { + "name": "model.layers.19.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 319488 + }, + { + "name": "model.layers.19.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 327680 + }, + { + "name": "model.layers.2.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 335872 + }, + { + "name": "model.layers.2.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 344064 + }, + { + "name": "model.layers.20.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 352256 + }, + { + "name": "model.layers.20.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 360448 + }, + { + "name": "model.layers.21.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 368640 + }, + { + "name": "model.layers.21.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 376832 + }, + { + "name": "model.layers.22.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 385024 + }, + { + "name": "model.layers.22.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 393216 + }, + { + "name": "model.layers.23.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 401408 + }, + { + "name": "model.layers.23.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 409600 + }, + { + "name": "model.layers.3.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 417792 + }, + { + "name": "model.layers.3.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 425984 + }, + { + "name": "model.layers.4.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 434176 + }, + { + "name": "model.layers.4.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 442368 + }, + { + "name": "model.layers.5.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 450560 + }, + { + "name": "model.layers.5.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 458752 + }, + { + "name": "model.layers.6.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 466944 + }, + { + "name": "model.layers.6.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 475136 + }, + { + "name": "model.layers.7.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 483328 + }, + { + "name": "model.layers.7.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 491520 + }, + { + "name": "model.layers.8.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 499712 + }, + { + "name": "model.layers.8.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 507904 + }, + { + "name": "model.layers.9.input_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 516096 + }, + { + "name": "model.layers.9.post_attention_layernorm.weight", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 8192, + "byteOffset": 524288 + } + ], + "md5sum": "faeba979734e080f140a8e908a9a22a6" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..cbc94889c5297ecbbe2911a3a682136f32a409fb --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d13962db64db769549f99cf45c5988e630bd63071278f098a9be194507580cfe +size 262144000 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0be1f6c1a00646c450ec42f442809a3d8b836cc --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e4ed4c3a6777aa8ba9dc916044f2c9c38a8c7501dca4f0d54d453b51c7ab65 +size 90177536 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..e82fcd83f9ea6cc13388e13e7d72472ea98c4c1c --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8752d52430e5d242001d6a301af243d18fc3e3b2c23cc8a32474ceecbffb9d3 +size 180355072 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..05de7c3b8605af0253675d083c952cce153fb808 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a3ccc4cba56cfd5d1de75dbf4e018bdbca3351cc27b79aee1ac56b68d15983 +size 100663296 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f7916227ab8d12dfa618370bbb40ea62a9eff06 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0e59eda1df4a7907a15402efc99878b037d51b7163b20ad912a3fc273605e5 +size 33554432 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..fae4ca70aabe13d3bcbdb76f7903b7ddf691d7ab --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f34f3467fe1d3d5393b159437fabef51f74afe0ba29caff9c2a84b1744a98e +size 90177536 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..0eb8461e5df48d01d2aa04c329dd4af37214ac5b --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22c6376ba54b3c3bcf743d55154c75ecd59a74dcdf9ee544f1c1155d180aeec9 +size 180355072 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc0170494fa797f369dc9871fffb6e3ff9ffd0ac --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42aa6012643bc3cc0a27516f71c5730157444ba1cdf49cfa202ed425b17da8f9 +size 100663296 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..21ff6fff482e39bcd2d8f0f916f1c28c95475ebb --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b336e2fbafad57bac4c999b1d534fdc4e228a75618ae6b41c8fd8b403cd0bacb +size 33554432 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..cebb13d39218904bec07e36a9c928f53ab394e76 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d496d68a285dd3f9569cb5d81e137819276db189890730f810efecb79575c1f9 +size 90177536 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ec272d02d2dc309070b0edc281a8d019ee434ae --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec6cc57b5a13cd7058670c9ea29d277dad0fa62d72f9e8eeb93c6aeaecaa67e3 +size 180355072 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..f91f689384be259de11a60af5f81851d8a152b50 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29215e9e146e64134082a01fbc4ae2ccfceb3ffdcc7fcf24a8b8d0dfd8c1e964 +size 100663296 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..5999e591c2745d5e29af4f29e64b68edf0a26338 --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae055ed8aa3c23191eae4091b4679ea29c940681d63c4884e56ce3dca283b566 +size 33554432 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8b06c0a1fb912fea263492f1820b2e67a4cf91f --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f3542d15afb4edb332ddec009b7be33facadc4078a4a861b30ccba034b574aa +size 100663296 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..7fb967ca83dadd8e61cba319f573c6fc4a2346a0 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b00ca10fe0d4563e0e11f98af567aafa8a814670e15b075d1670690e126e80 +size 90177536 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..228ff79060948accf38e9a348b1c8a5173e98805 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134fdadc4fbd62fe3fc93b5a5f4ea1975120a0f5896638b2a9787b347abcbc0a +size 180355072 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..88c82ebf8a6a0746c57dbb4b1e49103756e2cb4e --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2bddc5b9527f6feab0b53e6975d7c277bfe6a2fa5c8d14692f6945a58ed779 +size 100663296 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7d15bab2c53bd60e130cc261f1a1cdf28813168 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45eadd93163344f38cd8cdd1d3768786fe2d059adb5d7aa8426c7c3682cd055f +size 33554432 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f7ccc6f4bce3bfce02a9a55e6217ec783178730 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662a9c23e68bda14171266050b6ab59acc953ee3abcf34bceb19665b3ce45f71 +size 90177536 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..a2b69765067fcdc902acc4b243ed80f28191c13c --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f33e60c9fbd912adfb28f59ef6ba4fa9565bcf023b9e5be81a08d9b68cee9bd +size 180355072 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..b90d7ccd46d8a07c857ccd9e88f0f3c68a80a2e7 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef1f6d1a9961ea1534ff0c901da3aebf6ca4e4678d5860376731c8a5f4dbc27 +size 100663296 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..0072c821280416d7b187f66eafc8a71847744e2d --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91c08613c0ccd5c2d43d1d997dd6604d572fc73d47d1436855517da643c07b4 +size 33554432 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb2ded71a20e6aa0e4bf4fe6b14db3eb9694b5d8 --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2c24eeef7aab801e7cb4ebe3f9cf6ebee0eeb6fab741ce2cd7daec726c38ea +size 90177536 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..b370fcfecf12091cdf5126b8f721a646a3b40d3a --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab52d9c222c82a68d0ffb32c6ef50d0e1e7c0597574b6860234ca9b82c1f083c +size 180355072 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e8f29003b8d6d68e188b3c49312fcaf971f53ae --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7673111bcadd43011a25bf9dad68fcce7412f325d60fbdb7b5449b364e1724 +size 33554432 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..39abc1c67a06215456274182d9cd5beded5f6195 --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a432aba02636d59b31a788197944647c9017f4095bdf345ae55ed2724d2da77b +size 100663296 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc65ceca1842e1ce662bc14266d9fbe78556687f --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de08809bdcbee5ce1b593c4bd0972881eaf9f49e7bcb21f20d9354dbb4a1ea78 +size 33554432 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..f395e35b951df76cd4813403f04860aa56f58dd3 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c64e26a1ef86fe0d1cfa0c71bd1ee52c1c9faf1d50f47e61c4353b34f38302 +size 90177536 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..3fe4fc374f8e768c6136b9c6a198aa3b88b5521b --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0174cf1d66e874b4d6bbf1269204264194aa3a91d220a02f95ddaf50a57cdc +size 180355072 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..da7e34ed3ed31ab98505362840cbcc1e0ce1f72e --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a179a52c95d559659fa739ffff9285d903dad4226986fb6c97ef3c5cbefe36b +size 100663296 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..f92124c395f800b0f7a6247a3822216212feeafb --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3bc8a296b61991d9cbd38c3cbd73a9c4487f0a5ea79d80ca2e76099b18995a +size 33554432 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..793223af41ba062205fbe932d38862aae62bc34c --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:101df9f32bda1183e231bbf3c66cbb75c9cabab026b1f5b70b838e11ba61bbe7 +size 90177536 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6c325db402f977bac54367c3a5c036627343594 --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1b2cf3bc18b1b3b10ed38dbd63b96dc69642bb2c818e7ecf1b3adef965ef14 +size 180355072 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..951ec6b5b5a0afd77cd1634ddf41e1f148f2fb6f --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a8c449ef64969cdff5b227b094453cdd89bf072d4558cc50bc02262de6269b1 +size 100663296 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7b7bf0b3df9b6e326015700d187bb2397095e72 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233859329abb82b91b2d136ada6408b3457c68be8738ce897fb28dde177d75c0 +size 33554432 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..56a27a0d75a8e9b4d9d605530090161bf9333d51 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c30f55b23c35339909a05e84e81d647349745699548e5398cddf5c1e78b44018 +size 90177536 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..0c7a9b472e61df6246516d3845dbc8af21c11203 --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e72badbb388ddc64bcc3a01953c31a1cecd94b935d2e81af91ba6f3004d100 +size 532480 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2cc8fdf9f4e64c77b781c6324d1f47109f10787 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f8e97361225cb7eef75abc3b5aa2b1448a7abb251b4e8ffdacb629c586019b3 +size 180355072 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ddbf3c1ec16433d8c988e97811eec752626d0ee --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b19b556335a9da15a2a162612a0fe2cead7de5b362757c9940206e9f657c6477 +size 100663296 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..5aaa492126e78906059525871b44622a68c0b0f1 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504b454188d9c8cbac43fd987bb4dcf34822a9597e88448773a98088c721b16a +size 33554432 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..844ea5cca57c6e55b7e42f0468c8cb243c4bae63 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd17b844c66a49236004655ae05ed05c3473eaa54bdd2b2d5ce185b889d5a5af +size 90177536 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ac94e4c4625c141e29bd961c42abc57a1c5522d --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c359e0a679d5ac0729ff253ebc1429e2547bcff87d36f4665f3d9e23172e41 +size 180355072 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7e49ee182798607e55bd544b64ec9c9ffd33e7f --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d53d0bd1f0616121e098b867a37564493f81435c07b5e4f86366c5642b0223 +size 100663296 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..afa1e40b9d8b03b6c45066bb1170fa776be4b2ab --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:011839723c3b711375f8e2be1be966e1d3d9548033113accb939e725dfbdebf9 +size 180355072 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a8720132ebb93880376f0c589dcc13709a51749 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf5ff1652f4deefe490d74518621ab0a9b57da3509a72b2afd3a759f29b4048e +size 33554432 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3949bcc0f4881b8cc118948956c6340c217c6af --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3927aba0e4ed33a4133a439c05bd9788d38f032199731337e8a20994e6280a9d +size 90177536 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..47e965eb001982e6170a63cd9bc108f80dc79ad6 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08019da622618a2072689daf303b32cd9a276e86439f2df8817881bda18ebe3 +size 180355072 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..21760641a6dfb14d4d6b0eb9eb225e5d15d70723 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d200a143cab80206dd9c6bca547f470022a7f2bcf90f9622fe80802b65eafc +size 100663296 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..c293cf2d85e7c66f6ede49edba0fdc398e621814 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b68e7f1a584112bda4a5da607dea1c54f3d2f18bffaa223a23c144175d57603 +size 33554432 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e817b3dea8be3d01db413e87939b9794dea7609 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4369ed4f605997d48d6e5418b054e0b98e92d1b96ad651612cd15b9fdedfe7e6 +size 90177536 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..5ec3c1b8bcf597ec844c187d3f4d1d25c2a22221 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dff91789cc937d9b99271b9983f03a7ae8eb4945271658a017ca87ad0952019 +size 180355072 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3faf4dc9303d0f86d6ed120a21234f2491cc9ac --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c39938cf0cb27c37569be749f720fd745a139722280c6ecef24e52349cce9d5d +size 100663296 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e40935e8e9fe3d3b864fdb3f1f83be57a84b80f --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef661785f31466265e36f35c999deec753dface919e5d9e42b31dea7d5d3c652 +size 33554432 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..bb4495da05ad153271d8713a9aa9b55fa13c4a0a --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23a1bc7a4dec27105c6854db068d33a3bcd1aab0e8dc2e0aa3fb2df017602ed +size 90177536 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..46efc0ff20022c29405850d207bff1481a9de5be --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c4d3363e83ce7ab7d57e15e77c89dfe0bd307edd3592e622e088550d880c58 +size 100663296 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..135bcce3ece0e3bb608194e816dab6404787daab --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7c078e3019a8eefde4d547c5463193961969fc0baffadf994b06ed24975f27 +size 180355072 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebb632e2af1134ec907003ba7593a7b12153a058 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99ab52720b2b374dae63007ad968787e6a1640916067b3540414c8f93e8344a +size 100663296 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..5faa9d0080da0c8bb188b1091dcc8a3dd935cfb0 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f702700ef450834d224bd891422298ba91dfa60fe325a1b34f0b381002b8ccc +size 33554432 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7af39a8549d3d36047f9b6cb77d80c0ab651db3 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c3c19840933934181f202dc7e0aeedd397feb36a08eed3a5684c4bf6d82562 +size 262144000 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..43452951952d67c300fac72a66c459af9bcdbfdd --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1555499abf7b07920d76a6b2ac9dd0ec04ee7c3ff88a51477152e828d58f4b5 +size 90177536 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..737b627372d47ce5d637fcf5a7d84ec2baba319b --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc2915844584c516262769d3ef1a0bc18c0933b1cba602ac34a0ccb8b0eabbd +size 180355072 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2f6ba0651b451c3d3b4528309dfcee06c771b13 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6b9ef3cad97fd537528885a757ae5524a9891d9e7f61e3d8c408e2e8aeaaa9 +size 100663296 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ab3e4f32af61b074157f0912bec9784c0b564ac --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14681ef3f712684900e49606bda9f8cf6ac8a1cbe5f612aebca05ab36dff11ad +size 33554432 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..a07780c6adde7a7228779e584efd03ed628436e5 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58791439e4c49ac4675bff9aed3b733097e88f8bead6abd5ea352de14b0a5134 +size 90177536 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..52edd9442c73f426eafb791985a7dc7882cca083 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5256ca1b91a0a02ba19301ba41d64aadccd1485209ae02109398cbb4c448a5dd +size 180355072 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..f67e980e7288a80ecadde38927ced96dfd3bcd4d --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53565ea3bff3c13f7495e2b69f7c475702f2cfea494055a1ed8b0768808a971 +size 33554432 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..c15c09c252cb71f829bce31b191cd6748f79cde9 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34cb66ebf18e02f328e454a8c30616ebb3e1c0e60869c7158d7b6865b3d169e +size 100663296 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bf6950ac66a052a4ac2bd6271508f0a7bbfedfe --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ec0fddcf2d91d0cb9908deac1fc9561c56cbc4d78b75e197e2ca8852465a3c +size 33554432 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..0eb660bd7015fd2f74132b5dbb58c9182806bab3 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370b6caf6e8329d4f1aaff753c458d47ad551abeecd0e4a581644d36b69fc5e1 +size 90177536 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..03cde5d85a2ec5e00f54a8dd57688af9b6018480 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba89aca00e34546698a55774ab3e6a6ba4dacc1ac59270fbc762151b1847f0c +size 180355072 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9f992327155e5eb3bfe0477e47352d791a6aa75 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:666130f78c2f600a9617af77fad3ca631dcfc78c57ced4b344c42612573e48fc +size 100663296 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..09269e57d9cb4b7035abb2b0ed48ab4849a53b2f --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f1d811a4ffa98a3701e98ec35c8db90c84e0854fb7e28000869d2e061a31e5 +size 33554432 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..69c121376b8808ca06e5eb3f8aea1b37949334e3 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71c26fb80efa531f97881e31961882dd666b607decf0b53d91aca369413cd47 +size 90177536 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..34873e5b7f1797710b7748bc033c58be57236632 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8537957583fc02c75a6b5b1dc9c14f292e24558fe5b501695fa10938962caa6 +size 180355072 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..a808b8e7d3b73821dbc8d84082609b50b2d7abf9 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8671e1b45f3750dd60d78a2be9f2261f4f81d624b2d2809d5f291c8299f34b88 +size 100663296 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d25c22420e4e6877bc025c54032a8b35eedf8d3 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb99aa47692d7da7a4aa775c3cd0716c301bb2094c17f98c04c126c4592fee7 +size 33554432 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..d19ec87e8eb8b28a385a4740e94613f243901e4b --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe8953c099d75eeb99877724a30490650a074b445f9f74b0971a846fc33cbd5 +size 90177536 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbcc1d1ef46cc39c57916eb35928e8e327a03a2c --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cf530a405332880a731877e2f524f3eb206465cb62af6dc1542582d669bcaf5 +size 90177536 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..f82e3d488cf079f06fab0ba49c97311bf4759121 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b8981aa870605639d051ce196d0fc140efffd68da208ca06c9346b7b9fd3a1 +size 180355072 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e7e1ad5cdc423b6577d983ba0608a6b46b6f229 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8f4beb7bc076a080d48168b9d33b85c01bb9714c7347672286a298f2d3630d +size 100663296 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..30c6533cb6bdd82d5d7d5c15dcb7f58cb90b8add --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f5445f63c0185da6e5e274df0bb1ba3bf7a5104a4f8db18a69cf448f32a24f +size 33554432 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..769607e9463ac5ad213a06c8e90f660affe8a5de --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e2d9fd4018f903c62c7ebae7da29289a9696a77cfad191d1e7082a635af53b5 +size 90177536 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..3178df0c736459d391388b1d461b0821ab92ab79 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab7ae37755f9b7853d18cd073b69fa6d19e654d9e41816df715ef6e64c9f272 +size 180355072 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c7c7cba1b3725f4031ad5cc00b712743a1f16c1 --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9598aa83007d6ad89be0b2c34841b376b46a5f8f3f52159f1d15572f33b19fc6 +size 100663296 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..d81333ac57121ea284a4344a756008e8da68ab12 --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb5d47e54d30c4851972aca94630dc7adedc2d0334bed52ed21b54af01732560 +size 33554432 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..a61cbbe5ab60d3bfb8978016493b9133f067ca0b --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:633e9cde1d9a29d0fb56f54d7a16e603e39e244f2de3e7c13710b41cab4a5b49 +size 90177536 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..f5a1961fc1594d1716780bb50763edbb07e87d19 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb12f574a0df906222b32453f791ca5647b10dca3d67efe71a2b0e6b778ed18 +size 180355072 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..11bd5969c910b7c29df4fb9649f926db4e676f2e --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf1e5cf9396d2caecadda839e0cf0b449216e1784790d20a2e3dc5460a7e327 +size 180355072 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a81c3b9250c4ae38a718baeae7d5f75f8e08999 --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6c3164f2c740a5255c1c9e87855f638d284826b84d832fadc3b205f2620a4d +size 100663296 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed2758795448a58651f2da7c5609f005d2c69fb9 --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff57fe3496b809a19d7070c3deb750a245d57188e301c1b0fb4a7c25397e5ce8 +size 33554432 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..38f702f14674300a28b511c090989d39b51421a5 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed54fe0555efc09f721ae25e59f9b0a21d59e9ffda9fafede4cf145cebb6b022 +size 90177536 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..168dcf376fc732892906bf4dda3bf821271f2916 --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d163971d9704ef96fff10866dd65c8ac8b9a7a6d1cede83de89848323af36c +size 180355072 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b6262157adfa42fa7d9243e4997bf10154c1a7f --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e87bc5a93fd8a92419d1349181fbdc5d51ac870a04aec741c32fccb28efd7f9 +size 100663296 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..dad6358f04fe0fb8b57b9fd5c6f7761d5d1f80e3 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3bcd24d4fdf2d7f4a4c4c55d2aefee354b7b30978aedae7a60676302c08af6 +size 33554432 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..4396ad81778d241a1053df4487c27d2dfbe09e16 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5cf19202057e547c811d7d52e98247c1139ec0533a24f145f83e02650b6f50 +size 90177536 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e1e1c5b71f523f9abac3fb8af0863ce74c300a9 --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa34eabcc857b3aeb13ad5f6e5eec459a71b34b9e62aa52cd8f77617a9b1b3e +size 180355072 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..4f54f32126376a3f5b5cd1a9e408d62d9bce93e5 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fbed30b5713a94278a45184621bdc339e693a8fd844912e2aa3ff34077451e0 +size 100663296 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8b4b9d561e926334563604627de15a0634714f3 --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118a63f95e5357b18d76f263082ffbf03ab84e749c37fa7bba46c5470d96d9bd +size 33554432 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..94077b857d6a8469cd782fffb0ead31ea4fc8067 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cea9ab81368a4ba7ecb0061617ca557e53a13b6d06203c6a3aae04e83dc7da5 +size 100663296 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..46f4436f0c0671353012aaaf6f0fe13c996bcdb1 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92890a3d5521936ef88d0eaac96de27dd6fe3205cf2504cab033ecbf16d08043 +size 90177536 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5414a0ad3fa8b51cbe6aa6267d8d3730fabaffe --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0497c565ac84390f6e4a8973e8a6033851e0bfae19684cc4c23544b96379c6 +size 180355072 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..99a4363711e7e121e717556b63a2569d5378979c --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c292afcdb0751863f9e96c155a551b203105b839b9014c20706307361ba1a8 +size 100663296 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..a49bda4e9894cb87f0cb21926f4915d15ada9714 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16403312775190bb6c3527bc00f6856c9092a913872575aafde096b5e8d0d791 +size 33554432 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..1532b803fd96bc3e7c9ad236f0af3c66f35785bd --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c16fb5baceb31462c4582fb51c7cf7121659512ca94f555949d281de1d2b48 +size 90177536 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..62decd5a9edc6fb9f222b31ffb6cb246c94506af --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9075f2442f7c876b236412734f960a1596300a07a35163f7aef1f375a1eccc37 +size 180355072 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..7c645aa68764526a8258ed056fedba6097c88e27 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603b28c35d8265cfdc904463e855d0fe8c1130bd122fd00c20225c60d3ea493b +size 100663296 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3c158637e0c1cd6e90054fbf0c629aa7fe3a77f --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737ee65f606830f33615b02e5b03432126cf212d02a015e0159d2c8aa98e4b05 +size 33554432 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..314415435e0ce2cf64b890ff51e132fb07bb28b6 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccbe1ca3ed0fc96a16c6c2ff0d8fab951e5bfc416a2fb79ef81b1c0a0b22930 +size 90177536 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..41aead5c81b822d401fcee52df13a7efff5016f9 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b836c548be0c33d13cfffcd2c5de392e576aab6fec8f201ef3e935b3c8580dd1 +size 180355072 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..56bb086f23ca01b40bd7f7675e055f5da0ed7bf4 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf88bb2a5d221ab5920ee65c1f2b637e7e27b017631cbad64447578429adc1c +size 33554432 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..53607cce27491e614d81ede84ab64ab17eed6932 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbdee7ab1fa860156222e272bd7e6c7800552dc0228806a05d4e82e3df4b358 +size 100663296 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..c668bd8f36f910e92036a17c57f4477a3f083e9b --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6a0373d293de4e612e2f1be0fd76d7f05d1bcfd5c88ef76bafaf9b59b6b442 +size 33554432 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..62fe1cf6ebe1a0bbdfce892e638847c2f3ade366 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2aee72b43b73a1732d13245013364fb756b2543176a1e4f3ad25cdbca15861 +size 90177536 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..e9cd02e2a32b4e5b044816535a1c6801681c623c --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd763e14d356fb6c7bb7396efaca3a3ffb9837523dad9fbcaaa9906bb4c664e +size 180355072 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..aecca46937646643eb3e2ec8647156098bd47952 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61ead0fc1b16ba4aa2efd1556da2b3e4d846277b3450d1f9f7c9d15fb186d63 +size 100663296 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf3ec5f86c4343914e82b3d9779d6a04a822be2a --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b7dd4389193610ede390c5fe1855f743e591fd8deea7a71bed5848cc3cf812 +size 33554432 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb536a749d6fec1c2fde425a9c88e15842638c58 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd735190110f7e58b4545e4fbe1766db557ed3dd46899966b7772cef9313d66 +size 90177536 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..2f46ecba27a8357d905b2053de7022a745366e3a --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68defa085297e3f2e9ad35770bc80eb86395ece21d4e1e743cd6ab52d2b358c +size 180355072 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4bea01261ba54b6bf15ddf5bd1a2996418a81b1 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd380cd3f1b6aa989da8c8e6074bc8faa6ab19c5bc52f047790644bfbdb6c660 +size 100663296 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0a03b5b045284a5f20df47803c5888c7f57c4ff --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5d6c8c0c6329080a53f636c0368dd3ef8f739f1f5cc4310466047954893eeb +size 33554432 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..10b51132d7f119dd1c83cd115ce202256a6a5099 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35745c928a375d0da0e755c006ca5e06013856c478ea8172f0cdbf4f683a6db9 +size 90177536 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fdf2d90ff7c7041f60c71f84e927b493f8ff2bd --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4fd07f9b2de463da7c2177d65426a7523e4befc69324d5173adc7c46f00d9c +size 90177536 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..3615d52f97def6f4b1e29ec4ee3358af37e263fb --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c99688656a8f9c4a443f97efca4da5ab9564131e2fef1b056bb31bda68162c +size 180355072 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..b255ca9e140bb212aaac719775724ae85c940aec --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:488620c26440685157a28c5e57e6d9082ac42bde65c5fd7f66071820457170e4 +size 100663296 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f41baaf8cc338caa2bcdc5d816916131e42cbb7 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1daec2fede3e67fdcb036d9861411263e2c47da94b2edc9f4db912275f7d42 +size 33554432 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..88ab72c6d8c18f1bea7ca53cf37b9c1df0511e7b --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c338ae0311972fcf3b04fb529efed4b749de1dc8ced9a616034fe6c7305a49 +size 90177536 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..00bf489bae7d1d7e5f088c812a5f3985f884924c --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f89344d8c894239a6706a397a2305c80c41016a2b6f47eddd83c7e6b00f3b77 +size 180355072 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..650d04274286c6f8c2810d6c7ecde73d29bf0663 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:858aeee814fcdf94d0ef6c41dcae0850a01ae75e2bd8107104f36f537b2ab861 +size 100663296 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..c030a9188b84bd8172ed5095afbd95b50595b132 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de2921c59ec3be9c323f915f7356e2ede360747506ca0eea6edf1f2e6b0d1dd +size 33554432 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..328f7d4bc3bf052be488e6c8dae10fe391dd0cff --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e5c955aa5b0f5236fcd0d66676bd6d8f7340198e79314100d7a6e3b5422314 +size 90177536 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..3297069e86ea4e28cc041a799d197f00cd0f559e --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:245f9b4c2177e5db97c96fcbc139940bde2fbdbe08a4cc1892eed543976b33f2 +size 180355072 diff --git a/tokenizer.model b/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899 --- /dev/null +++ b/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347 +size 499723 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3723b3a4b003856238795c1d3b29f10fd21114e8 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,34 @@ +{ + "add_bos_token": true, + "add_eos_token": false, + "bos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "clean_up_tokenization_spaces": false, + "eos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "model_max_length": 512, + "pad_token": null, + "padding_side": "right", + "sp_model_kwargs": {}, + "tokenizer_class": "LlamaTokenizer", + "unk_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + } +}