Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- checkpoint-3089/added_tokens.json +16 -0
- checkpoint-3089/chat_template.json +3 -0
- checkpoint-3089/config.json +48 -0
- checkpoint-3089/generation_config.json +13 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
- checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-3089/added_tokens.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|box_end|>": 151649,
|
3 |
+
"<|box_start|>": 151648,
|
4 |
+
"<|endoftext|>": 151643,
|
5 |
+
"<|im_end|>": 151645,
|
6 |
+
"<|im_start|>": 151644,
|
7 |
+
"<|image_pad|>": 151655,
|
8 |
+
"<|object_ref_end|>": 151647,
|
9 |
+
"<|object_ref_start|>": 151646,
|
10 |
+
"<|quad_end|>": 151651,
|
11 |
+
"<|quad_start|>": 151650,
|
12 |
+
"<|video_pad|>": 151656,
|
13 |
+
"<|vision_end|>": 151653,
|
14 |
+
"<|vision_pad|>": 151654,
|
15 |
+
"<|vision_start|>": 151652
|
16 |
+
}
|
checkpoint-3089/chat_template.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
|
3 |
+
}
|
checkpoint-3089/config.json
ADDED
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/mnt/zhangh/sicong/vl3_data/checkpoints/Qwen/Qwen2-VL-72B-Instruct",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2VLForConditionalGeneration"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"eos_token_id": 151645,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8192,
|
11 |
+
"image_token_id": 151655,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 29568,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"max_window_layers": 80,
|
16 |
+
"model_type": "qwen2_vl",
|
17 |
+
"num_attention_heads": 64,
|
18 |
+
"num_hidden_layers": 80,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"rms_norm_eps": 1e-06,
|
21 |
+
"rope_scaling": {
|
22 |
+
"mrope_section": [
|
23 |
+
16,
|
24 |
+
24,
|
25 |
+
24
|
26 |
+
],
|
27 |
+
"rope_type": "default",
|
28 |
+
"type": "default"
|
29 |
+
},
|
30 |
+
"rope_theta": 1000000.0,
|
31 |
+
"sliding_window": 32768,
|
32 |
+
"tie_word_embeddings": false,
|
33 |
+
"torch_dtype": "bfloat16",
|
34 |
+
"transformers_version": "4.46.0",
|
35 |
+
"use_cache": false,
|
36 |
+
"use_sliding_window": false,
|
37 |
+
"video_token_id": 151656,
|
38 |
+
"vision_config": {
|
39 |
+
"hidden_size": 8192,
|
40 |
+
"in_chans": 3,
|
41 |
+
"model_type": "qwen2_vl",
|
42 |
+
"spatial_patch_size": 14
|
43 |
+
},
|
44 |
+
"vision_end_token_id": 151653,
|
45 |
+
"vision_start_token_id": 151652,
|
46 |
+
"vision_token_id": 151654,
|
47 |
+
"vocab_size": 152064
|
48 |
+
}
|
checkpoint-3089/generation_config.json
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"top_k": 1,
|
11 |
+
"top_p": 0.001,
|
12 |
+
"transformers_version": "4.46.0"
|
13 |
+
}
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74c42e7ea4b6175a9cacb2af02d490f21c0d6a4ef917fbdb498207cd242c17f
|
3 |
+
size 27264836613
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94b1c06bc39ee68cdfd447860c5447517e7ed3ce3ffda02f376dc7ed86cd903d
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:182c60968bc63cbc2f4e556c094ea8ebdb3787c0985fbf32bba64158dfabc315
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:602212bb21ec0a6e3985e22f1eb677d81dc2832a5bb5196c064e93fb3839737c
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8150d2c767c89a508c0d1437fa16a3b793fab45a094c20e2b7cb3b992eba1fce
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c94d37843bd35fa32dd0b6a665c8ba02f9b0b2601c53f020418b1b8c0a6d024
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afde019ed997233283ad9fa58c49c1b98dcf9226a84abb98db1c98e87455d4e9
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2eb4feab6c7de8c02204018fe7165c1f49304c5fda2597a5a6fdd8e0b1cb7a4
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8deea3483e3f2915524c7fd560f2ccd0dd5e99888cc3913b9f237d333a6c9477
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23dc44fd91db4b4eda35a39c182d36cd6906990710a1fa49b66aeafe25a477e1
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2be661dc9b2f52311f5160ba46c22065f2f1d7cea2f2711f772fd32e4b16e197
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce85374e7f0ad09e0edeef2cd799910403a43713a875754bf9df1a9229525db2
|
3 |
+
size 27264836613
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0916a4c275b848b60cd1e2a5e707070e8f6d02d84d34d7b095a3fefa254d155b
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47a05db28f09c2c9b906f87204a134b5c122530d86b66a28b9a26ea7ac9a5586
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dce80fe8ead43f369cc44a6a2da7ae34b20d1238f6c459b28275141b3138468
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3fc9427958978403e1eee704f3f457166bd590ac09c3eee222957fc335739b3
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec4c0adf86323727cef8a6b5abb7a900729468d923a2d02bc3ffb1ce6c4f83db
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f8505eea21182353881ecb725bf3443f6d8277cee487e0e41a86875dc705730
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9eae8cbd49907270a5318fb835a05aae09200cbd010e995e74401731e08f0100
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af11bc8b1fef1735cc54e7663027c60f1a84f2498ee87fd2613f0660caf8113e
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d50e5beaae6db356a582001017de453042971cf742326d8991b66185478009ac
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2ce6b6fe2bacd2eb297e3bdeb8458ccfd99451d81af3c28636b5de655a618c
|
3 |
+
size 27264836613
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60c80fec92595cc2cbb01addf68d1410e5030f9fadf63e1a93010d039dab1f56
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32ad50265818b99b1650cf20aa996667865eafa5679ce02d715bcd903b19f427
|
3 |
+
size 27264836627
|
checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f67e73100a501e744816dedd91363c7ef3a91e8a63926a1718a934509426ec2a
|
3 |
+
size 44479125
|
checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4949cb36da9de6730c2963d265bb269a7300fdedf3fe0eca0e679ec0a5842fe
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:205cfc80c041e320fc10114a1864b46073ec5169bc55fc445105fa8ac56b8b42
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3e88b556feb2e14a40e17d67aee1bb21627cdd6503f7c3796f0f1fd165026fd
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfc447884899fc790409fee53f929270a80b7e5cb41d2613d5830ef1a42a8503
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75548c107a86947223f47bb79905593b78af37f5b1f26cbb8e8091b623f68986
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35beeb31e51e25c92750a50a58e7e4efa3c918b88352a43799103c78aa9741a2
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d029525775db18eef57ba621c53c9371302ae5af44dd2a0623da19cb0e56b67e
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d1eda5dda07e43dc88ba7d3708c5b15c5a67fa852c0672e1f91c20854d653b7
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd3d9abd1d2bdbef38268477f97ae20e67ba7745924869d2dab99a59f6167044
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1e129bf09995bbccdc1f17d0a36e6213fd21cecb83caa7a9185dfe2b8e3786f
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:401934dc0b03259d660d4ffbcbd24ba315f5d64dcb129e53eb4740c1812c253d
|
3 |
+
size 44479125
|
checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:042e7168cb438ae5e8aae33df28bd3885dc606cc0add51c46ef26f2a1f14c08b
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3fadba113c5bc3612f6012e58a80c191b62494cb2f55eb524bb4f6c367e3896
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:734c830b3d8a2ebe32a5bdb46058d832115f207d98b1301424770a8da417d904
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58564cf279f7cafce29fb27c296d354367c170124de1f441b41e3df12a752b7d
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9b0579ef1c1ff0be1570182ba2688ec97b5490c1d8c8edd3a7a050bf87c131a
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5eeb1f340faf3d94c96b5580620a4edd201f1fbd90c0c0c1d6f1c052fa633870
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3d26192abde532484ccda2438bbcf7beb88c942713ead91c7d8c8ace237587c
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d4f4ac01bd15d27b5a89396bedb9fd0b388d2e5504375244bcb5aaa20834ad3
|
3 |
+
size 44480936
|
checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd84b6d2aa70b74ba35e0c25576a7f6fc51c77ac95b01b5a1bb9bcdbfd9f902e
|
3 |
+
size 44480936
|