Sicong commited on
Commit
0286882
1 Parent(s): fdd2807

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. checkpoint-3089/added_tokens.json +16 -0
  3. checkpoint-3089/chat_template.json +3 -0
  4. checkpoint-3089/config.json +48 -0
  5. checkpoint-3089/generation_config.json +13 -0
  6. checkpoint-3089/global_step3089/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  7. checkpoint-3089/global_step3089/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  8. checkpoint-3089/global_step3089/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  9. checkpoint-3089/global_step3089/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  10. checkpoint-3089/global_step3089/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  11. checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  12. checkpoint-3089/global_step3089/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  13. checkpoint-3089/global_step3089/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  14. checkpoint-3089/global_step3089/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  15. checkpoint-3089/global_step3089/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  16. checkpoint-3089/global_step3089/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  17. checkpoint-3089/global_step3089/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  18. checkpoint-3089/global_step3089/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  19. checkpoint-3089/global_step3089/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  20. checkpoint-3089/global_step3089/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  21. checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  22. checkpoint-3089/global_step3089/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  23. checkpoint-3089/global_step3089/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  24. checkpoint-3089/global_step3089/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  25. checkpoint-3089/global_step3089/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  26. checkpoint-3089/global_step3089/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  27. checkpoint-3089/global_step3089/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  28. checkpoint-3089/global_step3089/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  29. checkpoint-3089/global_step3089/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
  30. checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
  31. checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt +3 -0
  32. checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt +3 -0
  33. checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt +3 -0
  34. checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt +3 -0
  35. checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt +3 -0
  36. checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt +3 -0
  37. checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt +3 -0
  38. checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt +3 -0
  39. checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt +3 -0
  40. checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt +3 -0
  41. checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
  42. checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt +3 -0
  43. checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt +3 -0
  44. checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt +3 -0
  45. checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt +3 -0
  46. checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt +3 -0
  47. checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt +3 -0
  48. checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt +3 -0
  49. checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt +3 -0
  50. checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
checkpoint-3089/added_tokens.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|box_end|>": 151649,
3
+ "<|box_start|>": 151648,
4
+ "<|endoftext|>": 151643,
5
+ "<|im_end|>": 151645,
6
+ "<|im_start|>": 151644,
7
+ "<|image_pad|>": 151655,
8
+ "<|object_ref_end|>": 151647,
9
+ "<|object_ref_start|>": 151646,
10
+ "<|quad_end|>": 151651,
11
+ "<|quad_start|>": 151650,
12
+ "<|video_pad|>": 151656,
13
+ "<|vision_end|>": 151653,
14
+ "<|vision_pad|>": 151654,
15
+ "<|vision_start|>": 151652
16
+ }
checkpoint-3089/chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
3
+ }
checkpoint-3089/config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/mnt/zhangh/sicong/vl3_data/checkpoints/Qwen/Qwen2-VL-72B-Instruct",
3
+ "architectures": [
4
+ "Qwen2VLForConditionalGeneration"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 8192,
11
+ "image_token_id": 151655,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 29568,
14
+ "max_position_embeddings": 32768,
15
+ "max_window_layers": 80,
16
+ "model_type": "qwen2_vl",
17
+ "num_attention_heads": 64,
18
+ "num_hidden_layers": 80,
19
+ "num_key_value_heads": 8,
20
+ "rms_norm_eps": 1e-06,
21
+ "rope_scaling": {
22
+ "mrope_section": [
23
+ 16,
24
+ 24,
25
+ 24
26
+ ],
27
+ "rope_type": "default",
28
+ "type": "default"
29
+ },
30
+ "rope_theta": 1000000.0,
31
+ "sliding_window": 32768,
32
+ "tie_word_embeddings": false,
33
+ "torch_dtype": "bfloat16",
34
+ "transformers_version": "4.46.0",
35
+ "use_cache": false,
36
+ "use_sliding_window": false,
37
+ "video_token_id": 151656,
38
+ "vision_config": {
39
+ "hidden_size": 8192,
40
+ "in_chans": 3,
41
+ "model_type": "qwen2_vl",
42
+ "spatial_patch_size": 14
43
+ },
44
+ "vision_end_token_id": 151653,
45
+ "vision_start_token_id": 151652,
46
+ "vision_token_id": 151654,
47
+ "vocab_size": 152064
48
+ }
checkpoint-3089/generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.05,
10
+ "top_k": 1,
11
+ "top_p": 0.001,
12
+ "transformers_version": "4.46.0"
13
+ }
checkpoint-3089/global_step3089/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b74c42e7ea4b6175a9cacb2af02d490f21c0d6a4ef917fbdb498207cd242c17f
3
+ size 27264836613
checkpoint-3089/global_step3089/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94b1c06bc39ee68cdfd447860c5447517e7ed3ce3ffda02f376dc7ed86cd903d
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:182c60968bc63cbc2f4e556c094ea8ebdb3787c0985fbf32bba64158dfabc315
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:602212bb21ec0a6e3985e22f1eb677d81dc2832a5bb5196c064e93fb3839737c
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8150d2c767c89a508c0d1437fa16a3b793fab45a094c20e2b7cb3b992eba1fce
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c94d37843bd35fa32dd0b6a665c8ba02f9b0b2601c53f020418b1b8c0a6d024
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afde019ed997233283ad9fa58c49c1b98dcf9226a84abb98db1c98e87455d4e9
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2eb4feab6c7de8c02204018fe7165c1f49304c5fda2597a5a6fdd8e0b1cb7a4
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8deea3483e3f2915524c7fd560f2ccd0dd5e99888cc3913b9f237d333a6c9477
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23dc44fd91db4b4eda35a39c182d36cd6906990710a1fa49b66aeafe25a477e1
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2be661dc9b2f52311f5160ba46c22065f2f1d7cea2f2711f772fd32e4b16e197
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce85374e7f0ad09e0edeef2cd799910403a43713a875754bf9df1a9229525db2
3
+ size 27264836613
checkpoint-3089/global_step3089/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0916a4c275b848b60cd1e2a5e707070e8f6d02d84d34d7b095a3fefa254d155b
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47a05db28f09c2c9b906f87204a134b5c122530d86b66a28b9a26ea7ac9a5586
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dce80fe8ead43f369cc44a6a2da7ae34b20d1238f6c459b28275141b3138468
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3fc9427958978403e1eee704f3f457166bd590ac09c3eee222957fc335739b3
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec4c0adf86323727cef8a6b5abb7a900729468d923a2d02bc3ffb1ce6c4f83db
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f8505eea21182353881ecb725bf3443f6d8277cee487e0e41a86875dc705730
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eae8cbd49907270a5318fb835a05aae09200cbd010e995e74401731e08f0100
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af11bc8b1fef1735cc54e7663027c60f1a84f2498ee87fd2613f0660caf8113e
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d50e5beaae6db356a582001017de453042971cf742326d8991b66185478009ac
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea2ce6b6fe2bacd2eb297e3bdeb8458ccfd99451d81af3c28636b5de655a618c
3
+ size 27264836613
checkpoint-3089/global_step3089/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60c80fec92595cc2cbb01addf68d1410e5030f9fadf63e1a93010d039dab1f56
3
+ size 27264836627
checkpoint-3089/global_step3089/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32ad50265818b99b1650cf20aa996667865eafa5679ce02d715bcd903b19f427
3
+ size 27264836627
checkpoint-3089/global_step3089/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f67e73100a501e744816dedd91363c7ef3a91e8a63926a1718a934509426ec2a
3
+ size 44479125
checkpoint-3089/global_step3089/zero_pp_rank_10_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4949cb36da9de6730c2963d265bb269a7300fdedf3fe0eca0e679ec0a5842fe
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_11_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:205cfc80c041e320fc10114a1864b46073ec5169bc55fc445105fa8ac56b8b42
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_12_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3e88b556feb2e14a40e17d67aee1bb21627cdd6503f7c3796f0f1fd165026fd
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_13_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfc447884899fc790409fee53f929270a80b7e5cb41d2613d5830ef1a42a8503
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_14_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75548c107a86947223f47bb79905593b78af37f5b1f26cbb8e8091b623f68986
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_15_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35beeb31e51e25c92750a50a58e7e4efa3c918b88352a43799103c78aa9741a2
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_16_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d029525775db18eef57ba621c53c9371302ae5af44dd2a0623da19cb0e56b67e
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_17_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d1eda5dda07e43dc88ba7d3708c5b15c5a67fa852c0672e1f91c20854d653b7
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_18_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd3d9abd1d2bdbef38268477f97ae20e67ba7745924869d2dab99a59f6167044
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_19_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1e129bf09995bbccdc1f17d0a36e6213fd21cecb83caa7a9185dfe2b8e3786f
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:401934dc0b03259d660d4ffbcbd24ba315f5d64dcb129e53eb4740c1812c253d
3
+ size 44479125
checkpoint-3089/global_step3089/zero_pp_rank_20_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:042e7168cb438ae5e8aae33df28bd3885dc606cc0add51c46ef26f2a1f14c08b
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_21_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3fadba113c5bc3612f6012e58a80c191b62494cb2f55eb524bb4f6c367e3896
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_22_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:734c830b3d8a2ebe32a5bdb46058d832115f207d98b1301424770a8da417d904
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_23_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58564cf279f7cafce29fb27c296d354367c170124de1f441b41e3df12a752b7d
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_24_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b0579ef1c1ff0be1570182ba2688ec97b5490c1d8c8edd3a7a050bf87c131a
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_25_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eeb1f340faf3d94c96b5580620a4edd201f1fbd90c0c0c1d6f1c052fa633870
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_26_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3d26192abde532484ccda2438bbcf7beb88c942713ead91c7d8c8ace237587c
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_27_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d4f4ac01bd15d27b5a89396bedb9fd0b388d2e5504375244bcb5aaa20834ad3
3
+ size 44480936
checkpoint-3089/global_step3089/zero_pp_rank_28_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd84b6d2aa70b74ba35e0c25576a7f6fc51c77ac95b01b5a1bb9bcdbfd9f902e
3
+ size 44480936