Add checkpoint files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +6 -0
- config.json +221 -0
- generation_config.json +14 -0
- global_step65000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
- global_step65000/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image>": 151646,
|
3 |
+
"<|endoftext|>": 151643,
|
4 |
+
"<|im_end|>": 151645,
|
5 |
+
"<|im_start|>": 151644
|
6 |
+
}
|
config.json
ADDED
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "lmms-lab/llava-onevision-qwen2-7b-ov",
|
3 |
+
"add_faster_video": false,
|
4 |
+
"add_time_instruction": false,
|
5 |
+
"architectures": [
|
6 |
+
"LlavaQwenForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 151643,
|
10 |
+
"eos_token_id": 151645,
|
11 |
+
"faster_token_stride": 10,
|
12 |
+
"force_sample": false,
|
13 |
+
"hidden_act": "silu",
|
14 |
+
"hidden_size": 3584,
|
15 |
+
"ignore_index": -100,
|
16 |
+
"image_aspect_ratio": "anyres_max_9",
|
17 |
+
"image_crop_resolution": null,
|
18 |
+
"image_grid_pinpoints": [
|
19 |
+
[
|
20 |
+
384,
|
21 |
+
384
|
22 |
+
],
|
23 |
+
[
|
24 |
+
384,
|
25 |
+
768
|
26 |
+
],
|
27 |
+
[
|
28 |
+
384,
|
29 |
+
1152
|
30 |
+
],
|
31 |
+
[
|
32 |
+
384,
|
33 |
+
1536
|
34 |
+
],
|
35 |
+
[
|
36 |
+
384,
|
37 |
+
1920
|
38 |
+
],
|
39 |
+
[
|
40 |
+
384,
|
41 |
+
2304
|
42 |
+
],
|
43 |
+
[
|
44 |
+
768,
|
45 |
+
384
|
46 |
+
],
|
47 |
+
[
|
48 |
+
768,
|
49 |
+
768
|
50 |
+
],
|
51 |
+
[
|
52 |
+
768,
|
53 |
+
1152
|
54 |
+
],
|
55 |
+
[
|
56 |
+
768,
|
57 |
+
1536
|
58 |
+
],
|
59 |
+
[
|
60 |
+
768,
|
61 |
+
1920
|
62 |
+
],
|
63 |
+
[
|
64 |
+
768,
|
65 |
+
2304
|
66 |
+
],
|
67 |
+
[
|
68 |
+
1152,
|
69 |
+
384
|
70 |
+
],
|
71 |
+
[
|
72 |
+
1152,
|
73 |
+
768
|
74 |
+
],
|
75 |
+
[
|
76 |
+
1152,
|
77 |
+
1152
|
78 |
+
],
|
79 |
+
[
|
80 |
+
1152,
|
81 |
+
1536
|
82 |
+
],
|
83 |
+
[
|
84 |
+
1152,
|
85 |
+
1920
|
86 |
+
],
|
87 |
+
[
|
88 |
+
1152,
|
89 |
+
2304
|
90 |
+
],
|
91 |
+
[
|
92 |
+
1536,
|
93 |
+
384
|
94 |
+
],
|
95 |
+
[
|
96 |
+
1536,
|
97 |
+
768
|
98 |
+
],
|
99 |
+
[
|
100 |
+
1536,
|
101 |
+
1152
|
102 |
+
],
|
103 |
+
[
|
104 |
+
1536,
|
105 |
+
1536
|
106 |
+
],
|
107 |
+
[
|
108 |
+
1536,
|
109 |
+
1920
|
110 |
+
],
|
111 |
+
[
|
112 |
+
1536,
|
113 |
+
2304
|
114 |
+
],
|
115 |
+
[
|
116 |
+
1920,
|
117 |
+
384
|
118 |
+
],
|
119 |
+
[
|
120 |
+
1920,
|
121 |
+
768
|
122 |
+
],
|
123 |
+
[
|
124 |
+
1920,
|
125 |
+
1152
|
126 |
+
],
|
127 |
+
[
|
128 |
+
1920,
|
129 |
+
1536
|
130 |
+
],
|
131 |
+
[
|
132 |
+
1920,
|
133 |
+
1920
|
134 |
+
],
|
135 |
+
[
|
136 |
+
1920,
|
137 |
+
2304
|
138 |
+
],
|
139 |
+
[
|
140 |
+
2304,
|
141 |
+
384
|
142 |
+
],
|
143 |
+
[
|
144 |
+
2304,
|
145 |
+
768
|
146 |
+
],
|
147 |
+
[
|
148 |
+
2304,
|
149 |
+
1152
|
150 |
+
],
|
151 |
+
[
|
152 |
+
2304,
|
153 |
+
1536
|
154 |
+
],
|
155 |
+
[
|
156 |
+
2304,
|
157 |
+
1920
|
158 |
+
],
|
159 |
+
[
|
160 |
+
2304,
|
161 |
+
2304
|
162 |
+
]
|
163 |
+
],
|
164 |
+
"image_split_resolution": null,
|
165 |
+
"image_token_index": 151646,
|
166 |
+
"initializer_range": 0.02,
|
167 |
+
"intermediate_size": 18944,
|
168 |
+
"max_position_embeddings": 32768,
|
169 |
+
"max_window_layers": 28,
|
170 |
+
"mm_hidden_size": 1152,
|
171 |
+
"mm_newline_position": "grid",
|
172 |
+
"mm_patch_merge_type": "spatial_unpad",
|
173 |
+
"mm_projector_lr": null,
|
174 |
+
"mm_projector_type": "mlp2x_gelu",
|
175 |
+
"mm_resampler_type": null,
|
176 |
+
"mm_spatial_pool_mode": "bilinear",
|
177 |
+
"mm_spatial_pool_stride": null,
|
178 |
+
"mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
|
179 |
+
"mm_use_im_patch_token": false,
|
180 |
+
"mm_use_im_start_end": false,
|
181 |
+
"mm_vision_select_feature": "patch",
|
182 |
+
"mm_vision_select_layer": -2,
|
183 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
184 |
+
"mm_vision_tower_lr": 2e-06,
|
185 |
+
"model_type": "llava",
|
186 |
+
"num_attention_heads": 28,
|
187 |
+
"num_hidden_layers": 28,
|
188 |
+
"num_key_value_heads": 4,
|
189 |
+
"pos_skipping_range": 4096,
|
190 |
+
"projector_hidden_act": "gelu",
|
191 |
+
"rms_norm_eps": 1e-06,
|
192 |
+
"rope_scaling": null,
|
193 |
+
"rope_theta": 1000000.0,
|
194 |
+
"sliding_window": 131072,
|
195 |
+
"text_config": {
|
196 |
+
"model_type": "llama"
|
197 |
+
},
|
198 |
+
"tie_word_embeddings": false,
|
199 |
+
"tokenizer_model_max_length": 32768,
|
200 |
+
"tokenizer_padding_side": "right",
|
201 |
+
"torch_dtype": "bfloat16",
|
202 |
+
"transformers_version": "4.40.0.dev0",
|
203 |
+
"use_cache": false,
|
204 |
+
"use_mm_proj": true,
|
205 |
+
"use_pos_skipping": false,
|
206 |
+
"use_sliding_window": false,
|
207 |
+
"vision_config": {
|
208 |
+
"hidden_size": 1024,
|
209 |
+
"image_size": 336,
|
210 |
+
"intermediate_size": 4096,
|
211 |
+
"model_type": "clip_vision_model",
|
212 |
+
"num_attention_heads": 16,
|
213 |
+
"num_hidden_layers": 24,
|
214 |
+
"patch_size": 14,
|
215 |
+
"projection_dim": 768,
|
216 |
+
"vocab_size": 32000
|
217 |
+
},
|
218 |
+
"vision_feature_layer": -2,
|
219 |
+
"vision_feature_select_strategy": "default",
|
220 |
+
"vision_tower_pretrained": null
|
221 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.40.0.dev0"
|
14 |
+
}
|
global_step65000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ef15ab84cba861b84dd32cf0f3447560f4d0521f87c7049095ee772bd7773da
|
3 |
+
size 1003797456
|
global_step65000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee2d499050b7d42935db74523b95bfdeb8505887330a705912ef907ca7e17902
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f39c19fa07f0462a0a2a634d21c18f272d1f42b98e279f0b2486c1fdf517ebc
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2200217a27e3cc19fe821db196100cbcd863e247e42044a7bd8c23fc014e38f2
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e1bcbbcd53bdfaf20879904e08c6da87adec2d89b718728e283c9dd389675bf
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a687875aef692ef9f39047e1e9ecaf4dcb8d607d65261935287fb5bdb36c44b
|
3 |
+
size 1003797719
|
global_step65000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93e61ea6336dfa48bae0f9bdb224adeecc653c3c51a16e830fdb120b8bcb8d56
|
3 |
+
size 1003797911
|
global_step65000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7647ad46212f0836d2d70bbe26476ed151de13114f9f97967162fdeee2c06f6
|
3 |
+
size 1003797527
|
global_step65000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac7a17cb115dee35d5ec3668989d8b7b65e384c1a4f756aa05ae0fd80075ad64
|
3 |
+
size 1003798039
|
global_step65000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dee4c1ee72574fcbef7907fefba77f1962e9f902aa9f263b90f061114a27307e
|
3 |
+
size 1003797527
|
global_step65000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de39c3cd213abd7b9b10f1a8ca3af4fe91f03451b4f702c97a08036d926e68f
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae23d16ed5b8d73518ec8a77cebb9d1c0f9912df253b9c0251061021a78832eb
|
3 |
+
size 1003797392
|
global_step65000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72377f9e3de31c366c9dfe6e12f6b18fa0f0e8b5cb079a099d7aceb3856ae7ab
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d4d137e232c6c6c6b6cdf775966924b8632b6e545ebacd3af0ee00ab47acf02
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61d20a16ff86a885969fa7e719180da66d92d47e0c8b52a2019e95f0412d01e1
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6379dae105b17425fbb6cac97cf4918ece809ab6ac96be075b4ecd79909ae3e0
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af3f51b4f40b4b2209587f025ba6de088859398b0fa7e47878d93f0f40428f56
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:407bd87f0d60d76caf4f0c46e04c20944c5711ec02c64dd047e84132abd76735
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79647543d92b5936b708f4244418100a47a7aaa9b47403b7737c72d81b476d7f
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7bee22a8eb810bd6d336d9f572df05f5c423010c873a29ae248c98a442d5af2
|
3 |
+
size 1003797527
|
global_step65000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b36597ab56f9bf25ceb523db6184aba6cc04f3c60f07e02efdde8b4c5acd5a9a
|
3 |
+
size 1003797911
|
global_step65000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25b172d9168d127fdabfeba0e805b159b67291fc67a5c19f5c3a1cbe8fe7c584
|
3 |
+
size 1003797719
|
global_step65000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3216181421a0fad60dcb36e558ba35da24e2c75c7ecfd131c4aa1e2eb23d2b
|
3 |
+
size 1003797392
|
global_step65000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:418389660921c57a6cebfb94f57f044fde0748b89fb24306a2283970d1615d19
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5baf446505c43e5fbd00f54d983c7eb4bf76fc4a87a06b6baf3fb9e876513c7
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d93c3e9b51a1c5f48a36643cfe90d2f467a936a089a80800266b4e839d4cef95
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da91299d61947d96eddee6241d70d175a484fee9cb28e463345a6d33575d7953
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35aedf3b71502d3cda999cd41f52a5f99a95e72a3f2c7cb1235a86dbd40fb3df
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4bce51d9e6c658d7b6b33b3556cfb8c5e5e70a600caf6c50d706704ebea2eb1
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e250db1fdeb6bd2a5ad5e7e8e82010e3169f8abb5732aa3e8416c405be47480e
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bdeb2891a0762d35507e094c4d2ae9c908cdc6703931591a193a3b31883eb29
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8c17f61666952cc9eac023b88b7d7dd053895f7955137f9a4a14a3088ce9173
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:750ed6a93d7da22a8ce52f4e789e88bace0f95fbed92c112680c5a5078f6c0b2
|
3 |
+
size 1003797719
|
global_step65000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5bf9d5ac4ee1450e9b6d89573915d9e96d8ed2ab7f42693a3340d4d0237d321
|
3 |
+
size 1003797392
|
global_step65000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:807b8e3ef278355bb33be5eaeda85ad05edb0a091cc205b46a1d9f26aa68d6a4
|
3 |
+
size 1003797911
|
global_step65000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2403da7ca6a15c4f007ab19f4d7d727129be37296e4ad70a164bf8569dbb2dfb
|
3 |
+
size 1003797527
|
global_step65000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2907bcee62fd8a43a24665a876cb7b9f9c0be21cf8f55ee7608da2f72ec8b9f
|
3 |
+
size 1003798039
|
global_step65000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68e590633e5dab5cf936e73cf3a7128f0724496f72fc754499b09e94346dedd1
|
3 |
+
size 1003797527
|
global_step65000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:968e7cb6b1fff83c2eed4c732c23534e163e24e1e908970d0f7a135aacc931b6
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1ee25217510505786e2d31f1ddb9302bafe2d81421ad41bb212f6a51832891e
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e0430d5f03a4c125a74e805faaad4bf54e7b817615ff7a5a576ea08977884bd
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bc39094ebc4eacae8d59f15a724f5d6a10e6e0dd0117686114b4cf9ed8e9eae
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8d10faf42748c1e2e004061eb9eca9ad8682daa58c19a611feb055b3ca3f056
|
3 |
+
size 1003798103
|
global_step65000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d17c6bf5165f65e51c13b54713a248b2d4a9f6fc62427f8f0019af7ecae90e32
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4549d50b28a4a94932e28ad731274808d329fad8d71642d7fe3d34123e2e3900
|
3 |
+
size 1003797392
|
global_step65000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92a122aa484f63282b12230bc247cbdcdf953859f4a74c2d9486cb4312cd5c3
|
3 |
+
size 1003797463
|
global_step65000/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a3043f1b84ca39b9c4b43ecbc9b0681e3779b99f18fd9ca33e4032a1e51c2c
|
3 |
+
size 1003798103
|