Add checkpoint files
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +6 -0
- config.json +221 -0
- generation_config.json +14 -0
- global_step85000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- global_step85000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image>": 151646,
|
3 |
+
"<|endoftext|>": 151643,
|
4 |
+
"<|im_end|>": 151645,
|
5 |
+
"<|im_start|>": 151644
|
6 |
+
}
|
config.json
ADDED
@@ -0,0 +1,221 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "lmms-lab/llava-onevision-qwen2-7b-ov",
|
3 |
+
"add_faster_video": false,
|
4 |
+
"add_time_instruction": false,
|
5 |
+
"architectures": [
|
6 |
+
"LlavaQwenForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 151643,
|
10 |
+
"eos_token_id": 151645,
|
11 |
+
"faster_token_stride": 10,
|
12 |
+
"force_sample": false,
|
13 |
+
"hidden_act": "silu",
|
14 |
+
"hidden_size": 3584,
|
15 |
+
"ignore_index": -100,
|
16 |
+
"image_aspect_ratio": "anyres_max_9",
|
17 |
+
"image_crop_resolution": null,
|
18 |
+
"image_grid_pinpoints": [
|
19 |
+
[
|
20 |
+
384,
|
21 |
+
384
|
22 |
+
],
|
23 |
+
[
|
24 |
+
384,
|
25 |
+
768
|
26 |
+
],
|
27 |
+
[
|
28 |
+
384,
|
29 |
+
1152
|
30 |
+
],
|
31 |
+
[
|
32 |
+
384,
|
33 |
+
1536
|
34 |
+
],
|
35 |
+
[
|
36 |
+
384,
|
37 |
+
1920
|
38 |
+
],
|
39 |
+
[
|
40 |
+
384,
|
41 |
+
2304
|
42 |
+
],
|
43 |
+
[
|
44 |
+
768,
|
45 |
+
384
|
46 |
+
],
|
47 |
+
[
|
48 |
+
768,
|
49 |
+
768
|
50 |
+
],
|
51 |
+
[
|
52 |
+
768,
|
53 |
+
1152
|
54 |
+
],
|
55 |
+
[
|
56 |
+
768,
|
57 |
+
1536
|
58 |
+
],
|
59 |
+
[
|
60 |
+
768,
|
61 |
+
1920
|
62 |
+
],
|
63 |
+
[
|
64 |
+
768,
|
65 |
+
2304
|
66 |
+
],
|
67 |
+
[
|
68 |
+
1152,
|
69 |
+
384
|
70 |
+
],
|
71 |
+
[
|
72 |
+
1152,
|
73 |
+
768
|
74 |
+
],
|
75 |
+
[
|
76 |
+
1152,
|
77 |
+
1152
|
78 |
+
],
|
79 |
+
[
|
80 |
+
1152,
|
81 |
+
1536
|
82 |
+
],
|
83 |
+
[
|
84 |
+
1152,
|
85 |
+
1920
|
86 |
+
],
|
87 |
+
[
|
88 |
+
1152,
|
89 |
+
2304
|
90 |
+
],
|
91 |
+
[
|
92 |
+
1536,
|
93 |
+
384
|
94 |
+
],
|
95 |
+
[
|
96 |
+
1536,
|
97 |
+
768
|
98 |
+
],
|
99 |
+
[
|
100 |
+
1536,
|
101 |
+
1152
|
102 |
+
],
|
103 |
+
[
|
104 |
+
1536,
|
105 |
+
1536
|
106 |
+
],
|
107 |
+
[
|
108 |
+
1536,
|
109 |
+
1920
|
110 |
+
],
|
111 |
+
[
|
112 |
+
1536,
|
113 |
+
2304
|
114 |
+
],
|
115 |
+
[
|
116 |
+
1920,
|
117 |
+
384
|
118 |
+
],
|
119 |
+
[
|
120 |
+
1920,
|
121 |
+
768
|
122 |
+
],
|
123 |
+
[
|
124 |
+
1920,
|
125 |
+
1152
|
126 |
+
],
|
127 |
+
[
|
128 |
+
1920,
|
129 |
+
1536
|
130 |
+
],
|
131 |
+
[
|
132 |
+
1920,
|
133 |
+
1920
|
134 |
+
],
|
135 |
+
[
|
136 |
+
1920,
|
137 |
+
2304
|
138 |
+
],
|
139 |
+
[
|
140 |
+
2304,
|
141 |
+
384
|
142 |
+
],
|
143 |
+
[
|
144 |
+
2304,
|
145 |
+
768
|
146 |
+
],
|
147 |
+
[
|
148 |
+
2304,
|
149 |
+
1152
|
150 |
+
],
|
151 |
+
[
|
152 |
+
2304,
|
153 |
+
1536
|
154 |
+
],
|
155 |
+
[
|
156 |
+
2304,
|
157 |
+
1920
|
158 |
+
],
|
159 |
+
[
|
160 |
+
2304,
|
161 |
+
2304
|
162 |
+
]
|
163 |
+
],
|
164 |
+
"image_split_resolution": null,
|
165 |
+
"image_token_index": 151646,
|
166 |
+
"initializer_range": 0.02,
|
167 |
+
"intermediate_size": 18944,
|
168 |
+
"max_position_embeddings": 32768,
|
169 |
+
"max_window_layers": 28,
|
170 |
+
"mm_hidden_size": 1152,
|
171 |
+
"mm_newline_position": "grid",
|
172 |
+
"mm_patch_merge_type": "spatial_unpad",
|
173 |
+
"mm_projector_lr": null,
|
174 |
+
"mm_projector_type": "mlp2x_gelu",
|
175 |
+
"mm_resampler_type": null,
|
176 |
+
"mm_spatial_pool_mode": "bilinear",
|
177 |
+
"mm_spatial_pool_stride": null,
|
178 |
+
"mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
|
179 |
+
"mm_use_im_patch_token": false,
|
180 |
+
"mm_use_im_start_end": false,
|
181 |
+
"mm_vision_select_feature": "patch",
|
182 |
+
"mm_vision_select_layer": -2,
|
183 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
184 |
+
"mm_vision_tower_lr": 2e-06,
|
185 |
+
"model_type": "llava",
|
186 |
+
"num_attention_heads": 28,
|
187 |
+
"num_hidden_layers": 28,
|
188 |
+
"num_key_value_heads": 4,
|
189 |
+
"pos_skipping_range": 4096,
|
190 |
+
"projector_hidden_act": "gelu",
|
191 |
+
"rms_norm_eps": 1e-06,
|
192 |
+
"rope_scaling": null,
|
193 |
+
"rope_theta": 1000000.0,
|
194 |
+
"sliding_window": 131072,
|
195 |
+
"text_config": {
|
196 |
+
"model_type": "llama"
|
197 |
+
},
|
198 |
+
"tie_word_embeddings": false,
|
199 |
+
"tokenizer_model_max_length": 32768,
|
200 |
+
"tokenizer_padding_side": "right",
|
201 |
+
"torch_dtype": "bfloat16",
|
202 |
+
"transformers_version": "4.40.0.dev0",
|
203 |
+
"use_cache": false,
|
204 |
+
"use_mm_proj": true,
|
205 |
+
"use_pos_skipping": false,
|
206 |
+
"use_sliding_window": false,
|
207 |
+
"vision_config": {
|
208 |
+
"hidden_size": 1024,
|
209 |
+
"image_size": 336,
|
210 |
+
"intermediate_size": 4096,
|
211 |
+
"model_type": "clip_vision_model",
|
212 |
+
"num_attention_heads": 16,
|
213 |
+
"num_hidden_layers": 24,
|
214 |
+
"patch_size": 14,
|
215 |
+
"projection_dim": 768,
|
216 |
+
"vocab_size": 32000
|
217 |
+
},
|
218 |
+
"vision_feature_layer": -2,
|
219 |
+
"vision_feature_select_strategy": "default",
|
220 |
+
"vision_tower_pretrained": null
|
221 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.40.0.dev0"
|
14 |
+
}
|
global_step85000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d4315b8e686d7778f6da90b9ea318f9c59b144aaded0f17e729c848b42c0882
|
3 |
+
size 1204556112
|
global_step85000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c2212fcfba3be90d6ea4d89280823799a2ee28e3b9b207a7fddd290493ba826
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b9e24560c4bd6d1c6c3b5a513895746eee501f264d333e9c2100e1a65224338
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ec426e40fea77ab8feebb9ce70bef81da85b42353e3c20a27f04887e28b3d4c
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e31d28ddfda03a7bf12b611cd1f08330232c97cf5ff2c1cce5d837aae6480325
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0233cc9d23590d3b19817c52d6de251e7375ed89d4fa4f4b39c7578580d3af1
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ce9b53e78722273ee4aece5243b5ff8f9c235911cfd3c59576b4a668f04d958
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6608a170b12cdec16a422415ece07a82cbdef8fee13abac9d1a3552a21c95125
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5478ef14511e799bc62374e01709ac2274310a7bd8a3df0f924fade61c84750
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:731e11a594019f47782298ddc6ae1bd4d1a0a952f10c11c355daa6ccaa047e1b
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7f28b267c9bec03b17a09373820bd9b409be366b5d629ff66c9e8d34e7afa74
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c42d33c690b83c921156de1467df1288c9367c103951caf6351678c109eb8ede
|
3 |
+
size 1204556048
|
global_step85000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba9f1971d849ebb35d63feb2ba8724881620a016a6023ea50dd318eef42a2914
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:816a4ae68bbfdb1bd003bc2d2bfa0fca2e24d68d20cd7a859a15be767131783b
|
3 |
+
size 1204556823
|
global_step85000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c470b7683ee8fcf26b124c6839793211923fabf3ad10b1dbabec179c695601e8
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea6fabb1f1c6b6c926e420495d75a16d3b87e0bc1b71a2a76dae53c63718ef46
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a57a1fc8f1a6a50317292c3e78f6115c63c2cece23cd117ce9469c4d615d6dde
|
3 |
+
size 1204556823
|
global_step85000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18fcda0c8bead72e7c23fb726057377133e357c2be978f5b5fa9cd561d597874
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8cd7003440bb9475b36bddd46666b4bc2b9e0dc78d439c3fd55adb24a9dd486
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71d575be4223bca52a91da33c89942d80a2608cb8478aa591ba75fc50a4beab9
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fe6ce16a04c36159eef57296ca8571faa2797da196a2ef5b44df63427325357
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8fee847f5b99770a049e3139cb8e466f551b94ce2ce74e59e0c1c6f800a54e5
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f0ed63d7530677c09635e94eb02dfe3e8477957d099d9317c26fc196728b2f5
|
3 |
+
size 1204556048
|
global_step85000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:328f176b0693740932c3f14000d7babae975e9c870219f5e4387d1404ea2512c
|
3 |
+
size 1204556375
|
global_step85000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e6ac3123f02f2a55baf269f3b99a4e619cd65fd46025ff6f5f1d261f8f54e07
|
3 |
+
size 1204556631
|
global_step85000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cbbde05b6374dd5cb8afb32522f459a362c0ac0aa6d205ad1528f1efbe1a4bd
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf39acbc93abb32b0bf460bcd26e58626f21e1b9c0ba80ce67c241ca8f2beffd
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7582417c21a9b02af024515f20ac4b65a1cfc1bdd14fca415dd2758dc53dfd6
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cce3c171d3c50fa85b4b0fa7b5cbdfa0adda28a647502f1b8b399cb24f04870
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b6aae772cd519c97ef0f028d16fb4f51f5e64ff2d2a351ba8f680af257e545d
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e7f31db856de72ef7292bb5642af4bf23d4a618db2ad801260ca22570e3a4ce
|
3 |
+
size 1204556375
|
global_step85000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d5212d48dd8a8d63d7f1ecbd6c6c7d97cdba98b6b2b05cadbab63c74e763439
|
3 |
+
size 1204556631
|
global_step85000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c0df4d71be772a64442b855e52f50f752d5ebc4531652bc68ee05aa3b2a385a
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9bf142d662b87484f6c4907da85c5d24a544caec29474a9aea4823f99c3986f
|
3 |
+
size 1204556048
|
global_step85000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd8aa5fa486c40f2bf9e5b6fcdf325494f3387be48133b3164293155910fcce7
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cfc769afce9f80734d92bfee30a346bb077b482991fe27d440e4a41e07c1ee8
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:214ada9c2db8c94ee8313661926b5de74afdb3220a4ded997011cf755ddf990c
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd0bc71db5d3657ab7e1b9b93e4475ea0f530bcfa5e9c0de518668e6091fc9f2
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9fbd1ef1c3fac3e3d211299ccb7cceca3250560b3a8defec85ffd70d2076197
|
3 |
+
size 1204556375
|
global_step85000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02edd2f7736705da4239b6046bfc1ff4cbc5fd5c39bcdd96ed735d3e667ebe8e
|
3 |
+
size 1204556631
|
global_step85000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc8b97ee8be12aca11ba09a74d5a637cac9f6f8f1c2f9cade40ab4172d3d980
|
3 |
+
size 1204556119
|
global_step85000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37fddf7fabaf17ac62678fa074bc7549bdb83f4b7a070af93e0a1d2964896ed9
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5af2253e2a4ab78fe36d262bae77cad39c9dc061ff9e6151d516d1e95944a839
|
3 |
+
size 1204556183
|
global_step85000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:defa79229912244a21145958576b20f7f6c0a7c94c7ad629f675eece9bb7f669
|
3 |
+
size 1204556759
|
global_step85000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81666f8bce5cbdae4c5bd84bfa0b4877208ba9280c2e8827e7b62e0210202374
|
3 |
+
size 1204556048
|
global_step85000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d80c5d5dc8fd2608166926b2d859a7a260441fc983d6f00fbac20f55f646b32
|
3 |
+
size 1204556119
|