jaslee20 commited on
Commit
ff9fa11
·
verified ·
1 Parent(s): b8fd2ea

Add checkpoint files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. added_tokens.json +6 -0
  3. config.json +221 -0
  4. generation_config.json +14 -0
  5. global_step85000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  6. global_step85000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
  7. global_step85000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
  8. global_step85000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
  9. global_step85000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
  10. global_step85000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
  11. global_step85000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
  12. global_step85000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
  13. global_step85000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
  14. global_step85000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
  15. global_step85000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
  16. global_step85000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  17. global_step85000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
  18. global_step85000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
  19. global_step85000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
  20. global_step85000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
  21. global_step85000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
  22. global_step85000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
  23. global_step85000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
  24. global_step85000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
  25. global_step85000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
  26. global_step85000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
  27. global_step85000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  28. global_step85000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
  29. global_step85000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
  30. global_step85000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
  31. global_step85000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
  32. global_step85000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
  33. global_step85000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
  34. global_step85000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
  35. global_step85000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
  36. global_step85000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
  37. global_step85000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
  38. global_step85000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  39. global_step85000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
  40. global_step85000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
  41. global_step85000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
  42. global_step85000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
  43. global_step85000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
  44. global_step85000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
  45. global_step85000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
  46. global_step85000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
  47. global_step85000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
  48. global_step85000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
  49. global_step85000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
  50. global_step85000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ trainer_state.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "<image>": 151646,
3
+ "<|endoftext|>": 151643,
4
+ "<|im_end|>": 151645,
5
+ "<|im_start|>": 151644
6
+ }
config.json ADDED
@@ -0,0 +1,221 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "lmms-lab/llava-onevision-qwen2-7b-ov",
3
+ "add_faster_video": false,
4
+ "add_time_instruction": false,
5
+ "architectures": [
6
+ "LlavaQwenForCausalLM"
7
+ ],
8
+ "attention_dropout": 0.0,
9
+ "bos_token_id": 151643,
10
+ "eos_token_id": 151645,
11
+ "faster_token_stride": 10,
12
+ "force_sample": false,
13
+ "hidden_act": "silu",
14
+ "hidden_size": 3584,
15
+ "ignore_index": -100,
16
+ "image_aspect_ratio": "anyres_max_9",
17
+ "image_crop_resolution": null,
18
+ "image_grid_pinpoints": [
19
+ [
20
+ 384,
21
+ 384
22
+ ],
23
+ [
24
+ 384,
25
+ 768
26
+ ],
27
+ [
28
+ 384,
29
+ 1152
30
+ ],
31
+ [
32
+ 384,
33
+ 1536
34
+ ],
35
+ [
36
+ 384,
37
+ 1920
38
+ ],
39
+ [
40
+ 384,
41
+ 2304
42
+ ],
43
+ [
44
+ 768,
45
+ 384
46
+ ],
47
+ [
48
+ 768,
49
+ 768
50
+ ],
51
+ [
52
+ 768,
53
+ 1152
54
+ ],
55
+ [
56
+ 768,
57
+ 1536
58
+ ],
59
+ [
60
+ 768,
61
+ 1920
62
+ ],
63
+ [
64
+ 768,
65
+ 2304
66
+ ],
67
+ [
68
+ 1152,
69
+ 384
70
+ ],
71
+ [
72
+ 1152,
73
+ 768
74
+ ],
75
+ [
76
+ 1152,
77
+ 1152
78
+ ],
79
+ [
80
+ 1152,
81
+ 1536
82
+ ],
83
+ [
84
+ 1152,
85
+ 1920
86
+ ],
87
+ [
88
+ 1152,
89
+ 2304
90
+ ],
91
+ [
92
+ 1536,
93
+ 384
94
+ ],
95
+ [
96
+ 1536,
97
+ 768
98
+ ],
99
+ [
100
+ 1536,
101
+ 1152
102
+ ],
103
+ [
104
+ 1536,
105
+ 1536
106
+ ],
107
+ [
108
+ 1536,
109
+ 1920
110
+ ],
111
+ [
112
+ 1536,
113
+ 2304
114
+ ],
115
+ [
116
+ 1920,
117
+ 384
118
+ ],
119
+ [
120
+ 1920,
121
+ 768
122
+ ],
123
+ [
124
+ 1920,
125
+ 1152
126
+ ],
127
+ [
128
+ 1920,
129
+ 1536
130
+ ],
131
+ [
132
+ 1920,
133
+ 1920
134
+ ],
135
+ [
136
+ 1920,
137
+ 2304
138
+ ],
139
+ [
140
+ 2304,
141
+ 384
142
+ ],
143
+ [
144
+ 2304,
145
+ 768
146
+ ],
147
+ [
148
+ 2304,
149
+ 1152
150
+ ],
151
+ [
152
+ 2304,
153
+ 1536
154
+ ],
155
+ [
156
+ 2304,
157
+ 1920
158
+ ],
159
+ [
160
+ 2304,
161
+ 2304
162
+ ]
163
+ ],
164
+ "image_split_resolution": null,
165
+ "image_token_index": 151646,
166
+ "initializer_range": 0.02,
167
+ "intermediate_size": 18944,
168
+ "max_position_embeddings": 32768,
169
+ "max_window_layers": 28,
170
+ "mm_hidden_size": 1152,
171
+ "mm_newline_position": "grid",
172
+ "mm_patch_merge_type": "spatial_unpad",
173
+ "mm_projector_lr": null,
174
+ "mm_projector_type": "mlp2x_gelu",
175
+ "mm_resampler_type": null,
176
+ "mm_spatial_pool_mode": "bilinear",
177
+ "mm_spatial_pool_stride": null,
178
+ "mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
179
+ "mm_use_im_patch_token": false,
180
+ "mm_use_im_start_end": false,
181
+ "mm_vision_select_feature": "patch",
182
+ "mm_vision_select_layer": -2,
183
+ "mm_vision_tower": "google/siglip-so400m-patch14-384",
184
+ "mm_vision_tower_lr": 2e-06,
185
+ "model_type": "llava",
186
+ "num_attention_heads": 28,
187
+ "num_hidden_layers": 28,
188
+ "num_key_value_heads": 4,
189
+ "pos_skipping_range": 4096,
190
+ "projector_hidden_act": "gelu",
191
+ "rms_norm_eps": 1e-06,
192
+ "rope_scaling": null,
193
+ "rope_theta": 1000000.0,
194
+ "sliding_window": 131072,
195
+ "text_config": {
196
+ "model_type": "llama"
197
+ },
198
+ "tie_word_embeddings": false,
199
+ "tokenizer_model_max_length": 32768,
200
+ "tokenizer_padding_side": "right",
201
+ "torch_dtype": "bfloat16",
202
+ "transformers_version": "4.40.0.dev0",
203
+ "use_cache": false,
204
+ "use_mm_proj": true,
205
+ "use_pos_skipping": false,
206
+ "use_sliding_window": false,
207
+ "vision_config": {
208
+ "hidden_size": 1024,
209
+ "image_size": 336,
210
+ "intermediate_size": 4096,
211
+ "model_type": "clip_vision_model",
212
+ "num_attention_heads": 16,
213
+ "num_hidden_layers": 24,
214
+ "patch_size": 14,
215
+ "projection_dim": 768,
216
+ "vocab_size": 32000
217
+ },
218
+ "vision_feature_layer": -2,
219
+ "vision_feature_select_strategy": "default",
220
+ "vision_tower_pretrained": null
221
+ }
generation_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 151643,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 151645,
6
+ 151643
7
+ ],
8
+ "pad_token_id": 151643,
9
+ "repetition_penalty": 1.05,
10
+ "temperature": 0.7,
11
+ "top_k": 20,
12
+ "top_p": 0.8,
13
+ "transformers_version": "4.40.0.dev0"
14
+ }
global_step85000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d4315b8e686d7778f6da90b9ea318f9c59b144aaded0f17e729c848b42c0882
3
+ size 1204556112
global_step85000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c2212fcfba3be90d6ea4d89280823799a2ee28e3b9b207a7fddd290493ba826
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9e24560c4bd6d1c6c3b5a513895746eee501f264d333e9c2100e1a65224338
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec426e40fea77ab8feebb9ce70bef81da85b42353e3c20a27f04887e28b3d4c
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e31d28ddfda03a7bf12b611cd1f08330232c97cf5ff2c1cce5d837aae6480325
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0233cc9d23590d3b19817c52d6de251e7375ed89d4fa4f4b39c7578580d3af1
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ce9b53e78722273ee4aece5243b5ff8f9c235911cfd3c59576b4a668f04d958
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6608a170b12cdec16a422415ece07a82cbdef8fee13abac9d1a3552a21c95125
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5478ef14511e799bc62374e01709ac2274310a7bd8a3df0f924fade61c84750
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:731e11a594019f47782298ddc6ae1bd4d1a0a952f10c11c355daa6ccaa047e1b
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7f28b267c9bec03b17a09373820bd9b409be366b5d629ff66c9e8d34e7afa74
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c42d33c690b83c921156de1467df1288c9367c103951caf6351678c109eb8ede
3
+ size 1204556048
global_step85000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba9f1971d849ebb35d63feb2ba8724881620a016a6023ea50dd318eef42a2914
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:816a4ae68bbfdb1bd003bc2d2bfa0fca2e24d68d20cd7a859a15be767131783b
3
+ size 1204556823
global_step85000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c470b7683ee8fcf26b124c6839793211923fabf3ad10b1dbabec179c695601e8
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea6fabb1f1c6b6c926e420495d75a16d3b87e0bc1b71a2a76dae53c63718ef46
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a57a1fc8f1a6a50317292c3e78f6115c63c2cece23cd117ce9469c4d615d6dde
3
+ size 1204556823
global_step85000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18fcda0c8bead72e7c23fb726057377133e357c2be978f5b5fa9cd561d597874
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8cd7003440bb9475b36bddd46666b4bc2b9e0dc78d439c3fd55adb24a9dd486
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71d575be4223bca52a91da33c89942d80a2608cb8478aa591ba75fc50a4beab9
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe6ce16a04c36159eef57296ca8571faa2797da196a2ef5b44df63427325357
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8fee847f5b99770a049e3139cb8e466f551b94ce2ce74e59e0c1c6f800a54e5
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f0ed63d7530677c09635e94eb02dfe3e8477957d099d9317c26fc196728b2f5
3
+ size 1204556048
global_step85000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:328f176b0693740932c3f14000d7babae975e9c870219f5e4387d1404ea2512c
3
+ size 1204556375
global_step85000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e6ac3123f02f2a55baf269f3b99a4e619cd65fd46025ff6f5f1d261f8f54e07
3
+ size 1204556631
global_step85000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cbbde05b6374dd5cb8afb32522f459a362c0ac0aa6d205ad1528f1efbe1a4bd
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf39acbc93abb32b0bf460bcd26e58626f21e1b9c0ba80ce67c241ca8f2beffd
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7582417c21a9b02af024515f20ac4b65a1cfc1bdd14fca415dd2758dc53dfd6
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cce3c171d3c50fa85b4b0fa7b5cbdfa0adda28a647502f1b8b399cb24f04870
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b6aae772cd519c97ef0f028d16fb4f51f5e64ff2d2a351ba8f680af257e545d
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e7f31db856de72ef7292bb5642af4bf23d4a618db2ad801260ca22570e3a4ce
3
+ size 1204556375
global_step85000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d5212d48dd8a8d63d7f1ecbd6c6c7d97cdba98b6b2b05cadbab63c74e763439
3
+ size 1204556631
global_step85000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c0df4d71be772a64442b855e52f50f752d5ebc4531652bc68ee05aa3b2a385a
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9bf142d662b87484f6c4907da85c5d24a544caec29474a9aea4823f99c3986f
3
+ size 1204556048
global_step85000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd8aa5fa486c40f2bf9e5b6fcdf325494f3387be48133b3164293155910fcce7
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cfc769afce9f80734d92bfee30a346bb077b482991fe27d440e4a41e07c1ee8
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:214ada9c2db8c94ee8313661926b5de74afdb3220a4ded997011cf755ddf990c
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd0bc71db5d3657ab7e1b9b93e4475ea0f530bcfa5e9c0de518668e6091fc9f2
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9fbd1ef1c3fac3e3d211299ccb7cceca3250560b3a8defec85ffd70d2076197
3
+ size 1204556375
global_step85000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02edd2f7736705da4239b6046bfc1ff4cbc5fd5c39bcdd96ed735d3e667ebe8e
3
+ size 1204556631
global_step85000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cc8b97ee8be12aca11ba09a74d5a637cac9f6f8f1c2f9cade40ab4172d3d980
3
+ size 1204556119
global_step85000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37fddf7fabaf17ac62678fa074bc7549bdb83f4b7a070af93e0a1d2964896ed9
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af2253e2a4ab78fe36d262bae77cad39c9dc061ff9e6151d516d1e95944a839
3
+ size 1204556183
global_step85000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:defa79229912244a21145958576b20f7f6c0a7c94c7ad629f675eece9bb7f669
3
+ size 1204556759
global_step85000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81666f8bce5cbdae4c5bd84bfa0b4877208ba9280c2e8827e7b62e0210202374
3
+ size 1204556048
global_step85000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d80c5d5dc8fd2608166926b2d859a7a260441fc983d6f00fbac20f55f646b32
3
+ size 1204556119