kmfoda commited on
Commit
fafa71c
·
verified ·
1 Parent(s): 2fae9af

Run 2. Outer Step 2. Inner Step 861. Peers 21.

Browse files
Files changed (4) hide show
  1. config.json +14 -14
  2. inner_optimizer.pt +2 -2
  3. model.safetensors +1 -1
  4. outer_optimizer.pt +1 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "distributed/optimized-gpt2-1b",
3
  "activation_function": "gelu_new",
4
  "all_reduce_scores": {
5
  "0": "NON_PARTICIPATING",
@@ -85,7 +85,7 @@
85
  "170": "NON_PARTICIPATING",
86
  "171": "NON_PARTICIPATING",
87
  "172": "NON_PARTICIPATING",
88
- "173": "NON_PARTICIPATING",
89
  "174": "NON_PARTICIPATING",
90
  "175": "NON_PARTICIPATING",
91
  "176": "NON_PARTICIPATING",
@@ -97,7 +97,7 @@
97
  "181": "SUCCESS",
98
  "182": "NON_PARTICIPATING",
99
  "183": "NON_PARTICIPATING",
100
- "184": "SUCCESS",
101
  "185": "NON_PARTICIPATING",
102
  "186": "NON_PARTICIPATING",
103
  "187": "NON_PARTICIPATING",
@@ -106,7 +106,7 @@
106
  "19": "NON_PARTICIPATING",
107
  "190": "NON_PARTICIPATING",
108
  "191": "NON_PARTICIPATING",
109
- "192": "NON_PARTICIPATING",
110
  "193": "NON_PARTICIPATING",
111
  "194": "NON_PARTICIPATING",
112
  "195": "NON_PARTICIPATING",
@@ -141,12 +141,12 @@
141
  "220": "NON_PARTICIPATING",
142
  "221": "NON_PARTICIPATING",
143
  "222": "NON_PARTICIPATING",
144
- "223": "NON_PARTICIPATING",
145
  "224": "NON_PARTICIPATING",
146
  "225": "NON_PARTICIPATING",
147
  "226": "NON_PARTICIPATING",
148
  "227": "NON_PARTICIPATING",
149
- "228": "NON_PARTICIPATING",
150
  "229": "NON_PARTICIPATING",
151
  "23": "SUCCESS",
152
  "230": "NON_PARTICIPATING",
@@ -171,7 +171,7 @@
171
  "248": "NON_PARTICIPATING",
172
  "249": "SUCCESS",
173
  "25": "SUCCESS",
174
- "250": "NON_PARTICIPATING",
175
  "251": "NON_PARTICIPATING",
176
  "252": "NON_PARTICIPATING",
177
  "253": "NON_PARTICIPATING",
@@ -188,17 +188,17 @@
188
  "33": "NON_PARTICIPATING",
189
  "34": "NON_PARTICIPATING",
190
  "35": "NON_PARTICIPATING",
191
- "36": "NON_PARTICIPATING",
192
  "37": "NON_PARTICIPATING",
193
  "38": "NON_PARTICIPATING",
194
- "39": "NON_PARTICIPATING",
195
  "4": "NON_PARTICIPATING",
196
  "40": "NON_PARTICIPATING",
197
  "41": "NON_PARTICIPATING",
198
  "42": "NON_PARTICIPATING",
199
  "43": "NON_PARTICIPATING",
200
  "44": "NON_PARTICIPATING",
201
- "45": "NON_PARTICIPATING",
202
  "46": "NON_PARTICIPATING",
203
  "47": "NON_PARTICIPATING",
204
  "48": "NON_PARTICIPATING",
@@ -212,12 +212,12 @@
212
  "55": "NON_PARTICIPATING",
213
  "56": "NON_PARTICIPATING",
214
  "57": "NON_PARTICIPATING",
215
- "58": "NON_PARTICIPATING",
216
  "59": "NON_PARTICIPATING",
217
  "6": "NON_PARTICIPATING",
218
  "60": "NON_PARTICIPATING",
219
  "61": "NON_PARTICIPATING",
220
- "62": "SUCCESS",
221
  "63": "NON_PARTICIPATING",
222
  "64": "NON_PARTICIPATING",
223
  "65": "NON_PARTICIPATING",
@@ -234,7 +234,7 @@
234
  "75": "NON_PARTICIPATING",
235
  "76": "NON_PARTICIPATING",
236
  "77": "NON_PARTICIPATING",
237
- "78": "SUCCESS",
238
  "79": "NON_PARTICIPATING",
239
  "8": "NON_PARTICIPATING",
240
  "80": "NON_PARTICIPATING",
@@ -275,7 +275,7 @@
275
  "initializer_range": 0.02,
276
  "inner_step": 0,
277
  "inner_steps": 0,
278
- "last_allreduce_block": 5323221,
279
  "layer_norm_epsilon": 1e-05,
280
  "model_type": "gpt_optimized",
281
  "n_embd": 1280,
 
1
  {
2
+ "_name_or_path": "crypt0trading/c66-h14",
3
  "activation_function": "gelu_new",
4
  "all_reduce_scores": {
5
  "0": "NON_PARTICIPATING",
 
85
  "170": "NON_PARTICIPATING",
86
  "171": "NON_PARTICIPATING",
87
  "172": "NON_PARTICIPATING",
88
+ "173": "SUCCESS",
89
  "174": "NON_PARTICIPATING",
90
  "175": "NON_PARTICIPATING",
91
  "176": "NON_PARTICIPATING",
 
97
  "181": "SUCCESS",
98
  "182": "NON_PARTICIPATING",
99
  "183": "NON_PARTICIPATING",
100
+ "184": "NON_PARTICIPATING",
101
  "185": "NON_PARTICIPATING",
102
  "186": "NON_PARTICIPATING",
103
  "187": "NON_PARTICIPATING",
 
106
  "19": "NON_PARTICIPATING",
107
  "190": "NON_PARTICIPATING",
108
  "191": "NON_PARTICIPATING",
109
+ "192": "SUCCESS",
110
  "193": "NON_PARTICIPATING",
111
  "194": "NON_PARTICIPATING",
112
  "195": "NON_PARTICIPATING",
 
141
  "220": "NON_PARTICIPATING",
142
  "221": "NON_PARTICIPATING",
143
  "222": "NON_PARTICIPATING",
144
+ "223": "SUCCESS",
145
  "224": "NON_PARTICIPATING",
146
  "225": "NON_PARTICIPATING",
147
  "226": "NON_PARTICIPATING",
148
  "227": "NON_PARTICIPATING",
149
+ "228": "SUCCESS",
150
  "229": "NON_PARTICIPATING",
151
  "23": "SUCCESS",
152
  "230": "NON_PARTICIPATING",
 
171
  "248": "NON_PARTICIPATING",
172
  "249": "SUCCESS",
173
  "25": "SUCCESS",
174
+ "250": "SUCCESS",
175
  "251": "NON_PARTICIPATING",
176
  "252": "NON_PARTICIPATING",
177
  "253": "NON_PARTICIPATING",
 
188
  "33": "NON_PARTICIPATING",
189
  "34": "NON_PARTICIPATING",
190
  "35": "NON_PARTICIPATING",
191
+ "36": "SUCCESS",
192
  "37": "NON_PARTICIPATING",
193
  "38": "NON_PARTICIPATING",
194
+ "39": "SUCCESS",
195
  "4": "NON_PARTICIPATING",
196
  "40": "NON_PARTICIPATING",
197
  "41": "NON_PARTICIPATING",
198
  "42": "NON_PARTICIPATING",
199
  "43": "NON_PARTICIPATING",
200
  "44": "NON_PARTICIPATING",
201
+ "45": "SUCCESS",
202
  "46": "NON_PARTICIPATING",
203
  "47": "NON_PARTICIPATING",
204
  "48": "NON_PARTICIPATING",
 
212
  "55": "NON_PARTICIPATING",
213
  "56": "NON_PARTICIPATING",
214
  "57": "NON_PARTICIPATING",
215
+ "58": "SUCCESS",
216
  "59": "NON_PARTICIPATING",
217
  "6": "NON_PARTICIPATING",
218
  "60": "NON_PARTICIPATING",
219
  "61": "NON_PARTICIPATING",
220
+ "62": "NON_PARTICIPATING",
221
  "63": "NON_PARTICIPATING",
222
  "64": "NON_PARTICIPATING",
223
  "65": "NON_PARTICIPATING",
 
234
  "75": "NON_PARTICIPATING",
235
  "76": "NON_PARTICIPATING",
236
  "77": "NON_PARTICIPATING",
237
+ "78": "NON_PARTICIPATING",
238
  "79": "NON_PARTICIPATING",
239
  "8": "NON_PARTICIPATING",
240
  "80": "NON_PARTICIPATING",
 
275
  "initializer_range": 0.02,
276
  "inner_step": 0,
277
  "inner_steps": 0,
278
+ "last_allreduce_block": 5329444,
279
  "layer_norm_epsilon": 1e-05,
280
  "model_type": "gpt_optimized",
281
  "n_embd": 1280,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df2588b940f0bab6c967f7abc2a6ff9cd6bad6ed15bd3c1f94527dfc94cc3805
3
- size 2752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:421a24b266c83dbc38cf0889f35724e45d2eb609e4bc5bacbf90b235a7cb9650
3
+ size 8081781770
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72d1f4054db89ccac14b1f1280d753c2392383a6cf8af7ff098a570ffafd3cb9
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a10ab74b86db1f83774990e60783ed06c53ea3b3259355082cd444f7f7cf58a0
3
  size 4040701744
outer_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d5f2a8d84f90b6b8ea8f1d13a2aa194614eac91db3c7f307719b7f5a2b485cc
3
  size 4040805354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffa342e9371b9849c771ef9795ed5b0118e9cf43baa9de2731d81d8d17a7815d
3
  size 4040805354