tensor-tech commited on
Commit
2c30632
·
verified ·
1 Parent(s): 2b2698f

Run 4. Outer Step 22. Inner Step 1.

Browse files
Files changed (3) hide show
  1. config.json +6 -6
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -268,18 +268,18 @@
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
- 5526587,
272
- 5526593,
273
- 5526599,
274
- 5526605,
275
- 5526611
276
  ],
277
  "block_size": 1024,
278
  "bos_token_id": 50256,
279
  "embd_pdrop": 0.1,
280
  "eos_token_id": 50256,
281
  "initializer_range": 0.02,
282
- "inner_step": 0,
283
  "inner_steps": 0,
284
  "last_allreduce_block": 5523943,
285
  "layer_norm_epsilon": 1e-05,
 
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
+ 5526619,
272
+ 5526625,
273
+ 5526631,
274
+ 5526637,
275
+ 5526643
276
  ],
277
  "block_size": 1024,
278
  "bos_token_id": 50256,
279
  "embd_pdrop": 0.1,
280
  "eos_token_id": 50256,
281
  "initializer_range": 0.02,
282
+ "inner_step": 1,
283
  "inner_steps": 0,
284
  "last_allreduce_block": 5523943,
285
  "layer_norm_epsilon": 1e-05,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c412d65eba16719a66111cf96dd0bf1478d32ad7a40ae215f4017780d5d3f9d4
3
  size 8081782026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa69caa212a603da36a69c385fa10faf326c685381091e750277828390145eb1
3
  size 8081782026
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1964fdb7b09b6ac06f7b069a8a010e6834d8b8a75d5c795ef7b89855e3c2e0f4
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c12e60d34386084908ebb5fa848a12d90df84a3656717f85b9bb4089c664ee
3
  size 4040701744