rootxhacker commited on
Commit
fe0beb5
·
verified ·
1 Parent(s): d1032e6

Training in progress, step 38000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23dcc181cec0e10d847e208901d6626875ec6b62c6c0f26d433995f3783e85d0
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a045cd1651964484e35a7ee4cc80f394400bcf32d399ca366f907f0dafb8b29
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7432e9c2d93150abfd716acce42331362afc030b8c095403869cbf1291225746
3
  size 1544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47093e48c8dcb6ad57ae3eda9ce7141b8c756fad2f39a70827cbbb9ed49f5649
3
  size 1544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b8434a82bb738c0cecb4adf19f6cc16b50060235313456c478572cc44126b33
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b60bdca21a24c4c9f76b11b903c37c4127fc1f54a299af327f2fe260c58ff720
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c5a317d14f0c4fea42d2b4ca5f020a67142d647545709c1c9006f254a7d7349
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0df6fc486b7517363afca4fd7698726ecbf63a16d3ce84e06ce60f5376cd9b7e
3
+ size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4d13c8e281c1623531d4d497478b975ea082917bb2c61878d98cb5fb27c6af9
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97243af249b903bf91950a8fcb37e9bd58551a34f032c66a6b68e32bc4197313
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23ce717bb1ff7d19ce8b39673c5e006d14b3fec124190d834c88a63ab05da6d0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:541cb6dea9c80e2359e5134078f161ec83a5de3af8e29b3e9b6b880e5dd9058f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 36750,
3
- "best_metric": 0.9847651720046997,
4
- "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-34000",
5
- "epoch": 2.8843935081916774,
6
  "eval_steps": 250,
7
- "global_step": 37500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6458,6 +6458,92 @@
6458
  "eval_samples_per_second": 58.059,
6459
  "eval_steps_per_second": 14.515,
6460
  "step": 37500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6461
  }
6462
  ],
6463
  "logging_steps": 50,
 
1
  {
2
+ "best_global_step": 38000,
3
+ "best_metric": 0.98431396484375,
4
+ "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-38000",
5
+ "epoch": 2.9228520883008997,
6
  "eval_steps": 250,
7
+ "global_step": 38000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6458
  "eval_samples_per_second": 58.059,
6459
  "eval_steps_per_second": 14.515,
6460
  "step": 37500
6461
+ },
6462
+ {
6463
+ "epoch": 2.8882393662026,
6464
+ "grad_norm": 0.6800574660301208,
6465
+ "learning_rate": 7.630574240968237e-06,
6466
+ "loss": 0.983,
6467
+ "step": 37550
6468
+ },
6469
+ {
6470
+ "epoch": 2.892085224213522,
6471
+ "grad_norm": 0.9417561292648315,
6472
+ "learning_rate": 7.3708542191517545e-06,
6473
+ "loss": 0.973,
6474
+ "step": 37600
6475
+ },
6476
+ {
6477
+ "epoch": 2.895931082224444,
6478
+ "grad_norm": 0.6454310417175293,
6479
+ "learning_rate": 7.111134197335273e-06,
6480
+ "loss": 1.0493,
6481
+ "step": 37650
6482
+ },
6483
+ {
6484
+ "epoch": 2.8997769402353666,
6485
+ "grad_norm": 1.0287562608718872,
6486
+ "learning_rate": 6.851414175518792e-06,
6487
+ "loss": 0.9821,
6488
+ "step": 37700
6489
+ },
6490
+ {
6491
+ "epoch": 2.903622798246289,
6492
+ "grad_norm": 1.6874816417694092,
6493
+ "learning_rate": 6.591694153702309e-06,
6494
+ "loss": 0.9761,
6495
+ "step": 37750
6496
+ },
6497
+ {
6498
+ "epoch": 2.903622798246289,
6499
+ "eval_loss": 0.9886119961738586,
6500
+ "eval_runtime": 17.2542,
6501
+ "eval_samples_per_second": 57.957,
6502
+ "eval_steps_per_second": 14.489,
6503
+ "step": 37750
6504
+ },
6505
+ {
6506
+ "epoch": 2.907468656257211,
6507
+ "grad_norm": 0.7677489519119263,
6508
+ "learning_rate": 6.331974131885828e-06,
6509
+ "loss": 1.0421,
6510
+ "step": 37800
6511
+ },
6512
+ {
6513
+ "epoch": 2.9113145142681334,
6514
+ "grad_norm": 0.9784395098686218,
6515
+ "learning_rate": 6.072254110069346e-06,
6516
+ "loss": 0.9288,
6517
+ "step": 37850
6518
+ },
6519
+ {
6520
+ "epoch": 2.9151603722790553,
6521
+ "grad_norm": 0.6236763000488281,
6522
+ "learning_rate": 5.812534088252864e-06,
6523
+ "loss": 0.9777,
6524
+ "step": 37900
6525
+ },
6526
+ {
6527
+ "epoch": 2.9190062302899777,
6528
+ "grad_norm": 1.0675079822540283,
6529
+ "learning_rate": 5.552814066436382e-06,
6530
+ "loss": 0.9659,
6531
+ "step": 37950
6532
+ },
6533
+ {
6534
+ "epoch": 2.9228520883008997,
6535
+ "grad_norm": 0.9310262203216553,
6536
+ "learning_rate": 5.2930940446198996e-06,
6537
+ "loss": 0.9334,
6538
+ "step": 38000
6539
+ },
6540
+ {
6541
+ "epoch": 2.9228520883008997,
6542
+ "eval_loss": 0.98431396484375,
6543
+ "eval_runtime": 17.3967,
6544
+ "eval_samples_per_second": 57.482,
6545
+ "eval_steps_per_second": 14.371,
6546
+ "step": 38000
6547
  }
6548
  ],
6549
  "logging_steps": 50,