rootxhacker commited on
Commit
e869878
·
verified ·
1 Parent(s): 5d555b9

Training in progress, step 38500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fd57c393f47a10fedc0eeb53eea073bec9f5d74a93432c74ef773c66fc48524
3
  size 36730224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f4e59779ae5268c858ada9fe05772a37f9613020d8b9f7340783b2a16c0e383
3
  size 36730224
last-checkpoint/ar_diffusion_info.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bd9ca616ae823c9a3f8ca31216995734a05d8ab02efa11d199d90e7767f414c
3
  size 1736
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:376da5b0e7144c1b91117f5526417311ed45b536f61dd6ac0ef8b19051f1dc33
3
  size 1736
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7db25f3289aeb2b9363ef193bde6f97fc98f831d0d2faf2aba478e02c7461eb7
3
  size 73588346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de512a7acdea4434e0675f44f1896eab7a4c3fe6cc967e9cd2360783b35758f
3
  size 73588346
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fe094da8ad1e1bf555c74dca2c7341b574c5a3cf7d8c3a98ff15eda79c695fe
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8c00195221e523ee69e83979891848166b78d5b2c3da6d54545d0f1c8a050c4
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da55266e7e44775541aba7dfea6ddb4ce98b63d56ca8b7cf213a395f32135776
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:274528fb9458ad54ab5973b2752fc7f6c9483a2a721e4d0ba19183ca440bc21c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82bb4fe5bf3e8542933d8cb52c350875b68d38b60b96f875a9ab6b9538329c08
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bcb038f6702a5ed9cf6a7787eb82f2807063a89d7bbe28d73008f47570ae171
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": 31000,
3
  "best_metric": 0.7226839661598206,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-31000",
5
- "epoch": 2.9228520883008997,
6
  "eval_steps": 250,
7
- "global_step": 38000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6544,6 +6544,92 @@
6544
  "eval_samples_per_second": 56.128,
6545
  "eval_steps_per_second": 14.032,
6546
  "step": 38000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6547
  }
6548
  ],
6549
  "logging_steps": 50,
 
2
  "best_global_step": 31000,
3
  "best_metric": 0.7226839661598206,
4
  "best_model_checkpoint": "./ar-diffusion-checkpoints-fixed/checkpoint-31000",
5
+ "epoch": 2.961310668410122,
6
  "eval_steps": 250,
7
+ "global_step": 38500,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6544
  "eval_samples_per_second": 56.128,
6545
  "eval_steps_per_second": 14.032,
6546
  "step": 38000
6547
+ },
6548
+ {
6549
+ "epoch": 2.926697946311822,
6550
+ "grad_norm": 0.8798107504844666,
6551
+ "learning_rate": 5.0229852219307584e-06,
6552
+ "loss": 0.7084,
6553
+ "step": 38050
6554
+ },
6555
+ {
6556
+ "epoch": 2.9305438043227445,
6557
+ "grad_norm": 0.3845706284046173,
6558
+ "learning_rate": 4.763265200114277e-06,
6559
+ "loss": 0.6764,
6560
+ "step": 38100
6561
+ },
6562
+ {
6563
+ "epoch": 2.9343896623336665,
6564
+ "grad_norm": 0.6847463846206665,
6565
+ "learning_rate": 4.503545178297795e-06,
6566
+ "loss": 0.7165,
6567
+ "step": 38150
6568
+ },
6569
+ {
6570
+ "epoch": 2.938235520344589,
6571
+ "grad_norm": 0.7632951736450195,
6572
+ "learning_rate": 4.243825156481313e-06,
6573
+ "loss": 0.7311,
6574
+ "step": 38200
6575
+ },
6576
+ {
6577
+ "epoch": 2.9420813783555113,
6578
+ "grad_norm": 1.3314287662506104,
6579
+ "learning_rate": 3.984105134664832e-06,
6580
+ "loss": 0.6852,
6581
+ "step": 38250
6582
+ },
6583
+ {
6584
+ "epoch": 2.9420813783555113,
6585
+ "eval_loss": 0.7683274149894714,
6586
+ "eval_runtime": 17.9706,
6587
+ "eval_samples_per_second": 55.646,
6588
+ "eval_steps_per_second": 13.912,
6589
+ "step": 38250
6590
+ },
6591
+ {
6592
+ "epoch": 2.9459272363664333,
6593
+ "grad_norm": 1.0179448127746582,
6594
+ "learning_rate": 3.7243851128483497e-06,
6595
+ "loss": 0.759,
6596
+ "step": 38300
6597
+ },
6598
+ {
6599
+ "epoch": 2.9497730943773557,
6600
+ "grad_norm": 1.4116487503051758,
6601
+ "learning_rate": 3.4646650910318677e-06,
6602
+ "loss": 0.7773,
6603
+ "step": 38350
6604
+ },
6605
+ {
6606
+ "epoch": 2.953618952388278,
6607
+ "grad_norm": 0.6251114010810852,
6608
+ "learning_rate": 3.2049450692153856e-06,
6609
+ "loss": 0.7016,
6610
+ "step": 38400
6611
+ },
6612
+ {
6613
+ "epoch": 2.9574648103992,
6614
+ "grad_norm": 0.9810579419136047,
6615
+ "learning_rate": 2.945225047398904e-06,
6616
+ "loss": 0.6909,
6617
+ "step": 38450
6618
+ },
6619
+ {
6620
+ "epoch": 2.961310668410122,
6621
+ "grad_norm": 0.7243860363960266,
6622
+ "learning_rate": 2.6855050255824223e-06,
6623
+ "loss": 0.7305,
6624
+ "step": 38500
6625
+ },
6626
+ {
6627
+ "epoch": 2.961310668410122,
6628
+ "eval_loss": 0.7680486440658569,
6629
+ "eval_runtime": 17.9145,
6630
+ "eval_samples_per_second": 55.821,
6631
+ "eval_steps_per_second": 13.955,
6632
+ "step": 38500
6633
  }
6634
  ],
6635
  "logging_steps": 50,