OsamaMo commited on
Commit
89e6d1d
·
verified ·
1 Parent(s): 9864f98

Training in progress, step 500, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "o_proj",
24
- "k_proj",
25
- "down_proj",
26
- "gate_proj",
27
  "q_proj",
28
  "v_proj",
 
 
 
 
29
  "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
 
23
  "q_proj",
24
  "v_proj",
25
+ "gate_proj",
26
+ "k_proj",
27
+ "down_proj",
28
+ "o_proj",
29
  "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
last-checkpoint/trainer_state.json CHANGED
@@ -81,9 +81,9 @@
81
  {
82
  "epoch": 0.07145409074669525,
83
  "eval_news_finetune_val_loss": 0.48679304122924805,
84
- "eval_news_finetune_val_runtime": 1002.7224,
85
- "eval_news_finetune_val_samples_per_second": 1.396,
86
- "eval_news_finetune_val_steps_per_second": 1.396,
87
  "step": 100
88
  },
89
  {
@@ -159,9 +159,9 @@
159
  {
160
  "epoch": 0.1429081814933905,
161
  "eval_news_finetune_val_loss": 0.4338369369506836,
162
- "eval_news_finetune_val_runtime": 1003.2801,
163
- "eval_news_finetune_val_samples_per_second": 1.395,
164
- "eval_news_finetune_val_steps_per_second": 1.395,
165
  "step": 200
166
  },
167
  {
@@ -237,9 +237,9 @@
237
  {
238
  "epoch": 0.21436227224008575,
239
  "eval_news_finetune_val_loss": 0.40391305088996887,
240
- "eval_news_finetune_val_runtime": 1003.2872,
241
- "eval_news_finetune_val_samples_per_second": 1.395,
242
- "eval_news_finetune_val_steps_per_second": 1.395,
243
  "step": 300
244
  },
245
  {
@@ -315,9 +315,9 @@
315
  {
316
  "epoch": 0.285816362986781,
317
  "eval_news_finetune_val_loss": 0.39322975277900696,
318
- "eval_news_finetune_val_runtime": 1003.4166,
319
- "eval_news_finetune_val_samples_per_second": 1.395,
320
- "eval_news_finetune_val_steps_per_second": 1.395,
321
  "step": 400
322
  },
323
  {
@@ -393,9 +393,9 @@
393
  {
394
  "epoch": 0.35727045373347627,
395
  "eval_news_finetune_val_loss": 0.3787713646888733,
396
- "eval_news_finetune_val_runtime": 1003.589,
397
- "eval_news_finetune_val_samples_per_second": 1.395,
398
- "eval_news_finetune_val_steps_per_second": 1.395,
399
  "step": 500
400
  }
401
  ],
 
81
  {
82
  "epoch": 0.07145409074669525,
83
  "eval_news_finetune_val_loss": 0.48679304122924805,
84
+ "eval_news_finetune_val_runtime": 1001.9158,
85
+ "eval_news_finetune_val_samples_per_second": 1.397,
86
+ "eval_news_finetune_val_steps_per_second": 1.397,
87
  "step": 100
88
  },
89
  {
 
159
  {
160
  "epoch": 0.1429081814933905,
161
  "eval_news_finetune_val_loss": 0.4338369369506836,
162
+ "eval_news_finetune_val_runtime": 1002.1695,
163
+ "eval_news_finetune_val_samples_per_second": 1.397,
164
+ "eval_news_finetune_val_steps_per_second": 1.397,
165
  "step": 200
166
  },
167
  {
 
237
  {
238
  "epoch": 0.21436227224008575,
239
  "eval_news_finetune_val_loss": 0.40391305088996887,
240
+ "eval_news_finetune_val_runtime": 1002.5797,
241
+ "eval_news_finetune_val_samples_per_second": 1.396,
242
+ "eval_news_finetune_val_steps_per_second": 1.396,
243
  "step": 300
244
  },
245
  {
 
315
  {
316
  "epoch": 0.285816362986781,
317
  "eval_news_finetune_val_loss": 0.39322975277900696,
318
+ "eval_news_finetune_val_runtime": 1002.8865,
319
+ "eval_news_finetune_val_samples_per_second": 1.396,
320
+ "eval_news_finetune_val_steps_per_second": 1.396,
321
  "step": 400
322
  },
323
  {
 
393
  {
394
  "epoch": 0.35727045373347627,
395
  "eval_news_finetune_val_loss": 0.3787713646888733,
396
+ "eval_news_finetune_val_runtime": 1002.8588,
397
+ "eval_news_finetune_val_samples_per_second": 1.396,
398
+ "eval_news_finetune_val_steps_per_second": 1.396,
399
  "step": 500
400
  }
401
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2782bf8a609c154eefb42753d138dafcba3aa0ea92b9d87f5184a3cbc4f0f0be
3
  size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:367406c6dccce148fee91e86e6fa08ac415e3c6a88231b8f42f8d49575bf98f6
3
  size 5624