File size: 17,965 Bytes
14bd98c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 |
07/03/2023 01:07:03 - WARNING - __main__ - Process rank: -1, device: cuda:0, n_gpu: 1distributed training: False, 16-bits training: True
07/03/2023 01:07:03 - INFO - __main__ - Training/evaluation parameters TrainingArguments(
_n_gpu=1,
adafactor=False,
adam_beta1=0.9,
adam_beta2=0.999,
adam_epsilon=1e-08,
auto_find_batch_size=False,
bf16=False,
bf16_full_eval=False,
data_seed=None,
dataloader_drop_last=False,
dataloader_num_workers=0,
dataloader_pin_memory=True,
ddp_bucket_cap_mb=None,
ddp_find_unused_parameters=None,
ddp_timeout=1800,
debug=[],
deepspeed=None,
disable_tqdm=False,
do_eval=True,
do_predict=False,
do_train=True,
eval_accumulation_steps=None,
eval_delay=0,
eval_steps=391,
evaluation_strategy=steps,
fp16=True,
fp16_backend=auto,
fp16_full_eval=False,
fp16_opt_level=O1,
fsdp=[],
fsdp_config={'fsdp_min_num_params': 0, 'xla': False, 'xla_fsdp_grad_ckpt': False},
fsdp_min_num_params=0,
fsdp_transformer_layer_cls_to_wrap=None,
full_determinism=False,
gradient_accumulation_steps=1,
gradient_checkpointing=False,
greater_is_better=True,
group_by_length=False,
half_precision_backend=auto,
hub_model_id=None,
hub_private_repo=False,
hub_strategy=every_save,
hub_token=<HUB_TOKEN>,
ignore_data_skip=False,
include_inputs_for_metrics=False,
jit_mode_eval=False,
label_names=None,
label_smoothing_factor=0.0,
learning_rate=5e-05,
length_column_name=length,
load_best_model_at_end=True,
local_rank=-1,
log_level=passive,
log_level_replica=warning,
log_on_each_node=True,
logging_dir=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6/runs/Jul03_01-06-59_csr-dgx1-01,
logging_first_step=False,
logging_nan_inf_filter=True,
logging_steps=500,
logging_strategy=steps,
lr_scheduler_type=linear,
max_grad_norm=1.0,
max_steps=-1,
metric_for_best_model=accuracy,
mp_parameters=,
no_cuda=False,
num_train_epochs=6.0,
optim=adamw_torch,
optim_args=None,
output_dir=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6,
overwrite_output_dir=True,
past_index=-1,
per_device_eval_batch_size=64,
per_device_train_batch_size=32,
prediction_loss_only=False,
push_to_hub=False,
push_to_hub_model_id=None,
push_to_hub_organization=None,
push_to_hub_token=<PUSH_TO_HUB_TOKEN>,
ray_scope=last,
remove_unused_columns=True,
report_to=[],
resume_from_checkpoint=None,
run_name=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6,
save_on_each_node=False,
save_steps=391,
save_strategy=steps,
save_total_limit=1,
seed=42,
sharded_ddp=[],
skip_memory_metrics=True,
tf32=None,
torch_compile=False,
torch_compile_backend=None,
torch_compile_mode=None,
torchdynamo=None,
tpu_metrics_debug=False,
tpu_num_cores=None,
use_ipex=False,
use_legacy_prediction_loop=False,
use_mps_device=False,
warmup_ratio=0.1,
warmup_steps=0,
weight_decay=0.0,
xpu_backend=None,
)
07/03/2023 01:07:03 - INFO - datasets.builder - No config specified, defaulting to the single config: imdb/plain_text
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset Infos from /home/yujiepan/.cache/huggingface/modules/datasets_modules/datasets/imdb/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0
07/03/2023 01:07:03 - INFO - datasets.builder - Overwrite dataset info from restored data version if exists.
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset info from /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0
07/03/2023 01:07:03 - WARNING - datasets.builder - Found cached dataset imdb (/dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0)
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset info from /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0
07/03/2023 01:07:05 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-449826aec475610d.arrow
07/03/2023 01:07:11 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-ee7d3591a7ef8a71.arrow
07/03/2023 01:07:19 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-74a80ed80f1f2db9.arrow
07/03/2023 01:07:34 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/yujiepan/imdb-long/cache-13f54ac8f7bff8cf.arrow
07/03/2023 01:07:34 - INFO - __main__ - Sample 20952 of the training set: {'text': 'Arguably this is a very good "sequel", better than the first live action film 101 Dalmatians. It has good dogs, good actors, good jokes and all right slapstick! <br /><br />Cruella DeVil, who has had some rather major therapy, is now a lover of dogs and very kind to them. Many, including Chloe Simon, owner of one of the dogs that Cruella once tried to kill, do not believe this. Others, like Kevin Shepherd (owner of 2nd Chance Dog Shelter) believe that she has changed. <br /><br />Meanwhile, Dipstick, with his mate, have given birth to three cute dalmatian puppies! Little Dipper, Domino and Oddball...<br /><br />Starring Eric Idle as Waddlesworth (the hilarious macaw), Glenn Close as Cruella herself and Gerard Depardieu as Le Pelt (another baddie, the name should give a clue), this is a good family film with excitement and lots more!! One downfall of this film is that is has a lot of painful slapstick, but not quite as excessive as the last film. This is also funnier than the last film.<br /><br />Enjoy "102 Dalmatians"! :-)', 'label': 1, 'input_ids': [101, 15835, 2023, 2003, 1037, 2200, 2204, 1000, 8297, 1000, 1010, 2488, 2084, 1996, 2034, 2444, 2895, 2143, 7886, 17488, 18900, 7066, 1012, 2009, 2038, 2204, 6077, 1010, 2204, 5889, 1010, 2204, 13198, 1998, 2035, 2157, 14308, 21354, 999, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 10311, 2721, 6548, 1010, 2040, 2038, 2018, 2070, 2738, 2350, 7242, 1010, 2003, 2085, 1037, 7089, 1997, 6077, 1998, 2200, 2785, 2000, 2068, 1012, 2116, 1010, 2164, 9318, 4079, 1010, 3954, 1997, 2028, 1997, 1996, 6077, 2008, 10311, 2721, 2320, 2699, 2000, 3102, 1010, 2079, 2025, 2903, 2023, 1012, 2500, 1010, 2066, 4901, 11133, 1006, 3954, 1997, 3416, 3382, 3899, 7713, 1007, 2903, 2008, 2016, 2038, 2904, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 5564, 1010, 16510, 21354, 1010, 2007, 2010, 6775, 1010, 2031, 2445, 4182, 2000, 2093, 10140, 17488, 18900, 2937, 26781, 13046, 999, 2210, 16510, 4842, 1010, 23968, 1998, 5976, 7384, 1012, 1012, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 4626, 4388, 18373, 2004, 11333, 20338, 12255, 1006, 1996, 26316, 6097, 10376, 1007, 1010, 9465, 2485, 2004, 10311, 2721, 2841, 1998, 11063, 2139, 19362, 10265, 2226, 2004, 3393, 21877, 7096, 1006, 2178, 2919, 10265, 1010, 1996, 2171, 2323, 2507, 1037, 9789, 1007, 1010, 2023, 2003, 1037, 2204, 2155, 2143, 2007, 8277, 1998, 7167, 2062, 999, 999, 2028, 22252, 1997, 2023, 2143, 2003, 2008, 2003, 2038, 1037, 2843, 1997, 9145, 14308, 21354, 1010, 2021, 2025, 3243, 2004, 11664, 2004, 1996, 2197, 2143, 1012, 2023, 2003, 2036, 4569, 14862, 2084, 1996, 2197, 2143, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 5959, 1000, 9402, 17488, 18900, 7066, 1000, 999, 1024, 1011, 1007, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}.
07/03/2023 01:07:34 - INFO - __main__ - Sample 3648 of the training set: {'text': "It's a good thing I didn't watch this while i was pregnant.I definitely would have cried my eyes out and/or vomit. It was Kind of gruesome mainly disturbing. I personally thought the baby was adorable in its own twisted little way.However as a mom I cringed when Beth stabbed herself in the stomach and when Virgina aborted the child during her 3rd trimester with rusty utensils no less.Also,as an animal lover i almost cried when she scratched the cat to a bloody pulp.However,As creepy and sinister as the baby was I was rooting for it to live.And as twisted as the movie was I am extremely intrigued to see the sequel...... ......... ....... ......... ......... ....... ...... .....", 'label': 0, 'input_ids': [101, 2009, 1005, 1055, 1037, 2204, 2518, 1045, 2134, 1005, 1056, 3422, 2023, 2096, 1045, 2001, 6875, 1012, 1045, 5791, 2052, 2031, 6639, 2026, 2159, 2041, 1998, 1013, 2030, 23251, 1012, 2009, 2001, 2785, 1997, 24665, 15808, 8462, 3701, 14888, 1012, 1045, 7714, 2245, 1996, 3336, 2001, 23677, 1999, 2049, 2219, 6389, 2210, 2126, 1012, 2174, 2004, 1037, 3566, 1045, 23952, 2043, 7014, 13263, 2841, 1999, 1996, 4308, 1998, 2043, 6261, 2050, 11113, 15613, 1996, 2775, 2076, 2014, 3822, 12241, 20367, 2007, 13174, 21183, 6132, 12146, 2053, 2625, 1012, 2036, 1010, 2004, 2019, 4111, 7089, 1045, 2471, 6639, 2043, 2016, 15047, 1996, 4937, 2000, 1037, 6703, 16016, 1012, 2174, 1010, 2004, 17109, 1998, 16491, 2004, 1996, 3336, 2001, 1045, 2001, 7117, 2075, 2005, 2009, 2000, 2444, 1012, 1998, 2004, 6389, 2004, 1996, 3185, 2001, 1045, 2572, 5186, 18896, 2000, 2156, 1996, 8297, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}.
07/03/2023 01:07:34 - INFO - __main__ - Sample 819 of the training set: {'text': "This has to be the worst movie I have seen. Madsen fans don't be drawn into this like I was. He is only in it for a maximum of five minutes. This movie is so bad that the only reason why you would watch it is if all the rest of the movies on earth as well as t.v. had been destroyed.", 'label': 0, 'input_ids': [101, 2023, 2038, 2000, 2022, 1996, 5409, 3185, 1045, 2031, 2464, 1012, 5506, 5054, 4599, 2123, 1005, 1056, 2022, 4567, 2046, 2023, 2066, 1045, 2001, 1012, 2002, 2003, 2069, 1999, 2009, 2005, 1037, 4555, 1997, 2274, 2781, 1012, 2023, 3185, 2003, 2061, 2919, 2008, 1996, 2069, 3114, 2339, 2017, 2052, 3422, 2009, 2003, 2065, 2035, 1996, 2717, 1997, 1996, 5691, 2006, 3011, 2004, 2092, 2004, 1056, 1012, 1058, 1012, 2018, 2042, 3908, 1012, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}.
07/03/2023 01:07:34 - WARNING - evaluate.loading - Using the latest cached version of the module from /home/yujiepan/.cache/huggingface/modules/evaluate_modules/metrics/evaluate-metric--accuracy/f887c0aab52c2d38e1f8a215681126379eca617f96c447638f751434e8e65b14 (last modified on Wed Sep 28 14:58:53 2022) since it couldn't be found locally at evaluate-metric--accuracy, or remotely on the Hugging Face Hub.
{'eval_loss': 0.4330781102180481, 'eval_accuracy': 0.91216, 'eval_runtime': 65.4808, 'eval_samples_per_second': 381.791, 'eval_steps_per_second': 5.971, 'epoch': 0.5}
{'loss': 0.0385, 'learning_rate': 4.9680246328754146e-05, 'epoch': 0.64}
{'eval_loss': 0.3079942464828491, 'eval_accuracy': 0.91504, 'eval_runtime': 64.589, 'eval_samples_per_second': 387.063, 'eval_steps_per_second': 6.054, 'epoch': 1.0}
{'loss': 0.0654, 'learning_rate': 4.37588820464235e-05, 'epoch': 1.28}
{'eval_loss': 0.3285704255104065, 'eval_accuracy': 0.91636, 'eval_runtime': 64.8695, 'eval_samples_per_second': 385.389, 'eval_steps_per_second': 6.027, 'epoch': 1.5}
{'loss': 0.0636, 'learning_rate': 3.783751776409285e-05, 'epoch': 1.92}
{'eval_loss': 0.42962637543678284, 'eval_accuracy': 0.9184, 'eval_runtime': 130.3196, 'eval_samples_per_second': 191.836, 'eval_steps_per_second': 3.0, 'epoch': 2.0}
{'eval_loss': 0.5365941524505615, 'eval_accuracy': 0.91704, 'eval_runtime': 133.611, 'eval_samples_per_second': 187.11, 'eval_steps_per_second': 2.926, 'epoch': 2.5}
{'loss': 0.0344, 'learning_rate': 3.19161534817622e-05, 'epoch': 2.56}
{'eval_loss': 0.45805788040161133, 'eval_accuracy': 0.91724, 'eval_runtime': 130.2627, 'eval_samples_per_second': 191.92, 'eval_steps_per_second': 3.002, 'epoch': 3.0}
{'loss': 0.0285, 'learning_rate': 2.5994789199431553e-05, 'epoch': 3.2}
{'eval_loss': 0.5552997589111328, 'eval_accuracy': 0.91644, 'eval_runtime': 130.5012, 'eval_samples_per_second': 191.569, 'eval_steps_per_second': 2.996, 'epoch': 3.5}
{'loss': 0.0163, 'learning_rate': 2.008526764566556e-05, 'epoch': 3.84}
{'eval_loss': 0.5054952502250671, 'eval_accuracy': 0.91936, 'eval_runtime': 132.4835, 'eval_samples_per_second': 188.703, 'eval_steps_per_second': 2.951, 'epoch': 4.0}
{'loss': 0.0104, 'learning_rate': 1.4163903363334913e-05, 'epoch': 4.48}
{'eval_loss': 0.5432029366493225, 'eval_accuracy': 0.92644, 'eval_runtime': 130.5202, 'eval_samples_per_second': 191.541, 'eval_steps_per_second': 2.996, 'epoch': 4.5}
{'eval_loss': 0.5357362627983093, 'eval_accuracy': 0.92684, 'eval_runtime': 130.5356, 'eval_samples_per_second': 191.519, 'eval_steps_per_second': 2.995, 'epoch': 5.0}
{'loss': 0.0034, 'learning_rate': 8.242539081004264e-06, 'epoch': 5.12}
{'eval_loss': 0.5456807613372803, 'eval_accuracy': 0.92488, 'eval_runtime': 132.2657, 'eval_samples_per_second': 189.014, 'eval_steps_per_second': 2.956, 'epoch': 5.5}
{'loss': 0.0046, 'learning_rate': 2.3211747986736146e-06, 'epoch': 5.75}
{'eval_loss': 0.5325844883918762, 'eval_accuracy': 0.92816, 'eval_runtime': 130.2637, 'eval_samples_per_second': 191.918, 'eval_steps_per_second': 3.002, 'epoch': 6.0}
{'train_runtime': 3645.2659, 'train_samples_per_second': 41.149, 'train_steps_per_second': 1.287, 'train_loss': 0.02827812901810002, 'epoch': 6.0}
***** train metrics *****
epoch = 6.0
train_loss = 0.0283
train_runtime = 1:00:45.26
train_samples = 25000
train_samples_per_second = 41.149
train_steps_per_second = 1.287
07/03/2023 02:08:22 - INFO - __main__ - *** Evaluate ***
***** eval metrics *****
epoch = 6.0
eval_accuracy = 0.9282
eval_loss = 0.5326
eval_runtime = 0:02:10.43
eval_samples = 25000
eval_samples_per_second = 191.674
eval_steps_per_second = 2.998
***** eval metrics *****
epoch = 6.0
eval_accuracy = 0.8909
eval_loss = 0.7935
eval_runtime = 0:00:32.16
eval_samples = 5958
eval_samples_per_second = 185.204
eval_steps_per_second = 2.922
|