|
07/03/2023 01:07:03 - WARNING - __main__ - Process rank: -1, device: cuda:0, n_gpu: 1distributed training: False, 16-bits training: True |
|
07/03/2023 01:07:03 - INFO - __main__ - Training/evaluation parameters TrainingArguments( |
|
_n_gpu=1, |
|
adafactor=False, |
|
adam_beta1=0.9, |
|
adam_beta2=0.999, |
|
adam_epsilon=1e-08, |
|
auto_find_batch_size=False, |
|
bf16=False, |
|
bf16_full_eval=False, |
|
data_seed=None, |
|
dataloader_drop_last=False, |
|
dataloader_num_workers=0, |
|
dataloader_pin_memory=True, |
|
ddp_bucket_cap_mb=None, |
|
ddp_find_unused_parameters=None, |
|
ddp_timeout=1800, |
|
debug=[], |
|
deepspeed=None, |
|
disable_tqdm=False, |
|
do_eval=True, |
|
do_predict=False, |
|
do_train=True, |
|
eval_accumulation_steps=None, |
|
eval_delay=0, |
|
eval_steps=391, |
|
evaluation_strategy=steps, |
|
fp16=True, |
|
fp16_backend=auto, |
|
fp16_full_eval=False, |
|
fp16_opt_level=O1, |
|
fsdp=[], |
|
fsdp_config={'fsdp_min_num_params': 0, 'xla': False, 'xla_fsdp_grad_ckpt': False}, |
|
fsdp_min_num_params=0, |
|
fsdp_transformer_layer_cls_to_wrap=None, |
|
full_determinism=False, |
|
gradient_accumulation_steps=1, |
|
gradient_checkpointing=False, |
|
greater_is_better=True, |
|
group_by_length=False, |
|
half_precision_backend=auto, |
|
hub_model_id=None, |
|
hub_private_repo=False, |
|
hub_strategy=every_save, |
|
hub_token=<HUB_TOKEN>, |
|
ignore_data_skip=False, |
|
include_inputs_for_metrics=False, |
|
jit_mode_eval=False, |
|
label_names=None, |
|
label_smoothing_factor=0.0, |
|
learning_rate=5e-05, |
|
length_column_name=length, |
|
load_best_model_at_end=True, |
|
local_rank=-1, |
|
log_level=passive, |
|
log_level_replica=warning, |
|
log_on_each_node=True, |
|
logging_dir=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6/runs/Jul03_01-06-59_csr-dgx1-01, |
|
logging_first_step=False, |
|
logging_nan_inf_filter=True, |
|
logging_steps=500, |
|
logging_strategy=steps, |
|
lr_scheduler_type=linear, |
|
max_grad_norm=1.0, |
|
max_steps=-1, |
|
metric_for_best_model=accuracy, |
|
mp_parameters=, |
|
no_cuda=False, |
|
num_train_epochs=6.0, |
|
optim=adamw_torch, |
|
optim_args=None, |
|
output_dir=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6, |
|
overwrite_output_dir=True, |
|
past_index=-1, |
|
per_device_eval_batch_size=64, |
|
per_device_train_batch_size=32, |
|
prediction_loss_only=False, |
|
push_to_hub=False, |
|
push_to_hub_model_id=None, |
|
push_to_hub_organization=None, |
|
push_to_hub_token=<PUSH_TO_HUB_TOKEN>, |
|
ray_scope=last, |
|
remove_unused_columns=True, |
|
report_to=[], |
|
resume_from_checkpoint=None, |
|
run_name=/nvme1/yujiepan/token-dropping-logs/logs-final/train-imdb-baseline/0703-lr5e-05_warm0.1_epoch6, |
|
save_on_each_node=False, |
|
save_steps=391, |
|
save_strategy=steps, |
|
save_total_limit=1, |
|
seed=42, |
|
sharded_ddp=[], |
|
skip_memory_metrics=True, |
|
tf32=None, |
|
torch_compile=False, |
|
torch_compile_backend=None, |
|
torch_compile_mode=None, |
|
torchdynamo=None, |
|
tpu_metrics_debug=False, |
|
tpu_num_cores=None, |
|
use_ipex=False, |
|
use_legacy_prediction_loop=False, |
|
use_mps_device=False, |
|
warmup_ratio=0.1, |
|
warmup_steps=0, |
|
weight_decay=0.0, |
|
xpu_backend=None, |
|
) |
|
07/03/2023 01:07:03 - INFO - datasets.builder - No config specified, defaulting to the single config: imdb/plain_text |
|
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset Infos from /home/yujiepan/.cache/huggingface/modules/datasets_modules/datasets/imdb/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0 |
|
07/03/2023 01:07:03 - INFO - datasets.builder - Overwrite dataset info from restored data version if exists. |
|
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset info from /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0 |
|
07/03/2023 01:07:03 - WARNING - datasets.builder - Found cached dataset imdb (/dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0) |
|
07/03/2023 01:07:03 - INFO - datasets.info - Loading Dataset info from /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0 |
|
07/03/2023 01:07:05 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-449826aec475610d.arrow |
|
07/03/2023 01:07:11 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-ee7d3591a7ef8a71.arrow |
|
07/03/2023 01:07:19 - INFO - datasets.arrow_dataset - Caching processed dataset at /dev/shm/huggingface/datasets/imdb/plain_text/1.0.0/d613c88cf8fa3bab83b4ded3713f1f74830d1100e171db75bbddb80b3345c9c0/cache-74a80ed80f1f2db9.arrow |
|
07/03/2023 01:07:34 - WARNING - datasets.arrow_dataset - Loading cached processed dataset at /home/yujiepan/imdb-long/cache-13f54ac8f7bff8cf.arrow |
|
07/03/2023 01:07:34 - INFO - __main__ - Sample 20952 of the training set: {'text': 'Arguably this is a very good "sequel", better than the first live action film 101 Dalmatians. It has good dogs, good actors, good jokes and all right slapstick! <br /><br />Cruella DeVil, who has had some rather major therapy, is now a lover of dogs and very kind to them. Many, including Chloe Simon, owner of one of the dogs that Cruella once tried to kill, do not believe this. Others, like Kevin Shepherd (owner of 2nd Chance Dog Shelter) believe that she has changed. <br /><br />Meanwhile, Dipstick, with his mate, have given birth to three cute dalmatian puppies! Little Dipper, Domino and Oddball...<br /><br />Starring Eric Idle as Waddlesworth (the hilarious macaw), Glenn Close as Cruella herself and Gerard Depardieu as Le Pelt (another baddie, the name should give a clue), this is a good family film with excitement and lots more!! One downfall of this film is that is has a lot of painful slapstick, but not quite as excessive as the last film. This is also funnier than the last film.<br /><br />Enjoy "102 Dalmatians"! :-)', 'label': 1, 'input_ids': [101, 15835, 2023, 2003, 1037, 2200, 2204, 1000, 8297, 1000, 1010, 2488, 2084, 1996, 2034, 2444, 2895, 2143, 7886, 17488, 18900, 7066, 1012, 2009, 2038, 2204, 6077, 1010, 2204, 5889, 1010, 2204, 13198, 1998, 2035, 2157, 14308, 21354, 999, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 10311, 2721, 6548, 1010, 2040, 2038, 2018, 2070, 2738, 2350, 7242, 1010, 2003, 2085, 1037, 7089, 1997, 6077, 1998, 2200, 2785, 2000, 2068, 1012, 2116, 1010, 2164, 9318, 4079, 1010, 3954, 1997, 2028, 1997, 1996, 6077, 2008, 10311, 2721, 2320, 2699, 2000, 3102, 1010, 2079, 2025, 2903, 2023, 1012, 2500, 1010, 2066, 4901, 11133, 1006, 3954, 1997, 3416, 3382, 3899, 7713, 1007, 2903, 2008, 2016, 2038, 2904, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 5564, 1010, 16510, 21354, 1010, 2007, 2010, 6775, 1010, 2031, 2445, 4182, 2000, 2093, 10140, 17488, 18900, 2937, 26781, 13046, 999, 2210, 16510, 4842, 1010, 23968, 1998, 5976, 7384, 1012, 1012, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 4626, 4388, 18373, 2004, 11333, 20338, 12255, 1006, 1996, 26316, 6097, 10376, 1007, 1010, 9465, 2485, 2004, 10311, 2721, 2841, 1998, 11063, 2139, 19362, 10265, 2226, 2004, 3393, 21877, 7096, 1006, 2178, 2919, 10265, 1010, 1996, 2171, 2323, 2507, 1037, 9789, 1007, 1010, 2023, 2003, 1037, 2204, 2155, 2143, 2007, 8277, 1998, 7167, 2062, 999, 999, 2028, 22252, 1997, 2023, 2143, 2003, 2008, 2003, 2038, 1037, 2843, 1997, 9145, 14308, 21354, 1010, 2021, 2025, 3243, 2004, 11664, 2004, 1996, 2197, 2143, 1012, 2023, 2003, 2036, 4569, 14862, 2084, 1996, 2197, 2143, 1012, 1026, 7987, 1013, 1028, 1026, 7987, 1013, 1028, 5959, 1000, 9402, 17488, 18900, 7066, 1000, 999, 1024, 1011, 1007, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}. |
|
07/03/2023 01:07:34 - INFO - __main__ - Sample 3648 of the training set: {'text': "It's a good thing I didn't watch this while i was pregnant.I definitely would have cried my eyes out and/or vomit. It was Kind of gruesome mainly disturbing. I personally thought the baby was adorable in its own twisted little way.However as a mom I cringed when Beth stabbed herself in the stomach and when Virgina aborted the child during her 3rd trimester with rusty utensils no less.Also,as an animal lover i almost cried when she scratched the cat to a bloody pulp.However,As creepy and sinister as the baby was I was rooting for it to live.And as twisted as the movie was I am extremely intrigued to see the sequel...... ......... ....... ......... ......... ....... ...... .....", 'label': 0, 'input_ids': [101, 2009, 1005, 1055, 1037, 2204, 2518, 1045, 2134, 1005, 1056, 3422, 2023, 2096, 1045, 2001, 6875, 1012, 1045, 5791, 2052, 2031, 6639, 2026, 2159, 2041, 1998, 1013, 2030, 23251, 1012, 2009, 2001, 2785, 1997, 24665, 15808, 8462, 3701, 14888, 1012, 1045, 7714, 2245, 1996, 3336, 2001, 23677, 1999, 2049, 2219, 6389, 2210, 2126, 1012, 2174, 2004, 1037, 3566, 1045, 23952, 2043, 7014, 13263, 2841, 1999, 1996, 4308, 1998, 2043, 6261, 2050, 11113, 15613, 1996, 2775, 2076, 2014, 3822, 12241, 20367, 2007, 13174, 21183, 6132, 12146, 2053, 2625, 1012, 2036, 1010, 2004, 2019, 4111, 7089, 1045, 2471, 6639, 2043, 2016, 15047, 1996, 4937, 2000, 1037, 6703, 16016, 1012, 2174, 1010, 2004, 17109, 1998, 16491, 2004, 1996, 3336, 2001, 1045, 2001, 7117, 2075, 2005, 2009, 2000, 2444, 1012, 1998, 2004, 6389, 2004, 1996, 3185, 2001, 1045, 2572, 5186, 18896, 2000, 2156, 1996, 8297, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 1012, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}. |
|
07/03/2023 01:07:34 - INFO - __main__ - Sample 819 of the training set: {'text': "This has to be the worst movie I have seen. Madsen fans don't be drawn into this like I was. He is only in it for a maximum of five minutes. This movie is so bad that the only reason why you would watch it is if all the rest of the movies on earth as well as t.v. had been destroyed.", 'label': 0, 'input_ids': [101, 2023, 2038, 2000, 2022, 1996, 5409, 3185, 1045, 2031, 2464, 1012, 5506, 5054, 4599, 2123, 1005, 1056, 2022, 4567, 2046, 2023, 2066, 1045, 2001, 1012, 2002, 2003, 2069, 1999, 2009, 2005, 1037, 4555, 1997, 2274, 2781, 1012, 2023, 3185, 2003, 2061, 2919, 2008, 1996, 2069, 3114, 2339, 2017, 2052, 3422, 2009, 2003, 2065, 2035, 1996, 2717, 1997, 1996, 5691, 2006, 3011, 2004, 2092, 2004, 1056, 1012, 1058, 1012, 2018, 2042, 3908, 1012, 102], 'token_type_ids': [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}. |
|
07/03/2023 01:07:34 - WARNING - evaluate.loading - Using the latest cached version of the module from /home/yujiepan/.cache/huggingface/modules/evaluate_modules/metrics/evaluate-metric--accuracy/f887c0aab52c2d38e1f8a215681126379eca617f96c447638f751434e8e65b14 (last modified on Wed Sep 28 14:58:53 2022) since it couldn't be found locally at evaluate-metric--accuracy, or remotely on the Hugging Face Hub. |
|
{'eval_loss': 0.4330781102180481, 'eval_accuracy': 0.91216, 'eval_runtime': 65.4808, 'eval_samples_per_second': 381.791, 'eval_steps_per_second': 5.971, 'epoch': 0.5} |
|
{'loss': 0.0385, 'learning_rate': 4.9680246328754146e-05, 'epoch': 0.64} |
|
{'eval_loss': 0.3079942464828491, 'eval_accuracy': 0.91504, 'eval_runtime': 64.589, 'eval_samples_per_second': 387.063, 'eval_steps_per_second': 6.054, 'epoch': 1.0} |
|
{'loss': 0.0654, 'learning_rate': 4.37588820464235e-05, 'epoch': 1.28} |
|
{'eval_loss': 0.3285704255104065, 'eval_accuracy': 0.91636, 'eval_runtime': 64.8695, 'eval_samples_per_second': 385.389, 'eval_steps_per_second': 6.027, 'epoch': 1.5} |
|
{'loss': 0.0636, 'learning_rate': 3.783751776409285e-05, 'epoch': 1.92} |
|
{'eval_loss': 0.42962637543678284, 'eval_accuracy': 0.9184, 'eval_runtime': 130.3196, 'eval_samples_per_second': 191.836, 'eval_steps_per_second': 3.0, 'epoch': 2.0} |
|
{'eval_loss': 0.5365941524505615, 'eval_accuracy': 0.91704, 'eval_runtime': 133.611, 'eval_samples_per_second': 187.11, 'eval_steps_per_second': 2.926, 'epoch': 2.5} |
|
{'loss': 0.0344, 'learning_rate': 3.19161534817622e-05, 'epoch': 2.56} |
|
{'eval_loss': 0.45805788040161133, 'eval_accuracy': 0.91724, 'eval_runtime': 130.2627, 'eval_samples_per_second': 191.92, 'eval_steps_per_second': 3.002, 'epoch': 3.0} |
|
{'loss': 0.0285, 'learning_rate': 2.5994789199431553e-05, 'epoch': 3.2} |
|
{'eval_loss': 0.5552997589111328, 'eval_accuracy': 0.91644, 'eval_runtime': 130.5012, 'eval_samples_per_second': 191.569, 'eval_steps_per_second': 2.996, 'epoch': 3.5} |
|
{'loss': 0.0163, 'learning_rate': 2.008526764566556e-05, 'epoch': 3.84} |
|
{'eval_loss': 0.5054952502250671, 'eval_accuracy': 0.91936, 'eval_runtime': 132.4835, 'eval_samples_per_second': 188.703, 'eval_steps_per_second': 2.951, 'epoch': 4.0} |
|
{'loss': 0.0104, 'learning_rate': 1.4163903363334913e-05, 'epoch': 4.48} |
|
{'eval_loss': 0.5432029366493225, 'eval_accuracy': 0.92644, 'eval_runtime': 130.5202, 'eval_samples_per_second': 191.541, 'eval_steps_per_second': 2.996, 'epoch': 4.5} |
|
{'eval_loss': 0.5357362627983093, 'eval_accuracy': 0.92684, 'eval_runtime': 130.5356, 'eval_samples_per_second': 191.519, 'eval_steps_per_second': 2.995, 'epoch': 5.0} |
|
{'loss': 0.0034, 'learning_rate': 8.242539081004264e-06, 'epoch': 5.12} |
|
{'eval_loss': 0.5456807613372803, 'eval_accuracy': 0.92488, 'eval_runtime': 132.2657, 'eval_samples_per_second': 189.014, 'eval_steps_per_second': 2.956, 'epoch': 5.5} |
|
{'loss': 0.0046, 'learning_rate': 2.3211747986736146e-06, 'epoch': 5.75} |
|
{'eval_loss': 0.5325844883918762, 'eval_accuracy': 0.92816, 'eval_runtime': 130.2637, 'eval_samples_per_second': 191.918, 'eval_steps_per_second': 3.002, 'epoch': 6.0} |
|
{'train_runtime': 3645.2659, 'train_samples_per_second': 41.149, 'train_steps_per_second': 1.287, 'train_loss': 0.02827812901810002, 'epoch': 6.0} |
|
***** train metrics ***** |
|
epoch = 6.0 |
|
train_loss = 0.0283 |
|
train_runtime = 1:00:45.26 |
|
train_samples = 25000 |
|
train_samples_per_second = 41.149 |
|
train_steps_per_second = 1.287 |
|
07/03/2023 02:08:22 - INFO - __main__ - *** Evaluate *** |
|
***** eval metrics ***** |
|
epoch = 6.0 |
|
eval_accuracy = 0.9282 |
|
eval_loss = 0.5326 |
|
eval_runtime = 0:02:10.43 |
|
eval_samples = 25000 |
|
eval_samples_per_second = 191.674 |
|
eval_steps_per_second = 2.998 |
|
***** eval metrics ***** |
|
epoch = 6.0 |
|
eval_accuracy = 0.8909 |
|
eval_loss = 0.7935 |
|
eval_runtime = 0:00:32.16 |
|
eval_samples = 5958 |
|
eval_samples_per_second = 185.204 |
|
eval_steps_per_second = 2.922 |
|
|