|
epoch 0: avg Loss = 3.722 / dev BLEU = 0.0583 |
|
/home/xinyue/.conda/envs/myenv/lib/python3.10/site-packages/transformers/modeling_utils.py:2758: UserWarning: Moving the following attributes in the config to the generation config: {'max_length': 200}. You are seeing this warning because you've set generation parameters in the model config, as opposed to in the generation config. |
|
warnings.warn( |
|
epoch 1: avg Loss = 3.492 / dev BLEU = 0.0532 |
|
epoch 2: avg Loss = 3.798 / dev BLEU = 0.0522 |
|
epoch 3: avg Loss = 3.751 / dev BLEU = 0.0502 |
|
epoch 4: avg Loss = 3.736 / dev BLEU = 0.0489 |
|
epoch 5: avg Loss = 3.689 / dev BLEU = 0.0482 |
|
epoch 6: avg Loss = 3.700 / dev BLEU = 0.0527 |
|
epoch 7: avg Loss = 3.683 / dev BLEU = 0.0485 |
|
epoch 8: avg Loss = 3.662 / dev BLEU = 0.0551 |
|
epoch 9: avg Loss = 3.641 / dev BLEU = 0.0542 |
|
epoch 10: avg Loss = 3.598 / dev BLEU = 0.0539 |
|
epoch 11: avg Loss = 3.613 / dev BLEU = 0.0528 |
|
epoch 12: avg Loss = 3.612 / dev BLEU = 0.0466 |
|
epoch 13: avg Loss = 3.586 / dev BLEU = 0.0489 |
|
epoch 14: avg Loss = 3.592 / dev BLEU = 0.0527 |
|
epoch 15: avg Loss = 3.566 / dev BLEU = 0.0536 |
|
epoch 16: avg Loss = 3.540 / dev BLEU = 0.0542 |
|
epoch 17: avg Loss = 3.496 / dev BLEU = 0.0552 |
|
epoch 18: avg Loss = 3.480 / dev BLEU = 0.0585 |
|
epoch 19: avg Loss = 3.485 / dev BLEU = 0.0608 |
|
epoch 20: avg Loss = 3.459 / dev BLEU = 0.0588 |
|
epoch 21: avg Loss = 3.438 / dev BLEU = 0.0617 |
|
epoch 22: avg Loss = 3.441 / dev BLEU = 0.0609 |
|
epoch 23: avg Loss = 3.431 / dev BLEU = 0.0601 |
|
epoch 24: avg Loss = 3.418 / dev BLEU = 0.0616 |
|
epoch 25: avg Loss = 3.422 / dev BLEU = 0.0602 |
|
epoch 26: avg Loss = 3.413 / dev BLEU = 0.0624 |
|
epoch 27: avg Loss = 3.399 / dev BLEU = 0.0553 |
|
epoch 28: avg Loss = 3.380 / dev BLEU = 0.0605 |
|
epoch 29: avg Loss = 3.365 / dev BLEU = 0.0601 |
|
epoch 30: avg Loss = 3.354 / dev BLEU = 0.0596 |
|
epoch 31: avg Loss = 3.349 / dev BLEU = 0.0599 |
|
epoch 32: avg Loss = 3.350 / dev BLEU = 0.0559 |
|
epoch 33: avg Loss = 3.360 / dev BLEU = 0.0552 |
|
epoch 34: avg Loss = 3.344 / dev BLEU = 0.0505 |
|
epoch 35: avg Loss = 3.349 / dev BLEU = 0.0519 |
|
epoch 36: avg Loss = 3.358 / dev BLEU = 0.0495 |
|
epoch 37: avg Loss = 3.349 / dev BLEU = 0.0429 |
|
epoch 38: avg Loss = 3.337 / dev BLEU = 0.0589 |
|
epoch 39: avg Loss = 3.332 / dev BLEU = 0.0606 |
|
epoch 40: avg Loss = 3.318 / dev BLEU = 0.0598 |
|
epoch 41: avg Loss = 3.317 / dev BLEU = 0.0517 |
|
epoch 42: avg Loss = 3.303 / dev BLEU = 0.0537 |
|
epoch 43: avg Loss = 3.290 / dev BLEU = 0.0605 |
|
epoch 44: avg Loss = 3.286 / dev BLEU = 0.0621 |
|
epoch 45: avg Loss = 3.277 / dev BLEU = 0.0690 |
|
epoch 46: avg Loss = 3.263 / dev BLEU = 0.0694 |
|
epoch 47: avg Loss = 3.256 / dev BLEU = 0.0677 |
|
epoch 48: avg Loss = 3.249 / dev BLEU = 0.0722 |
|
epoch 49: avg Loss = 3.239 / dev BLEU = 0.0717 |
|
epoch 50: avg Loss = 3.232 / dev BLEU = 0.0689 |
|
epoch 51: avg Loss = 3.228 / dev BLEU = 0.0709 |
|
epoch 52: avg Loss = 3.217 / dev BLEU = 0.0699 |
|
epoch 53: avg Loss = 3.213 / dev BLEU = 0.0690 |
|
epoch 54: avg Loss = 3.208 / dev BLEU = 0.0719 |
|
epoch 55: avg Loss = 3.196 / dev BLEU = 0.0729 |
|
epoch 56: avg Loss = 3.179 / dev BLEU = 0.0708 |
|
epoch 57: avg Loss = 3.171 / dev BLEU = 0.0731 |
|
epoch 58: avg Loss = 3.172 / dev BLEU = 0.0706 |
|
epoch 59: avg Loss = 3.173 / dev BLEU = 0.0692 |
|
epoch 60: avg Loss = 3.168 / dev BLEU = 0.0693 |
|
epoch 61: avg Loss = 3.156 / dev BLEU = 0.0733 |
|
epoch 62: avg Loss = 3.153 / dev BLEU = 0.0575 |
|
epoch 63: avg Loss = 3.143 / dev BLEU = 0.0690 |
|
epoch 64: avg Loss = 3.130 / dev BLEU = 0.0707 |
|
epoch 65: avg Loss = 3.128 / dev BLEU = 0.0717 |
|
epoch 66: avg Loss = 3.124 / dev BLEU = 0.0674 |
|
epoch 67: avg Loss = 3.120 / dev BLEU = 0.0596 |
|
epoch 68: avg Loss = 3.111 / dev BLEU = 0.0634 |
|
epoch 69: avg Loss = 3.101 / dev BLEU = 0.0651 |
|
epoch 70: avg Loss = 3.093 / dev BLEU = 0.0683 |
|
epoch 71: avg Loss = 3.088 / dev BLEU = 0.0730 |
|
epoch 72: avg Loss = 3.084 / dev BLEU = 0.0697 |
|
epoch 73: avg Loss = 3.083 / dev BLEU = 0.0684 |
|
epoch 74: avg Loss = 3.075 / dev BLEU = 0.0710 |
|
epoch 75: avg Loss = 3.070 / dev BLEU = 0.0673 |
|
epoch 76: avg Loss = 3.068 / dev BLEU = 0.0619 |
|
epoch 77: avg Loss = 3.066 / dev BLEU = 0.0605 |
|
epoch 78: avg Loss = 3.065 / dev BLEU = 0.0697 |
|
epoch 79: avg Loss = 3.064 / dev BLEU = 0.0605 |
|
epoch 80: avg Loss = 3.064 / dev BLEU = 0.0658 |
|
epoch 81: avg Loss = 3.059 / dev BLEU = 0.0678 |
|
epoch 82: avg Loss = 3.053 / dev BLEU = 0.0720 |
|
epoch 83: avg Loss = 3.052 / dev BLEU = 0.0707 |
|
epoch 84: avg Loss = 3.049 / dev BLEU = 0.0712 |
|
epoch 85: avg Loss = 3.043 / dev BLEU = 0.0712 |
|
epoch 86: avg Loss = 3.039 / dev BLEU = 0.0706 |
|
epoch 87: avg Loss = 3.033 / dev BLEU = 0.0747 |
|
epoch 88: avg Loss = 3.032 / dev BLEU = 0.0706 |
|
epoch 89: avg Loss = 3.023 / dev BLEU = 0.0736 |
|
epoch 90: avg Loss = 3.019 / dev BLEU = 0.0737 |
|
epoch 91: avg Loss = 3.012 / dev BLEU = 0.0682 |
|
epoch 92: avg Loss = 3.006 / dev BLEU = 0.0672 |
|
epoch 93: avg Loss = 3.004 / dev BLEU = 0.0744 |
|
epoch 94: avg Loss = 3.002 / dev BLEU = 0.0646 |
|
epoch 95: avg Loss = 2.999 / dev BLEU = 0.0683 |
|
epoch 96: avg Loss = 2.995 / dev BLEU = 0.0628 |
|
epoch 97: avg Loss = 2.990 / dev BLEU = 0.0643 |
|
epoch 98: avg Loss = 2.985 / dev BLEU = 0.0665 |
|
epoch 99: avg Loss = 2.980 / dev BLEU = 0.0678 |
|
epoch 100: avg Loss = 2.972 / dev BLEU = 0.0662 |
|
|
|
 |
|
|
|
 |
|
|