from transformers import TrainingArguments training_args = TrainingArguments( output_dir="./results", num_train_epochs=3, per_device_train_batch_size=8, # Optimized for T4 GPU per_device_eval_batch_size=8, warmup_steps=500, weight_decay=0.01, logging_dir='./logs', logging_steps=50, save_steps=500, eval_steps=500, evaluation_strategy="steps", save_strategy="steps", save_total_limit=3, load_best_model_at_end=True, learning_rate=5e-5, fp16=True, # Using GPU features gradient_checkpointing=True )