{ | |
"run": { | |
"task": "image_text_pretrain", | |
"lr_sched": "linear_warmup_cosine_lr", | |
"init_lr": 0.0001, | |
"min_lr": 8e-05, | |
"warmup_lr": 1e-06, | |
"weight_decay": 0.05, | |
"max_epoch": 50, | |
"batch_size_train": 120, | |
"batch_size_eval": 3, | |
"num_workers": 4, | |
"warmup_steps": 500, | |
"iters_per_epoch": 500, | |
"seed": 42, | |
"output_dir": "output/xraygpt_mimic_pretrain", | |
"amp": true, | |
"resume_ckpt_path": "xraygpt/output/xraygpt_mimic_pretrain/20241020174/checkpoint_18.pth", | |
"evaluate": false, | |
"train_splits": [ | |
"train" | |
], | |
"device": "cuda", | |
"world_size": 4, | |
"dist_url": "env://", | |
"distributed": true, | |
"rank": 0, | |
"gpu": 0, | |
"dist_backend": "nccl" | |
}, | |
"model": { | |
"arch": "mini_gpt4", | |
"image_size": 224, | |
"drop_path_rate": 0, | |
"use_grad_checkpoint": false, | |
"vit_precision": "fp16", | |
"freeze_vit": true, | |
"freeze_qformer": true, | |
"num_query_token": 32, | |
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", | |
"prompt": "", | |
"model_type": "pretrain_vicuna" | |
}, | |
"preprocess": { | |
"vis_processor": { | |
"train": { | |
"name": "blip2_image_train", | |
"image_size": 224 | |
}, | |
"eval": { | |
"name": "blip2_image_eval", | |
"image_size": 224 | |
} | |
}, | |
"text_processor": { | |
"train": { | |
"name": "blip_caption" | |
}, | |
"eval": { | |
"name": "blip_caption" | |
} | |
} | |
}, | |
"datasets": { | |
"mimic": { | |
"data_type": "images", | |
"build_info": { | |
"storage": "dataset/mimic" | |
}, | |
"vis_processor": { | |
"train": { | |
"name": "blip2_image_train", | |
"image_size": 224 | |
} | |
}, | |
"text_processor": { | |
"train": { | |
"name": "blip_caption" | |
} | |
} | |
} | |
} | |
} | |
{"train_lr": "0.000", "train_loss": "1.248"} | |
{"train_lr": "0.000", "train_loss": "1.246"} | |
{"train_lr": "0.000", "train_loss": "1.245"} | |
{"train_lr": "0.000", "train_loss": "1.241"} | |