|
{ |
|
"run": { |
|
"task": "image_text_pretrain", |
|
"lr_sched": "linear_warmup_cosine_lr", |
|
"init_lr": 3e-05, |
|
"min_lr": 1e-05, |
|
"warmup_lr": 1e-06, |
|
"weight_decay": 0.05, |
|
"max_epoch": 40, |
|
"iters_per_epoch": 100, |
|
"batch_size_train": 8, |
|
"batch_size_eval": 1, |
|
"num_workers": 4, |
|
"warmup_steps": 10, |
|
"seed": 42, |
|
"output_dir": "output/xraygpt_vqa_finetune", |
|
"amp": true, |
|
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth", |
|
"evaluate": false, |
|
"train_splits": [ |
|
"train" |
|
], |
|
"device": "cuda", |
|
"world_size": 8, |
|
"dist_url": "env://", |
|
"distributed": true, |
|
"rank": 0, |
|
"gpu": 0, |
|
"dist_backend": "nccl" |
|
}, |
|
"model": { |
|
"arch": "mini_gpt4", |
|
"image_size": 224, |
|
"drop_path_rate": 0, |
|
"use_grad_checkpoint": false, |
|
"vit_precision": "fp16", |
|
"freeze_vit": true, |
|
"freeze_qformer": true, |
|
"num_query_token": 32, |
|
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", |
|
"prompt": "", |
|
"lora_r": 16, |
|
"lora_alpha": 16, |
|
"lora_target_modules": [ |
|
"q_proj", |
|
"k_proj", |
|
"v_proj", |
|
"o_proj", |
|
"gate_proj", |
|
"up_proj", |
|
"down_proj" |
|
], |
|
"lora_dropout": 0.1, |
|
"lora_bias": "none", |
|
"model_type": "pretrain_vicuna", |
|
"max_txt_len": 160, |
|
"end_sym": "<|eot_id|>", |
|
"ckpt": "24_10_29_14_43_38_epoch24.pth" |
|
}, |
|
"preprocess": { |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
}, |
|
"eval": { |
|
"name": "blip2_image_eval", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
}, |
|
"eval": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
}, |
|
"datasets": { |
|
"vqa": { |
|
"data_type": "images", |
|
"build_info": { |
|
"storage": "dataset/mimic_finetune" |
|
}, |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
} |
|
} |
|
} |
|
{"train_lr": "0.000019", "train_loss": "0.656437"} |
|
|