|
{ |
|
"run": { |
|
"task": "image_text_pretrain", |
|
"lr_sched": "linear_warmup_cosine_lr", |
|
"init_lr": 3e-05, |
|
"min_lr": 1e-05, |
|
"warmup_lr": 1e-06, |
|
"weight_decay": 0.05, |
|
"max_epoch": 100, |
|
"iters_per_epoch": 500, |
|
"batch_size_train": 8, |
|
"batch_size_eval": 1, |
|
"num_workers": 4, |
|
"warmup_steps": 200, |
|
"seed": 42, |
|
"output_dir": "output/xraygpt_vqa_finetune", |
|
"amp": true, |
|
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth", |
|
"evaluate": false, |
|
"train_splits": [ |
|
"train" |
|
], |
|
"device": "cuda", |
|
"world_size": 8, |
|
"dist_url": "env://", |
|
"distributed": true, |
|
"rank": 0, |
|
"gpu": 0, |
|
"dist_backend": "nccl" |
|
}, |
|
"model": { |
|
"arch": "mini_gpt4", |
|
"image_size": 224, |
|
"drop_path_rate": 0, |
|
"use_grad_checkpoint": false, |
|
"vit_precision": "fp16", |
|
"freeze_vit": true, |
|
"freeze_qformer": true, |
|
"num_query_token": 32, |
|
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", |
|
"prompt": "", |
|
"lora_r": 16, |
|
"lora_alpha": 16, |
|
"lora_target_modules": [ |
|
"q_proj", |
|
"k_proj", |
|
"v_proj", |
|
"o_proj", |
|
"gate_proj", |
|
"up_proj", |
|
"down_proj" |
|
], |
|
"lora_dropout": 0.1, |
|
"lora_bias": "none", |
|
"model_type": "pretrain_vicuna", |
|
"max_txt_len": 160, |
|
"end_sym": "<|eot_id|>", |
|
"ckpt": "24_10_29_03_29_41_epoch160.pth" |
|
}, |
|
"preprocess": { |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
}, |
|
"eval": { |
|
"name": "blip2_image_eval", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
}, |
|
"eval": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
}, |
|
"datasets": { |
|
"vqa": { |
|
"data_type": "images", |
|
"build_info": { |
|
"storage": "dataset/mimic_finetune" |
|
}, |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
} |
|
} |
|
} |
|
{ |
|
"run": { |
|
"task": "image_text_pretrain", |
|
"lr_sched": "linear_warmup_cosine_lr", |
|
"init_lr": 3e-05, |
|
"min_lr": 1e-05, |
|
"warmup_lr": 1e-06, |
|
"weight_decay": 0.05, |
|
"max_epoch": 100, |
|
"iters_per_epoch": 500, |
|
"batch_size_train": 10, |
|
"batch_size_eval": 1, |
|
"num_workers": 4, |
|
"warmup_steps": 200, |
|
"seed": 42, |
|
"output_dir": "output/xraygpt_vqa_finetune", |
|
"amp": true, |
|
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth", |
|
"evaluate": false, |
|
"train_splits": [ |
|
"train" |
|
], |
|
"device": "cuda", |
|
"world_size": 8, |
|
"dist_url": "env://", |
|
"distributed": true, |
|
"rank": 0, |
|
"gpu": 0, |
|
"dist_backend": "nccl" |
|
}, |
|
"model": { |
|
"arch": "mini_gpt4", |
|
"image_size": 224, |
|
"drop_path_rate": 0, |
|
"use_grad_checkpoint": false, |
|
"vit_precision": "fp16", |
|
"freeze_vit": true, |
|
"freeze_qformer": true, |
|
"num_query_token": 32, |
|
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", |
|
"prompt": "", |
|
"lora_r": 16, |
|
"lora_alpha": 16, |
|
"lora_target_modules": [ |
|
"q_proj", |
|
"k_proj", |
|
"v_proj", |
|
"o_proj", |
|
"gate_proj", |
|
"up_proj", |
|
"down_proj" |
|
], |
|
"lora_dropout": 0.1, |
|
"lora_bias": "none", |
|
"model_type": "pretrain_vicuna", |
|
"max_txt_len": 160, |
|
"end_sym": "<|eot_id|>", |
|
"ckpt": "24_10_29_03_29_41_epoch160.pth" |
|
}, |
|
"preprocess": { |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
}, |
|
"eval": { |
|
"name": "blip2_image_eval", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
}, |
|
"eval": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
}, |
|
"datasets": { |
|
"vqa": { |
|
"data_type": "images", |
|
"build_info": { |
|
"storage": "dataset/mimic_finetune" |
|
}, |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
} |
|
} |
|
} |
|
{ |
|
"run": { |
|
"task": "image_text_pretrain", |
|
"lr_sched": "linear_warmup_cosine_lr", |
|
"init_lr": 3e-05, |
|
"min_lr": 1e-05, |
|
"warmup_lr": 1e-06, |
|
"weight_decay": 0.05, |
|
"max_epoch": 100, |
|
"iters_per_epoch": 1050, |
|
"batch_size_train": 8, |
|
"batch_size_eval": 1, |
|
"num_workers": 4, |
|
"warmup_steps": 200, |
|
"seed": 42, |
|
"output_dir": "output/xraygpt_vqa_finetune", |
|
"amp": true, |
|
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth", |
|
"evaluate": false, |
|
"train_splits": [ |
|
"train" |
|
], |
|
"device": "cuda", |
|
"world_size": 8, |
|
"dist_url": "env://", |
|
"distributed": true, |
|
"rank": 0, |
|
"gpu": 0, |
|
"dist_backend": "nccl" |
|
}, |
|
"model": { |
|
"arch": "mini_gpt4", |
|
"image_size": 224, |
|
"drop_path_rate": 0, |
|
"use_grad_checkpoint": false, |
|
"vit_precision": "fp16", |
|
"freeze_vit": true, |
|
"freeze_qformer": true, |
|
"num_query_token": 32, |
|
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", |
|
"prompt": "", |
|
"lora_r": 16, |
|
"lora_alpha": 16, |
|
"lora_target_modules": [ |
|
"q_proj", |
|
"k_proj", |
|
"v_proj", |
|
"o_proj", |
|
"gate_proj", |
|
"up_proj", |
|
"down_proj" |
|
], |
|
"lora_dropout": 0.1, |
|
"lora_bias": "none", |
|
"model_type": "pretrain_vicuna", |
|
"max_txt_len": 160, |
|
"end_sym": "<|eot_id|>", |
|
"ckpt": "24_10_29_03_29_41_epoch160.pth" |
|
}, |
|
"preprocess": { |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
}, |
|
"eval": { |
|
"name": "blip2_image_eval", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
}, |
|
"eval": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
}, |
|
"datasets": { |
|
"vqa": { |
|
"data_type": "images", |
|
"build_info": { |
|
"storage": "dataset/mimic_finetune" |
|
}, |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
} |
|
} |
|
} |
|
{ |
|
"run": { |
|
"task": "image_text_pretrain", |
|
"lr_sched": "linear_warmup_cosine_lr", |
|
"init_lr": 3e-05, |
|
"min_lr": 1e-05, |
|
"warmup_lr": 1e-06, |
|
"weight_decay": 0.05, |
|
"max_epoch": 40, |
|
"iters_per_epoch": 1300, |
|
"batch_size_train": 8, |
|
"batch_size_eval": 1, |
|
"num_workers": 4, |
|
"warmup_steps": 200, |
|
"seed": 42, |
|
"output_dir": "output/xraygpt_vqa_finetune", |
|
"amp": true, |
|
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth", |
|
"evaluate": false, |
|
"train_splits": [ |
|
"train" |
|
], |
|
"device": "cuda", |
|
"world_size": 8, |
|
"dist_url": "env://", |
|
"distributed": true, |
|
"rank": 0, |
|
"gpu": 0, |
|
"dist_backend": "nccl" |
|
}, |
|
"model": { |
|
"arch": "mini_gpt4", |
|
"image_size": 224, |
|
"drop_path_rate": 0, |
|
"use_grad_checkpoint": false, |
|
"vit_precision": "fp16", |
|
"freeze_vit": true, |
|
"freeze_qformer": true, |
|
"num_query_token": 32, |
|
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational", |
|
"prompt": "", |
|
"lora_r": 16, |
|
"lora_alpha": 16, |
|
"lora_target_modules": [ |
|
"q_proj", |
|
"k_proj", |
|
"v_proj", |
|
"o_proj", |
|
"gate_proj", |
|
"up_proj", |
|
"down_proj" |
|
], |
|
"lora_dropout": 0.1, |
|
"lora_bias": "none", |
|
"model_type": "pretrain_vicuna", |
|
"max_txt_len": 160, |
|
"end_sym": "<|eot_id|>", |
|
"ckpt": "24_10_29_03_29_41_epoch160.pth" |
|
}, |
|
"preprocess": { |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
}, |
|
"eval": { |
|
"name": "blip2_image_eval", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
}, |
|
"eval": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
}, |
|
"datasets": { |
|
"vqa": { |
|
"data_type": "images", |
|
"build_info": { |
|
"storage": "dataset/mimic_finetune" |
|
}, |
|
"vis_processor": { |
|
"train": { |
|
"name": "blip2_image_train", |
|
"image_size": 224 |
|
} |
|
}, |
|
"text_processor": { |
|
"train": { |
|
"name": "blip_caption" |
|
} |
|
} |
|
} |
|
} |
|
} |
|
{"train_lr": "0.000019", "train_loss": "0.684137"} |
|
{"train_lr": "0.000018", "train_loss": "0.654648"} |
|
{"train_lr": "0.000017", "train_loss": "0.626471"} |
|
{"train_lr": "0.000017", "train_loss": "0.601327"} |
|
{"train_lr": "0.000016", "train_loss": "0.576456"} |
|
{"train_lr": "0.000015", "train_loss": "0.553397"} |
|
{"train_lr": "0.000014", "train_loss": "0.530701"} |
|
{"train_lr": "0.000014", "train_loss": "0.510915"} |
|
{"train_lr": "0.000013", "train_loss": "0.490313"} |
|
{"train_lr": "0.000013", "train_loss": "0.472298"} |
|
{"train_lr": "0.000012", "train_loss": "0.453687"} |
|
{"train_lr": "0.000012", "train_loss": "0.436265"} |
|
{"train_lr": "0.000011", "train_loss": "0.421915"} |
|
{"train_lr": "0.000011", "train_loss": "0.406703"} |
|
{"train_lr": "0.000011", "train_loss": "0.392106"} |
|
{"train_lr": "0.000010", "train_loss": "0.379085"} |
|
{"train_lr": "0.000010", "train_loss": "0.367431"} |
|
{"train_lr": "0.000010", "train_loss": "0.357473"} |
|
{"train_lr": "0.000010", "train_loss": "0.345610"} |
|
|