khanhduong's picture
add
0e0661d
{
"run": {
"task": "image_text_pretrain",
"lr_sched": "linear_warmup_cosine_lr",
"init_lr": 3e-05,
"min_lr": 1e-05,
"warmup_lr": 1e-06,
"weight_decay": 0.05,
"max_epoch": 100,
"iters_per_epoch": 500,
"batch_size_train": 8,
"batch_size_eval": 1,
"num_workers": 4,
"warmup_steps": 200,
"seed": 42,
"output_dir": "output/xraygpt_vqa_finetune",
"amp": true,
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth",
"evaluate": false,
"train_splits": [
"train"
],
"device": "cuda",
"world_size": 8,
"dist_url": "env://",
"distributed": true,
"rank": 0,
"gpu": 0,
"dist_backend": "nccl"
},
"model": {
"arch": "mini_gpt4",
"image_size": 224,
"drop_path_rate": 0,
"use_grad_checkpoint": false,
"vit_precision": "fp16",
"freeze_vit": true,
"freeze_qformer": true,
"num_query_token": 32,
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational",
"prompt": "",
"lora_r": 16,
"lora_alpha": 16,
"lora_target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj",
"gate_proj",
"up_proj",
"down_proj"
],
"lora_dropout": 0.1,
"lora_bias": "none",
"model_type": "pretrain_vicuna",
"max_txt_len": 160,
"end_sym": "<|eot_id|>",
"ckpt": "24_10_29_03_29_41_epoch160.pth"
},
"preprocess": {
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
},
"eval": {
"name": "blip2_image_eval",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
},
"eval": {
"name": "blip_caption"
}
}
},
"datasets": {
"vqa": {
"data_type": "images",
"build_info": {
"storage": "dataset/mimic_finetune"
},
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
}
}
}
}
}
{
"run": {
"task": "image_text_pretrain",
"lr_sched": "linear_warmup_cosine_lr",
"init_lr": 3e-05,
"min_lr": 1e-05,
"warmup_lr": 1e-06,
"weight_decay": 0.05,
"max_epoch": 100,
"iters_per_epoch": 500,
"batch_size_train": 10,
"batch_size_eval": 1,
"num_workers": 4,
"warmup_steps": 200,
"seed": 42,
"output_dir": "output/xraygpt_vqa_finetune",
"amp": true,
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth",
"evaluate": false,
"train_splits": [
"train"
],
"device": "cuda",
"world_size": 8,
"dist_url": "env://",
"distributed": true,
"rank": 0,
"gpu": 0,
"dist_backend": "nccl"
},
"model": {
"arch": "mini_gpt4",
"image_size": 224,
"drop_path_rate": 0,
"use_grad_checkpoint": false,
"vit_precision": "fp16",
"freeze_vit": true,
"freeze_qformer": true,
"num_query_token": 32,
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational",
"prompt": "",
"lora_r": 16,
"lora_alpha": 16,
"lora_target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj",
"gate_proj",
"up_proj",
"down_proj"
],
"lora_dropout": 0.1,
"lora_bias": "none",
"model_type": "pretrain_vicuna",
"max_txt_len": 160,
"end_sym": "<|eot_id|>",
"ckpt": "24_10_29_03_29_41_epoch160.pth"
},
"preprocess": {
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
},
"eval": {
"name": "blip2_image_eval",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
},
"eval": {
"name": "blip_caption"
}
}
},
"datasets": {
"vqa": {
"data_type": "images",
"build_info": {
"storage": "dataset/mimic_finetune"
},
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
}
}
}
}
}
{
"run": {
"task": "image_text_pretrain",
"lr_sched": "linear_warmup_cosine_lr",
"init_lr": 3e-05,
"min_lr": 1e-05,
"warmup_lr": 1e-06,
"weight_decay": 0.05,
"max_epoch": 100,
"iters_per_epoch": 1050,
"batch_size_train": 8,
"batch_size_eval": 1,
"num_workers": 4,
"warmup_steps": 200,
"seed": 42,
"output_dir": "output/xraygpt_vqa_finetune",
"amp": true,
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth",
"evaluate": false,
"train_splits": [
"train"
],
"device": "cuda",
"world_size": 8,
"dist_url": "env://",
"distributed": true,
"rank": 0,
"gpu": 0,
"dist_backend": "nccl"
},
"model": {
"arch": "mini_gpt4",
"image_size": 224,
"drop_path_rate": 0,
"use_grad_checkpoint": false,
"vit_precision": "fp16",
"freeze_vit": true,
"freeze_qformer": true,
"num_query_token": 32,
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational",
"prompt": "",
"lora_r": 16,
"lora_alpha": 16,
"lora_target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj",
"gate_proj",
"up_proj",
"down_proj"
],
"lora_dropout": 0.1,
"lora_bias": "none",
"model_type": "pretrain_vicuna",
"max_txt_len": 160,
"end_sym": "<|eot_id|>",
"ckpt": "24_10_29_03_29_41_epoch160.pth"
},
"preprocess": {
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
},
"eval": {
"name": "blip2_image_eval",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
},
"eval": {
"name": "blip_caption"
}
}
},
"datasets": {
"vqa": {
"data_type": "images",
"build_info": {
"storage": "dataset/mimic_finetune"
},
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
}
}
}
}
}
{
"run": {
"task": "image_text_pretrain",
"lr_sched": "linear_warmup_cosine_lr",
"init_lr": 3e-05,
"min_lr": 1e-05,
"warmup_lr": 1e-06,
"weight_decay": 0.05,
"max_epoch": 40,
"iters_per_epoch": 1300,
"batch_size_train": 8,
"batch_size_eval": 1,
"num_workers": 4,
"warmup_steps": 200,
"seed": 42,
"output_dir": "output/xraygpt_vqa_finetune",
"amp": true,
"resume_ckpt_path": "24_10_30_17_10_39_epoch20.pth",
"evaluate": false,
"train_splits": [
"train"
],
"device": "cuda",
"world_size": 8,
"dist_url": "env://",
"distributed": true,
"rank": 0,
"gpu": 0,
"dist_backend": "nccl"
},
"model": {
"arch": "mini_gpt4",
"image_size": 224,
"drop_path_rate": 0,
"use_grad_checkpoint": false,
"vit_precision": "fp16",
"freeze_vit": true,
"freeze_qformer": true,
"num_query_token": 32,
"llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational",
"prompt": "",
"lora_r": 16,
"lora_alpha": 16,
"lora_target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj",
"gate_proj",
"up_proj",
"down_proj"
],
"lora_dropout": 0.1,
"lora_bias": "none",
"model_type": "pretrain_vicuna",
"max_txt_len": 160,
"end_sym": "<|eot_id|>",
"ckpt": "24_10_29_03_29_41_epoch160.pth"
},
"preprocess": {
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
},
"eval": {
"name": "blip2_image_eval",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
},
"eval": {
"name": "blip_caption"
}
}
},
"datasets": {
"vqa": {
"data_type": "images",
"build_info": {
"storage": "dataset/mimic_finetune"
},
"vis_processor": {
"train": {
"name": "blip2_image_train",
"image_size": 224
}
},
"text_processor": {
"train": {
"name": "blip_caption"
}
}
}
}
}
{"train_lr": "0.000019", "train_loss": "0.684137"}
{"train_lr": "0.000018", "train_loss": "0.654648"}
{"train_lr": "0.000017", "train_loss": "0.626471"}
{"train_lr": "0.000017", "train_loss": "0.601327"}
{"train_lr": "0.000016", "train_loss": "0.576456"}
{"train_lr": "0.000015", "train_loss": "0.553397"}
{"train_lr": "0.000014", "train_loss": "0.530701"}
{"train_lr": "0.000014", "train_loss": "0.510915"}
{"train_lr": "0.000013", "train_loss": "0.490313"}
{"train_lr": "0.000013", "train_loss": "0.472298"}
{"train_lr": "0.000012", "train_loss": "0.453687"}
{"train_lr": "0.000012", "train_loss": "0.436265"}
{"train_lr": "0.000011", "train_loss": "0.421915"}
{"train_lr": "0.000011", "train_loss": "0.406703"}
{"train_lr": "0.000011", "train_loss": "0.392106"}
{"train_lr": "0.000010", "train_loss": "0.379085"}
{"train_lr": "0.000010", "train_loss": "0.367431"}
{"train_lr": "0.000010", "train_loss": "0.357473"}
{"train_lr": "0.000010", "train_loss": "0.345610"}