khanhduong commited on
Commit
a928ef0
·
verified ·
1 Parent(s): 9dcc1b0

Upload log.txt with huggingface_hub

Browse files
Files changed (1) hide show
  1. log.txt +3 -122
log.txt CHANGED
@@ -6,7 +6,7 @@
6
  "min_lr": 8e-05,
7
  "warmup_lr": 1e-06,
8
  "weight_decay": 0.05,
9
- "max_epoch": 150,
10
  "batch_size_train": 120,
11
  "batch_size_eval": 3,
12
  "num_workers": 4,
@@ -15,7 +15,7 @@
15
  "seed": 42,
16
  "output_dir": "output/xraygpt_mimic_pretrain",
17
  "amp": true,
18
- "resume_ckpt_path": "24_10_22_08_14_39_epoch99.pth",
19
  "evaluate": false,
20
  "train_splits": [
21
  "train"
@@ -81,123 +81,4 @@
81
  }
82
  }
83
  }
84
- {
85
- "run": {
86
- "task": "image_text_pretrain",
87
- "lr_sched": "linear_warmup_cosine_lr",
88
- "init_lr": 0.0001,
89
- "min_lr": 8e-05,
90
- "warmup_lr": 1e-06,
91
- "weight_decay": 0.05,
92
- "max_epoch": 150,
93
- "batch_size_train": 120,
94
- "batch_size_eval": 3,
95
- "num_workers": 4,
96
- "warmup_steps": 500,
97
- "iters_per_epoch": 500,
98
- "seed": 42,
99
- "output_dir": "output/xraygpt_mimic_pretrain",
100
- "amp": true,
101
- "resume_ckpt_path": "24_10_22_08_14_39_epoch99.pth",
102
- "evaluate": false,
103
- "train_splits": [
104
- "train"
105
- ],
106
- "device": "cuda",
107
- "world_size": 4,
108
- "dist_url": "env://",
109
- "distributed": true,
110
- "rank": 0,
111
- "gpu": 0,
112
- "dist_backend": "nccl"
113
- },
114
- "model": {
115
- "arch": "mini_gpt4",
116
- "image_size": 224,
117
- "drop_path_rate": 0,
118
- "use_grad_checkpoint": false,
119
- "vit_precision": "fp16",
120
- "freeze_vit": true,
121
- "freeze_qformer": true,
122
- "num_query_token": 32,
123
- "llama_model": "Joycean0301/Llama-3.2-3B-Instruct-Medical-Conversational",
124
- "prompt": "",
125
- "model_type": "pretrain_vicuna"
126
- },
127
- "preprocess": {
128
- "vis_processor": {
129
- "train": {
130
- "name": "blip2_image_train",
131
- "image_size": 224
132
- },
133
- "eval": {
134
- "name": "blip2_image_eval",
135
- "image_size": 224
136
- }
137
- },
138
- "text_processor": {
139
- "train": {
140
- "name": "blip_caption"
141
- },
142
- "eval": {
143
- "name": "blip_caption"
144
- }
145
- }
146
- },
147
- "datasets": {
148
- "mimic": {
149
- "data_type": "images",
150
- "build_info": {
151
- "storage": "dataset/mimic"
152
- },
153
- "vis_processor": {
154
- "train": {
155
- "name": "blip2_image_train",
156
- "image_size": 224
157
- }
158
- },
159
- "text_processor": {
160
- "train": {
161
- "name": "blip_caption"
162
- }
163
- }
164
- }
165
- }
166
- }
167
- {"train_lr": "0.000085", "train_loss": "1.176420"}
168
- {"train_lr": "0.000085", "train_loss": "1.175911"}
169
- {"train_lr": "0.000085", "train_loss": "1.177007"}
170
- {"train_lr": "0.000084", "train_loss": "1.174899"}
171
- {"train_lr": "0.000084", "train_loss": "1.176167"}
172
- {"train_lr": "0.000084", "train_loss": "1.175371"}
173
- {"train_lr": "0.000084", "train_loss": "1.175089"}
174
- {"train_lr": "0.000084", "train_loss": "1.174685"}
175
- {"train_lr": "0.000084", "train_loss": "1.173965"}
176
- {"train_lr": "0.000083", "train_loss": "1.173050"}
177
- {"train_lr": "0.000083", "train_loss": "1.174454"}
178
- {"train_lr": "0.000083", "train_loss": "1.174522"}
179
- {"train_lr": "0.000083", "train_loss": "1.171317"}
180
- {"train_lr": "0.000083", "train_loss": "1.173012"}
181
- {"train_lr": "0.000083", "train_loss": "1.173456"}
182
- {"train_lr": "0.000082", "train_loss": "1.172261"}
183
- {"train_lr": "0.000082", "train_loss": "1.171457"}
184
- {"train_lr": "0.000082", "train_loss": "1.172554"}
185
- {"train_lr": "0.000082", "train_loss": "1.169906"}
186
- {"train_lr": "0.000082", "train_loss": "1.171817"}
187
- {"train_lr": "0.000082", "train_loss": "1.170531"}
188
- {"train_lr": "0.000082", "train_loss": "1.170232"}
189
- {"train_lr": "0.000082", "train_loss": "1.171015"}
190
- {"train_lr": "0.000082", "train_loss": "1.169610"}
191
- {"train_lr": "0.000081", "train_loss": "1.170178"}
192
- {"train_lr": "0.000081", "train_loss": "1.169042"}
193
- {"train_lr": "0.000081", "train_loss": "1.170149"}
194
- {"train_lr": "0.000081", "train_loss": "1.168049"}
195
- {"train_lr": "0.000081", "train_loss": "1.169198"}
196
- {"train_lr": "0.000081", "train_loss": "1.169054"}
197
- {"train_lr": "0.000081", "train_loss": "1.168359"}
198
- {"train_lr": "0.000081", "train_loss": "1.168657"}
199
- {"train_lr": "0.000081", "train_loss": "1.168694"}
200
- {"train_lr": "0.000081", "train_loss": "1.168019"}
201
- {"train_lr": "0.000081", "train_loss": "1.167548"}
202
- {"train_lr": "0.000080", "train_loss": "1.165927"}
203
- {"train_lr": "0.000080", "train_loss": "1.168800"}
 
6
  "min_lr": 8e-05,
7
  "warmup_lr": 1e-06,
8
  "weight_decay": 0.05,
9
+ "max_epoch": 200,
10
  "batch_size_train": 120,
11
  "batch_size_eval": 3,
12
  "num_workers": 4,
 
15
  "seed": 42,
16
  "output_dir": "output/xraygpt_mimic_pretrain",
17
  "amp": true,
18
+ "resume_ckpt_path": "xraygpt/output/xraygpt_mimic_pretrain/20241028035/checkpoint_136.pth",
19
  "evaluate": false,
20
  "train_splits": [
21
  "train"
 
81
  }
82
  }
83
  }
84
+ {"train_lr": "0.000084", "train_loss": "1.166641"}