hyeongjin99 commited on
Commit
b9a1d80
·
verified ·
1 Parent(s): 71a93e7

End of training

Browse files
README.md CHANGED
@@ -14,6 +14,8 @@ should probably proofread and complete it, then remove this comment. -->
14
  # pt
15
 
16
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on an unknown dataset.
 
 
17
 
18
  ## Model description
19
 
 
14
  # pt
15
 
16
  This model is a fine-tuned version of [openai/clip-vit-large-patch14](https://huggingface.co/openai/clip-vit-large-patch14) on an unknown dataset.
17
+ It achieves the following results on the evaluation set:
18
+ - Loss: 0.0905
19
 
20
  ## Model description
21
 
all_results.json CHANGED
@@ -1,8 +1,12 @@
1
  {
2
  "epoch": 30.0,
 
 
 
 
3
  "total_flos": 1305922815073800.0,
4
- "train_loss": 1.2748958587646484,
5
- "train_runtime": 114.0949,
6
- "train_samples_per_second": 63.631,
7
- "train_steps_per_second": 1.052
8
  }
 
1
  {
2
  "epoch": 30.0,
3
+ "eval_loss": 0.0905422493815422,
4
+ "eval_runtime": 0.5259,
5
+ "eval_samples_per_second": 115.992,
6
+ "eval_steps_per_second": 7.606,
7
  "total_flos": 1305922815073800.0,
8
+ "train_loss": 1.105910873413086,
9
+ "train_runtime": 168.9398,
10
+ "train_samples_per_second": 42.974,
11
+ "train_steps_per_second": 1.421
12
  }
eval_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_loss": 0.0905422493815422,
4
+ "eval_runtime": 0.5259,
5
+ "eval_samples_per_second": 115.992,
6
+ "eval_steps_per_second": 7.606
7
+ }
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 49406,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 77,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 77
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 49407,
16
+ "pad_type_id": 0,
17
+ "pad_token": "<|endoftext|>"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 49406,
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 1305922815073800.0,
4
- "train_loss": 1.2748958587646484,
5
- "train_runtime": 114.0949,
6
- "train_samples_per_second": 63.631,
7
- "train_steps_per_second": 1.052
8
  }
 
1
  {
2
  "epoch": 30.0,
3
  "total_flos": 1305922815073800.0,
4
+ "train_loss": 1.105910873413086,
5
+ "train_runtime": 168.9398,
6
+ "train_samples_per_second": 42.974,
7
+ "train_steps_per_second": 1.421
8
  }
trainer_state.json CHANGED
@@ -3,23 +3,23 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 30.0,
5
  "eval_steps": 500,
6
- "global_step": 120,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 30.0,
13
- "step": 120,
14
  "total_flos": 1305922815073800.0,
15
- "train_loss": 1.2748958587646484,
16
- "train_runtime": 114.0949,
17
- "train_samples_per_second": 63.631,
18
- "train_steps_per_second": 1.052
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 120,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 30,
25
  "save_steps": 500,
@@ -36,7 +36,7 @@
36
  }
37
  },
38
  "total_flos": 1305922815073800.0,
39
- "train_batch_size": 64,
40
  "trial_name": null,
41
  "trial_params": null
42
  }
 
3
  "best_model_checkpoint": null,
4
  "epoch": 30.0,
5
  "eval_steps": 500,
6
+ "global_step": 240,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 30.0,
13
+ "step": 240,
14
  "total_flos": 1305922815073800.0,
15
+ "train_loss": 1.105910873413086,
16
+ "train_runtime": 168.9398,
17
+ "train_samples_per_second": 42.974,
18
+ "train_steps_per_second": 1.421
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 240,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 30,
25
  "save_steps": 500,
 
36
  }
37
  },
38
  "total_flos": 1305922815073800.0,
39
+ "train_batch_size": 32,
40
  "trial_name": null,
41
  "trial_params": null
42
  }