HaiderK commited on
Commit
1ce79f4
·
1 Parent(s): 38b5a9c

End of training

Browse files
README.md CHANGED
@@ -1,6 +1,4 @@
1
  ---
2
- license: mit
3
- base_model: naver-clova-ix/donut-base
4
  tags:
5
  - generated_from_trainer
6
  datasets:
@@ -15,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # Assignment
17
 
18
- This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the imagefolder dataset.
19
 
20
  ## Model description
21
 
@@ -34,13 +32,13 @@ More information needed
34
  ### Training hyperparameters
35
 
36
  The following hyperparameters were used during training:
37
- - learning_rate: 2e-05
38
  - train_batch_size: 2
39
  - eval_batch_size: 8
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
- - num_epochs: 25
44
 
45
  ### Training results
46
 
 
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  datasets:
 
13
 
14
  # Assignment
15
 
16
+ This model was trained from scratch on the imagefolder dataset.
17
 
18
  ## Model description
19
 
 
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
35
+ - learning_rate: 0.0002
36
  - train_batch_size: 2
37
  - eval_batch_size: 8
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
+ - num_epochs: 10
42
 
43
  ### Training results
44
 
generation_config.json CHANGED
@@ -1,8 +1,10 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
 
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
 
6
  "pad_token_id": 1,
7
  "transformers_version": "4.32.0.dev0"
8
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
+ "decoder_start_token_id": 0,
5
  "eos_token_id": 2,
6
  "forced_eos_token_id": 2,
7
+ "max_length": 512,
8
  "pad_token_id": 1,
9
  "transformers_version": "4.32.0.dev0"
10
  }
preprocessor_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
- "size": [
23
- 720,
24
- 960
25
- ]
26
  }
 
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
+ "size": {
23
+ "height": 960,
24
+ "width": 720
25
+ }
26
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -11,11 +11,18 @@
11
  "rstrip": false,
12
  "single_word": false
13
  },
 
14
  "model_max_length": 1000000000000000019884624838656,
 
15
  "pad_token": "<pad>",
 
 
16
  "processor_class": "DonutProcessor",
17
  "sep_token": "</s>",
18
  "sp_model_kwargs": {},
 
19
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
20
  "unk_token": "<unk>"
21
  }
 
11
  "rstrip": false,
12
  "single_word": false
13
  },
14
+ "max_length": 512,
15
  "model_max_length": 1000000000000000019884624838656,
16
+ "pad_to_multiple_of": null,
17
  "pad_token": "<pad>",
18
+ "pad_token_type_id": 0,
19
+ "padding_side": "right",
20
  "processor_class": "DonutProcessor",
21
  "sep_token": "</s>",
22
  "sp_model_kwargs": {},
23
+ "stride": 0,
24
  "tokenizer_class": "XLMRobertaTokenizer",
25
+ "truncation_side": "right",
26
+ "truncation_strategy": "longest_first",
27
  "unk_token": "<unk>"
28
  }