HaiderK commited on
Commit
028292c
·
1 Parent(s): 16f9109

End of training

Browse files
README.md CHANGED
@@ -1,4 +1,6 @@
1
  ---
 
 
2
  tags:
3
  - generated_from_trainer
4
  datasets:
@@ -13,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  # Assignment
15
 
16
- This model was trained from scratch on the imagefolder dataset.
17
 
18
  ## Model description
19
 
@@ -32,17 +34,13 @@ More information needed
32
  ### Training hyperparameters
33
 
34
  The following hyperparameters were used during training:
35
- - learning_rate: 0.0002
36
  - train_batch_size: 2
37
  - eval_batch_size: 8
38
  - seed: 42
39
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
40
  - lr_scheduler_type: linear
41
- - num_epochs: 10
42
-
43
- ### Training results
44
-
45
-
46
 
47
  ### Framework versions
48
 
 
1
  ---
2
+ license: mit
3
+ base_model: naver-clova-ix/donut-base
4
  tags:
5
  - generated_from_trainer
6
  datasets:
 
15
 
16
  # Assignment
17
 
18
+ This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the imagefolder dataset.
19
 
20
  ## Model description
21
 
 
34
  ### Training hyperparameters
35
 
36
  The following hyperparameters were used during training:
37
+ - learning_rate: 0.002
38
  - train_batch_size: 2
39
  - eval_batch_size: 8
40
  - seed: 42
41
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
  - lr_scheduler_type: linear
43
+ - num_epochs: 20
 
 
 
 
44
 
45
  ### Framework versions
46
 
generation_config.json CHANGED
@@ -1,10 +1,8 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
4
- "decoder_start_token_id": 0,
5
  "eos_token_id": 2,
6
  "forced_eos_token_id": 2,
7
- "max_length": 512,
8
  "pad_token_id": 1,
9
  "transformers_version": "4.32.0.dev0"
10
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 0,
 
4
  "eos_token_id": 2,
5
  "forced_eos_token_id": 2,
 
6
  "pad_token_id": 1,
7
  "transformers_version": "4.32.0.dev0"
8
  }
preprocessor_config.json CHANGED
@@ -19,8 +19,8 @@
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
- "size": {
23
- "height": 960,
24
- "width": 720
25
- }
26
  }
 
19
  "processor_class": "DonutProcessor",
20
  "resample": 2,
21
  "rescale_factor": 0.00392156862745098,
22
+ "size": [
23
+ 720,
24
+ 960
25
+ ]
26
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c24157433ea031a75fb7f33a6fc0e590fcea94b9ce2b1985092ef16b18eedab
3
- size 809211673
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb895880ee972a822d657a3d8695503a6a6be7de4798f7ef4dcb866dc3e669dc
3
+ size 809204953
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -11,18 +11,11 @@
11
  "rstrip": false,
12
  "single_word": false
13
  },
14
- "max_length": 512,
15
  "model_max_length": 1000000000000000019884624838656,
16
- "pad_to_multiple_of": null,
17
  "pad_token": "<pad>",
18
- "pad_token_type_id": 0,
19
- "padding_side": "right",
20
  "processor_class": "DonutProcessor",
21
  "sep_token": "</s>",
22
  "sp_model_kwargs": {},
23
- "stride": 0,
24
  "tokenizer_class": "XLMRobertaTokenizer",
25
- "truncation_side": "right",
26
- "truncation_strategy": "longest_first",
27
  "unk_token": "<unk>"
28
  }
 
11
  "rstrip": false,
12
  "single_word": false
13
  },
 
14
  "model_max_length": 1000000000000000019884624838656,
 
15
  "pad_token": "<pad>",
 
 
16
  "processor_class": "DonutProcessor",
17
  "sep_token": "</s>",
18
  "sp_model_kwargs": {},
 
19
  "tokenizer_class": "XLMRobertaTokenizer",
 
 
20
  "unk_token": "<unk>"
21
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9ba146e626400a8e4789df56ef2e2b8bd62ed50ad757462e60c97141c5dc7e0
3
  size 4219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ac18023fe270be166ba776454ae51201e768bcba29a652fa04e70e5a1618ebb
3
  size 4219