Image-to-Text
Transformers
PyTorch
donut
vision
Eval Results
File size: 720 Bytes
4d03da9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
resume_from_checkpoint_path: None
result_path: 'trainer/result'
pretrained_model_name_or_path: 'marzanconsulting/donut-dr-matriculas-ocr'
dataset_name_or_paths: 
  - 'trainer/dataset'
task_start_tokens: 
  - '<s_matricula>'
sort_json_key: False
train_batch_sizes: 
  - 5
val_batch_sizes: 
  - 1
input_size: 
  - 960
  - 1280
max_length: 868
max_position_embeddings: 868
align_long_axis: False
num_nodes: 1
seed: 2022
lr: 3e-05
warmup_steps: 300
num_training_samples_per_epoch: 800
max_epochs: 50
max_steps: -1
num_workers: 12
val_check_interval: 1.0
check_val_every_n_epoch: 3
gradient_clip_val: 1.0
verbose: True
model_dir: ''
tensorboard_dir: ''
checkpoint_dir: 
exp_name: 'train_cord_matriculas'
exp_version: 'mmc_v1'