Image-to-Text
Transformers
PyTorch
donut
vision
Eval Results
File size: 404 Bytes
4d03da9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
{
  "_name_or_path": "naver-clova-ix/donut-base",
  "align_long_axis": false,
  "architectures": [
    "DonutModel"
  ],
  "decoder_layer": 4,
  "encoder_layer": [
    2,
    2,
    14,
    2
  ],
  "input_size": [
    960,
    1280
  ],
  "max_length": 868,
  "max_position_embeddings": 868,
  "model_type": "donut",
  "torch_dtype": "float32",
  "transformers_version": "4.25.1",
  "window_size": 10
}