File size: 2,923 Bytes
9bf4bd7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
Collections:
- Name: ABINet-vision
  Metadata:
    Training Data: OCRDataset
    Training Techniques:
      - Adam
    Epochs: 20
    Batch Size: 1536
    Training Resources: 2 x NVIDIA A100-SXM4-80GB
    Architecture:
      - ResNetABI
      - ABIVisionModel
  Paper:
    URL: https://arxiv.org/pdf/2103.06495.pdf
    Title: 'Read Like Humans: Autonomous, Bidirectional and Iterative Language Modeling for Scene Text Recognition'
  README: configs/textrecog/abinet/README.md
- Name: ABINet
  Metadata:
    Training Data: OCRDataset
    Training Techniques:
      - Adam
    Epochs: 20
    Batch Size: 1536
    Training Resources: 8 x NVIDIA A100-SXM4-80GB
    Architecture:
      - ResNetABI
      - ABIVisionModel
      - ABILanguageDecoder
      - ABIFuser
  Paper:
    URL: https://arxiv.org/pdf/2103.06495.pdf
    Title: 'Read Like Humans: Autonomous, Bidirectional and Iterative Language Modeling for Scene Text Recognition'
  README: configs/textrecog/abinet/README.md

Models:
  - Name: abinet-vision_20e_st-an_mj
    Alias: ABINet_Vision
    In Collection: ABINet-vision
    Config: configs/textrecog/abinet/abinet-vision_20e_st-an_mj.py
    Metadata:
      Training Data:
        - SynthText
        - Syn90k
    Results:
      - Task: Text Recognition
        Dataset: IIIT5K
        Metrics:
          word_acc: 0.9523
      - Task: Text Recognition
        Dataset: SVT
        Metrics:
          word_acc: 0.9057
      - Task: Text Recognition
        Dataset: ICDAR2013
        Metrics:
          word_acc: 0.9369
      - Task: Text Recognition
        Dataset: ICDAR2015
        Metrics:
          word_acc: 0.7886
      - Task: Text Recognition
        Dataset: SVTP
        Metrics:
          word_acc: 0.8403
      - Task: Text Recognition
        Dataset: CT80
        Metrics:
          word_acc: 0.8437
    Weights: https://download.openmmlab.com/mmocr/textrecog/abinet/abinet-vision_20e_st-an_mj/abinet-vision_20e_st-an_mj_20220915_152445-85cfb03d.pth
  - Name: abinet_20e_st-an_mj
    Alias: ABINet
    In Collection: ABINet
    Config: configs/textrecog/abinet/abinet_20e_st-an_mj.py
    Metadata:
      Training Data:
        - SynthText
        - Syn90k
    Results:
      - Task: Text Recognition
        Dataset: IIIT5K
        Metrics:
          word_acc: 0.9603
      - Task: Text Recognition
        Dataset: SVT
        Metrics:
          word_acc: 0.9382
      - Task: Text Recognition
        Dataset: ICDAR2013
        Metrics:
          word_acc: 0.9547
      - Task: Text Recognition
        Dataset: ICDAR2015
        Metrics:
          word_acc: 0.8122
      - Task: Text Recognition
        Dataset: SVTP
        Metrics:
          word_acc: 0.8868
      - Task: Text Recognition
        Dataset: CT80
        Metrics:
          word_acc: 0.8785
    Weights: https://download.openmmlab.com/mmocr/textrecog/abinet/abinet_20e_st-an_mj/abinet_20e_st-an_mj_20221005_012617-ead8c139.pth