LOGO | 50.60% | 74.79% | 64.11% | 30 | 18 | 28 | 1007 | 14 | 122 | 728 |
GoMatching++ | 48.83% | 78.70% | 61.84% | 36 | 15 | 25 | 1016 | 26 | 162 | 707 |
GoMatching | 48.31% | 79.23% | 62.94% | 32 | 16 | 28 | 986 | 19 | 141 | 744 |
SVRepV2(Kuaishou-MMU) | 45.91% | 74.90% | 63.31% | 30 | 22 | 24 | 1006 | 24 | 203 | 719 |
GOCR | 44.71% | 74.45% | 65.23% | 37 | 9 | 30 | 1016 | 9 | 234 | 724 |
GOCR Offline | 42.82% | 74.85% | 62.19% | 29 | 8 | 39 | 913 | 4 | 164 | 832 |
TransDETR | 40.65% | 77.24% | 58.78% | 21 | 20 | 35 | 829 | 9 | 118 | 911 |
HIK_OCR | 33.85% | 77.38% | 47.80% | 21 | 11 | 44 | 682 | 6 | 90 | 1061 |
h&h_lab | 33.33% | 78.40% | 53.40% | 19 | 24 | 33 | 824 | 21 | 241 | 904 |
TransVTSpotter | 33.16% | 76.03% | 51.26% | 14 | 29 | 33 | 710 | 21 | 130 | 1018 |
VideoTextSCM | 33.10% | 76.18% | 53.83% | 23 | 28 | 25 | 888 | 30 | 309 | 831 |
TA-VTT | 32.59% | 78.97% | 46.82% | 13 | 27 | 36 | 749 | 14 | 179 | 986 |
Semantic-Aware Video Text Detection | 26.93% | 79.14% | 42.73% | 8 | 27 | 41 | 611 | 9 | 140 | 1129 |
SRC-B-TextProcessingLab | 14.69% | 69.02% | 30.47% | 0 | 16 | 60 | 348 | 4 | 91 | 1397 |
Megvii-Image++ | 10.58% | 68.05% | 35.07% | 7 | 18 | 51 | 484 | 6 | 299 | 1259 |
AJOU | 8.40% | 71.19% | 22.21% | 3 | 9 | 64 | 295 | 14 | 148 | 1440 |
USTB_TexVideo | 7.43% | 67.24% | 18.98% | 1 | 13 | 62 | 231 | 5 | 101 | 1513 |
StradVision-1 | 5.49% | 69.12% | 21.39% | 1 | 16 | 59 | 290 | 20 | 194 | 1439 |
USTB_TexVideo II-2 | 5.20% | 68.92% | 11.71% | 1 | 7 | 68 | 126 | 3 | 35 | 1620 |
RTST Lucas-Kanade-2 (RealTimeSceneText_LucasKanade_v2) | -53.29% | 66.37% | 5.45% | 0 | 10 | 66 | 136 | 56 | 1068 | 1557 |
USTB_TexVideo II-1 | -38.99% | 65.92% | 10.47% | 0 | 10 | 66 | 172 | 13 | 854 | 1564 |