LOGO | 67.96% | 77.34% | 75.17% | 38 | 14 | 12 | 616 | 18 | 56 | 190 |
TA-VTT | 62.38% | 77.35% | 71.86% | 46 | 7 | 11 | 614 | 40 | 100 | 170 |
Semantic-Aware Video Text Detection | 62.26% | 78.06% | 71.56% | 40 | 11 | 13 | 582 | 23 | 69 | 219 |
GOCR Offline | 61.77% | 75.68% | 78.80% | 43 | 5 | 16 | 626 | 4 | 117 | 194 |
SVRepV2(Kuaishou-MMU) | 60.92% | 74.72% | 76.77% | 40 | 13 | 11 | 609 | 31 | 107 | 184 |
GoMatching++ | 59.22% | 80.22% | 70.05% | 43 | 6 | 15 | 585 | 30 | 97 | 209 |
GOCR | 57.52% | 75.64% | 76.89% | 45 | 6 | 13 | 636 | 9 | 162 | 179 |
TransVTSpotter | 54.73% | 79.45% | 61.78% | 34 | 19 | 11 | 506 | 75 | 55 | 243 |
GoMatching | 54.61% | 80.83% | 66.94% | 34 | 13 | 17 | 540 | 25 | 90 | 259 |
TransDETR | 52.18% | 80.61% | 69.22% | 39 | 13 | 12 | 568 | 39 | 138 | 217 |
h&h_lab | 51.21% | 79.13% | 69.09% | 36 | 19 | 9 | 544 | 24 | 122 | 256 |
HIK_OCR | 48.30% | 78.72% | 64.35% | 24 | 18 | 22 | 440 | 15 | 42 | 369 |
VideoTextSCM | 47.57% | 75.43% | 61.01% | 36 | 16 | 12 | 508 | 73 | 116 | 243 |
SRC-B-TextProcessingLab | 20.02% | 64.12% | 47.91% | 10 | 22 | 32 | 303 | 0 | 138 | 521 |
USTB_TexVideo | 18.93% | 68.31% | 34.93% | 3 | 24 | 37 | 207 | 6 | 51 | 611 |
USTB_TexVideo II-2 | 18.33% | 71.25% | 30.57% | 3 | 20 | 41 | 174 | 6 | 23 | 644 |
Megvii-Image++ | 14.32% | 70.57% | 33.36% | 3 | 15 | 46 | 190 | 5 | 72 | 629 |
AJOU | 6.67% | 72.77% | 25.73% | 3 | 17 | 44 | 153 | 52 | 98 | 619 |
USTB_TexVideo II-1 | 3.03% | 69.07% | 7.55% | 0 | 4 | 60 | 35 | 5 | 10 | 784 |
StradVision-1 | 0.00% | 67.89% | 25.52% | 3 | 18 | 43 | 171 | 33 | 171 | 620 |
RTST Lucas-Kanade-2 (RealTimeSceneText_LucasKanade_v2) | -203.40% | 72.91% | 6.92% | 6 | 12 | 46 | 112 | 78 | 1788 | 634 |