GoMatching++ | 81.48% | 79.30% | 86.84% | 23 | 6 | 5 | 1886 | 5 | 113 | 285 |
GoMatching | 77.30% | 77.12% | 83.02% | 23 | 6 | 5 | 1790 | 7 | 108 | 379 |
h&h_lab | 76.70% | 78.83% | 84.08% | 24 | 8 | 2 | 1913 | 15 | 244 | 248 |
VideoTextSCM | 75.37% | 74.35% | 79.34% | 21 | 9 | 4 | 1722 | 28 | 82 | 426 |
LOGO | 74.72% | 74.69% | 80.63% | 23 | 6 | 5 | 1818 | 6 | 192 | 352 |
TransDETR | 73.71% | 75.00% | 83.77% | 23 | 7 | 4 | 1854 | 3 | 250 | 319 |
TransVTSpotter | 71.51% | 74.01% | 80.46% | 20 | 8 | 6 | 1729 | 6 | 173 | 441 |
GOCR | 71.09% | 74.20% | 80.04% | 20 | 11 | 3 | 1792 | 30 | 245 | 354 |
GOCR Offline | 70.27% | 74.75% | 81.55% | 19 | 8 | 7 | 1662 | 7 | 133 | 507 |
SVRepV2(Kuaishou-MMU) | 58.64% | 75.34% | 74.18% | 17 | 10 | 7 | 1422 | 9 | 146 | 745 |
HIK_OCR | 57.81% | 79.11% | 69.32% | 15 | 7 | 12 | 1342 | 22 | 84 | 812 |
TA-VTT | 53.13% | 78.07% | 69.09% | 15 | 11 | 8 | 1382 | 14 | 226 | 780 |
Semantic-Aware Video Text Detection | 51.19% | 78.60% | 67.28% | 11 | 13 | 10 | 1311 | 14 | 197 | 851 |
SRC-B-TextProcessingLab | 27.76% | 69.53% | 43.40% | 4 | 14 | 16 | 781 | 32 | 177 | 1363 |
AJOU | 20.36% | 72.04% | 40.62% | 4 | 10 | 20 | 636 | 13 | 193 | 1527 |
StradVision-1 | 17.69% | 71.14% | 34.58% | 3 | 10 | 21 | 629 | 34 | 244 | 1513 |
USTB_TexVideo | 10.16% | 69.83% | 26.25% | 0 | 13 | 21 | 535 | 23 | 314 | 1618 |
USTB_TexVideo II-2 | 6.34% | 70.45% | 19.59% | 1 | 7 | 26 | 347 | 14 | 209 | 1815 |
Megvii-Image++ | 5.84% | 64.64% | 36.01% | 1 | 17 | 16 | 810 | 13 | 683 | 1353 |
RTST Lucas-Kanade-2 (RealTimeSceneText_LucasKanade_v2) | -107.40% | 62.07% | 4.39% | 1 | 5 | 28 | 113 | 180 | 2450 | 1883 |
USTB_TexVideo II-1 | -24.49% | 65.84% | 21.36% | 1 | 12 | 21 | 379 | 7 | 912 | 1790 |