h&h_lab | 67.40% | 72.18% | 79.03% | 11 | 5 | 1 | 389 | 7 | 50 | 107 |
GOCR Offline | 67.00% | 70.68% | 74.07% | 14 | 1 | 2 | 387 | 5 | 50 | 111 |
TransDETR | 64.81% | 68.44% | 74.68% | 12 | 3 | 2 | 384 | 3 | 58 | 116 |
GOCR | 64.02% | 70.68% | 70.76% | 14 | 2 | 1 | 406 | 16 | 84 | 81 |
GoMatching++ | 61.63% | 74.30% | 65.96% | 11 | 4 | 2 | 370 | 13 | 60 | 120 |
SVRepV2(Kuaishou-MMU) | 59.24% | 77.04% | 77.64% | 11 | 3 | 3 | 376 | 9 | 78 | 118 |
VideoTextSCM | 58.65% | 75.67% | 65.83% | 12 | 2 | 3 | 366 | 20 | 71 | 117 |
GoMatching | 58.65% | 73.76% | 63.60% | 11 | 3 | 3 | 349 | 6 | 54 | 148 |
TA-VTT | 58.05% | 72.27% | 70.89% | 8 | 6 | 3 | 328 | 2 | 36 | 173 |
LOGO | 54.67% | 65.75% | 62.74% | 12 | 3 | 2 | 357 | 8 | 82 | 138 |
Semantic-Aware Video Text Detection | 54.47% | 70.11% | 70.17% | 5 | 9 | 3 | 293 | 3 | 19 | 207 |
TransVTSpotter | 48.51% | 68.31% | 65.23% | 9 | 7 | 1 | 328 | 11 | 84 | 164 |
HIK_OCR | 44.14% | 74.49% | 54.92% | 8 | 2 | 7 | 265 | 12 | 43 | 226 |
Megvii-Image++ | 40.16% | 71.07% | 51.04% | 1 | 8 | 8 | 234 | 3 | 32 | 266 |
AJOU | 37.97% | 68.51% | 39.17% | 3 | 9 | 5 | 231 | 43 | 40 | 229 |
SRC-B-TextProcessingLab | 28.03% | 78.55% | 44.81% | 2 | 4 | 11 | 151 | 1 | 10 | 351 |
USTB_TexVideo | 16.10% | 80.64% | 32.75% | 0 | 10 | 7 | 128 | 6 | 47 | 369 |
StradVision-1 | 12.33% | 82.47% | 37.59% | 0 | 8 | 9 | 134 | 4 | 72 | 365 |
USTB_TexVideo II-2 | 7.75% | 81.09% | 13.14% | 0 | 2 | 15 | 47 | 5 | 8 | 451 |
RTST Lucas-Kanade-2 (RealTimeSceneText_LucasKanade_v2) | -115.31% | 65.25% | 8.32% | 0 | 3 | 14 | 53 | 13 | 633 | 437 |
USTB_TexVideo II-1 | -33.00% | 79.18% | 17.56% | 0 | 5 | 12 | 84 | 6 | 250 | 413 |