├── .gitignore ├── LICENSE.md ├── README.md ├── augmentation ├── blur.py ├── camera.py ├── frost │ ├── frost1.png │ ├── frost2.png │ ├── frost3.png │ ├── frost4.jpg │ ├── frost5.jpg │ └── frost6.jpg ├── geometry.py ├── images │ ├── delivery.png │ ├── education.png │ ├── manila.png │ ├── nokia.png │ └── telekom.png ├── noise.py ├── ops.py ├── pattern.py ├── process.py ├── test.py ├── warp.py └── weather.py ├── create_lmdb_dataset.py ├── dataset.py ├── demo.ipynb ├── demo.py ├── demo_image ├── demo_1.png ├── demo_10.jpg ├── demo_2.jpg ├── demo_3.png ├── demo_4.png ├── demo_5.png ├── demo_6.png ├── demo_7.png ├── demo_8.jpg └── demo_9.jpg ├── figures ├── failure-case.jpg ├── trade-off.png └── vitstr_model.png ├── infer.py ├── infer_utils.py ├── model.py ├── modules ├── feature_extraction.py ├── prediction.py ├── sequence_modeling.py ├── transformation.py └── vitstr.py ├── requirements.txt ├── scripts └── paper │ ├── Accuracy_vs_GFLOPS.png │ ├── Accuracy_vs_Msec_per_Image.png │ ├── Accuracy_vs_Number_of_Parameters.png │ ├── plot_accuracy.py │ └── plot_error.py ├── test.py ├── train.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/LICENSE.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/README.md -------------------------------------------------------------------------------- /augmentation/blur.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/blur.py -------------------------------------------------------------------------------- /augmentation/camera.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/camera.py -------------------------------------------------------------------------------- /augmentation/frost/frost1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost1.png -------------------------------------------------------------------------------- /augmentation/frost/frost2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost2.png -------------------------------------------------------------------------------- /augmentation/frost/frost3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost3.png -------------------------------------------------------------------------------- /augmentation/frost/frost4.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost4.jpg -------------------------------------------------------------------------------- /augmentation/frost/frost5.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost5.jpg -------------------------------------------------------------------------------- /augmentation/frost/frost6.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/frost/frost6.jpg -------------------------------------------------------------------------------- /augmentation/geometry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/geometry.py -------------------------------------------------------------------------------- /augmentation/images/delivery.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/images/delivery.png -------------------------------------------------------------------------------- /augmentation/images/education.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/images/education.png -------------------------------------------------------------------------------- /augmentation/images/manila.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/images/manila.png -------------------------------------------------------------------------------- /augmentation/images/nokia.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/images/nokia.png -------------------------------------------------------------------------------- /augmentation/images/telekom.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/images/telekom.png -------------------------------------------------------------------------------- /augmentation/noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/noise.py -------------------------------------------------------------------------------- /augmentation/ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/ops.py -------------------------------------------------------------------------------- /augmentation/pattern.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/pattern.py -------------------------------------------------------------------------------- /augmentation/process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/process.py -------------------------------------------------------------------------------- /augmentation/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/test.py -------------------------------------------------------------------------------- /augmentation/warp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/warp.py -------------------------------------------------------------------------------- /augmentation/weather.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/augmentation/weather.py -------------------------------------------------------------------------------- /create_lmdb_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/create_lmdb_dataset.py -------------------------------------------------------------------------------- /dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/dataset.py -------------------------------------------------------------------------------- /demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo.ipynb -------------------------------------------------------------------------------- /demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo.py -------------------------------------------------------------------------------- /demo_image/demo_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_1.png -------------------------------------------------------------------------------- /demo_image/demo_10.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_10.jpg -------------------------------------------------------------------------------- /demo_image/demo_2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_2.jpg -------------------------------------------------------------------------------- /demo_image/demo_3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_3.png -------------------------------------------------------------------------------- /demo_image/demo_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_4.png -------------------------------------------------------------------------------- /demo_image/demo_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_5.png -------------------------------------------------------------------------------- /demo_image/demo_6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_6.png -------------------------------------------------------------------------------- /demo_image/demo_7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_7.png -------------------------------------------------------------------------------- /demo_image/demo_8.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_8.jpg -------------------------------------------------------------------------------- /demo_image/demo_9.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/demo_image/demo_9.jpg -------------------------------------------------------------------------------- /figures/failure-case.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/figures/failure-case.jpg -------------------------------------------------------------------------------- /figures/trade-off.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/figures/trade-off.png -------------------------------------------------------------------------------- /figures/vitstr_model.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/figures/vitstr_model.png -------------------------------------------------------------------------------- /infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/infer.py -------------------------------------------------------------------------------- /infer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/infer_utils.py -------------------------------------------------------------------------------- /model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/model.py -------------------------------------------------------------------------------- /modules/feature_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/modules/feature_extraction.py -------------------------------------------------------------------------------- /modules/prediction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/modules/prediction.py -------------------------------------------------------------------------------- /modules/sequence_modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/modules/sequence_modeling.py -------------------------------------------------------------------------------- /modules/transformation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/modules/transformation.py -------------------------------------------------------------------------------- /modules/vitstr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/modules/vitstr.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/paper/Accuracy_vs_GFLOPS.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/scripts/paper/Accuracy_vs_GFLOPS.png -------------------------------------------------------------------------------- /scripts/paper/Accuracy_vs_Msec_per_Image.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/scripts/paper/Accuracy_vs_Msec_per_Image.png -------------------------------------------------------------------------------- /scripts/paper/Accuracy_vs_Number_of_Parameters.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/scripts/paper/Accuracy_vs_Number_of_Parameters.png -------------------------------------------------------------------------------- /scripts/paper/plot_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/scripts/paper/plot_accuracy.py -------------------------------------------------------------------------------- /scripts/paper/plot_error.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/scripts/paper/plot_error.py -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/train.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/roatienza/deep-text-recognition-benchmark/HEAD/utils.py --------------------------------------------------------------------------------