├── .gitignore ├── CONTRIBUTING.md ├── LICENSE ├── README.md ├── pix2struct ├── __init__.py ├── configs │ ├── __init__.py │ ├── init │ │ ├── __init__.py │ │ ├── pix2struct_base_init.gin │ │ ├── pix2struct_large_init.gin │ │ ├── random_init.gin │ │ ├── warmup_base_init.gin │ │ └── warmup_large_init.gin │ ├── models │ │ ├── __init__.py │ │ ├── pix2struct.gin │ │ └── t5_1_1_flaxformer.gin │ ├── optimizers │ │ ├── __init__.py │ │ └── adafactor.gin │ ├── runs │ │ ├── __init__.py │ │ ├── eval.gin │ │ ├── inference.gin │ │ └── train.gin │ ├── schedules │ │ ├── __init__.py │ │ ├── ai2d.gin │ │ ├── chartqa.gin │ │ ├── docvqa.gin │ │ ├── infographicvqa.gin │ │ ├── ocrvqa.gin │ │ ├── refexp.gin │ │ ├── screen2words.gin │ │ ├── textcaps.gin │ │ └── widget_captioning.gin │ └── sizes │ │ ├── __init__.py │ │ ├── base.gin │ │ ├── large.gin │ │ └── tiny.gin ├── demo.py ├── demo_utils.py ├── example_inference.py ├── inference_utils.py ├── metrics.py ├── metrics_test.py ├── models.py ├── models_test.py ├── postprocessors.py ├── preprocessing │ ├── __init__.py │ ├── convert_ai2d.py │ ├── convert_chartqa.py │ ├── convert_docvqa.py │ ├── convert_ocrvqa.py │ ├── convert_refexp.py │ ├── convert_screen2words.py │ ├── convert_textcaps.py │ ├── convert_widget_captioning.py │ └── preprocessing_utils.py ├── preprocessors.py ├── preprocessors_test.py ├── tasks.py ├── transfer_utils.py └── web │ ├── static │ └── style.css │ └── templates │ └── demo_screenshot.html └── setup.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/.gitignore -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- 1 | External contributions are not accepted, sorry! 2 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/README.md -------------------------------------------------------------------------------- /pix2struct/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/init/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/init/pix2struct_base_init.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/pix2struct_base_init.gin -------------------------------------------------------------------------------- /pix2struct/configs/init/pix2struct_large_init.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/pix2struct_large_init.gin -------------------------------------------------------------------------------- /pix2struct/configs/init/random_init.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/random_init.gin -------------------------------------------------------------------------------- /pix2struct/configs/init/warmup_base_init.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/warmup_base_init.gin -------------------------------------------------------------------------------- /pix2struct/configs/init/warmup_large_init.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/init/warmup_large_init.gin -------------------------------------------------------------------------------- /pix2struct/configs/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/models/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/models/pix2struct.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/models/pix2struct.gin -------------------------------------------------------------------------------- /pix2struct/configs/models/t5_1_1_flaxformer.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/models/t5_1_1_flaxformer.gin -------------------------------------------------------------------------------- /pix2struct/configs/optimizers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/optimizers/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/optimizers/adafactor.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/optimizers/adafactor.gin -------------------------------------------------------------------------------- /pix2struct/configs/runs/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/runs/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/runs/eval.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/runs/eval.gin -------------------------------------------------------------------------------- /pix2struct/configs/runs/inference.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/runs/inference.gin -------------------------------------------------------------------------------- /pix2struct/configs/runs/train.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/runs/train.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/schedules/ai2d.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/ai2d.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/chartqa.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/chartqa.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/docvqa.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/docvqa.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/infographicvqa.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/infographicvqa.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/ocrvqa.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/ocrvqa.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/refexp.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/refexp.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/screen2words.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/screen2words.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/textcaps.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/textcaps.gin -------------------------------------------------------------------------------- /pix2struct/configs/schedules/widget_captioning.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/schedules/widget_captioning.gin -------------------------------------------------------------------------------- /pix2struct/configs/sizes/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/sizes/__init__.py -------------------------------------------------------------------------------- /pix2struct/configs/sizes/base.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/sizes/base.gin -------------------------------------------------------------------------------- /pix2struct/configs/sizes/large.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/sizes/large.gin -------------------------------------------------------------------------------- /pix2struct/configs/sizes/tiny.gin: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/configs/sizes/tiny.gin -------------------------------------------------------------------------------- /pix2struct/demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/demo.py -------------------------------------------------------------------------------- /pix2struct/demo_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/demo_utils.py -------------------------------------------------------------------------------- /pix2struct/example_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/example_inference.py -------------------------------------------------------------------------------- /pix2struct/inference_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/inference_utils.py -------------------------------------------------------------------------------- /pix2struct/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/metrics.py -------------------------------------------------------------------------------- /pix2struct/metrics_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/metrics_test.py -------------------------------------------------------------------------------- /pix2struct/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/models.py -------------------------------------------------------------------------------- /pix2struct/models_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/models_test.py -------------------------------------------------------------------------------- /pix2struct/postprocessors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/postprocessors.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/__init__.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_ai2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_ai2d.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_chartqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_chartqa.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_docvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_docvqa.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_ocrvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_ocrvqa.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_refexp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_refexp.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_screen2words.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_screen2words.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_textcaps.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_textcaps.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/convert_widget_captioning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/convert_widget_captioning.py -------------------------------------------------------------------------------- /pix2struct/preprocessing/preprocessing_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessing/preprocessing_utils.py -------------------------------------------------------------------------------- /pix2struct/preprocessors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessors.py -------------------------------------------------------------------------------- /pix2struct/preprocessors_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/preprocessors_test.py -------------------------------------------------------------------------------- /pix2struct/tasks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/tasks.py -------------------------------------------------------------------------------- /pix2struct/transfer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/transfer_utils.py -------------------------------------------------------------------------------- /pix2struct/web/static/style.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/web/static/style.css -------------------------------------------------------------------------------- /pix2struct/web/templates/demo_screenshot.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/pix2struct/web/templates/demo_screenshot.html -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/google-research/pix2struct/HEAD/setup.py --------------------------------------------------------------------------------