├── .gitignore ├── LICENSE ├── README.md ├── alphabet ├── fintabnet │ ├── character_alphabet.txt │ └── structure_alphabet.txt └── pubtabnet │ ├── character_alphabet.txt │ └── structure_alphabet.txt ├── configs ├── fintabnet.py ├── pubtab250.py ├── pubtabfin.py └── pubtabnet.py ├── datasets ├── FinTabNet.yaml ├── FinTabSub.yaml ├── PubTab250.yaml ├── PubTabNet.yaml └── PubTabSub.yaml ├── mutab ├── __init__.py ├── apis │ ├── __init__.py │ ├── test.py │ └── train.py ├── datasets │ ├── __init__.py │ ├── dataset.py │ ├── loader.py │ └── pipeline.py ├── metrics │ ├── __init__.py │ ├── metric.py │ ├── sample_pred.json │ ├── sample_real.json │ └── sample_test.json ├── models │ ├── __init__.py │ ├── attention.py │ ├── backbone.py │ ├── decoder.py │ ├── encoder.py │ ├── factory.py │ ├── handler.py │ ├── loss.py │ ├── network.py │ ├── revisor.py │ └── scanner.py ├── optimizer │ ├── __init__.py │ └── factory.py ├── syntax │ ├── __init__.py │ ├── html_to_otsl.py │ ├── otsl_to_html.py │ ├── sample_html.json │ └── sample_otsl.json └── utils │ ├── __init__.py │ └── utils.py ├── preprocess.py ├── pyproject.toml ├── test.py ├── train.py └── train.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/README.md -------------------------------------------------------------------------------- /alphabet/fintabnet/character_alphabet.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/alphabet/fintabnet/character_alphabet.txt -------------------------------------------------------------------------------- /alphabet/fintabnet/structure_alphabet.txt: -------------------------------------------------------------------------------- 1 | D 2 | L 3 | U 4 | X 5 | R 6 | eb 7 | -------------------------------------------------------------------------------- /alphabet/pubtabnet/character_alphabet.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/alphabet/pubtabnet/character_alphabet.txt -------------------------------------------------------------------------------- /alphabet/pubtabnet/structure_alphabet.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/alphabet/pubtabnet/structure_alphabet.txt -------------------------------------------------------------------------------- /configs/fintabnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/configs/fintabnet.py -------------------------------------------------------------------------------- /configs/pubtab250.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/configs/pubtab250.py -------------------------------------------------------------------------------- /configs/pubtabfin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/configs/pubtabfin.py -------------------------------------------------------------------------------- /configs/pubtabnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/configs/pubtabnet.py -------------------------------------------------------------------------------- /datasets/FinTabNet.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/datasets/FinTabNet.yaml -------------------------------------------------------------------------------- /datasets/FinTabSub.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/datasets/FinTabSub.yaml -------------------------------------------------------------------------------- /datasets/PubTab250.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/datasets/PubTab250.yaml -------------------------------------------------------------------------------- /datasets/PubTabNet.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/datasets/PubTabNet.yaml -------------------------------------------------------------------------------- /datasets/PubTabSub.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/datasets/PubTabSub.yaml -------------------------------------------------------------------------------- /mutab/__init__.py: -------------------------------------------------------------------------------- 1 | __version__ = "0.1.0" 2 | -------------------------------------------------------------------------------- /mutab/apis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/apis/__init__.py -------------------------------------------------------------------------------- /mutab/apis/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/apis/test.py -------------------------------------------------------------------------------- /mutab/apis/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/apis/train.py -------------------------------------------------------------------------------- /mutab/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/datasets/__init__.py -------------------------------------------------------------------------------- /mutab/datasets/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/datasets/dataset.py -------------------------------------------------------------------------------- /mutab/datasets/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/datasets/loader.py -------------------------------------------------------------------------------- /mutab/datasets/pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/datasets/pipeline.py -------------------------------------------------------------------------------- /mutab/metrics/__init__.py: -------------------------------------------------------------------------------- 1 | from .metric import TEDS 2 | 3 | __all__ = ["TEDS"] 4 | -------------------------------------------------------------------------------- /mutab/metrics/metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/metrics/metric.py -------------------------------------------------------------------------------- /mutab/metrics/sample_pred.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/metrics/sample_pred.json -------------------------------------------------------------------------------- /mutab/metrics/sample_real.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/metrics/sample_real.json -------------------------------------------------------------------------------- /mutab/metrics/sample_test.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/metrics/sample_test.json -------------------------------------------------------------------------------- /mutab/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/__init__.py -------------------------------------------------------------------------------- /mutab/models/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/attention.py -------------------------------------------------------------------------------- /mutab/models/backbone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/backbone.py -------------------------------------------------------------------------------- /mutab/models/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/decoder.py -------------------------------------------------------------------------------- /mutab/models/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/encoder.py -------------------------------------------------------------------------------- /mutab/models/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/factory.py -------------------------------------------------------------------------------- /mutab/models/handler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/handler.py -------------------------------------------------------------------------------- /mutab/models/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/loss.py -------------------------------------------------------------------------------- /mutab/models/network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/network.py -------------------------------------------------------------------------------- /mutab/models/revisor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/revisor.py -------------------------------------------------------------------------------- /mutab/models/scanner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/models/scanner.py -------------------------------------------------------------------------------- /mutab/optimizer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/optimizer/__init__.py -------------------------------------------------------------------------------- /mutab/optimizer/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/optimizer/factory.py -------------------------------------------------------------------------------- /mutab/syntax/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/syntax/__init__.py -------------------------------------------------------------------------------- /mutab/syntax/html_to_otsl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/syntax/html_to_otsl.py -------------------------------------------------------------------------------- /mutab/syntax/otsl_to_html.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/syntax/otsl_to_html.py -------------------------------------------------------------------------------- /mutab/syntax/sample_html.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/syntax/sample_html.json -------------------------------------------------------------------------------- /mutab/syntax/sample_otsl.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/syntax/sample_otsl.json -------------------------------------------------------------------------------- /mutab/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/utils/__init__.py -------------------------------------------------------------------------------- /mutab/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/mutab/utils/utils.py -------------------------------------------------------------------------------- /preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/preprocess.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/pyproject.toml -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/train.py -------------------------------------------------------------------------------- /train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/JG1VPP/MuTabNet/HEAD/train.sh --------------------------------------------------------------------------------