├── README.md ├── data ├── fce │ ├── fce-split.us.tsv │ └── fce.tsv └── gtc │ ├── all.tsv │ ├── dev.tok.en │ ├── dev.tok.fr │ ├── train.tok.en │ └── train.tok.fr ├── requirements.txt ├── src ├── __init__.py ├── bt │ ├── filter_bitext.py │ └── format_monolingual.py ├── eval.py ├── extract_diffs.py ├── fce │ └── split_sents.py ├── format_fairseq_output.py ├── gtc │ └── format_gtc.py ├── normalize.py ├── run_aspell.py ├── run_baseline.sh ├── run_bt.sh ├── run_gtc.sh └── tokenize.py └── xfspell.png /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/README.md -------------------------------------------------------------------------------- /data/fce/fce-split.us.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/fce/fce-split.us.tsv -------------------------------------------------------------------------------- /data/fce/fce.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/fce/fce.tsv -------------------------------------------------------------------------------- /data/gtc/all.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/gtc/all.tsv -------------------------------------------------------------------------------- /data/gtc/dev.tok.en: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/gtc/dev.tok.en -------------------------------------------------------------------------------- /data/gtc/dev.tok.fr: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/gtc/dev.tok.fr -------------------------------------------------------------------------------- /data/gtc/train.tok.en: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/gtc/train.tok.en -------------------------------------------------------------------------------- /data/gtc/train.tok.fr: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/data/gtc/train.tok.fr -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/requirements.txt -------------------------------------------------------------------------------- /src/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/bt/filter_bitext.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/bt/filter_bitext.py -------------------------------------------------------------------------------- /src/bt/format_monolingual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/bt/format_monolingual.py -------------------------------------------------------------------------------- /src/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/eval.py -------------------------------------------------------------------------------- /src/extract_diffs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/extract_diffs.py -------------------------------------------------------------------------------- /src/fce/split_sents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/fce/split_sents.py -------------------------------------------------------------------------------- /src/format_fairseq_output.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/format_fairseq_output.py -------------------------------------------------------------------------------- /src/gtc/format_gtc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/gtc/format_gtc.py -------------------------------------------------------------------------------- /src/normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/normalize.py -------------------------------------------------------------------------------- /src/run_aspell.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/run_aspell.py -------------------------------------------------------------------------------- /src/run_baseline.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/run_baseline.sh -------------------------------------------------------------------------------- /src/run_bt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/run_bt.sh -------------------------------------------------------------------------------- /src/run_gtc.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/run_gtc.sh -------------------------------------------------------------------------------- /src/tokenize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/src/tokenize.py -------------------------------------------------------------------------------- /xfspell.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mhagiwara/xfspell/HEAD/xfspell.png --------------------------------------------------------------------------------