├── .github └── workflows │ ├── pypi.yml │ └── test.yml ├── .gitignore ├── LICENSE ├── Makefile ├── README.md ├── corus ├── __init__.py ├── io.py ├── path.py ├── readme.py ├── record.py ├── sources │ ├── __init__.py │ ├── bsnlp.py │ ├── buriy.py │ ├── corpora.py │ ├── factru.py │ ├── gareev.py │ ├── gramru.py │ ├── lenta.py │ ├── librusec.py │ ├── meta.py │ ├── mokoron.py │ ├── morphoru.py │ ├── ne5.py │ ├── ods.py │ ├── omnia.py │ ├── persons.py │ ├── ria.py │ ├── rudrec.py │ ├── russe.py │ ├── simlex.py │ ├── taiga │ │ ├── __init__.py │ │ ├── arzamas.py │ │ ├── common.py │ │ ├── fontanka.py │ │ ├── interfax.py │ │ ├── kp.py │ │ ├── lenta.py │ │ ├── magazines.py │ │ ├── nplus1.py │ │ ├── proza.py │ │ ├── social.py │ │ └── subtitles.py │ ├── toloka.py │ ├── ud.py │ ├── wiki.py │ └── wikiner.py ├── third │ ├── WikiExtractor.py │ └── __init__.py └── zip.py ├── data ├── Collection5 │ ├── 001.ann │ └── 001.txt ├── Persons-1000.zip ├── aij-wikiner-ru-wp3.bz2 ├── annot.opcorpora.xml.byfile.zip ├── bsnlp │ └── test_pl_cs_ru_bg │ │ ├── annotated │ │ └── nord_stream │ │ │ └── ru │ │ │ ├── Nord_Stream_2_extra.xml_file_1.out │ │ │ └── Nord_Stream_2_extra.xml_file_7.out │ │ └── raw │ │ └── nord_stream │ │ └── ru │ │ ├── Nord_Stream_2_extra.xml_file_1.txt │ │ └── Nord_Stream_2_extra.xml_file_7.txt ├── buriy │ ├── lenta.tar.bz2 │ ├── news-articles-2014.tar.bz2 │ ├── news-articles-2015-part1.tar.bz2 │ ├── news-articles-2015-part2.tar.bz2 │ └── webhose-2016.tar.bz2 ├── factRuEval-2016-master │ └── devset │ │ ├── book_58.coref │ │ ├── book_58.facts │ │ ├── book_58.objects │ │ ├── book_58.spans │ │ ├── book_58.tokens │ │ └── book_58.txt ├── gramru │ └── GramEval_private_test.conllu ├── lenta-ru-news.csv.bz2 ├── lenta-ru-news.csv.gz ├── librusec_fb2.plain.gz ├── mokoron │ └── db.sql ├── morphoru │ ├── RNCgoldInUD_Morpho.conll │ ├── gikrya_new_test.out │ └── unamb_sent_14_6.conllu ├── ods │ ├── gazeta.csv.gz │ ├── interfax.csv.gz │ ├── iz.csv.gz │ ├── meduza.csv.gz │ ├── ria.csv.gz │ ├── rt.csv.gz │ └── tass-001.csv.gz ├── ria.json.gz ├── ru_om1000a.x1_.xz ├── rudrec │ └── rudrec_annotated.json ├── rus-ner-news-corpus.iob │ └── biztass-1.txt.iob ├── russe │ └── sem │ │ ├── ae-train.csv │ │ ├── ae2.csv │ │ ├── hj.csv │ │ └── rt.csv ├── ruwiki-latest-pages-articles.xml.bz2 ├── sample.ipynb ├── simlex │ └── ru_simlex965_tagged.tsv ├── taiga │ ├── Arzamas.tar.gz │ ├── Fontanka.tar.gz │ ├── Interfax.tar.gz │ ├── KP.tar.gz │ ├── Lenta.tar.gz │ ├── Magazines.tar.gz │ ├── NPlus1.tar.gz │ ├── Subtitles.tar.gz │ ├── proza_ru.zip │ ├── social.tar.gz │ └── stihi_ru.zip ├── toloka │ ├── lrwc-1.1-aggregated.tsv │ └── ruadrect │ │ └── task2_ru_test.tsv └── ud │ ├── ru_gsd-ud-dev.conllu │ ├── ru_pud-ud-test.conllu │ ├── ru_syntagrus-ud-dev.conllu │ └── ru_taiga-ud-dev.conllu ├── docs.ipynb ├── requirements ├── ci.txt └── dev.txt ├── setup.cfg └── setup.py /.github/workflows/pypi.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/.github/workflows/pypi.yml -------------------------------------------------------------------------------- /.github/workflows/test.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/.github/workflows/test.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/README.md -------------------------------------------------------------------------------- /corus/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | from .sources import * # noqa 3 | -------------------------------------------------------------------------------- /corus/io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/io.py -------------------------------------------------------------------------------- /corus/path.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/path.py -------------------------------------------------------------------------------- /corus/readme.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/readme.py -------------------------------------------------------------------------------- /corus/record.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/record.py -------------------------------------------------------------------------------- /corus/sources/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/__init__.py -------------------------------------------------------------------------------- /corus/sources/bsnlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/bsnlp.py -------------------------------------------------------------------------------- /corus/sources/buriy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/buriy.py -------------------------------------------------------------------------------- /corus/sources/corpora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/corpora.py -------------------------------------------------------------------------------- /corus/sources/factru.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/factru.py -------------------------------------------------------------------------------- /corus/sources/gareev.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/gareev.py -------------------------------------------------------------------------------- /corus/sources/gramru.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/gramru.py -------------------------------------------------------------------------------- /corus/sources/lenta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/lenta.py -------------------------------------------------------------------------------- /corus/sources/librusec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/librusec.py -------------------------------------------------------------------------------- /corus/sources/meta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/meta.py -------------------------------------------------------------------------------- /corus/sources/mokoron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/mokoron.py -------------------------------------------------------------------------------- /corus/sources/morphoru.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/morphoru.py -------------------------------------------------------------------------------- /corus/sources/ne5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/ne5.py -------------------------------------------------------------------------------- /corus/sources/ods.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/ods.py -------------------------------------------------------------------------------- /corus/sources/omnia.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/omnia.py -------------------------------------------------------------------------------- /corus/sources/persons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/persons.py -------------------------------------------------------------------------------- /corus/sources/ria.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/ria.py -------------------------------------------------------------------------------- /corus/sources/rudrec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/rudrec.py -------------------------------------------------------------------------------- /corus/sources/russe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/russe.py -------------------------------------------------------------------------------- /corus/sources/simlex.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/simlex.py -------------------------------------------------------------------------------- /corus/sources/taiga/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/__init__.py -------------------------------------------------------------------------------- /corus/sources/taiga/arzamas.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/arzamas.py -------------------------------------------------------------------------------- /corus/sources/taiga/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/common.py -------------------------------------------------------------------------------- /corus/sources/taiga/fontanka.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/fontanka.py -------------------------------------------------------------------------------- /corus/sources/taiga/interfax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/interfax.py -------------------------------------------------------------------------------- /corus/sources/taiga/kp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/kp.py -------------------------------------------------------------------------------- /corus/sources/taiga/lenta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/lenta.py -------------------------------------------------------------------------------- /corus/sources/taiga/magazines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/magazines.py -------------------------------------------------------------------------------- /corus/sources/taiga/nplus1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/nplus1.py -------------------------------------------------------------------------------- /corus/sources/taiga/proza.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/proza.py -------------------------------------------------------------------------------- /corus/sources/taiga/social.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/social.py -------------------------------------------------------------------------------- /corus/sources/taiga/subtitles.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/taiga/subtitles.py -------------------------------------------------------------------------------- /corus/sources/toloka.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/toloka.py -------------------------------------------------------------------------------- /corus/sources/ud.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/ud.py -------------------------------------------------------------------------------- /corus/sources/wiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/wiki.py -------------------------------------------------------------------------------- /corus/sources/wikiner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/sources/wikiner.py -------------------------------------------------------------------------------- /corus/third/WikiExtractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/third/WikiExtractor.py -------------------------------------------------------------------------------- /corus/third/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /corus/zip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/corus/zip.py -------------------------------------------------------------------------------- /data/Collection5/001.ann: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/Collection5/001.ann -------------------------------------------------------------------------------- /data/Collection5/001.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/Collection5/001.txt -------------------------------------------------------------------------------- /data/Persons-1000.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/Persons-1000.zip -------------------------------------------------------------------------------- /data/aij-wikiner-ru-wp3.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/aij-wikiner-ru-wp3.bz2 -------------------------------------------------------------------------------- /data/annot.opcorpora.xml.byfile.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/annot.opcorpora.xml.byfile.zip -------------------------------------------------------------------------------- /data/bsnlp/test_pl_cs_ru_bg/annotated/nord_stream/ru/Nord_Stream_2_extra.xml_file_1.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/bsnlp/test_pl_cs_ru_bg/annotated/nord_stream/ru/Nord_Stream_2_extra.xml_file_1.out -------------------------------------------------------------------------------- /data/bsnlp/test_pl_cs_ru_bg/annotated/nord_stream/ru/Nord_Stream_2_extra.xml_file_7.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/bsnlp/test_pl_cs_ru_bg/annotated/nord_stream/ru/Nord_Stream_2_extra.xml_file_7.out -------------------------------------------------------------------------------- /data/bsnlp/test_pl_cs_ru_bg/raw/nord_stream/ru/Nord_Stream_2_extra.xml_file_1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/bsnlp/test_pl_cs_ru_bg/raw/nord_stream/ru/Nord_Stream_2_extra.xml_file_1.txt -------------------------------------------------------------------------------- /data/bsnlp/test_pl_cs_ru_bg/raw/nord_stream/ru/Nord_Stream_2_extra.xml_file_7.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/bsnlp/test_pl_cs_ru_bg/raw/nord_stream/ru/Nord_Stream_2_extra.xml_file_7.txt -------------------------------------------------------------------------------- /data/buriy/lenta.tar.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/buriy/lenta.tar.bz2 -------------------------------------------------------------------------------- /data/buriy/news-articles-2014.tar.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/buriy/news-articles-2014.tar.bz2 -------------------------------------------------------------------------------- /data/buriy/news-articles-2015-part1.tar.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/buriy/news-articles-2015-part1.tar.bz2 -------------------------------------------------------------------------------- /data/buriy/news-articles-2015-part2.tar.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/buriy/news-articles-2015-part2.tar.bz2 -------------------------------------------------------------------------------- /data/buriy/webhose-2016.tar.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/buriy/webhose-2016.tar.bz2 -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.coref: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.coref -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.facts: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.facts -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.objects: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.objects -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.spans: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.spans -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.tokens: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.tokens -------------------------------------------------------------------------------- /data/factRuEval-2016-master/devset/book_58.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/factRuEval-2016-master/devset/book_58.txt -------------------------------------------------------------------------------- /data/gramru/GramEval_private_test.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/gramru/GramEval_private_test.conllu -------------------------------------------------------------------------------- /data/lenta-ru-news.csv.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/lenta-ru-news.csv.bz2 -------------------------------------------------------------------------------- /data/lenta-ru-news.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/lenta-ru-news.csv.gz -------------------------------------------------------------------------------- /data/librusec_fb2.plain.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/librusec_fb2.plain.gz -------------------------------------------------------------------------------- /data/mokoron/db.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/mokoron/db.sql -------------------------------------------------------------------------------- /data/morphoru/RNCgoldInUD_Morpho.conll: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/morphoru/RNCgoldInUD_Morpho.conll -------------------------------------------------------------------------------- /data/morphoru/gikrya_new_test.out: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/morphoru/gikrya_new_test.out -------------------------------------------------------------------------------- /data/morphoru/unamb_sent_14_6.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/morphoru/unamb_sent_14_6.conllu -------------------------------------------------------------------------------- /data/ods/gazeta.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/gazeta.csv.gz -------------------------------------------------------------------------------- /data/ods/interfax.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/interfax.csv.gz -------------------------------------------------------------------------------- /data/ods/iz.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/iz.csv.gz -------------------------------------------------------------------------------- /data/ods/meduza.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/meduza.csv.gz -------------------------------------------------------------------------------- /data/ods/ria.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/ria.csv.gz -------------------------------------------------------------------------------- /data/ods/rt.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/rt.csv.gz -------------------------------------------------------------------------------- /data/ods/tass-001.csv.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ods/tass-001.csv.gz -------------------------------------------------------------------------------- /data/ria.json.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ria.json.gz -------------------------------------------------------------------------------- /data/ru_om1000a.x1_.xz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ru_om1000a.x1_.xz -------------------------------------------------------------------------------- /data/rudrec/rudrec_annotated.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/rudrec/rudrec_annotated.json -------------------------------------------------------------------------------- /data/rus-ner-news-corpus.iob/biztass-1.txt.iob: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/rus-ner-news-corpus.iob/biztass-1.txt.iob -------------------------------------------------------------------------------- /data/russe/sem/ae-train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/russe/sem/ae-train.csv -------------------------------------------------------------------------------- /data/russe/sem/ae2.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/russe/sem/ae2.csv -------------------------------------------------------------------------------- /data/russe/sem/hj.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/russe/sem/hj.csv -------------------------------------------------------------------------------- /data/russe/sem/rt.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/russe/sem/rt.csv -------------------------------------------------------------------------------- /data/ruwiki-latest-pages-articles.xml.bz2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ruwiki-latest-pages-articles.xml.bz2 -------------------------------------------------------------------------------- /data/sample.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/sample.ipynb -------------------------------------------------------------------------------- /data/simlex/ru_simlex965_tagged.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/simlex/ru_simlex965_tagged.tsv -------------------------------------------------------------------------------- /data/taiga/Arzamas.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Arzamas.tar.gz -------------------------------------------------------------------------------- /data/taiga/Fontanka.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Fontanka.tar.gz -------------------------------------------------------------------------------- /data/taiga/Interfax.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Interfax.tar.gz -------------------------------------------------------------------------------- /data/taiga/KP.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/KP.tar.gz -------------------------------------------------------------------------------- /data/taiga/Lenta.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Lenta.tar.gz -------------------------------------------------------------------------------- /data/taiga/Magazines.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Magazines.tar.gz -------------------------------------------------------------------------------- /data/taiga/NPlus1.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/NPlus1.tar.gz -------------------------------------------------------------------------------- /data/taiga/Subtitles.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/Subtitles.tar.gz -------------------------------------------------------------------------------- /data/taiga/proza_ru.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/proza_ru.zip -------------------------------------------------------------------------------- /data/taiga/social.tar.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/social.tar.gz -------------------------------------------------------------------------------- /data/taiga/stihi_ru.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/taiga/stihi_ru.zip -------------------------------------------------------------------------------- /data/toloka/lrwc-1.1-aggregated.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/toloka/lrwc-1.1-aggregated.tsv -------------------------------------------------------------------------------- /data/toloka/ruadrect/task2_ru_test.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/toloka/ruadrect/task2_ru_test.tsv -------------------------------------------------------------------------------- /data/ud/ru_gsd-ud-dev.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ud/ru_gsd-ud-dev.conllu -------------------------------------------------------------------------------- /data/ud/ru_pud-ud-test.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ud/ru_pud-ud-test.conllu -------------------------------------------------------------------------------- /data/ud/ru_syntagrus-ud-dev.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ud/ru_syntagrus-ud-dev.conllu -------------------------------------------------------------------------------- /data/ud/ru_taiga-ud-dev.conllu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/data/ud/ru_taiga-ud-dev.conllu -------------------------------------------------------------------------------- /docs.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/docs.ipynb -------------------------------------------------------------------------------- /requirements/ci.txt: -------------------------------------------------------------------------------- 1 | flake8==5.0.4 2 | jupyter==1.0.0 3 | nbconvert==7.2.8 4 | -------------------------------------------------------------------------------- /requirements/dev.txt: -------------------------------------------------------------------------------- 1 | flake8 2 | ipykernel 3 | nbconvert 4 | -------------------------------------------------------------------------------- /setup.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/setup.cfg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/natasha/corus/HEAD/setup.py --------------------------------------------------------------------------------