├── .github ├── PULL_REQUEST_TEMPLATE.md └── workflows │ └── lint.yaml ├── .gitignore ├── Korpora ├── __init__.py ├── about.py ├── cli.py ├── korpora.py ├── korpus_aihub_kspon_speech.py ├── korpus_aihub_translation.py ├── korpus_chatbot_data.py ├── korpus_custom.py ├── korpus_kcbert.py ├── korpus_korean_hate_speech.py ├── korpus_korean_parallel.py ├── korpus_korean_petitions.py ├── korpus_kornli.py ├── korpus_korsts.py ├── korpus_kowiki.py ├── korpus_modu_messenger.py ├── korpus_modu_morpheme.py ├── korpus_modu_ne.py ├── korpus_modu_news.py ├── korpus_modu_spoken.py ├── korpus_modu_web.py ├── korpus_modu_written.py ├── korpus_namuwiki.py ├── korpus_naverchangwon_ner.py ├── korpus_nsmc.py ├── korpus_open_subtitles.py ├── korpus_question_pair.py ├── loader.py ├── task_fetch.py ├── task_lmdata.py └── utils.py ├── LICENSE ├── README.md ├── requirements.txt ├── setup.py ├── tests ├── manual.py ├── test_korean_chatbot_data.py ├── test_korean_hate_speech.py ├── test_korean_parallel.py ├── test_korean_petitions.py ├── test_kornli.py ├── test_korsts.py ├── test_naver_changwon_ner.py ├── test_nsmc.py └── test_question_pair.py └── tools └── lint.sh /.github/PULL_REQUEST_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/.github/PULL_REQUEST_TEMPLATE.md -------------------------------------------------------------------------------- /.github/workflows/lint.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/.github/workflows/lint.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/.gitignore -------------------------------------------------------------------------------- /Korpora/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/__init__.py -------------------------------------------------------------------------------- /Korpora/about.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/about.py -------------------------------------------------------------------------------- /Korpora/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/cli.py -------------------------------------------------------------------------------- /Korpora/korpora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpora.py -------------------------------------------------------------------------------- /Korpora/korpus_aihub_kspon_speech.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_aihub_kspon_speech.py -------------------------------------------------------------------------------- /Korpora/korpus_aihub_translation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_aihub_translation.py -------------------------------------------------------------------------------- /Korpora/korpus_chatbot_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_chatbot_data.py -------------------------------------------------------------------------------- /Korpora/korpus_custom.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_custom.py -------------------------------------------------------------------------------- /Korpora/korpus_kcbert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_kcbert.py -------------------------------------------------------------------------------- /Korpora/korpus_korean_hate_speech.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_korean_hate_speech.py -------------------------------------------------------------------------------- /Korpora/korpus_korean_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_korean_parallel.py -------------------------------------------------------------------------------- /Korpora/korpus_korean_petitions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_korean_petitions.py -------------------------------------------------------------------------------- /Korpora/korpus_kornli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_kornli.py -------------------------------------------------------------------------------- /Korpora/korpus_korsts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_korsts.py -------------------------------------------------------------------------------- /Korpora/korpus_kowiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_kowiki.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_messenger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_messenger.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_morpheme.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_morpheme.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_ne.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_ne.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_news.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_news.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_spoken.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_spoken.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_web.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_web.py -------------------------------------------------------------------------------- /Korpora/korpus_modu_written.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_modu_written.py -------------------------------------------------------------------------------- /Korpora/korpus_namuwiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_namuwiki.py -------------------------------------------------------------------------------- /Korpora/korpus_naverchangwon_ner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_naverchangwon_ner.py -------------------------------------------------------------------------------- /Korpora/korpus_nsmc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_nsmc.py -------------------------------------------------------------------------------- /Korpora/korpus_open_subtitles.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_open_subtitles.py -------------------------------------------------------------------------------- /Korpora/korpus_question_pair.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/korpus_question_pair.py -------------------------------------------------------------------------------- /Korpora/loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/loader.py -------------------------------------------------------------------------------- /Korpora/task_fetch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/task_fetch.py -------------------------------------------------------------------------------- /Korpora/task_lmdata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/task_lmdata.py -------------------------------------------------------------------------------- /Korpora/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/Korpora/utils.py -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/README.md -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/requirements.txt -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/setup.py -------------------------------------------------------------------------------- /tests/manual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/manual.py -------------------------------------------------------------------------------- /tests/test_korean_chatbot_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_korean_chatbot_data.py -------------------------------------------------------------------------------- /tests/test_korean_hate_speech.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_korean_hate_speech.py -------------------------------------------------------------------------------- /tests/test_korean_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_korean_parallel.py -------------------------------------------------------------------------------- /tests/test_korean_petitions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_korean_petitions.py -------------------------------------------------------------------------------- /tests/test_kornli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_kornli.py -------------------------------------------------------------------------------- /tests/test_korsts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_korsts.py -------------------------------------------------------------------------------- /tests/test_naver_changwon_ner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_naver_changwon_ner.py -------------------------------------------------------------------------------- /tests/test_nsmc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_nsmc.py -------------------------------------------------------------------------------- /tests/test_question_pair.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tests/test_question_pair.py -------------------------------------------------------------------------------- /tools/lint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ko-nlp/Korpora/HEAD/tools/lint.sh --------------------------------------------------------------------------------