├── .gitignore ├── README.md ├── aion ├── embeddings │ ├── cove.py │ ├── doc2vec.py │ ├── document_embeddings.py │ ├── elmo.py │ ├── embeddings.py │ ├── glove.py │ ├── infersent.py │ ├── infersent_lib │ │ ├── .gitignore │ │ ├── LICENSE │ │ ├── README.md │ │ ├── data.py │ │ ├── dataset │ │ │ ├── get_data.bash │ │ │ └── tokenizer.sed │ │ ├── encoder │ │ │ ├── demo.ipynb │ │ │ ├── extract_features.py │ │ │ ├── models.py │ │ │ └── samples.txt │ │ ├── models.py │ │ ├── mutils.py │ │ └── train_nli.py │ ├── sentence_embeddings.py │ ├── skip_thoughts.py │ └── word_embeddings.py ├── helper │ ├── __init__.py │ └── file_helper.py └── util │ ├── __init__.py │ └── spell_check.py └── sample ├── embeddings └── nlp-embeddings-document-doc2vec.ipynb ├── nlp-3_basic_distance_measurement_in_text_mining.ipynb ├── nlp-bag_of_words.ipynb ├── nlp-character_embedding.ipynb ├── nlp-distance-edit_distance.ipynb ├── nlp-embeddings-sentence-elmo.ipynb ├── nlp-embeddings-sentence-infersent.ipynb ├── nlp-embeddings-word-cove.ipynb ├── nlp-lsa_lda.ipynb ├── nlp-model_interpretation-201808.ipynb ├── nlp-model_interpretation.ipynb ├── nlp-model_interpretation_anchor.ipynb ├── nlp-model_interpretation_shap.ipynb ├── nlp-named_entity_recognition.ipynb ├── nlp-part_of_speech.ipynb ├── nlp-sentence_tokenization.ipynb ├── nlp-skip_thoughts.ipynb ├── nlp-stemming.ipynb ├── nlp-stop_words.ipynb ├── nlp-text_summarization_extractive.ipynb ├── nlp-word_embedding.ipynb ├── nlp-word_mover_distance.ipynb ├── nlp-word_tokenization.ipynb ├── nlp_lemmatization.ipynb ├── preprocessing └── nlp-preprocessing-string_matching-fuzzywuzzy.ipynb ├── resources └── LSI and LDA.pptx └── util ├── nlp-util-spell_corrector.ipynb └── nlp-util-symspell.ipynb /.gitignore: -------------------------------------------------------------------------------- 1 | *.pyc -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/README.md -------------------------------------------------------------------------------- /aion/embeddings/cove.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/cove.py -------------------------------------------------------------------------------- /aion/embeddings/doc2vec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/doc2vec.py -------------------------------------------------------------------------------- /aion/embeddings/document_embeddings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/document_embeddings.py -------------------------------------------------------------------------------- /aion/embeddings/elmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/elmo.py -------------------------------------------------------------------------------- /aion/embeddings/embeddings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/embeddings.py -------------------------------------------------------------------------------- /aion/embeddings/glove.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/glove.py -------------------------------------------------------------------------------- /aion/embeddings/infersent.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/.gitignore -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/LICENSE -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/README.md -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/data.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/dataset/get_data.bash: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/dataset/get_data.bash -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/dataset/tokenizer.sed: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/dataset/tokenizer.sed -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/encoder/demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/encoder/demo.ipynb -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/encoder/extract_features.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/encoder/extract_features.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/encoder/models.py: -------------------------------------------------------------------------------- 1 | ../models.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/encoder/samples.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/encoder/samples.txt -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/models.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/mutils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/mutils.py -------------------------------------------------------------------------------- /aion/embeddings/infersent_lib/train_nli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/infersent_lib/train_nli.py -------------------------------------------------------------------------------- /aion/embeddings/sentence_embeddings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/sentence_embeddings.py -------------------------------------------------------------------------------- /aion/embeddings/skip_thoughts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/skip_thoughts.py -------------------------------------------------------------------------------- /aion/embeddings/word_embeddings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/embeddings/word_embeddings.py -------------------------------------------------------------------------------- /aion/helper/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /aion/helper/file_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/helper/file_helper.py -------------------------------------------------------------------------------- /aion/util/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /aion/util/spell_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/aion/util/spell_check.py -------------------------------------------------------------------------------- /sample/embeddings/nlp-embeddings-document-doc2vec.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/embeddings/nlp-embeddings-document-doc2vec.ipynb -------------------------------------------------------------------------------- /sample/nlp-3_basic_distance_measurement_in_text_mining.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-3_basic_distance_measurement_in_text_mining.ipynb -------------------------------------------------------------------------------- /sample/nlp-bag_of_words.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-bag_of_words.ipynb -------------------------------------------------------------------------------- /sample/nlp-character_embedding.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-character_embedding.ipynb -------------------------------------------------------------------------------- /sample/nlp-distance-edit_distance.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-distance-edit_distance.ipynb -------------------------------------------------------------------------------- /sample/nlp-embeddings-sentence-elmo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-embeddings-sentence-elmo.ipynb -------------------------------------------------------------------------------- /sample/nlp-embeddings-sentence-infersent.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-embeddings-sentence-infersent.ipynb -------------------------------------------------------------------------------- /sample/nlp-embeddings-word-cove.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-embeddings-word-cove.ipynb -------------------------------------------------------------------------------- /sample/nlp-lsa_lda.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-lsa_lda.ipynb -------------------------------------------------------------------------------- /sample/nlp-model_interpretation-201808.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-model_interpretation-201808.ipynb -------------------------------------------------------------------------------- /sample/nlp-model_interpretation.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-model_interpretation.ipynb -------------------------------------------------------------------------------- /sample/nlp-model_interpretation_anchor.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-model_interpretation_anchor.ipynb -------------------------------------------------------------------------------- /sample/nlp-model_interpretation_shap.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-model_interpretation_shap.ipynb -------------------------------------------------------------------------------- /sample/nlp-named_entity_recognition.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-named_entity_recognition.ipynb -------------------------------------------------------------------------------- /sample/nlp-part_of_speech.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-part_of_speech.ipynb -------------------------------------------------------------------------------- /sample/nlp-sentence_tokenization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-sentence_tokenization.ipynb -------------------------------------------------------------------------------- /sample/nlp-skip_thoughts.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-skip_thoughts.ipynb -------------------------------------------------------------------------------- /sample/nlp-stemming.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-stemming.ipynb -------------------------------------------------------------------------------- /sample/nlp-stop_words.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-stop_words.ipynb -------------------------------------------------------------------------------- /sample/nlp-text_summarization_extractive.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-text_summarization_extractive.ipynb -------------------------------------------------------------------------------- /sample/nlp-word_embedding.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-word_embedding.ipynb -------------------------------------------------------------------------------- /sample/nlp-word_mover_distance.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-word_mover_distance.ipynb -------------------------------------------------------------------------------- /sample/nlp-word_tokenization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp-word_tokenization.ipynb -------------------------------------------------------------------------------- /sample/nlp_lemmatization.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/nlp_lemmatization.ipynb -------------------------------------------------------------------------------- /sample/preprocessing/nlp-preprocessing-string_matching-fuzzywuzzy.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/preprocessing/nlp-preprocessing-string_matching-fuzzywuzzy.ipynb -------------------------------------------------------------------------------- /sample/resources/LSI and LDA.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/resources/LSI and LDA.pptx -------------------------------------------------------------------------------- /sample/util/nlp-util-spell_corrector.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/util/nlp-util-spell_corrector.ipynb -------------------------------------------------------------------------------- /sample/util/nlp-util-symspell.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/makcedward/nlp/HEAD/sample/util/nlp-util-symspell.ipynb --------------------------------------------------------------------------------