├── .gitignore ├── LICENSE ├── Main.py ├── README.md ├── baselines ├── BERT │ ├── bert_embedder.py │ ├── bert_tuning.py │ ├── hdf5_save.py │ └── neighbouring_sentences.py ├── README.md ├── cantreader_calculations │ ├── analysis.md │ ├── cantreader_precision_recall.py │ ├── dea_drug_list.pkl │ └── drug_predictions.tsv ├── embed │ └── embed_helper.py ├── identify_euphemisms │ ├── char_eu_detection.py │ ├── data_helper.py │ └── word2vec_eu_detection.py ├── identify_keywords │ ├── corpus_helper.py │ ├── identify_words_dict.py │ ├── identify_words_graph.py │ └── identify_words_tfidf.py ├── plot │ └── visualize.py ├── preprocess │ ├── preprocess_gab.py │ └── preprocess_reddit.py └── word2vec_sim │ └── word2vec_sim.py ├── classification_model.py ├── data ├── euphemism_answer_drug.txt ├── target_keywords_drug.txt └── text │ └── sample.txt ├── detection.py ├── identification.py ├── read_file.py └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/LICENSE -------------------------------------------------------------------------------- /Main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/Main.py -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/README.md -------------------------------------------------------------------------------- /baselines/BERT/bert_embedder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/BERT/bert_embedder.py -------------------------------------------------------------------------------- /baselines/BERT/bert_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/BERT/bert_tuning.py -------------------------------------------------------------------------------- /baselines/BERT/hdf5_save.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/BERT/hdf5_save.py -------------------------------------------------------------------------------- /baselines/BERT/neighbouring_sentences.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/BERT/neighbouring_sentences.py -------------------------------------------------------------------------------- /baselines/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/README.md -------------------------------------------------------------------------------- /baselines/cantreader_calculations/analysis.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/cantreader_calculations/analysis.md -------------------------------------------------------------------------------- /baselines/cantreader_calculations/cantreader_precision_recall.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/cantreader_calculations/cantreader_precision_recall.py -------------------------------------------------------------------------------- /baselines/cantreader_calculations/dea_drug_list.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/cantreader_calculations/dea_drug_list.pkl -------------------------------------------------------------------------------- /baselines/cantreader_calculations/drug_predictions.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/cantreader_calculations/drug_predictions.tsv -------------------------------------------------------------------------------- /baselines/embed/embed_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/embed/embed_helper.py -------------------------------------------------------------------------------- /baselines/identify_euphemisms/char_eu_detection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_euphemisms/char_eu_detection.py -------------------------------------------------------------------------------- /baselines/identify_euphemisms/data_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_euphemisms/data_helper.py -------------------------------------------------------------------------------- /baselines/identify_euphemisms/word2vec_eu_detection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_euphemisms/word2vec_eu_detection.py -------------------------------------------------------------------------------- /baselines/identify_keywords/corpus_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_keywords/corpus_helper.py -------------------------------------------------------------------------------- /baselines/identify_keywords/identify_words_dict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_keywords/identify_words_dict.py -------------------------------------------------------------------------------- /baselines/identify_keywords/identify_words_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_keywords/identify_words_graph.py -------------------------------------------------------------------------------- /baselines/identify_keywords/identify_words_tfidf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/identify_keywords/identify_words_tfidf.py -------------------------------------------------------------------------------- /baselines/plot/visualize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/plot/visualize.py -------------------------------------------------------------------------------- /baselines/preprocess/preprocess_gab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/preprocess/preprocess_gab.py -------------------------------------------------------------------------------- /baselines/preprocess/preprocess_reddit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/preprocess/preprocess_reddit.py -------------------------------------------------------------------------------- /baselines/word2vec_sim/word2vec_sim.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/baselines/word2vec_sim/word2vec_sim.py -------------------------------------------------------------------------------- /classification_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/classification_model.py -------------------------------------------------------------------------------- /data/euphemism_answer_drug.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/data/euphemism_answer_drug.txt -------------------------------------------------------------------------------- /data/target_keywords_drug.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/data/target_keywords_drug.txt -------------------------------------------------------------------------------- /data/text/sample.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/data/text/sample.txt -------------------------------------------------------------------------------- /detection.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/detection.py -------------------------------------------------------------------------------- /identification.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/identification.py -------------------------------------------------------------------------------- /read_file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/read_file.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WanzhengZhu/Euphemism/HEAD/requirements.txt --------------------------------------------------------------------------------