├── .DS_Store ├── LICENSE ├── README.md └── bib_citations ├── 10_must_reads.bib ├── Evaluation.bib ├── NMT_attention_mechanism.bib ├── NMT_decoding.bib ├── NMT_document_level.bib ├── NMT_domain_adaptation.bib ├── NMT_efficiency.bib ├── NMT_ensemble_and_reranking.bib ├── NMT_fairness_and_diversity.bib ├── NMT_human_centered_automatic_post-editing.bib ├── NMT_human_centered_interactive.bib ├── NMT_interpretability.bib ├── NMT_linguistic_interpretation.bib ├── NMT_low_resource_data_augmentation.bib ├── NMT_low_resource_meta.bib ├── NMT_low_resource_multitask.bib ├── NMT_low_resource_pivot_based.bib ├── NMT_low_resource_semi_supervised.bib ├── NMT_low_resource_transfer.bib ├── NMT_low_resource_unsupervised.bib ├── NMT_model_architecture.bib ├── NMT_multimodal.bib ├── NMT_open_vocabulary_and_char.bib ├── NMT_poetry_translation.bib ├── NMT_pretraining.bib ├── NMT_prior_knowledge_coverage.bib ├── NMT_prior_knowledge_syntactic_semantic.bib ├── NMT_prior_knowledge_word_phrase.bib ├── NMT_quality_estimation.bib ├── NMT_robustness.bib ├── NMT_speech_and_simultaneous.bib ├── NMT_training_framework.bib ├── NMT_tutorials_and_challenges.bib ├── SMT_discriminative_training.bib ├── SMT_human_centered.bib ├── SMT_phrase_based.bib ├── SMT_syntax_based.bib ├── SMT_system_combination.bib ├── SMT_tutorials.bib ├── SMT_word_based.bib └── Word_Translation.bib /.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/THUNLP-MT/MT-Reading-List/b79517bcf9e0862366a1bebc9c03a6139c13ab8c/.DS_Store -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | BSD 3-Clause License 2 | 3 | Copyright (c) 2018, THUNLP-MT 4 | All rights reserved. 5 | 6 | Redistribution and use in source and binary forms, with or without 7 | modification, are permitted provided that the following conditions are met: 8 | 9 | * Redistributions of source code must retain the above copyright notice, this 10 | list of conditions and the following disclaimer. 11 | 12 | * Redistributions in binary form must reproduce the above copyright notice, 13 | this list of conditions and the following disclaimer in the documentation 14 | and/or other materials provided with the distribution. 15 | 16 | * Neither the name of the copyright holder nor the names of its 17 | contributors may be used to endorse or promote products derived from 18 | this software without specific prior written permission. 19 | 20 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 21 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 22 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE 23 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE 24 | FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 25 | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR 26 | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER 27 | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 28 | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 29 | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 30 | -------------------------------------------------------------------------------- /bib_citations/10_must_reads.bib: -------------------------------------------------------------------------------- 1 | @article{mathsmt, 2 | title={The mathematics of statistical machine translation: Parameter estimation}, 3 | author={Brown, Peter F and Pietra, Vincent J Della and Pietra, Stephen A Della and Mercer, Robert L}, 4 | journal={Computational linguistics}, 5 | volume={19}, 6 | number={2}, 7 | pages={263--311}, 8 | year={1993}, 9 | publisher={MIT Press} 10 | } 11 | @inproceedings{bleu, 12 | title={BLEU: a method for automatic evaluation of machine translation}, 13 | author={Papineni, Kishore and Roukos, Salim and Ward, Todd and Zhu, Wei-Jing}, 14 | booktitle={Proceedings of ACL}, 15 | year={2002} 16 | } 17 | @inproceedings{spbt, 18 | title={Statistical phrase-based translation}, 19 | author={Koehn, Philipp and Och, Franz Josef and Marcu, Daniel}, 20 | booktitle={Proceedings of NAACL}, 21 | year={2003} 22 | } 23 | @inproceedings{mrt4smt, 24 | title={Minimum error rate training in statistical machine translation}, 25 | author={Och, Franz Josef}, 26 | booktitle={Proceedings of ACL}, 27 | year={2003} 28 | } 29 | @article{hpbt, 30 | title={Hierarchical phrase-based translation}, 31 | author={Chiang, David}, 32 | journal={computational linguistics}, 33 | volume={33}, 34 | number={2}, 35 | pages={201--228}, 36 | year={2007}, 37 | publisher={MIT Press} 38 | } 39 | @inproceedings{seq2seq, 40 | title={Sequence to sequence learning with neural networks}, 41 | author={Sutskever, Ilya and Vinyals, Oriol and Le, Quoc V}, 42 | booktitle={Advances in neural information processing systems}, 43 | year={2014} 44 | } 45 | @inproceedings{rnnsearch, 46 | author = {Bahdanau, Dzmitry and Cho, KyungHyun and Bengio, Yoshua}, 47 | title = {Neural Machine Translation by Jointly Learning to Align and Translate}, 48 | booktitle = {Proceedings of ICLR}, 49 | year = {2015} 50 | } 51 | @inproceedings{adam, 52 | author = {Kingma, Diederik P. and Ba, Jimmy}, 53 | title = {Adam: A Method for Stochastic Optimization}, 54 | booktitle = {Proceedings of ICLR}, 55 | year = {2015} 56 | } 57 | @InProceedings{bpe, 58 | author = {Sennrich, Rico and Haddow, Barry and Birch, Alexandra}, 59 | title = {Neural Machine Translation of Rare Words with Subword Units}, 60 | booktitle = {Proceedings of ACL}, 61 | year = {2016} 62 | } 63 | @inproceedings{transformer, 64 | title={Attention Is All You Need}, 65 | author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, Lukasz and Polosukhin, Illia}, 66 | booktitle={Proceedings of NIPS}, 67 | year={2017} 68 | } -------------------------------------------------------------------------------- /bib_citations/Evaluation.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{bleu, 2 | title={BLEU: a method for automatic evaluation of machine translation}, 3 | author={Papineni, Kishore and Roukos, Salim and Ward, Todd and Zhu, Wei-Jing}, 4 | booktitle={Proceedings of ACL}, 5 | year={2002} 6 | } 7 | @inproceedings{koehn2004statistical, 8 | title={Statistical Significance Tests for Machine Translation Evaluation}, 9 | author={Koehn, Philipp}, 10 | booktitle={Proceedings of EMNLP}, 11 | year={2004} 12 | } 13 | @InProceedings{W05-0909, 14 | author = "Banerjee, Satanjeev 15 | and Lavie, Alon", 16 | title = "METEOR: An Automatic Metric for MT Evaluation with Improved Correlation with Human Judgments", 17 | booktitle = "Proceedings of the ACL Workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation and/or Summarization", 18 | year = "2005" 19 | } 20 | @inproceedings{snover2006study, 21 | title={A study of translation edit rate with targeted human annotation}, 22 | author={Snover, Matthew and Dorr, Bonnie and Schwartz, Richard and Micciulla, Linnea and Makhoul, John}, 23 | booktitle={Proceedings of Association for Machine Translation in the Americas}, 24 | year={2006} 25 | } 26 | @InProceedings{P18-1083, 27 | author = "Wang, Xin 28 | and Chen, Wenhu 29 | and Wang, Yuan-Fang 30 | and Wang, William Yang", 31 | title = "No Metrics Are Perfect: Adversarial Reward Learning for Visual Storytelling", 32 | booktitle = "Proceedings of ACL", 33 | year = "2018" 34 | } -------------------------------------------------------------------------------- /bib_citations/NMT_attention_mechanism.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{rnnsearch, 2 | author = {Bahdanau, Dzmitry and Cho, KyungHyun and Bengio, Yoshua}, 3 | title = {Neural Machine Translation by Jointly Learning to Align and Translate}, 4 | booktitle = {Proceedings of ICLR}, 5 | year = {2015} 6 | } 7 | @InProceedings{D15-1166, 8 | author = "Luong, Thang 9 | and Pham, Hieu 10 | and Manning, Christopher D.", 11 | title = "Effective Approaches to Attention-based Neural Machine Translation", 12 | booktitle = "Proceedings of EMNLP", 13 | year = "2015" 14 | } 15 | @inproceedings{Feng2016Improving, 16 | author = {Shi Feng and 17 | Shujie Liu and 18 | Nan Yang and 19 | Mu Li and 20 | Ming Zhou and 21 | Kenny Q. Zhu}, 22 | title = {Improving Attention Modeling with Implicit Distortion and Fertility for Machine Translation}, 23 | booktitle = {{COLING} 2016, 26th International Conference on Computational Linguistics, 24 | Proceedings of the Conference: Technical Papers, December 11-16, 2016, 25 | Osaka, Japan}, 26 | pages = {3082--3092}, 27 | year = {2016}, 28 | } 29 | @InProceedings{D16-1249, 30 | author = "Mi, Haitao 31 | and Wang, Zhiguo 32 | and Ittycheriah, Abe", 33 | title = "Supervised Attentions for Neural Machine Translation", 34 | booktitle = "Proceedings of EMNLP", 35 | year = "2016" 36 | } 37 | @InProceedings{lin2017structured, 38 | author={Lin, Zhouhan and Feng, Minwei and Santos, Cicero Nogueira dos and Yu, Mo and Xiang, Bing and Zhou, Bowen and Bengio, Yoshua}, 39 | title = "A structured self-attentive sentence embedding", 40 | booktitle = "Proceedings of ICLR", 41 | year = "2017" 42 | } 43 | @InProceedings{shen2017disan, 44 | author={Shen, Tao and Zhou, Tianyi and Long, Guodong and Jiang, Jing and Pan, Shirui and Zhang, Chengqi}, 45 | title = "DiSAN: Directional Self-Attention Network for RNN/CNN-Free Language Understanding", 46 | booktitle = "Proceedings of AAAI", 47 | year = "2018" 48 | } 49 | @InProceedings{shen2018bi, 50 | author={Shen, Tao and Zhou, Tianyi and Long, Guodong and Jiang, Jing and Zhang, Chengqi}, 51 | title={Bi-directional block self-attention for fast and memory-efficient sequence modeling}, 52 | booktitle = "Proceedings of ICLR", 53 | year = "2018" 54 | } 55 | @InProceedings{shen2018reinforced, 56 | author={Shen, Tao and Zhou, Tianyi and Long, Guodong and Jiang, Jing and Wang, Sen and Zhang, Chengqi}, 57 | title={Reinforced Self-Attention Network: a Hybrid of Hard and Soft Attention for Sequence Modeling}, 58 | booktitle = "Proceedings of IJCAI", 59 | year = "2018" 60 | } 61 | @InProceedings{N18-2074, 62 | author = "Shaw, Peter 63 | and Uszkoreit, Jakob 64 | and Vaswani, Ashish", 65 | title = "Self-Attention with Relative Position Representations", 66 | booktitle = "Proceedings of NAACL", 67 | year = "2018" 68 | } 69 | @InProceedings{N18-1124, 70 | author = "Miculicich Werlen, Lesly 71 | and Pappas, Nikolaos 72 | and Ram, Dhananjay 73 | and Popescu-Belis, Andrei", 74 | title = "Self-Attentive Residual Decoder for Neural Machine Translation", 75 | booktitle = "Proceedings of NAACL", 76 | year = "2018" 77 | } 78 | @InProceedings{N18-1125, 79 | author = "Li, Xintong 80 | and Liu, Lemao 81 | and Tu, Zhaopeng 82 | and Shi, Shuming 83 | and Meng, Max", 84 | title = "Target Foresight Based Attention for Neural Machine Translation", 85 | booktitle = "Proceedings of NAACL", 86 | year = "2018" 87 | } 88 | @InProceedings{P18-1166, 89 | author = "Zhang, Biao 90 | and Xiong, Deyi 91 | and su jinsong , jinsong", 92 | title = "Accelerating Neural Transformer via an Average Attention Network", 93 | booktitle = "Proceedings of ACL", 94 | year = "2018" 95 | } 96 | @InProceedings{P18-1167, 97 | author = "Domhan, Tobias", 98 | title = "How Much Attention Do You Need? A Granular Analysis of Neural Machine Translation Architectures", 99 | booktitle = "Proceedings of ACL", 100 | year = "2018" 101 | } 102 | @InProceedings{P18-1164, 103 | author = "Kuang, Shaohui 104 | and Li, Junhui 105 | and Branco, Ant{\'o}nio 106 | and Luo, Weihua 107 | and Xiong, Deyi", 108 | title = "Attention Focusing for Neural Machine Translation by Bridging Source and Target Embeddings", 109 | booktitle = "Proceedings of ACL", 110 | year = "2018" 111 | } 112 | @InProceedings{P18-2059, 113 | author = "Malaviya, Chaitanya 114 | and Ferreira, Pedro 115 | and Martins, Andr{\'e} F. T.", 116 | title = "Sparse and Constrained Attention for Neural Machine Translation", 117 | booktitle = "Proceedings of ACL", 118 | year = "2018" 119 | } 120 | @InProceedings{D18-1065, 121 | author = "Shankar, Shiv 122 | and Garg, Siddhant 123 | and Sarawagi, Sunita", 124 | title = "Surprisingly Easy Hard-Attention for Sequence to Sequence Learning", 125 | booktitle = "Proceedings of EMNLP", 126 | year = "2018" 127 | } 128 | @InProceedings{D18-1317, 129 | author = "Li, Jian 130 | and Tu, Zhaopeng 131 | and Yang, Baosong 132 | and Lyu, Michael R. 133 | and Zhang, Tong", 134 | title = "Multi-Head Attention with Disagreement Regularization", 135 | booktitle = "Proceedings of EMNLP", 136 | year = "2018" 137 | } 138 | @InProceedings{D18-1408, 139 | author = "Wu, Wei 140 | and Wang, Houfeng 141 | and Liu, Tianyu 142 | and Ma, Shuming", 143 | title = "Phrase-level Self-Attention Networks for Universal Sentence Encoding", 144 | booktitle = "Proceedings of EMNLP", 145 | year = "2018" 146 | } 147 | @InProceedings{D18-1475, 148 | author = "Yang, Baosong 149 | and Tu, Zhaopeng 150 | and Wong, Derek F. 151 | and Meng, Fandong 152 | and Chao, Lidia S. 153 | and Zhang, Tong", 154 | title = "Modeling Localness for Self-Attention Networks", 155 | booktitle = "Proceedings of EMNLP", 156 | year = "2018" 157 | } 158 | @InProceedings{D18-1331, 159 | author = "Lin, Junyang 160 | and Sun, Xu 161 | and Ren, Xuancheng 162 | and Li, Muyu 163 | and Su, Qi", 164 | title = "Learning When to Concentrate or Divert Attention: Self-Adaptive Attention Temperature for Neural Machine Translation", 165 | booktitle = "Proceedings of EMNLP", 166 | year = "2018" 167 | } 168 | @InProceedings{D18-1338, 169 | author = "Bapna, Ankur 170 | and Chen, Mia 171 | and Firat, Orhan 172 | and Cao, Yuan 173 | and Wu, Yonghui", 174 | title = "Training Deeper Neural Machine Translation Models with Transparent Attention", 175 | booktitle = "Proceedings of EMNLP", 176 | year = "2018" 177 | } 178 | @InProceedings{C18-1142, 179 | author = "Bahuleyan, Hareesh 180 | and Mou, Lili 181 | and Vechtomova, Olga 182 | and Poupart, Pascal", 183 | title = "Variational Attention for Sequence-to-Sequence Models", 184 | booktitle = "Proceedings of COLING", 185 | year = "2018" 186 | } 187 | @InProceedings{K18-1010, 188 | author = "Elbayad, Maha 189 | and Besacier, Laurent 190 | and Verbeek, Jakob", 191 | title = "Pervasive Attention: {\{}2D{\}} Convolutional Neural Networks for Sequence-to-Sequence Prediction", 192 | booktitle = "Proceedings of CoNLL", 193 | year = "2018" 194 | } 195 | @inproceedings{Deng2018LatentAA, 196 | title={Latent Alignment and Variational Attention}, 197 | author={Yuntian Deng and Yoon Kim and Justin Chiu and Demi Guo and Alexander M. Rush}, 198 | booktitle={NeurIPS}, 199 | year={2018} 200 | } 201 | @InProceedings{shankar2019posterior, 202 | title={Posterior Attention Models for Sequence to Sequence Learning}, 203 | author={Shankar, Shiv and Sarawagi, Sunita}, 204 | booktitle={Proceedings of ICLR}, 205 | year={2019} 206 | } 207 | @InProceedings{yang2019context-aware, 208 | author = "Yang, Baosong 209 | and Li, Jian 210 | and Wong, Derek 211 | and Chao, Lidia S 212 | and Wang, Xing 213 | and Tu, Zhaopeng", 214 | title = "Context-Aware Self-Attention Networks", 215 | booktitle = "Proceedings of AAAI" 216 | year = "2019" 217 | } -------------------------------------------------------------------------------- /bib_citations/NMT_decoding.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D16-1027, 2 | author = "Wang, Mingxuan 3 | and Lu, Zhengdong 4 | and Li, Hang 5 | and Liu, Qun", 6 | title = "Memory-enhanced Decoder for Neural Machine Translation", 7 | booktitle = "Proceedings of EMNLP", 8 | year = "2016" 9 | } 10 | @InProceedings{P17-1174, 11 | author = "Ishiwatari, Shonosuke 12 | and Yao, Jingtao 13 | and Liu, Shujie 14 | and Li, Mu 15 | and Zhou, Ming 16 | and Yoshinaga, Naoki 17 | and Kitsuregawa, Masaru 18 | and Jia, Weijia", 19 | title = "Chunk-based Decoder for Neural Machine Translation", 20 | booktitle = "Proceedings of ACL", 21 | year = "2017" 22 | } 23 | @InProceedings{P17-2092, 24 | author = "Zhou, Hao 25 | and Tu, Zhaopeng 26 | and Huang, Shujian 27 | and Liu, Xiaohua 28 | and Li, Hang 29 | and Chen, Jiajun", 30 | title = "Chunk-Based Bi-Scale Decoder for Neural Machine Translation", 31 | booktitle = "Proceedings of ACL", 32 | year = "2017" 33 | } 34 | @InProceedings{E17-2061, 35 | author = "Yang, Zichao 36 | and Hu, Zhiting 37 | and Deng, Yuntian 38 | and Dyer, Chris 39 | and Smola, Alex", 40 | title = "Neural Machine Translation with Recurrent Attention Modeling", 41 | booktitle = "Proceedings of EACL", 42 | year = "2017" 43 | } 44 | @InProceedings{W17-3207, 45 | author = "Freitag, Markus 46 | and Al-Onaizan, Yaser", 47 | title = "Beam Search Strategies for Neural Machine Translation", 48 | booktitle = "Proceedings of the First Workshop on Neural Machine Translation", 49 | year = "2017" 50 | } 51 | @InProceedings{W17-4716, 52 | author = "Chatterjee, Rajen 53 | and Negri, Matteo 54 | and Turchi, Marco 55 | and Federico, Marcello 56 | and Specia, Lucia 57 | and Blain, Fr{\'e}d{\'e}ric", 58 | title = "Guiding Neural Machine Translation Decoding with External Knowledge", 59 | booktitle = "Proceedings of the Second Conference on Machine Translation", 60 | year = "2017" 61 | } 62 | @InProceedings{D17-1014, 63 | author = "Hoang, Cong Duy Vu 64 | and Haffari, Gholamreza 65 | and Cohn, Trevor", 66 | title = "Towards Decoding as Continuous Optimisation in Neural Machine Translation", 67 | booktitle = "Proceedings of EMNLP", 68 | year = "2017" 69 | } 70 | @InProceedings{D17-1157, 71 | author = "Chang, Yin-Wen 72 | and Collins, Michael", 73 | title = "Source-Side Left-to-Right or Target-Side Left-to-Right? An Empirical Comparison of Two Phrase-Based Decoding Algorithms", 74 | booktitle = "Proceedings of EMNLP", 75 | year = "2017" 76 | } 77 | @InProceedings{D17-1210, 78 | author = "Gu, Jiatao 79 | and Cho, Kyunghyun 80 | and Li, Victor O.K.", 81 | title = "Trainable Greedy Decoding for Neural Machine Translation", 82 | booktitle = "Proceedings of EMNLP", 83 | year = "2017" 84 | } 85 | @inproceedings{Khayrallah:17, 86 | title={Neural Lattice Search for Domain Adaptation in Machine Translation}, 87 | author={Khayrallah, Huda and Kumar, Gaurav and Duh, Kevin and Post, Matt and Koehn, Philipp}, 88 | booktitle={Proceedings of IJCNLP}, 89 | year={2017} 90 | } 91 | @inproceedings{gu2017non, 92 | title={Non-autoregressive neural machine translation}, 93 | author={Gu, Jiatao and Bradbury, James and Xiong, Caiming and Li, Victor OK and Socher, Richard}, 94 | booktitle={Proceedings of ICLR}, 95 | year={2018} 96 | } 97 | @inproceedings{zhang2018asynchronous, 98 | title={Asynchronous Bidirectional Decoding for Neural Machine Translation}, 99 | author={Zhang, Xiangwen and Su, Jinsong and Qin, Yue and Liu, Yang and Ji, Rongrong and Wang, Hongji}, 100 | booktitle={Proceedings of AAAI}, 101 | year={2018} 102 | } 103 | @inproceedings{gu2018neural, 104 | title={Neural machine translation with gumbel-greedy decoding}, 105 | author={Gu, Jiatao and Im, Daniel Jiwoong and Li, Victor OK}, 106 | booktitle={Proceedings of AAAI}, 107 | year={2018} 108 | } 109 | @InProceedings{P18-1115, 110 | author = "Schulz, Philip 111 | and Aziz, Wilker 112 | and Cohn, Trevor", 113 | title = "A Stochastic Decoder for Neural Machine Translation", 114 | booktitle = "Proceedings of ACL", 115 | year = "2018" 116 | } 117 | @InProceedings{P18-2054, 118 | author = "Shu, Raphael 119 | and Nakayama, Hideki", 120 | title = "Improving Beam Search by Removing Monotonic Constraint for Neural Machine Translation", 121 | booktitle = "Proceedings of ACL", 122 | year = "2018" 123 | } 124 | @InProceedings{C18-1276, 125 | author = "Lin, Junyang 126 | and Sun, Xu 127 | and Ren, Xuancheng 128 | and Ma, Shuming 129 | and Su, Jinsong 130 | and Su, Qi", 131 | title = "Deconvolution-Based Global Decoding for Neural Machine Translation", 132 | booktitle = "Proceedings of COLING", 133 | year = "2018" 134 | } 135 | @InProceedings{D18-1044, 136 | author = "Wang, Chunqi 137 | and Zhang, Ji 138 | and Chen, Haiqing", 139 | title = "Semi-Autoregressive Neural Machine Translation", 140 | booktitle = "Proceedings of EMNLP", 141 | year = "2018" 142 | } 143 | @InProceedings{D18-1048, 144 | author = "Geng, Xinwei 145 | and Feng, Xiaocheng 146 | and Qin, Bing 147 | and Liu, Ting", 148 | title = "Adaptive Multi-pass Decoder for Neural Machine Translation", 149 | booktitle = "Proceedings of EMNLP", 150 | year = "2018" 151 | } 152 | @InProceedings{D18-1460, 153 | author = "Zhang, Wen 154 | and Huang, Liang 155 | and Feng, Yang 156 | and Shen, Lei 157 | and Liu, Qun", 158 | title = "Speeding Up Neural Machine Translation Decoding by Cube Pruning", 159 | booktitle = "Proceedings of EMNLP", 160 | year = "2018" 161 | } 162 | @InProceedings{D18-1509, 163 | author = "Wang, Xinyi 164 | and Pham, Hieu 165 | and Yin, Pengcheng 166 | and Neubig, Graham", 167 | title = "A Tree-based Decoder for Neural Machine Translation", 168 | booktitle = "Proceedings of EMNLP", 169 | year = "2018" 170 | } 171 | @InProceedings{D18-1510, 172 | author = "Shao, Chenze 173 | and Chen, Xilin 174 | and Feng, Yang", 175 | title = "Greedy Search with Probabilistic N-gram Matching for Neural Machine Translation", 176 | booktitle = "Proceedings of EMNLP", 177 | year = "2018" 178 | } 179 | @InProceedings{D18-1511, 180 | author = "Zhang, Zhisong 181 | and Wang, Rui 182 | and Utiyama, Masao 183 | and Sumita, Eiichiro 184 | and Zhao, Hai", 185 | title = "Exploring Recombination for Efficient Decoding of Neural Machine Translation", 186 | booktitle = "Proceedings of EMNLP", 187 | year = "2018" 188 | } 189 | @InProceedings{D18-1037, 190 | author = "G{\={u}}, Jetic 191 | and Shavarani, Hassan S. 192 | and Sarkar, Anoop", 193 | title = "Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing", 194 | booktitle = "Proceedings of EMNLP", 195 | year = "2018" 196 | } 197 | @InProceedings{D18-1342, 198 | author = "Yang, Yilin 199 | and Huang, Liang 200 | and Ma, Mingbo", 201 | title = "Breaking the Beam Search Curse: A Study of (Re-)Scoring Methods and Stopping Criteria for Neural Machine Translation", 202 | booktitle = "Proceedings of EMNLP", 203 | year = "2018" 204 | } 205 | @InProceedings{D18-1035, 206 | author = "Chen, Yun 207 | and Li, Victor O.K. 208 | and Cho, Kyunghyun 209 | and Bowman, Samuel", 210 | title = "A Stable and Effective Learning Strategy for Trainable Greedy Decoding", 211 | booktitle = "Proceedings of EMNLP", 212 | year = "2018" 213 | } 214 | @InProceedings{guo2018non, 215 | title={Non-autoregressive neural machine translation with enhanced decoder input}, 216 | author={Guo, Junliang and Tan, Xu and He, Di and Qin, Tao and Xu, Linli and Liu, Tie-Yan}, 217 | booktitle={Proceedings of AAAI}, 218 | year={2019} 219 | } 220 | @InProceedings{wang2019non, 221 | title={Non-Autoregressive Machine Translation with Auxiliary Regularization}, 222 | author={Wang, Yiren and Tian, Fei and He, Di and Qin, Tao and Zhai, ChengXiang and Liu, Tie-Yan}, 223 | booktitle={Proceedings of AAAI}, 224 | year={2019} 225 | } -------------------------------------------------------------------------------- /bib_citations/NMT_document_level.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D17-1301, 2 | author = "Wang, Longyue 3 | and Tu, Zhaopeng 4 | and Way, Andy 5 | and Liu, Qun", 6 | title = "Exploiting Cross-Sentence Context for Neural Machine Translation", 7 | booktitle = "Proceedings of EMNLP", 8 | year = "2017" 9 | } 10 | @InProceedings{W17-4811, 11 | author = "Tiedemann, J{\"o}rg 12 | and Scherrer, Yves", 13 | title = "Neural Machine Translation with Extended Context", 14 | booktitle = "Proceedings of the Third Workshop on Discourse in Machine Translation", 15 | year = "2017" 16 | } 17 | @InProceedings{N18-1118, 18 | author = "Bawden, Rachel 19 | and Sennrich, Rico 20 | and Birch, Alexandra 21 | and Haddow, Barry", 22 | title = "Evaluating Discourse Phenomena in Neural Machine Translation", 23 | booktitle = "Proceedings of NAACL", 24 | year = "2018" 25 | } 26 | @InProceedings{P18-1117, 27 | author = "Voita, Elena 28 | and Serdyukov, Pavel 29 | and Sennrich, Rico 30 | and Titov, Ivan", 31 | title = "Context-Aware Neural Machine Translation Learns Anaphora Resolution", 32 | booktitle = "Proceedings of ACL", 33 | year = "2018" 34 | } 35 | @InProceedings{P18-1118, 36 | author = "Maruf, Sameen 37 | and Haffari, Gholamreza", 38 | title = "Document Context Neural Machine Translation with Memory Networks", 39 | booktitle = "Proceedings of ACL", 40 | year = "2018" 41 | } 42 | @InProceedings{C18-1050, 43 | author = "Kuang, Shaohui 44 | and Xiong, Deyi 45 | and Luo, Weihua 46 | and Zhou, Guodong", 47 | title = "Modeling Coherence for Neural Machine Translation with Dynamic and Topic Caches", 48 | booktitle = "Proceedings of COLING", 49 | year = "2018" 50 | } 51 | @InProceedings{C18-1051, 52 | author = "Kuang, Shaohui 53 | and Xiong, Deyi", 54 | title = "Fusing Recency into Neural Machine Translation with an Inter-Sentence Gate Model", 55 | booktitle = "Proceedings of COLING", 56 | year = "2018" 57 | } 58 | @InProceedings{D18-1049, 59 | author = "Zhang, Jiacheng 60 | and Luan, Huanbo 61 | and Sun, Maosong 62 | and Zhai, Feifei 63 | and Xu, Jingfang 64 | and Zhang, Min 65 | and Liu, Yang", 66 | title = "Improving the Transformer Translation Model with Document-Level Context", 67 | booktitle = "Proceedings of EMNLP", 68 | year = "2018" 69 | } 70 | @InProceedings{D18-1512, 71 | author = "L{\"a}ubli, Samuel 72 | and Sennrich, Rico 73 | and Volk, Martin", 74 | title = "Has Machine Translation Achieved Human Parity? A Case for Document-level Evaluation", 75 | booktitle = "Proceedings of EMNLP", 76 | year = "2018" 77 | } 78 | @InProceedings{D18-1325, 79 | author = "Miculicich, Lesly 80 | and Ram, Dhananjay 81 | and Pappas, Nikolaos 82 | and Henderson, James", 83 | title = "Document-Level Neural Machine Translation with Hierarchical Attention Networks", 84 | booktitle = "Proceedings of EMNLP", 85 | year = "2018" 86 | } 87 | @Article{Q18-1029, 88 | author = "Tu, Zhaopeng 89 | and Liu, Yang 90 | and Shi, Shuming 91 | and Zhang, Tong", 92 | title = "Learning to Remember Translation History with a Continuous Cache", 93 | journal = "Transactions of the Association for Computational Linguistics", 94 | year = "2018", 95 | volume = "6", 96 | pages = "407--420" 97 | } -------------------------------------------------------------------------------- /bib_citations/NMT_domain_adaptation.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P17-2061, 2 | author = "Chu, Chenhui 3 | and Dabre, Raj 4 | and Kurohashi, Sadao", 5 | title = "An Empirical Comparison of Domain Adaptation Methods for Neural Machine Translation", 6 | booktitle = "Proceedings of ACL", 7 | year = "2017" 8 | } 9 | @InProceedings{P17-2089, 10 | author = "Wang, Rui 11 | and Finch, Andrew 12 | and Utiyama, Masao 13 | and Sumita, Eiichiro", 14 | title = "Sentence Embedding for Neural Machine Translation Domain Adaptation", 15 | booktitle = "Proceedings of ACL", 16 | year = "2017" 17 | } 18 | @InProceedings{W17-3205, 19 | author = "Chen, Boxing 20 | and Cherry, Colin 21 | and Foster, George 22 | and Larkin, Samuel", 23 | title = "Cost Weighting for Neural Machine Translation Domain Adaptation", 24 | booktitle = "Proceedings of the First Workshop on Neural Machine Translation", 25 | year = "2017" 26 | } 27 | @InProceedings{W17-4712, 28 | author = "Britz, Denny 29 | and Le, Quoc 30 | and Pryzant, Reid", 31 | title = "Effective Domain Mixing for Neural Machine Translation", 32 | booktitle = "Proceedings of the Second Conference on Machine Translation", 33 | year = "2017" 34 | } 35 | @InProceedings{W17-4714, 36 | author = "Chinea-Rios, Mara 37 | and Peris, {\`A}lvaro 38 | and Casacuberta, Francisco", 39 | title = "Adapting Neural Machine Translation with Parallel Synthetic Data", 40 | booktitle = "Proceedings of the Second Conference on Machine Translation", 41 | year = "2017" 42 | } 43 | @InProceedings{D17-1155, 44 | author = "Wang, Rui 45 | and Utiyama, Masao 46 | and Liu, Lemao 47 | and Chen, Kehai 48 | and Sumita, Eiichiro", 49 | title = "Instance Weighting for Neural Machine Translation Domain Adaptation", 50 | booktitle = "Proceedings of EMNLP", 51 | year = "2017" 52 | } 53 | @InProceedings{D17-1156, 54 | author = "Miceli Barone, Antonio Valerio 55 | and Haddow, Barry 56 | and Germann, Ulrich 57 | and Sennrich, Rico", 58 | title = "Regularization techniques for fine-tuning in neural machine translation", 59 | booktitle = "Proceedings of EMNLP", 60 | year = "2017" 61 | } 62 | @InProceedings{N18-2080, 63 | author = "Vilar, David", 64 | title = "Learning Hidden Unit Contribution for Adapting Neural Machine Translation Models", 65 | booktitle = "Proceedings of NAACL", 66 | year = "2018" 67 | } 68 | @InProceedings{P18-2050, 69 | author = "Michel, Paul 70 | and Neubig, Graham", 71 | title = "Extreme Adaptation for Personalized Neural Machine Translation", 72 | booktitle = "Proceedings of ACL", 73 | year = "2018" 74 | } 75 | @InProceedings{C18-1269, 76 | author = "Zhang, Shiqi 77 | and Xiong, Deyi", 78 | title = "Sentence Weighting for Neural Machine Translation Domain Adaptation", 79 | booktitle = "Proceedings of COLING", 80 | year = "2018" 81 | } 82 | @InProceedings{C18-1111, 83 | author = "Chu, Chenhui 84 | and Wang, Rui", 85 | title = "A Survey of Domain Adaptation for Neural Machine Translation", 86 | booktitle = "Proceedings of COLING", 87 | year = "2018" 88 | } 89 | @InProceedings{D18-1041, 90 | author = "Zeng, Jiali 91 | and Su, Jinsong 92 | and Wen, Huating 93 | and Liu, Yang 94 | and Xie, Jun 95 | and Yin, Yongjing 96 | and Zhao, Jianqiang", 97 | title = "Multi-Domain Neural Machine Translation with Word-Level Domain Context Discrimination", 98 | booktitle = "Proceedings of EMNLP", 99 | year = "2018" 100 | } 101 | @InProceedings{D18-1103, 102 | author = "Neubig, Graham 103 | and Hu, Junjie", 104 | title = "Rapid Adaptation of Neural Machine Translation to New Languages", 105 | booktitle = "Proceedings of EMNLP", 106 | year = "2018" 107 | } 108 | @inproceedings{zeng-etal-2019-iterative, 109 | title = "Iterative Dual Domain Adaptation for Neural Machine Translation", 110 | author = "Zeng, Jiali and 111 | Liu, Yang and 112 | su, jinsong and 113 | Ge, yubing and 114 | Lu, Yaojie and 115 | Yin, Yongjing and 116 | luo, jiebo", 117 | booktitle = "Proceedings of EMNLP", 118 | publisher = "Association for Computational Linguistics" 119 | } -------------------------------------------------------------------------------- /bib_citations/NMT_efficiency.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{K16-1029, 2 | author = "See, Abigail 3 | and Luong, Minh-Thang 4 | and Manning, Christopher D.", 5 | title = "Compression of Neural Machine Translation Models via Pruning", 6 | booktitle = "Proceedings of CoNLL", 7 | year = "2016" 8 | } 9 | @InProceedings{P17-1079, 10 | author = "Oda, Yusuke 11 | and Arthur, Philip 12 | and Neubig, Graham 13 | and Yoshino, Koichiro 14 | and Nakamura, Satoshi", 15 | title = "Neural Machine Translation via Binary Code Prediction", 16 | booktitle = "Proceedings of ACL", 17 | year = "2017" 18 | } 19 | @InProceedings{P17-2091, 20 | author = "Shi, Xing 21 | and Knight, Kevin", 22 | title = "Speeding Up Neural Machine Translation Decoding by Shrinking Run-time Vocabulary", 23 | booktitle = "Proceedings of ACL", 24 | year = "2017" 25 | } 26 | @InProceedings{E17-2025, 27 | author = "Press, Ofir 28 | and Wolf, Lior", 29 | title = "Using the Output Embedding to Improve Language Models", 30 | booktitle = "Proceedings of EACL", 31 | year = "2017" 32 | } 33 | @InProceedings{D17-1154, 34 | author = "Zhang, Xiaowei 35 | and Chen, Wei 36 | and Wang, Feng 37 | and Xu, Shuang 38 | and Xu, Bo", 39 | title = "Towards Compact and Fast Neural Machine Translation Using a Combined Method", 40 | booktitle = "Proceedings of EMNLP", 41 | year = "2017" 42 | } 43 | @InProceedings{D17-1300, 44 | author = "Devlin, Jacob", 45 | title = "Sharp Models on Dull Hardware: Fast and Accurate Neural Machine Translation Decoding on the CPU", 46 | booktitle = "Proceedings of EMNLP", 47 | year = "2017" 48 | } 49 | @InProceedings{I17-2046, 50 | author = "Zhang, Dakun 51 | and Kim, Jungi 52 | and Crego, Josep 53 | and Senellart, Jean", 54 | title = "Boosting Neural Machine Translation", 55 | booktitle = "Proceedings of IJCNLP", 56 | year = "2017" 57 | } 58 | @InProceedings{kaiser2018fast, 59 | title={Fast Decoding in Sequence Models Using Discrete Latent Variables}, 60 | author={Kaiser, {\L}ukasz and Roy, Aurko and Vaswani, Ashish and Pamar, Niki and Bengio, Samy and Uszkoreit, Jakob and Shazeer, Noam}, 61 | booktitle={Proceedings of ICML}, 62 | year={2018} 63 | } 64 | @InProceedings{N18-3013, 65 | author = "Iglesias, Gonzalo 66 | and Tambellini, William 67 | and de Gispert, Adri{\`a} 68 | and Hasler, Eva 69 | and Byrne, Bill", 70 | title = "Accelerating NMT Batched Beam Decoding with LMBR Posteriors for Deployment", 71 | booktitle = "Proceedings of NAACL", 72 | year = "2018" 73 | } 74 | @InProceedings{N18-3014, 75 | author = "Quinn, Jerry 76 | and Ballesteros, Miguel", 77 | title = "Pieces of Eight: 8-bit Neural Machine Translation", 78 | booktitle = "Proceedings of NAACL", 79 | year = "2018" 80 | } 81 | @InProceedings{N18-1119, 82 | author = "Post, Matt 83 | and Vilar, David", 84 | title = "Fast Lexically Constrained Decoding with Dynamic Beam Allocation for Neural Machine Translation", 85 | booktitle = "Proceedings of NAACL", 86 | year = "2018" 87 | } 88 | @InProceedings{P18-1166, 89 | author = "Zhang, Biao 90 | and Xiong, Deyi 91 | and su jinsong , jinsong", 92 | title = "Accelerating Neural Transformer via an Average Attention Network", 93 | booktitle = "Proceedings of ACL", 94 | year = "2018" 95 | } 96 | @InProceedings{P18-2048, 97 | author = "Wang, Rui 98 | and Utiyama, Masao 99 | and Sumita, Eiichiro", 100 | title = "Dynamic Sentence Sampling for Efficient Training of Neural Machine Translation", 101 | booktitle = "Proceedings of ACL", 102 | year = "2018" 103 | } 104 | @InProceedings{W18-6301, 105 | author = "Ott, Myle 106 | and Edunov, Sergey 107 | and Grangier, David 108 | and Auli, Michael", 109 | title = "Scaling Neural Machine Translation", 110 | booktitle = "Proceedings of the Third Conference on Machine Translation: Research Papers", 111 | year = "2018" 112 | } 113 | @InProceedings{D18-1104, 114 | author = "Wuebker, Joern 115 | and Simianer, Patrick 116 | and DeNero, John", 117 | title = "Compact Personalized Models for Neural Machine Translation", 118 | booktitle = "Proceedings of EMNLP", 119 | year = "2018" 120 | } 121 | @InProceedings{D18-1460, 122 | author = "Zhang, Wen 123 | and Huang, Liang 124 | and Feng, Yang 125 | and Shen, Lei 126 | and Liu, Qun", 127 | title = "Speeding Up Neural Machine Translation Decoding by Cube Pruning", 128 | booktitle = "Proceedings of EMNLP", 129 | year = "2018" 130 | } 131 | @InProceedings{D18-1511, 132 | author = "Zhang, Zhisong 133 | and Wang, Rui 134 | and Utiyama, Masao 135 | and Sumita, Eiichiro 136 | and Zhao, Hai", 137 | title = "Exploring Recombination for Efficient Decoding of Neural Machine Translation", 138 | booktitle = "Proceedings of EMNLP", 139 | year = "2018" 140 | } 141 | @InProceedings{D18-1332, 142 | author = "Bogoychev, Nikolay 143 | and Heafield, Kenneth 144 | and Aji, Alham Fikri 145 | and Junczys-Dowmunt, Marcin", 146 | title = "Accelerating Asynchronous Stochastic Gradient Descent for Neural Machine Translation", 147 | booktitle = "Proceedings of EMNLP", 148 | year = "2018" 149 | } 150 | @inproceedings{NIPS2018_8212, 151 | title = {Blockwise Parallel Decoding for Deep Autoregressive Models}, 152 | author = {Stern, Mitchell and Shazeer, Noam and Uszkoreit, Jakob}, 153 | booktitle = {Proceedings of NeurIPS}, 154 | year = {2018}, 155 | } 156 | 157 | -------------------------------------------------------------------------------- /bib_citations/NMT_ensemble_and_reranking.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{C16-1133, 2 | author = "Garmash, Ekaterina 3 | and Monz, Christof", 4 | title = "Ensemble Learning for Multi-Source Neural Machine Translation", 5 | booktitle = "Proceedings of COLING", 6 | year = "2016" 7 | } 8 | @InProceedings{P17-2060, 9 | author = "Zhou, Long 10 | and Hu, Wenpeng 11 | and Zhang, Jiajun 12 | and Zong, Chengqing", 13 | title = "Neural System Combination for Machine Translation", 14 | booktitle = "Proceedings of ACL", 15 | year = "2017" 16 | } 17 | @InProceedings{D18-1150, 18 | author = "Huang, Jiaji 19 | and Li, Yi 20 | and Ping, Wei 21 | and Huang, Liang", 22 | title = "Large Margin Neural Language Model", 23 | booktitle = "Proceedings of EMNLP", 24 | year = "2018" 25 | } 26 | -------------------------------------------------------------------------------- /bib_citations/NMT_fairness_and_diversity.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{W16-4620, 2 | author = "Yamagishi, Hayahide 3 | and Kanouchi, Shin 4 | and Sato, Takayuki 5 | and Komachi, Mamoru", 6 | title = "Controlling the Voice of a Sentence in Japanese-to-English Neural Machine Translation", 7 | booktitle = "Proceedings of the 3rd Workshop on Asian Translation (WAT2016)", 8 | year = "2016", 9 | } 10 | @InProceedings{N16-1005, 11 | author = "Sennrich, Rico 12 | and Haddow, Barry 13 | and Birch, Alexandra", 14 | title = "Controlling Politeness in Neural Machine Translation via Side Constraints", 15 | booktitle = "Proceedings of NAACL", 16 | year = "2016", 17 | } 18 | @InProceedings{E17-1101, 19 | author = "Rabinovich, Ella 20 | and Patel, Raj Nath 21 | and Mirkin, Shachar 22 | and Specia, Lucia 23 | and Wintner, Shuly", 24 | title = "Personalized Machine Translation: Preserving Original Author Traits", 25 | booktitle = "Proceedings of EACL", 26 | year = "2017" 27 | } 28 | @InProceedings{ott2018analyzing, 29 | title={Analyzing uncertainty in neural machine translation}, 30 | author={Ott, Myle and Auli, Michael and Granger, David and Ranzato, Marc'Aurelio}, 31 | booktitle={Proceedings of ICML}, 32 | year={2018} 33 | } 34 | @InProceedings{P18-2050, 35 | author = "Michel, Paul 36 | and Neubig, Graham", 37 | title = "Extreme Adaptation for Personalized Neural Machine Translation", 38 | booktitle = "Proceedings of ACL", 39 | year = "2018", 40 | } 41 | @InProceedings{P18-1115, 42 | author = "Schulz, Philip 43 | and Aziz, Wilker 44 | and Cohn, Trevor", 45 | title = "A Stochastic Decoder for Neural Machine Translation", 46 | booktitle = "Proceedings of ACL", 47 | year = "2018", 48 | } 49 | @InProceedings{D18-1334, 50 | author = "Vanmassenhove, Eva 51 | and Hardmeier, Christian 52 | and Way, Andy", 53 | title = "Getting Gender Right in Neural Machine Translation", 54 | booktitle = "Proceedings of EMNLP", 55 | year = "2018", 56 | } -------------------------------------------------------------------------------- /bib_citations/NMT_human_centered_automatic_post-editing.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{P16-2046, 2 | title={A neural network based approach to automatic post-editing}, 3 | author={Pal, Santanu and Naskar, Sudip Kumar and Vela, Mihaela and van Genabith, Josef}, 4 | booktitle={Proceedings of ACL}, 5 | year={2016} 6 | } 7 | @InProceedings{W16-2378, 8 | author = "Junczys-Dowmunt, Marcin 9 | and Grundkiewicz, Roman", 10 | title = "Log-linear Combinations of Monolingual and Bilingual Neural Machine Translation Models for Automatic Post-Editing", 11 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 12 | year = "2016", 13 | } 14 | @InProceedings{E17-2056, 15 | author = "Pal, Santanu 16 | and Naskar, Sudip Kumar 17 | and Vela, Mihaela 18 | and Liu, Qun 19 | and van Genabith, Josef", 20 | title = "Neural Automatic Post-Editing Using Prior Alignment and Reranking", 21 | booktitle = "Proceedings of EACL", 22 | year = "2017", 23 | } 24 | @InProceedings{E17-1050, 25 | author = "Chatterjee, Rajen 26 | and Gebremelak, Gebremedhen 27 | and Negri, Matteo 28 | and Turchi, Marco", 29 | title = "Online Automatic Post-editing for MT in a Multi-Domain Translation Environment", 30 | booktitle = "Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 1, Long Papers", 31 | year = "2017", 32 | publisher = "Association for Computational Linguistics", 33 | pages = "525--535", 34 | location = "Valencia, Spain", 35 | url = "http://aclweb.org/anthology/E17-1050" 36 | } 37 | @InProceedings{N18-1025, 38 | author = "Grangier, David 39 | and Auli, Michael", 40 | title = "QuickEdit: Editing Text {\&} Translations by Crossing Words Out", 41 | booktitle = "Proceedings of NAACL", 42 | year = "2018" 43 | } 44 | @InProceedings{D18-1341, 45 | author = "Vu, Thuy-Trang 46 | and Haffari, Gholamreza", 47 | title = "Automatic Post-Editing of Machine Translation: A Neural Programmer-Interpreter Approach", 48 | booktitle = "Proceedings of EMNLP", 49 | year = "2018" 50 | } 51 | @InProceedings{D19-1634, 52 | author = "Huang, Xuancheng and 53 | Liu, Yang and 54 | Luan, Huanbo and 55 | Xu, Jingfang and 56 | Sun, Maosong", 57 | title = "Learning to Copy for Automatic Post-Editing", 58 | booktitle = "Proceedings of EMNLP", 59 | year = "2019" 60 | } 61 | -------------------------------------------------------------------------------- /bib_citations/NMT_human_centered_interactive.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P16-1007, 2 | author = "Wuebker, Joern 3 | and Green, Spence 4 | and DeNero, John 5 | and Hasan, Sasa 6 | and Luong, Minh-Thang", 7 | title = "Models and Inference for Prefix-Constrained Machine Translation", 8 | booktitle = "Proceedings of ACL", 9 | year = "2016" 10 | } 11 | @InProceedings{knowles2016neural, 12 | author="Knowles, Rebecca and Koehn, Philipp", 13 | title="Neural interactive translation prediction", 14 | booktitle="Proceedings of the Association for Machine Translation in the Americas", 15 | year="2016" 16 | } 17 | @article{peris2017interactive, 18 | author="Peris, {\'A}lvaro and Domingo, Miguel and Casacuberta, Francisco", 19 | title="Interactive neural machine translation", 20 | journal="Computer Speech \& Language", 21 | volume="45", 22 | pages="201--220", 23 | year="2017", 24 | publisher="Elsevier" 25 | } 26 | @InProceedings{D17-1153, 27 | author = "Nguyen, Khanh 28 | and Daum{\'e} III, Hal 29 | and Boyd-Graber, Jordan", 30 | title = "Reinforcement Learning for Bandit Neural Machine Translation with Simulated Human Feedback", 31 | booktitle = "Proceedings of EMNLP", 32 | year = "2017" 33 | } 34 | @InProceedings{K18-1015, 35 | author = "Peris, {\`A}lvaro 36 | and Casacuberta, Francisco", 37 | title = "Active Learning for Interactive Neural Machine Translation of Data Streams", 38 | booktitle = "Proceedings of CoNLL", 39 | year = "2018" 40 | } 41 | @InProceedings{lam2018reinforcement, 42 | author = "Lam, Tsz, Kin, 43 | and Kreutzer, Julia 44 | and Riezler Stefan", 45 | title = "A Reinforcement Learning Approach to Interactive-Predictive Neural Machine Translation", 46 | booktitle = "Proceedings of EAMT", 47 | year = "2018" 48 | } 49 | @InProceedings{N18-3012, 50 | author = "Kreutzer, Julia 51 | and Khadivi, Shahram 52 | and Matusov, Evgeny 53 | and Riezler, Stefan", 54 | title = "Can Neural Machine Translation be Improved with User Feedback?", 55 | booktitle = "Proceedings of NAACL", 56 | year = "2018" 57 | } 58 | @InProceedings{P18-2052, 59 | author = "Petrushkov, Pavel 60 | and Khadivi, Shahram 61 | and Matusov, Evgeny", 62 | title = "Learning from Chunk-based Feedback in Neural Machine Translation", 63 | booktitle = "Proceedings of ACL", 64 | year = "2018" 65 | } 66 | @InProceedings{P18-1165, 67 | author = "Kreutzer, Julia 68 | and Uyheng, Joshua 69 | and Riezler, Stefan", 70 | title = "Reliability and Learnability of Human Bandit Feedback for Sequence-to-Sequence Reinforcement Learning", 71 | booktitle = "Proceedings of ACL", 72 | year = "2018" 73 | } 74 | -------------------------------------------------------------------------------- /bib_citations/NMT_interpretability.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{ding2017visualizing, 2 | title={Visualizing and understanding neural machine translation}, 3 | author={Ding, Yanzhuo and Liu, Yang and Luan, Huanbo and Sun, Maosong}, 4 | booktitle={Proceedings of ACL}, 5 | year={2017} 6 | } 7 | @article{strobelt2019s, 8 | title={Seq2seq-Vis: A Visual Debugging Tool for Sequence-to-Sequence Models}, 9 | author={Strobelt, Hendrik and Gehrmann, Sebastian and Behrisch, Michael and Perer, Adam and Pfister, Hanspeter and Rush, Alexander M}, 10 | journal={IEEE transactions on visualization and computer graphics}, 11 | volume={25}, 12 | number={1}, 13 | pages={353--363}, 14 | year={2019}, 15 | publisher={IEEE} 16 | } 17 | @InProceedings{W18-5431, 18 | author = "Raganato, Alessandro 19 | and Tiedemann, J{\"o}rg", 20 | title = "An Analysis of Encoder Representations in Transformer-Based Machine Translation", 21 | booktitle = "Proceedings of the 2018 EMNLP Workshop BlackboxNLP: Analyzing and Interpreting Neural Networks for NLP", 22 | year = "2018", 23 | } 24 | @InProceedings{W18-5420, 25 | author = "Stahlberg, Felix 26 | and Saunders, Danielle 27 | and Byrne, Bill", 28 | title = "An Operation Sequence Model for Explainable Neural Machine Translation", 29 | booktitle = "Proceedings of the 2018 EMNLP Workshop BlackboxNLP: Analyzing and Interpreting Neural Networks for NLP", 30 | year = "2018", 31 | } 32 | @InProceedings{dalvi2018what, 33 | title={What Is One Grain of Sand in the Desert? Analyzing Individual Neurons in Deep NLP Models}, 34 | author={Dalvi, Fahim and Durrani, Nadir and Sajjad, Hassan and Belinkov, Yonatan and Bau, Anthony and Glass, James}, 35 | booktitle={Proceedings of AAAI}, 36 | year={2019} 37 | } 38 | @InProceedings{bau2018identifying, 39 | title={Identifying and Controlling Important Neurons in Neural Machine Translation}, 40 | author={Bau, Anthony and Belinkov, Yonatan and Sajjad, Hassan and Durrani, Nadir and Dalvi, Fahim and Glass, James}, 41 | booktitle={Proceedings of ICLR}, 42 | year={2019} 43 | } 44 | -------------------------------------------------------------------------------- /bib_citations/NMT_linguistic_interpretation.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{hill2015embedding, 2 | title={Embedding word similarity with neural machine translation}, 3 | author={Hill, Felix and Cho, Kyunghyun and Jean, Sebastien and Devin, Coline and Bengio, Yoshua}, 4 | booktitle={Proceedings of ICLR}, 5 | year={2015} 6 | } 7 | @InProceedings{D16-1159, 8 | author = "Shi, Xing 9 | and Padhi, Inkit 10 | and Knight, Kevin", 11 | title = "Does String-Based Neural MT Learn Source Syntax?", 12 | booktitle = "Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing ", 13 | year = "2016", 14 | } 15 | @InProceedings{P17-1080, 16 | author = "Belinkov, Yonatan 17 | and Durrani, Nadir 18 | and Dalvi, Fahim 19 | and Sajjad, Hassan 20 | and Glass, James", 21 | title = "What do Neural Machine Translation Models Learn about Morphology?", 22 | booktitle = "Proceedings of ACL", 23 | year = "2017" 24 | } 25 | @InProceedings{P17-1049, 26 | author = "Rabinovich, Ella 27 | and Ordan, Noam 28 | and Wintner, Shuly", 29 | title = "Found in Translation: Reconstructing Phylogenetic Language Trees from Translations", 30 | booktitle = "Proceedings of ACL", 31 | year = "2017" 32 | } 33 | @InProceedings{E17-2060, 34 | author = "Sennrich, Rico", 35 | title = "How Grammatical is Character-level Neural Machine Translation? Assessing MT Quality with Contrastive Translation Pairs", 36 | booktitle = "Proceedings of EACL", 37 | year = "2017" 38 | } 39 | @InProceedings{N18-2082, 40 | author = "Poliak, Adam 41 | and Belinkov, Yonatan 42 | and Glass, James 43 | and Van Durme, Benjamin", 44 | title = "On the Evaluation of Semantic Phenomena in Neural Machine Translation Using Natural Language Inference", 45 | booktitle = "Proceedings of NAACL", 46 | year = "2018" 47 | } 48 | @InProceedings{D18-1313, 49 | author = "Bisazza, Arianna 50 | and Tump, Clara", 51 | title = "The Lazy Encoder: A Fine-Grained Analysis of the Role of Morphology in Neural Machine Translation", 52 | booktitle = "Proceedings of EMNLP", 53 | year = "2018" 54 | } 55 | @InProceedings{D18-1396, 56 | author = "Wu, Lijun 57 | and Tan, Xu 58 | and He, Di 59 | and Tian, Fei 60 | and Qin, Tao 61 | and Lai, Jianhuang 62 | and Liu, Tie-Yan", 63 | title = "Beyond Error Propagation in Neural Machine Translation: Characteristics of Language Also Matter", 64 | booktitle = "Proceedings of EMNLP", 65 | year = "2018" 66 | } 67 | -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_data_augmentation.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P17-2090, 2 | author = "Fadaee, Marzieh 3 | and Bisazza, Arianna 4 | and Monz, Christof", 5 | title = "Data Augmentation for Low-Resource Neural Machine Translation", 6 | booktitle = "Proceedings of ACL", 7 | year = "2017" 8 | } 9 | @InProceedings{D18-1040, 10 | author = "Fadaee, Marzieh 11 | and Monz, Christof", 12 | title = "Back-Translation Sampling by Targeting Difficult Words in Neural Machine Translation", 13 | booktitle = "Proceedings of EMNLP", 14 | year = "2018" 15 | } 16 | @InProceedings{D18-1045, 17 | author = "Edunov, Sergey 18 | and Ott, Myle 19 | and Auli, Michael 20 | and Grangier, David", 21 | title = "Understanding Back-Translation at Scale", 22 | booktitle = "Proceedings of EMNLP", 23 | year = "2018" 24 | } 25 | @InProceedings{D18-1100, 26 | author = "Wang, Xinyi 27 | and Pham, Hieu 28 | and Dai, Zihang 29 | and Neubig, Graham", 30 | title = "SwitchOut: an Efficient Data Augmentation Algorithm for Neural Machine Translation", 31 | booktitle = "Proceedings of EMNLP", 32 | year = "2018" 33 | } 34 | -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_meta.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D18-1398, 2 | author = "Gu, Jiatao 3 | and Wang, Yong 4 | and Chen, Yun 5 | and Li, Victor O. K. 6 | and Cho, Kyunghyun", 7 | title = "Meta-Learning for Low-Resource Neural Machine Translation", 8 | booktitle = "Proceedings of EMNLP", 9 | year = "2018" 10 | } 11 | -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_multitask.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P15-1166, 2 | author = "Dong, Daxiang 3 | and Wu, Hua 4 | and He, Wei 5 | and Yu, Dianhai 6 | and Wang, Haifeng", 7 | title = "Multi-Task Learning for Multiple Language Translation", 8 | booktitle = "Proceedings of ACL", 9 | year = "2015" 10 | } 11 | @InProceedings{N16-1101, 12 | author = "Firat, Orhan 13 | and Cho, Kyunghyun 14 | and Bengio, Yoshua", 15 | title = "Multi-Way, Multilingual Neural Machine Translation with a Shared Attention Mechanism", 16 | booktitle = "Proceedings of NAACL", 17 | year = "2016" 18 | } 19 | @InProceedings{N16-1004, 20 | author = "Zoph, Barret 21 | and Knight, Kevin", 22 | title = "Multi-Source Neural Translation", 23 | booktitle = "Proceedings of NAACL", 24 | year = "2016" 25 | } 26 | @InProceedings{D16-1026, 27 | author = "Firat, Orhan 28 | and Sankaran, Baskaran 29 | and Al-Onaizan, Yaser 30 | and Yarman Vural, Fatos T. 31 | and Cho, Kyunghyun", 32 | title = "Zero-Resource Translation with Multi-Lingual Neural Machine Translation", 33 | booktitle = "Proceedings of EMNLP", 34 | year = "2016" 35 | } 36 | @Article{Q17-1024, 37 | author = "Johnson, Melvin 38 | and Schuster, Mike 39 | and Le, Quoc V. 40 | and Krikun, Maxim 41 | and Wu, Yonghui 42 | and Chen, Zhifeng 43 | and Thorat, Nikhil 44 | and Vi{\'e}gas, Fernanda 45 | and Wattenberg, Martin 46 | and Corrado, Greg 47 | and Hughes, Macduff 48 | and Dean, Jeffrey", 49 | title = "Google's Multilingual Neural Machine Translation System: Enabling Zero-Shot Translation", 50 | journal = "Transactions of the Association for Computational Linguistics", 51 | year = "2017", 52 | volume = "5", 53 | pages = "339--351" 54 | } 55 | @InProceedings{N18-1123, 56 | author = "Zaremoodi, Poorya 57 | and Haffari, Gholamreza", 58 | title = "Neural Machine Translation for Bilingually Scarce Scenarios: a Deep Multi-Task Learning Approach", 59 | booktitle = "Proceedings of NAACL", 60 | year = "2018" 61 | } 62 | @InProceedings{P18-2104, 63 | author = "Zaremoodi, Poorya 64 | and Buntine, Wray 65 | and Haffari, Gholamreza", 66 | title = "Adaptive Knowledge Sharing in Multi-Task Learning: Improving Low-Resource Neural Machine Translation", 67 | booktitle = "Proceedings of ACL", 68 | year = "2018" 69 | } 70 | @InProceedings{C18-1054, 71 | author = "Lakew, Surafel Melaku 72 | and Cettolo, Mauro 73 | and Federico, Marcello", 74 | title = "A Comparison of Transformer and Recurrent Neural Networks on Multilingual Neural Machine Translation", 75 | booktitle = "Proceedings of COLING", 76 | year = "2018" 77 | } 78 | @InProceedings{C18-1263, 79 | author = "Blackwood, Graeme 80 | and Ballesteros, Miguel 81 | and Ward, Todd", 82 | title = "Multilingual Neural Machine Translation with Task-Specific Attention", 83 | booktitle = "Proceedings of COLING", 84 | year = "2018" 85 | } 86 | @InProceedings{W18-6327, 87 | author = "Sachan, Devendra 88 | and Neubig, Graham", 89 | title = "Parameter Sharing Methods for Multilingual Self-Attentional Translation Models", 90 | booktitle = "Proceedings of the Third Conference on Machine Translation: Research Papers", 91 | year = "2018" 92 | } 93 | @InProceedings{D18-1039, 94 | author = "Platanios, Emmanouil Antonios 95 | and Sachan, Mrinmaya 96 | and Neubig, Graham 97 | and Mitchell, Tom", 98 | title = "Contextual Parameter Generation for Universal Neural Machine Translation", 99 | booktitle = "Proceedings of EMNLP", 100 | year = "2018" 101 | } 102 | @InProceedings{D18-1326, 103 | author = "Wang, Yining 104 | and Zhang, Jiajun 105 | and Zhai, Feifei 106 | and Xu, Jingfang 107 | and Zong, Chengqing", 108 | title = "Three Strategies to Improve One-to-Many Multilingual Translation", 109 | booktitle = "Proceedings of EMNLP", 110 | year = "2018" 111 | } 112 | @inproceedings{tan2019multilingual, 113 | title={Multilingual Neural Machine Translation with Knowledge Distillation}, 114 | author={Tan, Xu and Ren, Yi and He, Di and Qin, Tao and Zhao, Zhou and Liu, Tie-Yan}, 115 | booktitle = {Proceedings of ICLR}, 116 | year = {2019} 117 | } 118 | @inproceedings{wang2019multilingual, 119 | title={Multilingual Neural Machine Translation With Soft Decoupled Encoding}, 120 | author={Wang, Xinyi and Pham, Hieu and Arthur, Philip and Neubig, Graham}, 121 | booktitle = {Proceedings of ICLR}, 122 | year = {2019} 123 | } -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_pivot_based.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D16-1026, 2 | author = "Firat, Orhan 3 | and Sankaran, Baskaran 4 | and Al-Onaizan, Yaser 5 | and Yarman Vural, Fatos T. 6 | and Cho, Kyunghyun", 7 | title = "Zero-Resource Translation with Multi-Lingual Neural Machine Translation", 8 | booktitle = "Proceedings of EMNLP", 9 | year = "2016" 10 | } 11 | @inproceedings{zheng2017maximum, 12 | title={Maximum expected likelihood estimation for zero-resource neural machine translation}, 13 | author={Zheng, Hao and Cheng, Yong and Liu, Yang}, 14 | booktitle={Proceedings of IJCAI}, 15 | year={2017} 16 | } 17 | @InProceedings{P17-1176, 18 | author = "Chen, Yun 19 | and Liu, Yang 20 | and Cheng, Yong 21 | and Li, Victor O.K.", 22 | title = "A Teacher-Student Framework for Zero-Resource Neural Machine Translation", 23 | booktitle = "Proceedings of ACL", 24 | year = "2017" 25 | } 26 | @inproceedings{cheng2017joint, 27 | title={Joint training for pivot-based neural machine translation}, 28 | author={Cheng, Yong and Yang, Qian and Liu, Yang and Sun, Maosong and Xu, Wei}, 29 | booktitle={Proceedings of IJCAI}, 30 | year={2017} 31 | } 32 | @inproceedings{chen2018zero, 33 | title={Zero-Resource Neural Machine Translation with Multi-Agent Communication Game}, 34 | author={Chen, Yun and Liu, Yang and Li, Victor OK}, 35 | booktitle={Proceedings of AAAI}, 36 | year={2018} 37 | } 38 | @InProceedings{P18-1006, 39 | author = "Ren, Shuo 40 | and Chen, Wenhu 41 | and Liu, Shujie 42 | and Li, Mu 43 | and Zhou, Ming 44 | and Ma, Shuai", 45 | title = "Triangular Architecture for Rare Language Translation", 46 | booktitle = "Proceedings of ACL", 47 | year = "2018" 48 | } 49 | -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_semi_supervised.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P16-1009, 2 | author = "Sennrich, Rico 3 | and Haddow, Barry 4 | and Birch, Alexandra", 5 | title = "Improving Neural Machine Translation Models with Monolingual Data", 6 | booktitle = "Proceedings of ACL", 7 | year = "2016" 8 | } 9 | @InProceedings{P16-1185, 10 | author = "Cheng, Yong 11 | and Xu, Wei 12 | and He, Zhongjun 13 | and He, Wei 14 | and Wu, Hua 15 | and Sun, Maosong 16 | and Liu, Yang", 17 | title = "Semi-Supervised Learning for Neural Machine Translation", 18 | booktitle = "Proceedings of ACL", 19 | year = "2016" 20 | } 21 | @InProceedings{D17-1158, 22 | author = "Domhan, Tobias 23 | and Hieber, Felix", 24 | title = "Using Target-side Monolingual Data for Neural Machine Translation through Multi-task Learning", 25 | booktitle = "Proceedings of EMNLP", 26 | year = "2017" 27 | } 28 | @InProceedings{W17-4715, 29 | author = "Currey, Anna 30 | and Miceli Barone, Antonio Valerio 31 | and Heafield, Kenneth", 32 | title = "Copied Monolingual Data Improves Low-Resource Neural Machine Translation", 33 | booktitle = "Proceedings of the Second Conference on Machine Translation", 34 | year = "2017" 35 | } -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_transfer.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D16-1163, 2 | author = "Zoph, Barret 3 | and Yuret, Deniz 4 | and May, Jonathan 5 | and Knight, Kevin", 6 | title = "Transfer Learning for Low-Resource Neural Machine Translation", 7 | booktitle = "Proceedings of EMNLP", 8 | year = "2016" 9 | } 10 | @InProceedings{N18-1032, 11 | author = "Gu, Jiatao 12 | and Hassan, Hany 13 | and Devlin, Jacob 14 | and Li, Victor O.K.", 15 | title = "Universal Neural Machine Translation for Extremely Low Resource Languages", 16 | booktitle = "Proceedings of NAACL", 17 | year = "2018" 18 | } 19 | @InProceedings{W18-6325, 20 | author = "Kocmi, Tom 21 | and Bojar, Ond{\v{r}}ej", 22 | title = "Trivial Transfer Learning for Low-Resource Neural Machine Translation", 23 | booktitle = "Proceedings of the Third Conference on Machine Translation: Research Papers", 24 | year = "2018" 25 | } 26 | -------------------------------------------------------------------------------- /bib_citations/NMT_low_resource_unsupervised.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D17-1266, 2 | author = "Pourdamghani, Nima 3 | and Knight, Kevin", 4 | title = "Deciphering Related Languages", 5 | booktitle = "Proceedings of EMNLP", 6 | year = "2017" 7 | } 8 | @InProceedings{artetxe2017unsupervised, 9 | title={Unsupervised neural machine translation}, 10 | author={Artetxe, Mikel and Labaka, Gorka and Agirre, Eneko and Cho, Kyunghyun}, 11 | booktitle = "Proceedings of ICLR", 12 | year={2018} 13 | } 14 | @InProceedings{lample2017unsupervised, 15 | title={Unsupervised machine translation using monolingual corpora only}, 16 | author={Lample, Guillaume and Conneau, Alexis and Denoyer, Ludovic and Ranzato, Marc'Aurelio}, 17 | booktitle={Proceedings of ICLR}, 18 | year={2018} 19 | } 20 | @InProceedings{P18-1005, 21 | author = "Yang, Zhen 22 | and Chen, Wei 23 | and Wang, Feng 24 | and Xu, Bo", 25 | title = "Unsupervised Neural Machine Translation with Weight Sharing", 26 | booktitle = "Proceedings of ACL", 27 | year = "2018" 28 | } 29 | @InProceedings{D18-1549, 30 | author = "Lample, Guillaume 31 | and Ott, Myle 32 | and Conneau, Alexis 33 | and Denoyer, Ludovic 34 | and Ranzato, Marc'Aurelio", 35 | title = "Phrase-Based {\&} Neural Unsupervised Machine Translation", 36 | booktitle = "Proceedings of EMNLP", 37 | year = "2018" 38 | } 39 | @Article{J18-3006, 40 | author = "Naim, Iftekhar 41 | and Riley, Parker 42 | and Gildea, Daniel", 43 | title = "Feature-Based Decipherment for Machine Translation", 44 | journal = "Computational Linguistics", 45 | year = "2018", 46 | volume = "44", 47 | number = "3", 48 | pages = "525--546" 49 | } 50 | @InProceedings{ren-etal-2019-explicit, 51 | title = "Explicit Cross-lingual Pre-training for Unsupervised Machine Translation", 52 | author = "Ren, Shuo and 53 | Wu, Yu and 54 | Liu, Shujie and 55 | Zhou, Ming and 56 | Ma, Shuai", 57 | booktitle = "Proceedings of EMNLP", 58 | year = "2019", 59 | } -------------------------------------------------------------------------------- /bib_citations/NMT_model_architecture.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{D13-1176, 2 | author = "Kalchbrenner, Nal 3 | and Blunsom, Phil", 4 | title = "Recurrent Continuous Translation Models", 5 | booktitle = "Proceedings of EMNLP", 6 | year = "2013" 7 | } 8 | @inproceedings{seq2seq, 9 | title={Sequence to sequence learning with neural networks}, 10 | author={Sutskever, Ilya and Vinyals, Oriol and Le, Quoc V}, 11 | booktitle={Advances in neural information processing systems}, 12 | year={2014} 13 | } 14 | @inproceedings{rnnsearch, 15 | author = {Bahdanau, Dzmitry and Cho, KyungHyun and Bengio, Yoshua}, 16 | title = {Neural Machine Translation by Jointly Learning to Align and Translate}, 17 | booktitle = {Proceedings of ICLR}, 18 | year = {2015} 19 | } 20 | @InProceedings{gnmt, 21 | author= {Yonghui Wu and 22 | Mike Schuster and 23 | Zhifeng Chen and 24 | Quoc V. Le and 25 | Mohammad Norouzi and 26 | Wolfgang Macherey and 27 | Maxim Krikun and 28 | Yuan Cao and 29 | Qin Gao and 30 | Klaus Macherey and 31 | Jeff Klingner and 32 | Apurva Shah and 33 | Melvin Johnson and 34 | Xiaobing Liu and 35 | Lukasz Kaiser and 36 | Stephan Gouws and 37 | Yoshikiyo Kato and 38 | Taku Kudo and 39 | Hideto Kazawa and 40 | Keith Stevens and 41 | George Kurian and 42 | Nishant Patil and 43 | Wei Wang and 44 | Cliff Young and 45 | Jason Smith and 46 | Jason Riesa and 47 | Alex Rudnick and 48 | Oriol Vinyals and 49 | Greg Corrado and 50 | Macduff Hughes and 51 | Jeffrey Dean}, 52 | title = {Google's Neural Machine Translation System: Bridging the Gap between Human and Machine Translation}, 53 | booktitle = "Proceedings of NIPS", 54 | year = {2016}, 55 | } 56 | @Article{Q16-1027, 57 | author = "Zhou, Jie 58 | and Cao, Ying 59 | and Wang, Xuguang 60 | and Li, Peng 61 | and Xu, Wei", 62 | title = "Deep Recurrent Models with Fast-Forward Connections for Neural Machine Translation", 63 | journal = "Transactions of the Association for Computational Linguistics", 64 | year = "2016", 65 | volume = "4", 66 | pages = "371--383" 67 | } 68 | @InProceedings{P16-1154, 69 | author = "Gu, Jiatao 70 | and Lu, Zhengdong 71 | and Li, Hang 72 | and Li, Victor O.K.", 73 | title = "Incorporating Copying Mechanism in Sequence-to-Sequence Learning", 74 | booktitle = "Proceedings of ACL", 75 | year = "2016" 76 | } 77 | @InProceedings{D16-1050, 78 | author = "Zhang, Biao 79 | and Xiong, Deyi 80 | and su, jinsong 81 | and Duan, Hong 82 | and Zhang, Min", 83 | title = "Variational Neural Machine Translation", 84 | booktitle = "Proceedings of EMNLP", 85 | year = "2016" 86 | } 87 | @InProceedings{convs2s, 88 | title={Convolutional Sequence to Sequence Learning}, 89 | author={Gehring, Jonas and Auli, Michael and Grangier, David and Yarats, Denis and Dauphin, Yann N}, 90 | booktitle={Proceedings of ICML}, 91 | year={2017} 92 | } 93 | @InProceedings{P17-1012, 94 | author = "Gehring, Jonas 95 | and Auli, Michael 96 | and Grangier, David 97 | and Dauphin, Yann", 98 | title = "A Convolutional Encoder Model for Neural Machine Translation", 99 | booktitle = "Proceedings of ACL", 100 | year = "2017" 101 | } 102 | @InProceedings{P17-1013, 103 | author = "Wang, Mingxuan 104 | and Lu, Zhengdong 105 | and Zhou, Jie 106 | and Liu, Qun", 107 | title = "Deep Neural Machine Translation with Linear Associative Unit", 108 | booktitle = "Proceedings of ACL", 109 | year = "2017" 110 | } 111 | @InProceedings{D17-1145, 112 | author = "Sperber, Matthias 113 | and Neubig, Graham 114 | and Niehues, Jan 115 | and Waibel, Alex", 116 | title = "Neural Lattice-to-Sequence Models for Uncertain Inputs", 117 | booktitle = "Proceedings of EMNLP", 118 | year = "2017" 119 | } 120 | @InProceedings{D17-1151, 121 | author = "Britz, Denny 122 | and Goldie, Anna 123 | and Luong, Minh-Thang 124 | and Le, Quoc", 125 | title = "Massive Exploration of Neural Machine Translation Architectures", 126 | booktitle = "Proceedings of EMNLP", 127 | year = "2017" 128 | } 129 | @inproceedings{transformer, 130 | title={Attention Is All You Need}, 131 | author={Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, Lukasz and Polosukhin, Illia}, 132 | booktitle={Proceedings of NIPS}, 133 | year={2017} 134 | } 135 | @inproceedings{tu2017neural, 136 | title={Neural machine translation with reconstruction}, 137 | author={Tu, Zhaopeng and Liu, Yang and Shang, Lifeng and Liu, Xiaohua and Li, Hang}, 138 | booktitle={Thirty-First AAAI Conference on Artificial Intelligence}, 139 | year={2017} 140 | } 141 | @inproceedings{kaiser2017depthwise, 142 | title={Depthwise separable convolutions for neural machine translation}, 143 | author={Kaiser, Lukasz and Gomez, Aidan N and Chollet, Francois}, 144 | booktitle={Proceedings of ICLR}, 145 | year={2018} 146 | } 147 | @InProceedings{kaiser2018fast, 148 | title={Fast Decoding in Sequence Models Using Discrete Latent Variables}, 149 | author={Kaiser, {\L}ukasz and Roy, Aurko and Vaswani, Ashish and Pamar, Niki and Bengio, Samy and Uszkoreit, Jakob and Shazeer, Noam}, 150 | booktitle={Proceedings of ICML}, 151 | year={2018} 152 | } 153 | @InProceedings{N18-1117, 154 | author = "Shen, Yanyao 155 | and Tan, Xu 156 | and He, Di 157 | and Qin, Tao 158 | and Liu, Tie-Yan", 159 | title = "Dense Information Flow for Neural Machine Translation", 160 | booktitle = "Proceedings of NAACL", 161 | year = "2018" 162 | } 163 | @InProceedings{N18-1154, 164 | author = "Chen, Wenhu 165 | and Li, Guanlin 166 | and Ren, Shuo 167 | and Liu, Shujie 168 | and Zhang, Zhirui 169 | and Li, Mu 170 | and Zhou, Ming", 171 | title = "Generative Bridging Network for Neural Sequence Prediction", 172 | booktitle = "Proceedings of ACL", 173 | year = "2018" 174 | } 175 | @InProceedings{P18-1008, 176 | author = "Chen, Mia Xu 177 | and Firat, Orhan 178 | and Bapna, Ankur 179 | and Johnson, Melvin 180 | and Macherey, Wolfgang 181 | and Foster, George 182 | and Jones, Llion 183 | and Schuster, Mike 184 | and Shazeer, Noam 185 | and Parmar, Niki 186 | and Vaswani, Ashish 187 | and Uszkoreit, Jakob 188 | and Kaiser, Lukasz 189 | and Chen, Zhifeng 190 | and Wu, Yonghui 191 | and Hughes, Macduff", 192 | title = "The Best of Both Worlds: Combining Recent Advances in Neural Machine Translation", 193 | booktitle = "Proceedings of ACL", 194 | year = "2018" 195 | } 196 | @InProceedings{P18-2060, 197 | author = "Wang, Weiyue 198 | and Zhu, Derui 199 | and Alkhouli, Tamer 200 | and Gan, Zixuan 201 | and Ney, Hermann", 202 | title = "Neural Hidden Markov Model for Machine Translation", 203 | booktitle = "Proceedings of ACL", 204 | year = "2018" 205 | } 206 | @InProceedings{C18-1232, 207 | author = "Gong, Jingjing 208 | and Qiu, Xipeng 209 | and Wang, Shaojing 210 | and Huang, Xuanjing", 211 | title = "Information Aggregation via Dynamic Routing for Sequence Encoding", 212 | booktitle = "Proceedings of COLING", 213 | year = "2018" 214 | } 215 | @InProceedings{C18-1255, 216 | author = "Wang, Qiang 217 | and Li, Fuxue 218 | and Xiao, Tong 219 | and Li, Yanyang 220 | and Li, Yinqiao 221 | and Zhu, Jingbo", 222 | title = "Multi-layer Representation Fusion for Neural Machine Translation", 223 | booktitle = "Proceedings of COLING", 224 | year = "2018" 225 | } 226 | @InProceedings{C18-1257, 227 | author = "Li, Yachao 228 | and Li, Junhui 229 | and Zhang, Min", 230 | title = "Adaptive Weighting for Neural Machine Translation", 231 | booktitle = "Proceedings of COLING", 232 | year = "2018" 233 | } 234 | @InProceedings{C18-1259, 235 | author = "Song, Kaitao 236 | and Tan, Xu 237 | and He, Di 238 | and Lu, Jianfeng 239 | and Qin, Tao 240 | and Liu, Tie-Yan", 241 | title = "Double Path Networks for Sequence to Sequence Learning", 242 | booktitle = "Proceedings of COLING", 243 | year = "2018" 244 | } 245 | @InProceedings{D18-1457, 246 | author = "Dou, Zi-Yi 247 | and Tu, Zhaopeng 248 | and Wang, Xing 249 | and Shi, Shuming 250 | and Zhang, Tong", 251 | title = "Exploiting Deep Representations for Neural Machine Translation", 252 | booktitle = "Proceedings of EMNLP", 253 | year = "2018" 254 | } 255 | @InProceedings{D18-1459, 256 | author = "Zhang, Biao 257 | and Xiong, Deyi 258 | and su, jinsong 259 | and Lin, Qian 260 | and Zhang, Huiji", 261 | title = "Simplifying Neural Machine Translation with Addition-Subtraction Twin-Gated Recurrent Networks", 262 | booktitle = "Proceedings of EMNLP", 263 | year = "2018" 264 | } 265 | @InProceedings{D18-1458, 266 | author = "Tang, Gongbo 267 | and M{\"u}ller, Mathias 268 | and Rios, Annette 269 | and Sennrich, Rico", 270 | title = "Why Self-Attention? A Targeted Evaluation of Neural Machine Translation Architectures", 271 | booktitle = "Proceedings of EMNLP", 272 | year = "2018" 273 | } 274 | @InProceedings{D18-1503, 275 | author = "Tran, Ke 276 | and Bisazza, Arianna 277 | and Monz, Christof", 278 | title = "The Importance of Being Recurrent for Modeling Hierarchical Structure", 279 | booktitle = "Proceedings of EMNLP", 280 | year = "2018" 281 | } 282 | @InProceedings{D18-1335, 283 | author = "Bahar, Parnia 284 | and Brix, Christopher 285 | and Ney, Hermann", 286 | title = "Towards Two-Dimensional Sequence to Sequence Model in Neural Machine Translation", 287 | booktitle = "Proceedings of EMNLP", 288 | year = "2018" 289 | } 290 | @inproceedings{he2018layer, 291 | title={Layer-wise coordination between encoder and decoder for neural machine translation}, 292 | author={He, Tianyu and Tan, Xu and Xia, Yingce and He, Di and Qin, Tao and Chen, Zhibo and Liu, Tie-Yan}, 293 | booktitle={Proceedings of NeurIPS}, 294 | year={2018} 295 | } 296 | @article{hassan2018achieving, 297 | title={Achieving human parity on automatic chinese to english news translation}, 298 | author={Hassan, Hany and Aue, Anthony and Chen, Chang and Chowdhary, Vishal and Clark, Jonathan and Federmann, Christian and Huang, Xuedong and Junczys-Dowmunt, Marcin and Lewis, William and Li, Mu and others}, 299 | year={Technical report. Microsoft AI \& Research} 300 | } 301 | @inproceedings{dehghani2018universal, 302 | title={Universal Transformers}, 303 | author={Dehghani, Mostafa and Gouws, Stephan and Vinyals, Oriol and Uszkoreit, Jakob and Kaiser, {\L}ukasz}, 304 | booktitle = {Proceedings of ICLR}, 305 | year = {2019} 306 | } 307 | @inproceedings{wu2019pay, 308 | title={Pay Less Attention with Lightweight and Dynamic Convolutions}, 309 | author={Wu, Felix and Fan, Angela and Baevski, Alexei and Dauphin, Yann N and Auli, Michael}, 310 | booktitle = {Proceedings of ICLR}, 311 | year = {2019} 312 | } 313 | @InProceedings{dou2019dynamic, 314 | author = "Dou, Zi-yi 315 | and Tu, Zhaopeng 316 | and Wang, Xing 317 | and Wang, Longyue 318 | and Shi, Shuming 319 | and Zhang, Tong", 320 | title = "Dynamic Layer Aggregation for Neural Machine Translation with Routing-by-Agreement", 321 | booktitle = "Proceedings of AAAI" 322 | year = "2019" 323 | } 324 | @inproceedings{wang-2019-towards, 325 | title = "Towards Linear Time Neural Machine Translation with Capsule Networks", 326 | author = "Wang, Mingxuan", 327 | booktitle = "Proceedings of EMNLP", 328 | publisher = "Association for Computational Linguistics", 329 | } 330 | @inproceedings{zhang-etal-2019-improving, 331 | title = "Improving Deep Transformer with Depth-Scaled Initialization and Merged Attention", 332 | author = "Zhang, Biao and 333 | Titov, Ivan and 334 | Sennrich, Rico", 335 | booktitle = "Proceedings of EMNLP" 336 | year = "2019", 337 | } -------------------------------------------------------------------------------- /bib_citations/NMT_multimodal.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P16-1227, 2 | author = "Hitschler, Julian 3 | and Schamoni, Shigehiko 4 | and Riezler, Stefan", 5 | title = "Multimodal Pivots for Image Caption Translation", 6 | booktitle = "Proceedings of ACL", 7 | year = "2016" 8 | } 9 | @InProceedings{W16-2346, 10 | author = "Specia, Lucia 11 | and Frank, Stella 12 | and Sima'an, Khalil 13 | and Elliott, Desmond", 14 | title = "A Shared Task on Multimodal Machine Translation and Crosslingual Image Description", 15 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 16 | year = "2016" 17 | } 18 | @InProceedings{W16-2362, 19 | author = "Rodr{\'i}guez Guasch, Sergio 20 | and Costa-juss{\`a}, Marta R.", 21 | title = "WMT 2016 Multimodal Translation System Description based on Bidirectional Recurrent Neural Networks with Double-Embeddings", 22 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 23 | year = "2016" 24 | } 25 | @InProceedings{W16-2360, 26 | author = "Huang, Po-Yao 27 | and Liu, Frederick 28 | and Shiang, Sz-Rung 29 | and Oh, Jean 30 | and Dyer, Chris", 31 | title = "Attention-based Multimodal Neural Machine Translation", 32 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 33 | year = "2016" 34 | } 35 | @InProceedings{W16-2362, 36 | author = "Rodr{\'i}guez Guasch, Sergio 37 | and Costa-juss{\`a}, Marta R.", 38 | title = "WMT 2016 Multimodal Translation System Description based on Bidirectional Recurrent Neural Networks with Double-Embeddings", 39 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 40 | year = "2016" 41 | } 42 | @InProceedings{W16-2359, 43 | author = "Calixto, Iacer 44 | and Elliott, Desmond 45 | and Frank, Stella", 46 | title = "DCU-UvA Multimodal MT System Report", 47 | booktitle = "Proceedings of the First Conference on Machine Translation: Volume 2, Shared Task Papers", 48 | year = "2016" 49 | } 50 | @InProceedings{W17-4718, 51 | author = "Elliott, Desmond 52 | and Frank, Stella 53 | and Barrault, Lo{\"i}c 54 | and Bougares, Fethi 55 | and Specia, Lucia", 56 | title = "Findings of the Second Shared Task on Multimodal Machine Translation and Multilingual Image Description", 57 | booktitle = "Proceedings of the Second Conference on Machine Translation", 58 | year = "2017" 59 | } 60 | @InProceedings{P17-1175, 61 | author = "Calixto, Iacer 62 | and Liu, Qun 63 | and Campbell, Nick", 64 | title = "Doubly-Attentive Decoder for Multi-modal Neural Machine Translation", 65 | booktitle = "Proceedings of ACL", 66 | year = "2017" 67 | } 68 | @InProceedings{D17-1095, 69 | author = "Delbrouck, Jean-Benoit 70 | and Dupont, St{\'e}phane", 71 | title = "An empirical study on the effectiveness of images in Multimodal Neural Machine Translation", 72 | booktitle = "Proceedings of EMNLP", 73 | year = "2017" 74 | } 75 | @InProceedings{D17-1105, 76 | author = "Calixto, Iacer 77 | and Liu, Qun", 78 | title = "Incorporating Global Visual Features into Attention-based Neural Machine Translation", 79 | booktitle = "Proceedings of EMNLP", 80 | year = "2017" 81 | } 82 | @InProceedings{lee2017emergent, 83 | title={Emergent translation in multi-agent communication}, 84 | author={Lee, Jason and Cho, Kyunghyun and Weston, Jason and Kiela, Douwe}, 85 | booktitle={Proceedings of ICLR}, 86 | year={2018} 87 | } 88 | @InProceedings{chen2018zero, 89 | title={Zero-Resource Neural Machine Translation with Multi-Agent Communication Game}, 90 | author={Chen, Yun and Liu, Yang and Li, Victor OK}, 91 | booktitle={Proceedings of AAAI}, 92 | year={2018} 93 | } 94 | @InProceedings{W18-6402, 95 | author = "Barrault, Lo{\"i}c 96 | and Bougares, Fethi 97 | and Specia, Lucia 98 | and Lala, Chiraag 99 | and Elliott, Desmond 100 | and Frank, Stella", 101 | title = "Findings of the Third Shared Task on Multimodal Machine Translation", 102 | booktitle = "Proceedings of the Third Conference on Machine Translation: Shared Task Papers", 103 | year = "2018" 104 | } 105 | @InProceedings{P18-1239, 106 | author = "Hewitt, John 107 | and Ippolito, Daphne 108 | and Callahan, Brendan 109 | and Kriz, Reno 110 | and Wijaya, Derry Tanti 111 | and Callison-Burch, Chris", 112 | title = "Learning Translations via Images with a Massively Multilingual Image Dataset", 113 | booktitle = "Proceedings of ACL", 114 | year = "2018" 115 | } 116 | @InProceedings{D18-1400, 117 | author = "Zhou, Mingyang 118 | and Cheng, Runxiang 119 | and Lee, Yong Jae 120 | and Yu, Zhou", 121 | title = "A Visual Attention Grounding Neural Model for Multimodal Machine Translation", 122 | booktitle = "Proceedings of EMNLP", 123 | year = "2018" 124 | } 125 | @InProceedings{D18-1329, 126 | author = "Elliott, Desmond", 127 | title = "Adversarial Evaluation of Multimodal Machine Translation", 128 | booktitle = "Proceedings of EMNLP", 129 | year = "2018" 130 | } -------------------------------------------------------------------------------- /bib_citations/NMT_open_vocabulary_and_char.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{hill2014embedding, 2 | title={Embedding word similarity with neural machine translation}, 3 | author={Hill, Felix and Cho, Kyunghyun and Jean, Sebastien and Devin, Coline and Bengio, Yoshua}, 4 | booktitle={Proceedings of ICLR}, 5 | year={2015} 6 | } 7 | @InProceedings{P15-1002, 8 | author = "Luong, Thang 9 | and Sutskever, Ilya 10 | and Le, Quoc 11 | and Vinyals, Oriol 12 | and Zaremba, Wojciech", 13 | title = "Addressing the Rare Word Problem in Neural Machine Translation", 14 | booktitle = "Proceedings of ACL", 15 | year = "2015" 16 | } 17 | @InProceedings{P15-1001, 18 | author = "Jean, S{\'e}bastien 19 | and Cho, Kyunghyun 20 | and Memisevic, Roland 21 | and Bengio, Yoshua", 22 | title = "On Using Very Large Target Vocabulary for Neural Machine Translation", 23 | booktitle = "Proceedings of ACL", 24 | year = "2015" 25 | } 26 | @InProceedings{P16-1162, 27 | author = "Sennrich, Rico 28 | and Haddow, Barry 29 | and Birch, Alexandra", 30 | title = "Neural Machine Translation of Rare Words with Subword Units", 31 | booktitle = "Proceedings of ACL", 32 | year = "2016" 33 | } 34 | @InProceedings{P16-1100, 35 | author = "Luong, Minh-Thang 36 | and Manning, Christopher D.", 37 | title = "Achieving Open Vocabulary Neural Machine Translation with Hybrid Word-Character Models", 38 | booktitle = "Proceedings of ACL", 39 | year = "2016" 40 | } 41 | @InProceedings{P16-1160, 42 | author = "Chung, Junyoung 43 | and Cho, Kyunghyun 44 | and Bengio, Yoshua", 45 | title = "A Character-level Decoder without Explicit Segmentation for Neural Machine Translation", 46 | booktitle = "Proceedings of ACL", 47 | year = "2016" 48 | } 49 | @Article{Q17-1026, 50 | author = "Lee, Jason 51 | and Cho, Kyunghyun 52 | and Hofmann, Thomas", 53 | title = "Fully Character-Level Neural Machine Translation without Explicit Segmentation", 54 | journal = "Transactions of the Association for Computational Linguistics", 55 | year = "2017" 56 | } 57 | @InProceedings{D17-1146, 58 | author = "Feng, Yang 59 | and Zhang, Shiyue 60 | and Zhang, Andi 61 | and Wang, Dong 62 | and Abel, Andrew", 63 | title = "Memory-augmented Neural Machine Translation", 64 | booktitle = "Proceedings of EMNLP", 65 | year = "2017" 66 | } 67 | @InProceedings{D17-1150, 68 | author = "Yang, Baosong 69 | and Wong, Derek F. 70 | and Xiao, Tong 71 | and Chao, Lidia S. 72 | and Zhu, Jingbo", 73 | title = "Towards Bidirectional Hierarchical Representations for Attention-based Neural Machine Translation", 74 | booktitle = "Proceedings of EMNLP", 75 | year = "2017" 76 | } 77 | @InProceedings{N18-1006, 78 | author = "Passban, Peyman 79 | and Liu, Qun 80 | and Way, Andy", 81 | title = "Improving Character-Based Decoding Using Target-Side Morphological Information for Neural Machine Translation", 82 | booktitle = "Proceedings of NAACL", 83 | year = "2018" 84 | } 85 | @InProceedings{N18-1116, 86 | author = "Chen, Huadong 87 | and Huang, Shujian 88 | and Chiang, David 89 | and Dai, Xinyu 90 | and Chen, Jiajun", 91 | title = "Combining Character and Word Information in Neural Machine Translation Using a Multi-Level Attention", 92 | booktitle = "Proceedings of NAACL", 93 | year = "2018" 94 | } 95 | @InProceedings{N18-1121, 96 | author = "Liu, Frederick 97 | and Lu, Han 98 | and Neubig, Graham", 99 | title = "Handling Homographs in Neural Machine Translation", 100 | booktitle = "Proceedings of NAACL", 101 | year = "2018" 102 | } 103 | @InProceedings{P18-1007, 104 | author = "Kudo, Taku", 105 | title = "Subword Regularization: Improving Neural Network Translation Models with Multiple Subword Candidates", 106 | booktitle = "Proceedings of ACL", 107 | year = "2018" 108 | } 109 | @InProceedings{C18-1052, 110 | author = "Morishita, Makoto 111 | and Suzuki, Jun 112 | and Nagata, Masaaki", 113 | title = "Improving Neural Machine Translation by Incorporating Hierarchical Subword Features", 114 | booktitle = "Proceedings of COLING", 115 | year = "2018" 116 | } 117 | @InProceedings{D18-1036, 118 | author = "Zhao, Yang 119 | and Zhang, Jiajun 120 | and He, Zhongjun 121 | and Zong, Chengqing 122 | and Wu, Hua", 123 | title = "Addressing Troublesome Words in Neural Machine Translation", 124 | booktitle = "Proceedings of EMNLP", 125 | year = "2018" 126 | } 127 | @InProceedings{D18-1461, 128 | author = "Cherry, Colin 129 | and Foster, George 130 | and Bapna, Ankur 131 | and Firat, Orhan 132 | and Macherey, Wolfgang", 133 | title = "Revisiting Character-Based Neural Machine Translation with Capacity and Compression", 134 | booktitle = "Proceedings of EMNLP", 135 | year = "2018" 136 | } 137 | @InProceedings{D18-1339, 138 | author = "Knowles, Rebecca 139 | and Koehn, Philipp", 140 | title = "Context and Copying in Neural Machine Translation", 141 | booktitle = "Proceedings of EMNLP", 142 | year = "2018" 143 | } 144 | -------------------------------------------------------------------------------- /bib_citations/NMT_poetry_translation.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{N18-2011, 2 | author = "Ghazvininejad, Marjan 3 | and Choi, Yejin 4 | and Knight, Kevin", 5 | title = "Neural Poetry Translation", 6 | booktitle = "Proceedings of NAACL", 7 | year = "2018" 8 | } 9 | -------------------------------------------------------------------------------- /bib_citations/NMT_pretraining.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{mccann2017learned, 2 | title={Learned in translation: Contextualized word vectors}, 3 | author={McCann, Bryan and Bradbury, James and Xiong, Caiming and Socher, Richard}, 4 | booktitle={Proceedings of NIPS}, 5 | year={2017} 6 | } 7 | @InProceedings{N18-2084, 8 | author = "Qi, Ye 9 | and Sachan, Devendra 10 | and Felix, Matthieu 11 | and Padmanabhan, Sarguna 12 | and Neubig, Graham", 13 | title = "When and Why Are Pre-Trained Word Embeddings Useful for Neural Machine Translation?", 14 | booktitle = "Proceedings of NAACL", 15 | year = "2018" 16 | } 17 | @InProceedings{N18-1202, 18 | author = "Peters, Matthew 19 | and Neumann, Mark 20 | and Iyyer, Mohit 21 | and Gardner, Matt 22 | and Clark, Christopher 23 | and Lee, Kenton 24 | and Zettlemoyer, Luke", 25 | title = "Deep Contextualized Word Representations", 26 | booktitle = "Proceedings of NAACL", 27 | year = "2018" 28 | } 29 | @InProceedings{P18-1031, 30 | author = "Howard, Jeremy 31 | and Ruder, Sebastian", 32 | title = "Universal Language Model Fine-tuning for Text Classification", 33 | booktitle = "Proceedings of ACL", 34 | year = "2018" 35 | } 36 | @article{radford2018improving, 37 | title={Improving language understanding by generative pre-training}, 38 | author={Radford, Alec and Narasimhan, Karthik and Salimans, Tim and Sutskever, Ilya}, 39 | year={Technical report. OpenAI} 40 | } 41 | @article{devlin2018bert, 42 | title={Bert: Pre-training of deep bidirectional transformers for language understanding}, 43 | author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina}, 44 | journal={arXiv preprint arXiv:1810.04805}, 45 | year={2018} 46 | } 47 | @article{radford2019language, 48 | title={Language Models are Unsupervised Multitask Learners}, 49 | author={Radford, Alec and Wu, Jeffrey and Child, Rewon and Luan, David and Amodei, Dario and Sutskever, Ilya}, 50 | year={Technical report. OpenAI} 51 | } -------------------------------------------------------------------------------- /bib_citations/NMT_prior_knowledge_coverage.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P16-1008, 2 | author = "Tu, Zhaopeng 3 | and Lu, Zhengdong 4 | and Liu, Yang 5 | and Liu, Xiaohua 6 | and Li, Hang", 7 | title = "Modeling Coverage for Neural Machine Translation", 8 | booktitle = "Proceedings of ACL", 9 | year = "2016" 10 | } 11 | @InProceedings{gnmt, 12 | author= {Yonghui Wu and 13 | Mike Schuster and 14 | Zhifeng Chen and 15 | Quoc V. Le and 16 | Mohammad Norouzi and 17 | Wolfgang Macherey and 18 | Maxim Krikun and 19 | Yuan Cao and 20 | Qin Gao and 21 | Klaus Macherey and 22 | Jeff Klingner and 23 | Apurva Shah and 24 | Melvin Johnson and 25 | Xiaobing Liu and 26 | Lukasz Kaiser and 27 | Stephan Gouws and 28 | Yoshikiyo Kato and 29 | Taku Kudo and 30 | Hideto Kazawa and 31 | Keith Stevens and 32 | George Kurian and 33 | Nishant Patil and 34 | Wei Wang and 35 | Cliff Young and 36 | Jason Smith and 37 | Jason Riesa and 38 | Alex Rudnick and 39 | Oriol Vinyals and 40 | Greg Corrado and 41 | Macduff Hughes and 42 | Jeffrey Dean}, 43 | title = {Google's Neural Machine Translation System: Bridging the Gap between Human and Machine Translation}, 44 | booktitle = "Proceedings of NIPS", 45 | year = {2016}, 46 | } 47 | @InProceedings{D16-1096, 48 | author = "Mi, Haitao 49 | and Sankaran, Baskaran 50 | and Wang, Zhiguo 51 | and Ittycheriah, Abe", 52 | title = "Coverage Embedding Models for Neural Machine Translation", 53 | booktitle = "Proceedings of EMNLP", 54 | year = "2016" 55 | } 56 | @Article{Q17-1007, 57 | author = "Tu, Zhaopeng 58 | and Liu, Yang 59 | and Lu, Zhengdong 60 | and Liu, Xiaohua 61 | and Li, Hang", 62 | title = "Context Gates for Neural Machine Translation", 63 | journal = "Transactions of the Association for Computational Linguistics", 64 | year = "2017", 65 | volume = "5", 66 | pages = "87--99", 67 | } 68 | @InProceedings{P18-2047, 69 | author = "Li, Yanyang 70 | and Xiao, Tong 71 | and Li, Yinqiao 72 | and Wang, Qiang 73 | and Xu, Changming 74 | and Zhu, Jingbo", 75 | title = "A Simple and Effective Approach to Coverage-Aware Neural Machine Translation", 76 | booktitle = "Proceedings of ACL", 77 | year = "2018" 78 | } 79 | @Article{Q18-1011, 80 | author = "Zheng, Zaixiang 81 | and Zhou, Hao 82 | and Huang, Shujian 83 | and Mou, Lili 84 | and Dai, Xinyu 85 | and Chen, Jiajun 86 | and Tu, Zhaopeng", 87 | title = "Modeling Past and Future for Neural Machine Translation", 88 | journal = "Transactions of the Association for Computational Linguistics", 89 | year = "2018", 90 | volume = "6", 91 | pages = "145--157", 92 | } 93 | @InProceedings{kong2018neural, 94 | author = "Kong, Xiang 95 | and Tu, Zhaopeng 96 | and Shi, Shuming 97 | and Hovy, Eduard 98 | and Zhang, Tong", 99 | title = "Neural Machine Translation with Adequacy-Oriented Learning", 100 | booktitle = "Proceedings of AAAI", 101 | year = "2019" 102 | } -------------------------------------------------------------------------------- /bib_citations/NMT_prior_knowledge_syntactic_semantic.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{N16-1102, 2 | author = "Cohn, Trevor 3 | and Hoang, Cong Duy Vu 4 | and Vymolova, Ekaterina 5 | and Yao, Kaisheng 6 | and Dyer, Chris 7 | and Haffari, Gholamreza", 8 | title = "Incorporating Structural Alignment Biases into an Attentional Neural Translation Model", 9 | booktitle = "Proceedings of NAACL", 10 | year = "2016" 11 | } 12 | @inproceedings{cheng2016agreement, 13 | title={Agreement-based joint training for bidirectional attention-based neural machine translation}, 14 | author={Cheng, Yong and Shen, Shiqi and He, Zhongjun and He, Wei and Wu, Hua and Sun, Maosong and Liu, Yang}, 15 | booktitle={Proceedings of AAAI}, 16 | year={2016} 17 | } 18 | @InProceedings{D16-1159, 19 | author = "Shi, Xing 20 | and Padhi, Inkit 21 | and Knight, Kevin", 22 | title = "Does String-Based Neural MT Learn Source Syntax?", 23 | booktitle = "Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing ", 24 | year = "2016", 25 | } 26 | @InProceedings{P17-1064, 27 | author = "Li, Junhui 28 | and Xiong, Deyi 29 | and Tu, Zhaopeng 30 | and Zhu, Muhua 31 | and Zhang, Min 32 | and Zhou, Guodong", 33 | title = "Modeling Source Syntax for Neural Machine Translation", 34 | booktitle = "Proceedings of ACL", 35 | year = "2017" 36 | } 37 | @InProceedings{P17-1065, 38 | author = "Wu, Shuangzhi 39 | and Zhang, Dongdong 40 | and Yang, Nan 41 | and Li, Mu 42 | and Zhou, Ming", 43 | title = "Sequence-to-Dependency Neural Machine Translation", 44 | booktitle = "Proceedings of ACL", 45 | year = "2017" 46 | } 47 | @InProceedings{P17-1140, 48 | author = "Zhang, Jinchao 49 | and Wang, Mingxuan 50 | and Liu, Qun 51 | and Zhou, Jie", 52 | title = "Incorporating Word Reordering Knowledge into Attention-based Neural Machine Translation", 53 | booktitle = "Proceedings of ACL", 54 | year = "2017" 55 | } 56 | @InProceedings{P17-1177, 57 | author = "Chen, Huadong 58 | and Huang, Shujian 59 | and Chiang, David 60 | and Chen, Jiajun", 61 | title = "Improved Neural Machine Translation with a Syntax-Aware Encoder and Decoder", 62 | booktitle = "Proceedings of ACL", 63 | year = "2017" 64 | } 65 | @InProceedings{P17-2012, 66 | author = "Eriguchi, Akiko 67 | and Tsuruoka, Yoshimasa 68 | and Cho, Kyunghyun", 69 | title = "Learning to Parse and Translate Improves Neural Machine Translation", 70 | booktitle = "Proceedings of ACL", 71 | year = "2017" 72 | } 73 | @InProceedings{P17-2021, 74 | author = "Aharoni, Roee 75 | and Goldberg, Yoav", 76 | title = "Towards String-To-Tree Neural Machine Translation", 77 | booktitle = "Proceedings of ACL", 78 | year = "2017" 79 | } 80 | @InProceedings{D17-1012, 81 | author = "Hashimoto, Kazuma 82 | and Tsuruoka, Yoshimasa", 83 | title = "Neural Machine Translation with Source-Side Latent Graph Parsing", 84 | booktitle = "Proceedings of EMNLP", 85 | year = "2017" 86 | } 87 | @InProceedings{D17-1209, 88 | author = "Bastings, Joost 89 | and Titov, Ivan 90 | and Aziz, Wilker 91 | and Marcheggiani, Diego 92 | and Simaan, Khalil", 93 | title = "Graph Convolutional Encoders for Syntax-aware Neural Machine Translation", 94 | booktitle = "Proceedings of EMNLP", 95 | year = "2017" 96 | } 97 | @InProceedings{D17-1304, 98 | author = "Chen, Kehai 99 | and Wang, Rui 100 | and Utiyama, Masao 101 | and Liu, Lemao 102 | and Tamura, Akihiro 103 | and Sumita, Eiichiro 104 | and Zhao, Tiejun", 105 | title = "Neural Machine Translation with Source Dependency Representation", 106 | booktitle = "Proceedings of EMNLP", 107 | year = "2017" 108 | } 109 | @InProceedings{N18-1006, 110 | author = "Passban, Peyman 111 | and Liu, Qun 112 | and Way, Andy", 113 | title = "Improving Character-Based Decoding Using Target-Side Morphological Information for Neural Machine Translation ", 114 | booktitle = "Proceedings of NAACL", 115 | year = "2018" 116 | } 117 | @InProceedings{N18-2078, 118 | author = "Marcheggiani, Diego 119 | and Bastings, Joost 120 | and Titov, Ivan", 121 | title = "Exploiting Semantics in Neural Machine Translation with Graph Convolutional Networks ", 122 | booktitle = "Proceedings of NAACL", 123 | year = "2018" 124 | } 125 | @InProceedings{P18-1116, 126 | author = "Ma, Chunpeng 127 | and Tamura, Akihiro 128 | and Utiyama, Masao 129 | and Zhao, Tiejun 130 | and Sumita, Eiichiro", 131 | title = "Forest-Based Neural Machine Translation", 132 | booktitle = "Proceedings of ACL", 133 | year = "2018" 134 | } 135 | @InProceedings{P18-1164, 136 | author = "Kuang, Shaohui 137 | and Li, Junhui 138 | and Branco, Ant{\'o}nio 139 | and Luo, Weihua 140 | and Xiong, Deyi", 141 | title = "Attention Focusing for Neural Machine Translation by Bridging Source and Target Embeddings", 142 | booktitle = "Proceedings of ACL", 143 | year = "2018" 144 | } 145 | @InProceedings{P18-2049, 146 | author = "Ataman, Duygu 147 | and Federico, Marcello", 148 | title = "Compositional Representation of Morphologically-Rich Input for Neural Machine Translation", 149 | booktitle = "Proceedings of ACL", 150 | year = "2018" 151 | } 152 | @InProceedings{P18-1026, 153 | author= "Beck, Daniel 154 | and Haffari, Gholamreza 155 | and Cohn, Trevor", 156 | title= "Graph-to-Sequence Learning using Gated Graph Neural Networks", 157 | booktitle = "Proceedings of ACL", 158 | year= "2018", 159 | } 160 | @InProceedings{P18-2051, 161 | author = "Saunders, Danielle 162 | and Stahlberg, Felix 163 | and de Gispert, Adri{\`a} 164 | and Byrne, Bill", 165 | title = "Multi-representation ensembles and delayed SGD updates improve syntax-based NMT", 166 | booktitle = "Proceedings of ACL", 167 | year = "2018" 168 | } 169 | @InProceedings{C18-1110, 170 | author = "Zhang, Wen 171 | and Hu, Jiawei 172 | and Feng, Yang 173 | and Liu, Qun", 174 | title = "Refining Source Representations with Relation Networks for Neural Machine Translation", 175 | booktitle = "Proceedings of COLING", 176 | year = "2018" 177 | } 178 | @InProceedings{C18-1120, 179 | author = "Zaremoodi, Poorya 180 | and Haffari, Gholamreza", 181 | title = "Incorporating Syntactic Uncertainty in Neural Machine Translation with a Forest-to-Sequence Model", 182 | booktitle = "Proceedings of COLING", 183 | year = "2018" 184 | } 185 | @InProceedings{C18-1123, 186 | author = "Zhang, Hao 187 | and Ng, Axel 188 | and Sproat, Richard", 189 | title = "Fast and Accurate Reordering with ITG Transition RNN", 190 | booktitle = "Proceedings of COLING", 191 | year = "2018" 192 | } 193 | @InProceedings{D18-1037, 194 | author = "G{\={u}}, Jetic 195 | and Shavarani, Hassan S. 196 | and Sarkar, Anoop", 197 | title = "Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing", 198 | booktitle = "Proceedings of EMNLP", 199 | year = "2018" 200 | } 201 | @InProceedings{D18-1327, 202 | author = "Currey, Anna 203 | and Heafield, Kenneth", 204 | title = "Multi-Source Syntactic Neural Machine Translation", 205 | booktitle = "Proceedings of EMNLP", 206 | year = "2018" 207 | } 208 | @InProceedings{D18-1509, 209 | author = "Wang, Xinyi 210 | and Pham, Hieu 211 | and Yin, Pengcheng 212 | and Neubig, Graham", 213 | title = "A Tree-based Decoder for Neural Machine Translation", 214 | booktitle = "Proceedings of EMNLP", 215 | year = "2018" 216 | } 217 | @Article{Q18-1017, 218 | author = "Kiperwasser, Eliyahu 219 | and Ballesteros, Miguel", 220 | title = "Scheduled Multi-Task Learning: From Syntax to Translation", 221 | journal = "Transactions of the Association for Computational Linguistics", 222 | year = "2018", 223 | volume = "6", 224 | pages = "225--240" 225 | } 226 | -------------------------------------------------------------------------------- /bib_citations/NMT_prior_knowledge_word_phrase.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{he2016improved, 2 | author = "He, Wei 3 | and He, Zhongjun 4 | and Wu, Hua and 5 | Wang, Haifeng", 6 | title = "Improved Neural Machine Translation with SMT Features.", 7 | booktitle = "Proceedings of AAAI", 8 | year = "2016" 9 | } 10 | @InProceedings{P16-2021, 11 | author = "Mi, Haitao 12 | and Wang, Zhiguo and 13 | Ittycheriah, Abe", 14 | title = "Vocabulary manipulation for neural machine translation", 15 | booktitle = "Proceedings of ACL", 16 | year = "2016" 17 | } 18 | @InProceedings{D16-1162, 19 | author = "Arthur, Philip 20 | and Neubig, Graham 21 | and Nakamura, Satoshi", 22 | title = "Incorporating Discrete Translation Lexicons into Neural Machine Translation", 23 | booktitle = "Proceedings of EMNLP", 24 | year = "2016" 25 | } 26 | @InProceedings{P17-1139, 27 | author = "Zhang, Jiacheng 28 | and Liu, Yang 29 | and Luan, Huanbo 30 | and Xu, Jingfang 31 | and Sun, Maosong", 32 | title = "Prior Knowledge Integration for Neural Machine Translation using Posterior Regularization", 33 | booktitle = "Proceedings of ACL", 34 | year = "2017" 35 | } 36 | @InProceedings{P17-1141, 37 | author = "Hokamp, Chris 38 | and Liu, Qun", 39 | title = "Lexically Constrained Decoding for Sequence Generation Using Grid Beam Search", 40 | booktitle = "Proceedings of ACL", 41 | year = "2017" 42 | } 43 | @InProceedings{E17-2061, 44 | author = "Yang, Zichao 45 | and Hu, Zhiting 46 | and Deng, Yuntian 47 | and Dyer, Chris 48 | and Smola, Alex", 49 | title = "Neural Machine Translation with Recurrent Attention Modeling", 50 | booktitle = "Proceedings of EACL", 51 | year = "2017" 52 | } 53 | @InProceedings{E17-2025, 54 | author = "Press, Ofir 55 | and Wolf, Lior", 56 | title = "Using the Output Embedding to Improve Language Models", 57 | booktitle = "Proceedings of EACL", 58 | year = "2017" 59 | } 60 | @InProceedings{W17-4716, 61 | author = "Chatterjee, Rajen 62 | and Negri, Matteo 63 | and Turchi, Marco 64 | and Federico, Marcello 65 | and Specia, Lucia 66 | and Blain, Fr{\'e}d{\'e}ric", 67 | title = "Guiding Neural Machine Translation Decoding with External Knowledge", 68 | booktitle = "Proceedings of the Second Conference on Machine Translation", 69 | year = "2017" 70 | } 71 | @InProceedings{D17-1013, 72 | author = "Weng, Rongxiang 73 | and Huang, Shujian 74 | and Zheng, Zaixiang 75 | and DAI, XIN-YU 76 | and CHEN, Jiajun", 77 | title = "Neural Machine Translation with Word Predictions", 78 | booktitle = "Proceedings of EMNLP", 79 | year = "2017" 80 | } 81 | @InProceedings{D17-1146, 82 | author = "Feng, Yang 83 | and Zhang, Shiyue 84 | and Zhang, Andi 85 | and Wang, Dong 86 | and Abel, Andrew", 87 | title = "Memory-augmented Neural Machine Translation", 88 | booktitle = "Proceedings of EMNLP", 89 | year = "2017" 90 | } 91 | @InProceedings{D17-1148, 92 | author = "Dahlmann, Leonard 93 | and Matusov, Evgeny 94 | and Petrushkov, Pavel 95 | and Khadivi, Shahram", 96 | title = "Neural Machine Translation Leveraging Phrase-based Models in a Hybrid Search", 97 | booktitle = "Proceedings of EMNLP", 98 | year = "2017" 99 | } 100 | @InProceedings{D17-1149, 101 | author = "Wang, Xing 102 | and Tu, Zhaopeng 103 | and Xiong, Deyi 104 | and Zhang, Min", 105 | title = "Translating Phrases in Neural Machine Translation", 106 | booktitle = "Proceedings of EMNLP", 107 | year = "2017" 108 | } 109 | @InProceedings{D17-1150, 110 | author = "Yang, Baosong 111 | and Wong, Derek F. 112 | and Xiao, Tong 113 | and Chao, Lidia S. 114 | and Zhu, Jingbo", 115 | title = "Towards Bidirectional Hierarchical Representations for Attention-based Neural Machine Translation", 116 | booktitle = "Proceedings of EMNLP", 117 | year = "2017" 118 | } 119 | @InProceedings{huang2017towards, 120 | title={Towards Neural Phrase-based Machine Translation}, 121 | author={Huang, Po-Sen and Wang, Chong and Huang, Sitao and Zhou, Dengyong and Deng, Li}, 122 | booktitle={Proceedings of ICLR}, 123 | year={2017} 124 | } 125 | @InProceedings{N18-1031, 126 | author = "Nguyen, Toan 127 | and Chiang, David", 128 | title = "Improving Lexical Choice in Neural Machine Translation", 129 | booktitle = "Proceedings of NAACL", 130 | year = "2018" 131 | } 132 | @InProceedings{N18-1116, 133 | author = "Chen, Huadong 134 | and Huang, Shujian 135 | and Chiang, David 136 | and Dai, Xinyu 137 | and Chen, Jiajun", 138 | title = "Combining Character and Word Information in Neural Machine Translation Using a Multi-Level Attention", 139 | booktitle = "Proceedings of NAACL", 140 | year = "2018" 141 | } 142 | @InProceedings{N18-1119, 143 | author = "Post, Matt 144 | and Vilar, David", 145 | title = "Fast Lexically Constrained Decoding with Dynamic Beam Allocation for Neural Machine Translation", 146 | booktitle = "Proceedings of NAACL", 147 | year = "2018" 148 | } 149 | @InProceedings{N18-1120, 150 | author = "Zhang, Jingyi 151 | and Utiyama, Masao 152 | and Sumita, Eiichro 153 | and Neubig, Graham 154 | and Nakamura, Satoshi", 155 | title = "Guiding Neural Machine Translation with Retrieved Translation Pieces", 156 | booktitle = "Proceedings of NAACL", 157 | year = "2018" 158 | } 159 | @InProceedings{N18-2081, 160 | author = "Hasler, Eva 161 | and de Gispert, Adri{\`a} 162 | and Iglesias, Gonzalo 163 | and Byrne, Bill", 164 | title = "Neural Machine Translation Decoding with Terminology Constraints", 165 | booktitle = "Proceedings of NAACL", 166 | year = "2018" 167 | } 168 | @InProceedings{N18-2083, 169 | author = "Pourdamghani, Nima 170 | and Ghazvininejad, Marjan 171 | and Knight, Kevin", 172 | title = "Using Word Vectors to Improve Word Alignments for Low Resource Machine Translation", 173 | booktitle = "Proceedings of NAACL", 174 | year = "2018" 175 | } 176 | @InProceedings{P18-2053, 177 | author = "Ma, Shuming 178 | and SUN, Xu 179 | and Wang, Yizhong 180 | and Lin, Junyang", 181 | title = "Bag-of-Words as Target for Neural Machine Translation", 182 | booktitle = "Proceedings of ACL", 183 | year = "2018" 184 | } 185 | @InProceedings{C18-1124, 186 | author = "Wang, Mingxuan 187 | and Xie, Jun 188 | and Tan, Zhixing 189 | and Su, Jinsong 190 | and Xiong, Deyi 191 | and Bian, Chao", 192 | title = "Neural Machine Translation with Decoding History Enhanced Attention", 193 | booktitle = "Proceedings of COLING", 194 | year = "2018" 195 | } 196 | @InProceedings{C18-1274, 197 | author = "Ugawa, Arata 198 | and Tamura, Akihiro 199 | and Ninomiya, Takashi 200 | and Takamura, Hiroya 201 | and Okumura, Manabu", 202 | title = "Neural Machine Translation Incorporating Named Entity", 203 | booktitle = "Proceedings of COLING", 204 | year = "2018" 205 | } 206 | @InProceedings{D18-1333, 207 | author = "Wang, Longyue 208 | and Tu, Zhaopeng 209 | and Way, Andy 210 | and Liu, Qun", 211 | title = "Learning to Jointly Translate and Predict Dropped Pronouns with a Shared Reconstruction Mechanism", 212 | booktitle = "Proceedings of EMNLP", 213 | year = "2018" 214 | } 215 | @InProceedings{D18-1340, 216 | author = "Cao, Qian 217 | and Xiong, Deyi", 218 | title = "Encoding Gated Translation Memory into Neural Machine Translation", 219 | booktitle = "Proceedings of EMNLP", 220 | year = "2018" 221 | } 222 | @inproceedings{gong2018frage, 223 | title={FRAGE: frequency-agnostic word representation}, 224 | author={Gong, Chengyue and He, Di and Tan, Xu and Qin, Tao and Wang, Liwei and Liu, Tie-Yan}, 225 | booktitle={Proceedings of NeurIPS}, 226 | year={2018} 227 | } 228 | @inproceedings{wang-etal-2019-one, 229 | title = "One Model to Learn Both: Zero Pronoun Prediction and Translation", 230 | author = "Wang, Longyue and 231 | Tu, Zhaopeng and 232 | Wang, Xing and 233 | Shi, Shuming", 234 | year = "2019", 235 | booktitle = "Proceedings of EMNLP", 236 | } -------------------------------------------------------------------------------- /bib_citations/NMT_quality_estimation.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{W15-3037, 2 | author = "Kreutzer, Julia 3 | and Schamoni, Shigehiko 4 | and Riezler, Stefan", 5 | title = "QUality Estimation from ScraTCH (QUETCH): Deep Learning for Word-level Translation Quality Estimation", 6 | booktitle = "Proceedings of the Tenth Workshop on Statistical Machine Translation", 7 | year = "2015" 8 | } 9 | @InProceedings{N16-1059, 10 | author = "Kim, Hyun 11 | and Lee, Jong-Hyeok", 12 | title = "A Recurrent Neural Networks Approach for Estimating the Quality of Machine Translation Output", 13 | booktitle = "Proceedings of NAACL", 14 | year = "2016" 15 | } 16 | @InProceedings{W17-4763, 17 | author = "Kim, Hyun 18 | and Lee, Jong-Hyeok 19 | and Na, Seung-Hoon", 20 | title = "Predictor-Estimator using Multilevel Task Learning with Stack Propagation for Neural Quality Estimation", 21 | booktitle = "Proceedings of the Second Conference on Machine Translation", 22 | year = "2017" 23 | } 24 | @InProceedings{E17-1020, 25 | author = "Baskaya, Osman 26 | and Yildiz, Eray 27 | and Tunaoglu, Doruk 28 | and Eren, Mustafa Tolga 29 | and Do{\u{g}}ru{\"o}z, A. Seza", 30 | title = "Integrating Meaning into Quality Evaluation of Machine Translation", 31 | booktitle = "Proceedings of EACL", 32 | year = "2017" 33 | } 34 | @InProceedings{E17-2057, 35 | author = "Graham, Yvette 36 | and Ma, Qingsong 37 | and Baldwin, Timothy 38 | and Liu, Qun 39 | and Parra, Carla 40 | and Scarton, Carolina", 41 | title = "Improving Evaluation of Document-level Machine Translation Quality Estimation", 42 | booktitle = "Proceedings of EACL", 43 | year = "2017" 44 | } 45 | @InProceedings{E17-2060, 46 | author = "Sennrich, Rico", 47 | title = "How Grammatical is Character-level Neural Machine Translation? Assessing MT Quality with Contrastive Translation Pairs", 48 | booktitle = "Proceedings of EACL", 49 | year = "2017" 50 | } 51 | @InProceedings{D17-1263, 52 | author = "Isabelle, Pierre 53 | and Cherry, Colin 54 | and Foster, George", 55 | title = "A Challenge Set Approach to Evaluating Machine Translation", 56 | booktitle = "Proceedings of EMNLP", 57 | year = "2017" 58 | } 59 | @InProceedings{D17-1147, 60 | author = "van der Wees, Marlies 61 | and Bisazza, Arianna 62 | and Monz, Christof", 63 | title = "Dynamic Data Selection for Neural Machine Translation", 64 | booktitle = "Proceedings of EMNLP", 65 | year = "2017" 66 | } 67 | @Article{Q17-1015, 68 | author = "Martins, Andr{\'e} F.T. 69 | and Junczys-Dowmunt, Marcin 70 | and Kepler, Fabio N. 71 | and Astudillo, Ram{\'o}n 72 | and Hokamp, Chris 73 | and Grundkiewicz, Roman", 74 | title = "Pushing the Limits of Translation Quality Estimation", 75 | journal = "Transactions of the Association for Computational Linguistics", 76 | year = "2017", 77 | volume = "5", 78 | pages = "205--218", 79 | } 80 | @article{li2018unified, 81 | title={A Unified Neural Network for Quality Estimation of Machine Translation}, 82 | author={Li, Maoxi and Xiang, Qingyu and Chen, Zhiming and Wang, Mingwen}, 83 | journal={IEICE Transactions on Information and Systems}, 84 | volume={101}, 85 | number={9}, 86 | pages={2417--2421}, 87 | year={2018}, 88 | publisher={The Institute of Electronics, Information and Communication Engineers} 89 | } 90 | @InProceedings{W18-6451, 91 | author = "Specia, Lucia 92 | and Blain, Fr{\'e}d{\'e}ric 93 | and Logacheva, Varvara 94 | and Astudillo, Ram{\'o}n 95 | and Martins, Andr{\'e} F. T.", 96 | title = "Findings of the WMT 2018 Shared Task on Quality Estimation", 97 | booktitle = "Proceedings of the Third Conference on Machine Translation: Shared Task Papers", 98 | year = "2018" 99 | } 100 | @InProceedings{W18-6314, 101 | author = "Wang, Wei 102 | and Watanabe, Taro 103 | and Hughes, Macduff 104 | and Nakagawa, Tetsuji 105 | and Chelba, Ciprian", 106 | title = "Denoising Neural Machine Translation Training with Trusted Data and Online Data Selection", 107 | booktitle = "Proceedings of the Third Conference on Machine Translation: Research Papers", 108 | year = "2018" 109 | } 110 | @InProceedings{P18-2037, 111 | author = "Schwenk, Holger", 112 | title = "Filtering and Mining Parallel Data in a Joint Multilingual Space", 113 | booktitle = "Proceedings of ACL", 114 | year = "2018" 115 | } 116 | @InProceedings{P18-2105, 117 | author = "Stewart, Craig 118 | and Vogler, Nikolai 119 | and Hu, Junjie 120 | and Boyd-Graber, Jordan 121 | and Neubig, Graham", 122 | title = "Automatic Estimation of Simultaneous Interpreter Performance", 123 | booktitle = "Proceedings of ACL", 124 | year = "2018" 125 | } 126 | @InProceedings{C18-1266, 127 | author = "Ive, Julia 128 | and Blain, Fr{\'e}d{\'e}ric 129 | and Specia, Lucia", 130 | title = "deepQuest: A Framework for Neural-based Quality Estimation", 131 | booktitle = "Proceedings of COLING", 132 | year = "2018" 133 | } 134 | @InProceedings{D18-1328, 135 | author = "Pham, Minh Quang 136 | and Crego, Josep 137 | and Senellart, Jean 138 | and Yvon, Fran{\c{c}}ois", 139 | title = "Fixing Translation Divergences in Parallel Corpora for Neural MT", 140 | booktitle = "Proceedings of EMNLP", 141 | year = "2018" 142 | } 143 | @InProceedings{fan2019bilingual, // Currently goes with the citation from the ResearchGate 144 | author = {Fan, Kai and Li, Bo and Zhou, Fengming and Wang, Jiayi}, 145 | title = {"Bilingual Expert" Can Find Translation Errors}, 146 | booktitle = {Proceedings of AAAI}, 147 | year = {2019}, 148 | } -------------------------------------------------------------------------------- /bib_citations/NMT_robustness.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{belinkov2017synthetic, 2 | title={Synthetic and Natural Noise Both Break Neural Machine Translation}, 3 | author={Belinkov, Yonatan and Bisk, Yonatan}, 4 | booktitle = {Proceedings of ICLR}, 5 | year = {2018} 6 | } 7 | @inproceedings{zhao2017generating, 8 | title={Generating natural adversarial examples}, 9 | author={Zhao, Zhengli and Dua, Dheeru and Singh, Sameer}, 10 | booktitle = {Proceedings of ICLR}, 11 | year = {2018} 12 | } 13 | @InProceedings{P18-1163, 14 | author = "Cheng, Yong 15 | and Tu, Zhaopeng 16 | and Meng, Fandong 17 | and Zhai, Junjie 18 | and Liu, Yang", 19 | title = "Towards Robust Neural Machine Translation", 20 | booktitle = "Proceedings of ACL", 21 | year = "2018" 22 | } 23 | @InProceedings{P18-1079, 24 | author = "Ribeiro, Marco Tulio 25 | and Singh, Sameer 26 | and Guestrin, Carlos", 27 | title = "Semantically Equivalent Adversarial Rules for Debugging NLP models", 28 | booktitle = "Proceedings of ACL", 29 | year = "2018" 30 | } 31 | @InProceedings{C18-1055, 32 | author = "Ebrahimi, Javid 33 | and Lowd, Daniel 34 | and Dou, Dejing", 35 | title = "On Adversarial Examples for Character-Level Neural Machine Translation", 36 | booktitle = "Proceedings of COLING", 37 | year = "2018" 38 | } 39 | @InProceedings{D18-1050, 40 | author = "Michel, Paul 41 | and Neubig, Graham", 42 | title = "MTNT: A Testbed for Machine Translation of Noisy Text", 43 | booktitle = "Proceedings of EMNLP", 44 | year = "2018" 45 | } -------------------------------------------------------------------------------- /bib_citations/NMT_speech_and_simultaneous.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{post2013improved, 2 | title={Improved speech-to-text translation with the Fisher and Callhome Spanish--English speech translation corpus}, 3 | author={Post, Matt and Kumar, Gaurav and Lopez, Adam and Karakos, Damianos and Callison-Burch, Chris and Khudanpur, Sanjeev}, 4 | booktitle={Proceedings of IWSLT}, 5 | year={2013} 6 | } 7 | @inproceedings{kumar2014some, 8 | title={Some insights from translating conversational telephone speech}, 9 | author={Kumar, Gaurav and Post, Matt and Povey, Daniel and Khudanpur, Sanjeev}, 10 | booktitle={Acoustics, Speech and Signal Processing (ICASSP), 2014 IEEE International Conference on}, 11 | year={2014} 12 | } 13 | @InProceedings{N16-1109, 14 | author = "Duong, Long 15 | and Anastasopoulos, Antonios 16 | and Chiang, David 17 | and Bird, Steven 18 | and Cohn, Trevor", 19 | title = "An Attentional Model for Speech Translation Without Transcription", 20 | booktitle = "Proceedings of NAACL", 21 | year = "2016" 22 | } 23 | @InProceedings{D16-1133, 24 | author = "Anastasopoulos, Antonios 25 | and Chiang, David 26 | and Duong, Long", 27 | title = "An Unsupervised Probability Model for Speech-to-Translation Alignment of Low-Resource Languages", 28 | booktitle = "Proceedings of EMNLP", 29 | year = "2016" 30 | } 31 | @InProceedings{weiss2017sequence, 32 | author={Weiss, Ron J and Chorowski, Jan and Jaitly, Navdeep and Wu, Yonghui and Chen, Zhifeng}, 33 | title={Sequence-to-sequence models can directly translate foreign speech}, 34 | booktitle={Proceedings of Interspeech}, 35 | year={2017} 36 | } 37 | @InProceedings{E17-1099, 38 | author = "Gu, Jiatao 39 | and Neubig, Graham 40 | and Cho, Kyunghyun 41 | and Li, Victor O.K.", 42 | title = "Learning to Translate in Real-time with Neural Machine Translation", 43 | booktitle = "Proceedings of EACL", 44 | year = "2017" 45 | } 46 | @InProceedings{E17-2076, 47 | author = "Bansal, Sameer 48 | and Kamper, Herman 49 | and Lopez, Adam 50 | and Goldwater, Sharon", 51 | title = "Towards speech-to-text translation without speech recognition", 52 | booktitle = "Proceedings of EACL", 53 | year = "2017" 54 | } 55 | @inproceedings{gu2017non, 56 | title={Non-autoregressive neural machine translation}, 57 | author={Gu, Jiatao and Bradbury, James and Xiong, Caiming and Li, Victor OK and Socher, Richard}, 58 | booktitle={Proceedings of ICLR}, 59 | year={2018} 60 | } 61 | @InProceedings{N18-1008, 62 | author = "Anastasopoulos, Antonios 63 | and Chiang, David", 64 | title = "Tied Multitask Learning for Neural Speech Translation", 65 | booktitle = "Proceedings of NAACL", 66 | year = "2018" 67 | } 68 | @InProceedings{N18-2079, 69 | author = "Dalvi, Fahim 70 | and Durrani, Nadir 71 | and Sajjad, Hassan 72 | and Vogel, Stephan", 73 | title = "Incremental Decoding and Training Methods for Simultaneous Translation in Neural Machine Translation", 74 | booktitle = "Proceedings of NAACL", 75 | year = "2018" 76 | } 77 | @InProceedings{P18-2105, 78 | author = "Stewart, Craig 79 | and Vogler, Nikolai 80 | and Hu, Junjie 81 | and Boyd-Graber, Jordan 82 | and Neubig, Graham", 83 | title = "Automatic Estimation of Simultaneous Interpreter Performance", 84 | booktitle = "Proceedings of ACL", 85 | year = "2018" 86 | } 87 | @InProceedings{C18-2020, 88 | author = "Dessloch, Florian 89 | and Ha, Thanh-Le 90 | and M{\"u}ller, Markus 91 | and Niehues, Jan 92 | and Nguyen, Thai Son 93 | and Pham, Ngoc-Quan 94 | and Salesky, Elizabeth 95 | and Sperber, Matthias 96 | and St{\"u}ker, Sebastian 97 | and Zenkel, Thomas 98 | and Waibel, Alexander", 99 | title = "KIT Lecture Translator: Multilingual Speech Translation with One-Shot Learning", 100 | booktitle = "Proceedings of COLING", 101 | year = "2018" 102 | } 103 | @InProceedings{D18-1044, 104 | author = "Wang, Chunqi 105 | and Zhang, Ji 106 | and Chen, Haiqing", 107 | title = "Semi-Autoregressive Neural Machine Translation", 108 | booktitle = "Proceedings of EMNLP", 109 | year = "2018" 110 | } 111 | @InProceedings{D18-1336, 112 | author = "Libovick{\'y}, Jind{\v{r}}ich 113 | and Helcl, Jind{\v{r}}ich", 114 | title = "End-to-End Non-Autoregressive Neural Machine Translation with Connectionist Temporal Classification", 115 | booktitle = "Proceedings of EMNLP", 116 | year = "2018" 117 | } 118 | @InProceedings{D18-1337, 119 | author = "Alinejad, Ashkan 120 | and Siahbani, Maryam 121 | and Sarkar, Anoop", 122 | title = "Prediction Improves Simultaneous Neural Machine Translation", 123 | booktitle = "Proceedings of EMNLP", 124 | year = "2018" 125 | } 126 | @article{ma2018stacl, 127 | title={Stacl: Simultaneous translation with integrated anticipation and controllable latency}, 128 | author={Ma, Mingbo and Huang, Liang and Xiong, Hao and Liu, Kaibo and Zhang, Chuanqiang and He, Zhongjun and Liu, Hairong and Li, Xing and Wang, Haifeng}, 129 | journal={arXiv preprint arXiv:1810.08398}, 130 | year={2018} 131 | } -------------------------------------------------------------------------------- /bib_citations/NMT_training_framework.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{ranzato2016sequence, 2 | title={Sequence level training with recurrent neural networks}, 3 | author={Ranzato, Marc'Aurelio and Chopra, Sumit and Auli, Michael and Zaremba, Wojciech}, 4 | booktitle={Proceedings of ICLR}, 5 | year={2016} 6 | } 7 | @inproceedings{luong2016multi, 8 | title={Multi-task sequence to sequence learning}, 9 | author={Luong, Minh-Thang and Le, Quoc V and Sutskever, Ilya and Vinyals, Oriol and Kaiser, Lukasz}, 10 | booktitle={Proceedings of ICLR}, 11 | year={2016} 12 | } 13 | @InProceedings{P16-1159, 14 | author = "Shen, Shiqi 15 | and Cheng, Yong 16 | and He, Zhongjun 17 | and He, Wei 18 | and Wu, Hua 19 | and Sun, Maosong 20 | and Liu, Yang", 21 | title = "Minimum Risk Training for Neural Machine Translation", 22 | booktitle = "Proceedings of ACL", 23 | year = "2016" 24 | } 25 | @InProceedings{D16-1137, 26 | author = "Wiseman, Sam 27 | and Rush, Alexander M.", 28 | title = "Sequence-to-Sequence Learning as Beam-Search Optimization", 29 | booktitle = "Proceedings of EMNLP", 30 | year = "2016" 31 | } 32 | @inproceedings{he2016dual, 33 | title={Dual learning for machine translation}, 34 | author={He, Di and Xia, Yingce and Qin, Tao and Wang, Liwei and Yu, Nenghai and Liu, Tie-Yan and Ma, Wei-Ying}, 35 | booktitle={Proceedings of NIPS}, 36 | year={2016} 37 | } 38 | @inproceedings{sokolov2016stochastic, 39 | title={Stochastic structured prediction under bandit feedback}, 40 | author={Sokolov, Artem and Kreutzer, Julia and Riezler, Stefan and Lo, Christopher}, 41 | booktitle={Proceedings of NIPS}, 42 | year={2016} 43 | } 44 | @inproceedings{bahdanau2017actor, 45 | title={An actor-critic algorithm for sequence prediction}, 46 | author={Bahdanau, Dzmitry and Brakel, Philemon and Xu, Kelvin and Goyal, Anirudh and Lowe, Ryan and Pineau, Joelle and Courville, Aaron and Bengio, Yoshua}, 47 | booktitle={Proceedings of ICLR}, 48 | year={2017} 49 | } 50 | @inproceedings{xia2017dualsupervised, 51 | title={Dual Supervised Learning}, 52 | author={Xia, Yingce and Qin, Tao and Chen, Wei and Bian, Jiang and Yu, Nenghai and Liu, Tieyan}, 53 | journal={international conference on machine learning}, 54 | pages={3789--3798}, 55 | year={2017} 56 | } 57 | @inproceedings{Xia2017DualInference, 58 | author = {Yingce Xia and 59 | Jiang Bian and 60 | Tao Qin and 61 | Nenghai Yu and 62 | Tie{-}Yan Liu}, 63 | title = {Dual Inference for Machine Learning}, 64 | booktitle = {Proceedings of the Twenty-Sixth International Joint Conference on 65 | Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August 66 | 19-25, 2017}, 67 | pages = {3112--3118}, 68 | year = {2017} 69 | } 70 | @InProceedings{P17-1138, 71 | author = "Kreutzer, Julia 72 | and Sokolov, Artem 73 | and Riezler, Stefan", 74 | title = "Bandit Structured Prediction for Neural Sequence-to-Sequence Learning", 75 | booktitle = "Proceedings of ACL", 76 | year = "2017" 77 | } 78 | @inproceedings{he2017decoding, 79 | title={Decoding with value networks for neural machine translation}, 80 | author={He, Di and Lu, Hanqing and Xia, Yingce and Qin, Tao and Wang, Liwei and Liu, Tie-Yan}, 81 | booktitle={Proceedings of NIPS}, 82 | year={2017} 83 | } 84 | @InProceedings{N18-1033, 85 | author = "Edunov, Sergey 86 | and Ott, Myle 87 | and Auli, Michael 88 | and Grangier, David 89 | and Ranzato, Marc'Aurelio", 90 | title = "Classical Structured Prediction Losses for Sequence to Sequence Learning", 91 | booktitle = "Proceedings of NAACL", 92 | year = "2018" 93 | } 94 | @InProceedings{N18-1122, 95 | author = "Yang, Zhen 96 | and Chen, Wei 97 | and Wang, Feng 98 | and Xu, Bo", 99 | title = "Improving Neural Machine Translation with Conditional Sequence Generative Adversarial Nets", 100 | booktitle = "Proceedings of NAACL", 101 | year = "2018" 102 | } 103 | @InProceedings{P18-1155, 104 | author = "Dai, Zihang 105 | and Xie, Qizhe 106 | and Hovy, Eduard", 107 | title = "From Credit Assignment to Entropy Regularization: Two New Algorithms for Neural Sequence Prediction", 108 | booktitle = "Proceedings of ACL", 109 | year = "2018" 110 | } 111 | @InProceedings{D18-1149, 112 | author = "Lee, Jason 113 | and Mansimov, Elman 114 | and Cho, Kyunghyun", 115 | title = "Deterministic Non-Autoregressive Neural Sequence Modeling by Iterative Refinement", 116 | booktitle = "Proceedings of EMNLP", 117 | year = "2018" 118 | } 119 | @InProceedings{D18-1217, 120 | author = "Clark, Kevin 121 | and Luong, Minh-Thang 122 | and Manning, Christopher D. 123 | and Le, Quoc", 124 | title = "Semi-Supervised Sequence Modeling with Cross-View Training", 125 | booktitle = "Proceedings of EMNLP", 126 | year = "2018" 127 | } 128 | @InProceedings{D18-1397, 129 | author = "Wu, Lijun 130 | and Tian, Fei 131 | and Qin, Tao 132 | and Lai, Jianhuang 133 | and Liu, Tie-Yan", 134 | title = "A Study of Reinforcement Learning for Neural Machine Translation", 135 | booktitle = "Proceedings of EMNLP", 136 | year = "2018" 137 | } 138 | @InProceedings{D18-1398, 139 | author = "Gu, Jiatao 140 | and Wang, Yong 141 | and Chen, Yun 142 | and Li, Victor O. K. 143 | and Cho, Kyunghyun", 144 | title = "Meta-Learning for Low-Resource Neural Machine Translation", 145 | booktitle = "Proceedings of EMNLP", 146 | year = "2018" 147 | } 148 | @InProceedings{D18-1406, 149 | author = "Yavuz, Semih 150 | and Chiu, Chung-Cheng 151 | and Nguyen, Patrick 152 | and Wu, Yonghui", 153 | title = "CaLcs: Continuously Approximating Longest Common Subsequence for Sequence Level Optimization", 154 | booktitle = "Proceedings of EMNLP", 155 | year = "2018" 156 | } 157 | @InProceedings{shah2018generative, 158 | author = {Shah, Harshil and 159 | Barber, David}, 160 | title = {Generative Neural Machine Translation}, 161 | booktitle = {Proceedings of NeurIPS}, 162 | year = {2018} 163 | } 164 | @InProceedings{wu2018learning, 165 | author = {Wu, Lijun and 166 | Tian, Fei and 167 | Xia, Yingce and 168 | Fan, Yang and 169 | Qin, Tao and 170 | Lai, Jianhuang and 171 | Liu, Tie{-}Yan}, 172 | title = {Learning to Teach with Dynamic Loss Functions}, 173 | booktitle = {Proceedings of NeurIPS}, 174 | year = {2018} 175 | } 176 | @inproceedings{wang2019multi, 177 | title={Multi-Agent Dual Learning}, 178 | author={Wang, Yiren and Xia, Yingce and He, Tianyu and Tian, Fei and Qin, Tao and Zhai, ChengXiang and Liu, Tie-Yan}, 179 | booktitle={Proceedings of ICLR}, 180 | year={2019} 181 | } 182 | @inproceedings{chen2019improving, 183 | title={Improving Sequence-to-Sequence Learning via Optimal Transport}, 184 | author={Chen, Liqun and Zhang, Yizhe and Zhang, Ruiyi and Tao, Chenyang and Gan, Zhe and Zhang, Haichao and Li, Bai and Shen, Dinghan and Chen, Changyou and Carin Lawrence}, 185 | booktitle={Proceedings of ICLR}, 186 | year={2019} 187 | } 188 | @inproceedings{kumar2019von, 189 | title={Von Mises-Fisher Loss for Training Sequence to Sequence Models with Continuous Outputs}, 190 | author={Kumar, Sachin and Tsvetkov, Yulia}, 191 | booktitle={Proceedings of ICLR}, 192 | year={2019} 193 | } 194 | @inproceedings{bi-etal-2019-multi, 195 | title = "Multi-agent Learning for Neural Machine Translation", 196 | author = "bi, tianchi and 197 | xiong, hao and 198 | He, Zhongjun and 199 | Wu, Hua and 200 | Wang, Haifeng", 201 | booktitle = "Proceedings of EMNLP)", 202 | } -------------------------------------------------------------------------------- /bib_citations/NMT_tutorials_and_challenges.bib: -------------------------------------------------------------------------------- 1 | @misc{thang2016neural, 2 | author = {Luong, Thang 3 | and Cho, Kyunghyun 4 | and Manning, Christopher}, 5 | title = {Neural Machine Translation}, 6 | howpublished = {ACL Tutorial}, 7 | year = {2016}, 8 | } 9 | @article{neubig2017neural, 10 | author = {Neubig, Graham}, 11 | title = {Neural Machine Translation and Sequence-to-sequence Models: {A} Tutorial}, 12 | journal = {CoRR}, 13 | year = {2017} 14 | } 15 | @misc{vinyals2017seq2seq, 16 | author = {Vinyals, Oriol 17 | and Jaitly, Navdeep}, 18 | title = {Seq2Seq ICML Tutorial}, 19 | howpublished = {ICML Tutorial}, 20 | year = {2017}, 21 | } 22 | @article{philipp2017neural, 23 | author = {Koehn, Philipp}, 24 | title = {Neural Machine Translation}, 25 | journal = {CoRR}, 26 | volume = {abs/1709.07809}, 27 | year = {2017} 28 | } 29 | @InProceedings{W17-3204, 30 | author = "Koehn, Philipp 31 | and Knowles, Rebecca", 32 | title = "Six Challenges for Neural Machine Translation", 33 | booktitle = "Proceedings of the First Workshop on Neural Machine Translation", 34 | year = "2017" 35 | } 36 | -------------------------------------------------------------------------------- /bib_citations/SMT_discriminative_training.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P02-1038, 2 | author = "Och, Franz Josef 3 | and Ney, Hermann ", 4 | title = "Discriminative Training and Maximum Entropy Models for Statistical Machine Translation", 5 | booktitle = "Proceedings of ACL", 6 | year = "2002" 7 | } 8 | @inproceedings{mrt4smt, 9 | title={Minimum error rate training in statistical machine translation}, 10 | author={Och, Franz Josef}, 11 | booktitle={Proceedings of ACL}, 12 | year={2003} 13 | } 14 | @InProceedings{D07-1080, 15 | author = "Watanabe, Taro 16 | and Suzuki, Jun 17 | and Tsukada, Hajime 18 | and Isozaki, Hideki", 19 | title = "Online Large-Margin Training for Statistical Machine Translation", 20 | booktitle = "Proceedings of EMNLP-CoNLL", 21 | year = "2007", 22 | url = "http://aclweb.org/anthology/D07-1080" 23 | } 24 | @InProceedings{N09-1025, 25 | author = "Chiang, David 26 | and Knight, Kevin 27 | and Wang, Wei", 28 | title = "11,001 New Features for Statistical Machine Translation", 29 | booktitle = "Proceedings of NAACL", 30 | year = "2009" 31 | } -------------------------------------------------------------------------------- /bib_citations/SMT_human_centered.bib: -------------------------------------------------------------------------------- 1 | @article{foster1997target, 2 | author = "Foster, George and Isabelle, Pierre and Plamondon, Pierre", 3 | title = "Target-Text Mediated Interactive Machine Translation", 4 | journal = "Machine Translation", 5 | year = "1997", 6 | volume = "12", 7 | pages = "175--194" 8 | } 9 | @article{langlais2002transtype, 10 | author = "Langlais, Philippe, Lapalme, Guy and Lorange, Marie", 11 | title = ""{TransType}: Development-Evaluation Cycles to Boost Translator's Productivity", 12 | journal = "Machine Translation", 13 | volume = "17", 14 | number = "2", 15 | pages = "77--98", 16 | year = "2002" 17 | } 18 | @inproceedings{tomas2006statistical, 19 | title = "Statistical Phrase-Based Models for Interactive Computer-Assisted Translation", 20 | author = "Tom{\'a}s, Jes{\'u}s and Casacuberta, Francisco", 21 | booktitl = "Proceedings of the International Conference on Computational Linguistics/Association for Computational Linguistics", 22 | pages = "835--841", 23 | year = "2006" 24 | } 25 | @article{vidal2006computer, 26 | title = "Computer-assisted translation using speech recognition", 27 | author = "Vidal, Enrique and Casacuberta, Francisco and Rodriguez, Luis and Civera, Jorge and Hinarejos, Carlos D Mart{\'\i}nez", 28 | journal = "IEEE Transactions on Audio, Speech, and Language Processing", 29 | volume = "14", 30 | number = "3", 31 | pages = "941--951", 32 | year = "2006", 33 | publisher = "IEEE" 34 | } 35 | @article{khadivi2008integration, 36 | title = "Integration of speech recognition and machine translation in computer-assisted translation", 37 | author = "Khadivi, Shahram and Ney, Hermann", 38 | journal = "IEEE Transactions on Audio, Speech, and Language Processing", 39 | volume = "16", 40 | number = "8", 41 | pages = "1551--1564", 42 | year = "2008", 43 | publisher = "IEEE" 44 | } 45 | @article{barrachina2009statistical, 46 | author = "Barrachina, Sergio and Bender, Oliver and Casacuberta, Francisco and Civera, Jorge and Cubel, Elsa and Khadivi, Shahram and Lagarda, Antonio and Ney, Hermann and Tom\'{a}s, Jes\'{u}s and Vidal, Enrique and Vilar, Juan-Miguel", 47 | title = "Statistical Approaches to Computer-Assisted Translation", 48 | journal = "Computational Linguistics", 49 | volume = "35", 50 | number = "1", 51 | year = "2009", 52 | pages = "3--28" 53 | } 54 | @article{casacuberta2009human, 55 | title = "Human interaction for high-quality machine translation", 56 | author = "Casacuberta, Francisco and Civera, Jorge and Cubel, Elsa and Lagarda, Antonio L and Lapalme, Guy and Macklovitch, Elliott and Vidal, Enrique", 57 | journal = "Communications of the ACM", 58 | volume = "52", 59 | number = "10", 60 | pages = "135--138", 61 | year = "2009" 62 | } 63 | @article{alabau2014improving, 64 | author = "Alabau, Vicent and Sanchis, Alberto and Casacuberta, Francisco", 65 | title = "Improving On-line Handwritten Recognition in Interactive Machine Translation", 66 | journal = "Pattern Recognition", 67 | year = "2014", 68 | volume = "47", 69 | number = "3", 70 | pages = "1217--1228" 71 | } 72 | @InProceedings{cheng2016primt, 73 | author = "Cheng, Shanbo and Huang, Shujian and Chen, Huadong and Dai, Xin-Yu and Chen, Jiajun", 74 | title = ""{PRIMT}: A Pick-Revise Framework for Interactive Machine Translation", 75 | booktitle = "Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies", 76 | year = "2016", 77 | pages = "1240--1249" 78 | } 79 | 80 | @article{domingo2018segment, 81 | title = "Segment-based interactive-predictive machine translation", 82 | author = "Domingo, Miguel and Peris, {\'A}lvaro and Casacuberta, Francisco", 83 | journal = "Machine Translation", 84 | pages = "1--23", 85 | year = "2018" 86 | } 87 | @article{martinez2012online, 88 | author = "Mart\'{i}nez-G\'{o}mez, Pascual and Sanchis-Trilles, Germ\'{a}n and Casacuberta, Francisco", 89 | title = "Online Adaptation Strategies for Statistical Machine Translation in Post-Editing Scenarios", 90 | journal = "Pattern Recognition", 91 | year = "2012", 92 | volume = "45", 93 | number = "9", 94 | pages = "3193--3203" 95 | } 96 | 97 | @article{gonzalez14cost, 98 | title= "Cost-sensitive active learning for computer-assisted translation", 99 | author= "Gonz{\'a}lez-Rubio, Jes{\'u}s and Casacuberta, Francisco", 100 | journal= "Pattern Recognition Letters", 101 | volume= "37", 102 | pages= "124--134", 103 | year= "2014" 104 | } 105 | @article{lagarda15translating, 106 | title = "Translating without in-domain corpus: Machine translation post-editing with online learning techniques", 107 | author = "Lagarda, Antonio L and Ortiz-Mart{\'\i}nez, Daniel and Alabau, Vicent and Casacuberta, Francisco", 108 | journal = "Computer Speech \& Language", 109 | volume = "32", 110 | number = "1", 111 | pages = "109--134", 112 | year = "2015" 113 | } 114 | @article{sanchis2015improving, 115 | title = "Improving translation quality stability using Bayesian predictive adaptation", 116 | author = "Sanchis-Trilles, Germ{\'a}n and Casacuberta, Francisco", 117 | journal = "Computer Speech \& Language", 118 | volume = "34", 119 | number = "1", 120 | pages = "1--17", 121 | year = "2015" 122 | } 123 | @article{ortiz16online, 124 | title = "Online Learning for Statistical Machine Translation", 125 | author = "Ortiz-Mart{\'i}nez, Daniel", 126 | journal =" Computational Linguistics", 127 | volume = "42", 128 | number = "1", 129 | pages = "121--161", 130 | year = "2016" 131 | } -------------------------------------------------------------------------------- /bib_citations/SMT_phrase_based.bib: -------------------------------------------------------------------------------- 1 | @inproceedings{spbt, 2 | title={Statistical phrase-based translation}, 3 | author={Koehn, Philipp and Och, Franz Josef and Marcu, Daniel}, 4 | booktitle={Proceedings of NAACL}, 5 | year={2003} 6 | } 7 | @InProceedings{D08-1089, 8 | author = "Galley, Michel 9 | and Manning, Christopher D.", 10 | title = "A Simple and Effective Hierarchical Phrase Reordering Model", 11 | booktitle = "Proceedings of EMNLP", 12 | year = "2008" 13 | } 14 | -------------------------------------------------------------------------------- /bib_citations/SMT_syntax_based.bib: -------------------------------------------------------------------------------- 1 | @Article{J97-3002, 2 | author = "Wu, Dekai", 3 | title = "Stochastic Inversion Transduction Grammars and Bilingual Parsing of Parallel Corpora", 4 | journal = "Computational Linguistics", 5 | year = "1997", 6 | volume = "23", 7 | number = "3", 8 | url = "http://aclweb.org/anthology/J97-3002" 9 | } 10 | @InProceedings{P06-1121, 11 | author = "Galley, Michel 12 | and Graehl, Jonathan 13 | and Knight, Kevin 14 | and Marcu, Daniel 15 | and DeNeefe, Steve 16 | and Wang, Wei 17 | and Thayer, Ignacio", 18 | title = "Scalable Inference and Training of Context-Rich Syntactic Translation Models", 19 | booktitle = "Proceedings of COLING/ACL", 20 | year = "2006" 21 | } 22 | @InProceedings{P06-1077, 23 | author = "Liu, Yang (1) 24 | and Liu, Qun 25 | and Lin, Shouxun", 26 | title = "Tree-to-String Alignment Template for Statistical Machine Translation", 27 | booktitle = "Proceedings of COLING/ACL", 28 | year = "2006" 29 | } 30 | @InProceedings{P06-1066, 31 | author = "Xiong, Deyi 32 | and Liu, Qun 33 | and Lin, Shouxun", 34 | title = "Maximum Entropy Based Phrase Reordering Model for Statistical Machine Translation", 35 | booktitle = "Proceedings of COLING/ACL", 36 | year = "2006" 37 | } 38 | @article{hpbt, 39 | title={Hierarchical phrase-based translation}, 40 | author={Chiang, David}, 41 | journal={computational linguistics}, 42 | volume={33}, 43 | number={2}, 44 | pages={201--228}, 45 | year={2007}, 46 | publisher={MIT Press} 47 | } 48 | @InProceedings{P07-1019, 49 | author = "Huang, Liang 50 | and Chiang, David", 51 | title = "Forest Rescoring: Faster Decoding with Integrated Language Models", 52 | booktitle = "Proceedings of ACL", 53 | year = "2007" 54 | } 55 | @InProceedings{P08-1023, 56 | author = "Mi, Haitao 57 | and Huang, Liang 58 | and Liu, Qun", 59 | title = "Forest-Based Translation", 60 | booktitle = "Proceedings of ACL", 61 | year = "2008" 62 | } 63 | @InProceedings{P08-1064, 64 | author = "Zhang, Min 65 | and Jiang, Hongfei 66 | and Aw, Aiti 67 | and Li, Haizhou 68 | and Tan, Chew Lim 69 | and Li, Sheng", 70 | title = "A Tree Sequence Alignment-based Tree-to-Tree Translation Model", 71 | booktitle = "Proceedings of ACL", 72 | year = "2008" 73 | } 74 | @InProceedings{P08-1066, 75 | author = "Shen, Libin 76 | and Xu, Jinxi 77 | and Weischedel, Ralph", 78 | title = "A New String-to-Dependency Machine Translation Algorithm with a Target Dependency Language Model", 79 | booktitle = "Proceedings of ACL", 80 | year = "2008" 81 | } 82 | @InProceedings{D08-1022, 83 | author = "Mi, Haitao 84 | and Huang, Liang", 85 | title = "Forest-based Translation Rule Extraction", 86 | booktitle = "Proceedings of EMNLP", 87 | year = "2008", 88 | } 89 | @InProceedings{P09-1063, 90 | author = "Liu, Yang 91 | and L{\"u}, Yajuan 92 | and Liu, Qun", 93 | title = "Improving Tree-to-Tree Translation with Packed Forests", 94 | booktitle = "Proceedings of ACL/IJNLP", 95 | year = "2009" 96 | } 97 | @InProceedings{P10-1146, 98 | author = "Chiang, David", 99 | title = "Learning to Translate with Source and Target Syntax", 100 | booktitle = "Proceedings of ACL", 101 | year = "2010" 102 | } 103 | -------------------------------------------------------------------------------- /bib_citations/SMT_system_combination.bib: -------------------------------------------------------------------------------- 1 | @InProceedings{P07-1040, 2 | author = "Rosti, Antti-Veikko 3 | and Matsoukas, Spyros 4 | and Schwartz, Richard", 5 | title = "Improved Word-Level System Combination for Machine Translation", 6 | booktitle = "Proceedings of ACL", 7 | year = "2007" 8 | } 9 | @InProceedings{D08-1011, 10 | author = "He, Xiaodong 11 | and Yang, Mei 12 | and Gao, Jianfeng 13 | and Nguyen, Patrick 14 | and Moore, Robert", 15 | title = "Indirect-HMM-based Hypothesis Alignment for Combining Outputs from Machine Translation Systems", 16 | booktitle = "Proceedings of EMNLP", 17 | year = "2008" 18 | } -------------------------------------------------------------------------------- /bib_citations/SMT_tutorials.bib: -------------------------------------------------------------------------------- 1 | @misc{koehn2006statistical, 2 | title={Statistical machine translation: the basic, the novel, and the speculative}, 3 | author={Koehn, Philipp}, 4 | howpublished={EACL Tutorial}, 5 | year={2006} 6 | } 7 | @article{Lopez2008statistical, 8 | author = {Lopez, Adam}, 9 | title = {Statistical Machine Translation}, 10 | journal = {ACM Comput. Surv.}, 11 | issue_date = {August 2008}, 12 | volume = {40}, 13 | number = {3}, 14 | month = aug, 15 | year = {2008}, 16 | issn = {0360-0300}, 17 | pages = {8:1--8:49}, 18 | articleno = {8}, 19 | numpages = {49}, 20 | url = {http://doi.acm.org/10.1145/1380584.1380586}, 21 | doi = {10.1145/1380584.1380586}, 22 | acmid = {1380586}, 23 | publisher = {ACM}, 24 | address = {New York, NY, USA}, 25 | keywords = {Natural language processing, machine translation}, 26 | } 27 | -------------------------------------------------------------------------------- /bib_citations/SMT_word_based.bib: -------------------------------------------------------------------------------- 1 | @article{mathsmt, 2 | title={The mathematics of statistical machine translation: Parameter estimation}, 3 | author={Brown, Peter F and Pietra, Vincent J Della and Pietra, Stephen A Della and Mercer, Robert L}, 4 | journal={Computational linguistics}, 5 | volume={19}, 6 | number={2}, 7 | pages={263--311}, 8 | year={1993}, 9 | publisher={MIT Press} 10 | } 11 | InProceedings{C96-2141, 12 | author = "Vogel, Stephan 13 | and Ney, Hermann 14 | and Tillmann, Christoph", 15 | title = "HMM-Based Word Alignment in Statistical Translation", 16 | booktitle = "Proceedings of COLING", 17 | year = "1996", 18 | } 19 | @Article{J03-1002, 20 | author = "Och, Franz Josef 21 | and Ney, Hermann", 22 | title = "A Systematic Comparison of Various Statistical Alignment Models", 23 | journal = "Computational Linguistics", 24 | year = "2003", 25 | volume = "29", 26 | number = "1", 27 | url = "http://aclweb.org/anthology/J03-1002" 28 | } 29 | @InProceedings{N06-1014, 30 | author = "Liang, Percy 31 | and Taskar, Ben 32 | and Klein, Dan", 33 | title = "Alignment by Agreement", 34 | booktitle = "Proceedings of NAACL", 35 | year = "2006" 36 | } 37 | @InProceedings{N13-1073, 38 | author = "Dyer, Chris 39 | and Chahuneau, Victor 40 | and Smith, Noah A.", 41 | title = "A Simple, Fast, and Effective Reparameterization of IBM Model 2", 42 | booktitle = "Proceedings of NAACL", 43 | year = "2013" 44 | } 45 | -------------------------------------------------------------------------------- /bib_citations/Word_Translation.bib: -------------------------------------------------------------------------------- 1 | @article{mikolov2013exploiting, 2 | author = {Mikolov, Tomas and 3 | Le, Quoc and 4 | Sutskever, Ilya}, 5 | title = {Exploiting Similarities among Languages for Machine Translation}, 6 | journal={arXiv preprint arXiv:1309.4168}, 7 | year = {2013} 8 | } 9 | @InProceedings{N15-1104, 10 | author = "Xing, Chao 11 | and Wang, Dong 12 | and Liu, Chao 13 | and Lin, Yiye", 14 | title = "Normalized Word Embedding and Orthogonal Transform for Bilingual Word Translation", 15 | booktitle = "Proceedings of NAACL", 16 | year = "2015" 17 | } 18 | @InProceedings{dinu2015improving, 19 | title={Improving Zero-shot Learning by Mitigating the Hubness Problem}, 20 | Georgiana Dinu, Angeliki Lazaridou, and Marco Baroni 21 | author={Dinu, Georgiana and Lazaridou, Augeliki and Baroni, Marco}, 22 | booktitle={Proceedings of ICLR}, 23 | year={2015} 24 | } 25 | @inproceedings{zhang2016building, 26 | title={Building Earth Mover's Distance on Bilingual Word Embeddings for Machine Translation}, 27 | author={Zhang, Meng and Liu, Yang and Luan, Huan-Bo and Sun, Maosong and Izuha, Tatsuya and Hao, Jie}, 28 | booktitle={AAAI}, 29 | year={2016} 30 | } 31 | @InProceedings{C16-1300, 32 | author = "Zhang, Meng 33 | and Liu, Yang 34 | and Luan, Huanbo 35 | and Liu, Yiqun 36 | and Sun, Maosong", 37 | title = "Inducing Bilingual Lexica From Non-Parallel Data With Earth Mover's Distance Regularization", 38 | booktitle = "Proceedings of COLING", 39 | year = "2016" 40 | } 41 | @InProceedings{P16-1024, 42 | author = "Vuli{\'{c}}, Ivan 43 | and Korhonen, Anna", 44 | title = "On the Role of Seed Lexicons in Learning Bilingual Word Embeddings", 45 | booktitle = "Proceedings of ACL", 46 | year = "2016" 47 | } 48 | @InProceedings{D16-1250, 49 | author = "Artetxe, Mikel 50 | and Labaka, Gorka 51 | and Agirre, Eneko", 52 | title = "Learning principled bilingual mappings of word embeddings while preserving monolingual invariance", 53 | booktitle = "Proceedings of EMNLP", 54 | year = "2016" 55 | } 56 | @inproceedings{zhang2017bilingual, 57 | title={Bilingual Lexicon Induction from Non-Parallel Data with Minimal Supervision.}, 58 | author={Zhang, Meng and Peng, Haoruo and Liu, Yang and Luan, Huan-Bo and Sun, Maosong}, 59 | booktitle={AAAI}, 60 | year={2017} 61 | } 62 | @Article{J17-2001, 63 | author = "Irvine, Ann 64 | and Callison-Burch, Chris", 65 | title = "A Comprehensive Analysis of Bilingual Lexicon Induction", 66 | journal = "Computational Linguistics", 67 | year = "2017", 68 | volume = "43", 69 | number = "2", 70 | pages = "273--310" 71 | } 72 | @InProceedings{P17-1042, 73 | author = "Artetxe, Mikel 74 | and Labaka, Gorka 75 | and Agirre, Eneko", 76 | title = "Learning bilingual word embeddings with (almost) no bilingual data", 77 | booktitle = "Proceedings of ACL", 78 | year = "2017" 79 | } 80 | @InProceedings{P17-1179, 81 | author = "Zhang, Meng 82 | and Liu, Yang 83 | and Luan, Huanbo 84 | and Sun, Maosong", 85 | title = "Adversarial Training for Unsupervised Bilingual Lexicon Induction", 86 | booktitle = "Proceedings of ACL", 87 | year = "2017" 88 | } 89 | @InProceedings{E17-1102, 90 | author = "Heyman, Geert 91 | and Vuli{\'{c}}, Ivan 92 | and Moens, Marie-Francine", 93 | title = "Bilingual Lexicon Induction by Learning to Combine Word-Level and Character-Level Representations", 94 | booktitle = "Proceedings of EACL", 95 | year = "2017" 96 | } 97 | @InProceedings{E17-2098, 98 | author = "Hauer, Bradley 99 | and Nicolai, Garrett 100 | and Kondrak, Grzegorz", 101 | title = "Bootstrapping Unsupervised Bilingual Lexicon Induction", 102 | booktitle = "Proceedings of EACL", 103 | year = "2017" 104 | } 105 | @InProceedings{E17-2103, 106 | author = "Kim, Yunsu 107 | and Schamper, Julian 108 | and Ney, Hermann", 109 | title = "Unsupervised Training for Large Vocabulary Translation Using Sparse Lexicon and Word Classes", 110 | booktitle = "Proceedings of EACL", 111 | year = "2017" 112 | } 113 | @InProceedings{D17-1152, 114 | author = "Wijaya, Derry Tanti 115 | and Callahan, Brendan 116 | and Hewitt, John 117 | and Gao, Jie 118 | and Ling, Xiao 119 | and Apidianaki, Marianna 120 | and Callison-Burch, Chris", 121 | title = "Learning Translations via Matrix Completion", 122 | booktitle = "Proceedings of EMNLP", 123 | year = "2017" 124 | } 125 | @InProceedings{D17-1207, 126 | author = "Zhang, Meng 127 | and Liu, Yang 128 | and Luan, Huanbo 129 | and Sun, Maosong", 130 | title = "Earth Mover's Distance Minimization for Unsupervised Bilingual Lexicon Induction", 131 | booktitle = "Proceedings of EMNLP", 132 | year = "2017" 133 | } 134 | @InProceedings{D17-1264, 135 | author = "Nakashole, Ndapandula 136 | and Flauger, Raphael", 137 | title = "Knowledge Distillation for Bilingual Dictionary Induction", 138 | booktitle = "Proceedings of EMNLP", 139 | year = "2017" 140 | } 141 | @Article{Q18-1014, 142 | author = "Aldarmaki, Hanan 143 | and Mohan, Mahesh 144 | and Diab, Mona", 145 | title = "Unsupervised Word Mapping Using Structural Similarities in Monolingual Embeddings", 146 | journal = "Transactions of the Association for Computational Linguistics", 147 | year = "2018", 148 | volume = "6", 149 | pages = "185--196" 150 | } 151 | @InProceedings{conneau2017word, 152 | title={Word translation without parallel data}, 153 | author={Conneau, Alexis and Lample, Guillaume and Ranzato, Marc'Aurelio and Denoyer, Ludovic and J{\'e}gou, Herv{\'e}}, 154 | booktitle={Proceedings of ICLR}, 155 | year={2018} 156 | } 157 | @InProceedings{N18-2030, 158 | author = "Braune, Fabienne 159 | and Hangya, Viktor 160 | and Eder, Tobias 161 | and Fraser, Alexander", 162 | title = "Evaluating bilingual word embeddings on the long tail", 163 | booktitle = "Proceedings of NAACL", 164 | year = "2018" 165 | } 166 | @InProceedings{P18-2036, 167 | author = "Nakashole, Ndapa 168 | and Flauger, Raphael", 169 | title = "Characterizing Departures from Linearity in Word Translation", 170 | booktitle = "Proceedings of ACL", 171 | year = "2018" 172 | } 173 | @InProceedings{P18-1072, 174 | author = "S{\o}gaard, Anders 175 | and Ruder, Sebastian 176 | and Vuli{\'{c}}, Ivan", 177 | title = "On the Limitations of Unsupervised Bilingual Dictionary Induction", 178 | booktitle = "Proceedings of ACL", 179 | year = "2018" 180 | } 181 | @InProceedings{P18-1073, 182 | author = "Artetxe, Mikel 183 | and Labaka, Gorka 184 | and Agirre, Eneko", 185 | title = "A robust self-learning method for fully unsupervised cross-lingual mappings of word embeddings", 186 | booktitle = "Proceedings of ACL", 187 | year = "2018" 188 | } 189 | @InProceedings{P18-2062, 190 | author = "Riley, Parker 191 | and Gildea, Daniel", 192 | title = "Orthographic Features for Bilingual Lexicon Induction", 193 | booktitle = "Proceedings of ACL", 194 | year = "2018" 195 | } 196 | @InProceedings{C18-1080, 197 | author = "Hazem, Amir 198 | and Morin, Emmanuel", 199 | title = "Leveraging Meta-Embeddings for Bilingual Lexicon Extraction from Specialized Comparable Corpora", 200 | booktitle = "Proceedings of COLING", 201 | year = "2018" 202 | } 203 | @InProceedings{D18-1023, 204 | author = "Huang, Lifu 205 | and Cho, Kyunghyun 206 | and Zhang, Boliang 207 | and Ji, Heng 208 | and Knight, Kevin", 209 | title = "Multi-lingual Common Semantic Space Construction via Cluster-consistent Word Embedding", 210 | booktitle = "Proceedings of EMNLP", 211 | year = "2018" 212 | } 213 | @InProceedings{D18-1024, 214 | author = "Chen, Xilun 215 | and Cardie, Claire", 216 | title = "Unsupervised Multilingual Word Embeddings", 217 | booktitle = "Proceedings of EMNLP", 218 | year = "2018" 219 | } 220 | @InProceedings{D18-1025, 221 | author = "Chi, Ta Chung 222 | and Chen, Yun-Nung", 223 | title = "CLUSE: Cross-Lingual Unsupervised Sense Embeddings", 224 | booktitle = "Proceedings of EMNLP", 225 | year = "2018", 226 | } 227 | @InProceedings{D18-1027, 228 | author = "Doval, Yerai 229 | and Camacho-Collados, Jose 230 | and Espinosa Anke, Luis 231 | and Schockaert, Steven", 232 | title = "Improving Cross-Lingual Word Embeddings by Meeting in the Middle", 233 | booktitle = "Proceedings of EMNLP", 234 | year = "2018" 235 | } 236 | @InProceedings{D18-1042, 237 | author = "Ruder, Sebastian 238 | and Cotterell, Ryan 239 | and Kementchedjhieva, Yova 240 | and S{\o}gaard, Anders", 241 | title = "A Discriminative Latent-Variable Model for Bilingual Lexicon Induction", 242 | booktitle = "Proceedings of EMNLP", 243 | year = "2018" 244 | } 245 | @InProceedings{D18-1043, 246 | author = "Hoshen, Yedid 247 | and Wolf, Lior", 248 | title = "Non-Adversarial Unsupervised Word Translation", 249 | booktitle = "Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing", 250 | year = "2018", 251 | publisher = "Association for Computational Linguistics", 252 | pages = "469--478", 253 | location = "Brussels, Belgium", 254 | url = "http://aclweb.org/anthology/D18-1043" 255 | } 256 | @InProceedings{D18-1047, 257 | author = "Nakashole, Ndapa", 258 | title = "NORMA: Neighborhood Sensitive Maps for Multilingual Word Embeddings", 259 | booktitle = "Proceedings of EMNLP", 260 | year = "2018" 261 | } 262 | @InProceedings{D18-1056, 263 | author = "Hartmann, Mareike 264 | and Kementchedjhieva, Yova 265 | and S{\o}gaard, Anders", 266 | title = "Why is unsupervised alignment of English embeddings from different algorithms so hard?", 267 | booktitle = "Proceedings of EMNLP", 268 | year = "2018" 269 | } 270 | @InProceedings{D18-1062, 271 | author = "Dou, Zi-Yi 272 | and Zhou, Zhi-Hao 273 | and Huang, Shujian", 274 | title = "Unsupervised Bilingual Lexicon Induction via Latent Variable Models", 275 | booktitle = "Proceedings of EMNLP", 276 | year = "2018" 277 | } 278 | @InProceedings{D18-1063, 279 | author = "Mukherjee, Tanmoy 280 | and Yamada, Makoto 281 | and Hospedales, Timothy", 282 | title = "Learning Unsupervised Word Translations Without Adversaries", 283 | booktitle = "Proceedings of EMNLP", 284 | year = "2018" 285 | } 286 | @InProceedings{D18-1214, 287 | author = "Alvarez-Melis, David 288 | and Jaakkola, Tommi", 289 | title = "Gromov-Wasserstein Alignment of Word Embedding Spaces", 290 | booktitle = "Proceedings of EMNLP", 291 | year = "2018" 292 | } 293 | @InProceedings{D18-1268, 294 | author = "Xu, Ruochen 295 | and Yang, Yiming 296 | and Otani, Naoki 297 | and Wu, Yuexin", 298 | title = "Unsupervised Cross-lingual Transfer of Word Embedding Spaces", 299 | booktitle = "Proceedings of EMNLP", 300 | year = "2018" 301 | } 302 | @InProceedings{D18-1330, 303 | author = "Joulin, Armand 304 | and Bojanowski, Piotr 305 | and Mikolov, Tomas 306 | and J{\'e}gou, Herv{\'e} 307 | and Grave, Edouard", 308 | title = "Loss in Translation: Learning Bilingual Word Mapping with a Retrieval Criterion", 309 | booktitle = "Proceedings of EMNLP", 310 | year = "2018" 311 | } 312 | @article{ruder2019survey, 313 | author = {Ruder, Sebastian and Vulić, Ivan and Søgaard, Anders}, 314 | title = {A survey of cross-lingual embedding models}, 315 | journal={Journal of Artificial Intelligence Research}, 316 | volume={}, //To appear. Leave it blank temporarily 317 | pages={}, //To appear. Leave it blank temporarily 318 | year={2019} 319 | } 320 | @Article{Q19-XXXX, //To appear. Leave it as "XXXX" temporarily 321 | author = "Jawanpuria, Pratik 322 | and Balgovind, Arjun 323 | and Kunchukuttan, Anoop 324 | and Mishra, Bamdev", 325 | title = "Learning Multilingual Word Embeddings in Latent Metric Space: A Geometric Approach", 326 | journal = "Transactions of the Association for Computational Linguistics", 327 | year = "2019", 328 | volume = "7", 329 | pages = "", //To appear. Leave it blank temporarily 330 | } 331 | 332 | --------------------------------------------------------------------------------