Commit 51cd432f by 曹润柘

更新 bibliography.bib

parent 99300e4f
......@@ -186,7 +186,6 @@
Keith Stevens and
George Kurian and
Nishant Patil and
Wei Wang and
Cliff Young and
Jason Smith and
Jason Riesa and
......@@ -221,7 +220,6 @@
Yann N. Dauphin},
title = {Convolutional Sequence to Sequence Learning},
publisher = {International Conference on Machine Learning},
//series = {Proceedings of Machine Learning Research},
volume = {70},
pages = {1243--1252},
year = {2017}
......@@ -270,10 +268,8 @@
author = {Ian J. Goodfellow and
Yoshua Bengio and
Aaron C. Courville},
title = {Deep Learning},
//series = {Adaptive computation and machine learning},
publisher = {{MIT} Press},
year = {2016}
......@@ -386,7 +382,6 @@
publisher={International Conference on Acoustics, Speech, and Signal Processing},
//organization={IEEE Computer Society}
......@@ -425,7 +420,6 @@
title = {Speech and language processing: an introduction to natural language
processing, computational linguistics, and speech recognition, 2nd
//series = {Prentice Hall series in artificial intelligence},
publisher = {Prentice Hall, Pearson Education International},
year = {2009}
......@@ -743,7 +737,6 @@
author = {Philipp Koehn and
Hieu Hoang and
Alexandra Birch and
Chris Callison-Burch and
Marcello Federico and
Nicola Bertoldi and
......@@ -824,7 +817,6 @@
Kevin Knight and
Daniel Marcu and
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
......@@ -847,28 +839,25 @@
%%%%% chapter 3------------------------------------------------------
author = {Andrew Y. Ng and
Michael I. Jordan},
title = {On Discriminative vs. Generative Classifiers: {A} comparison of logistic
regression and naive Bayes},
pages = {841--848},
publisher = {{MIT} Press},
year = {2001},
title ={On discriminative vs. generative classifiers: A comparison of logistic regression and naive bayes},
author ={Ng, Andrew Y and Jordan, Michael I},
pages ={841--848},
year ={2002}
author = {Huang, Liang},
title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications-Tutorial notes},
title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications - Tutorial notes},
year = {2008},
publisher = {International Conference on Computational Linguistics},
address = {Manchester, UK},
publisher = {Coling 2008 Organizing Committee},
author = {Aho, Alfred V and
Ullman, Jeffrey D},
title = {The theory of parsing, translation, and compiling},
publisher = {Prentice-Hall Englewood Cliffs, NJ},
author = {Alfred V. Aho and
Jeffrey D. Ullman},
title = {The theory of parsing, translation, and compiling. 2: Compiling},
publisher = {Prentice-Hall},
year = {1973},
......@@ -877,7 +866,6 @@
author={Rau, Lisa F},
publisher={IEEE Conference on Artificial Intelligence Application},
......@@ -890,16 +878,11 @@
author = {Guillaume Lample and
Miguel Ballesteros and
Sandeep Subramanian and
Kazuya Kawakami and
Chris Dyer},
title = {Neural Architectures for Named Entity Recognition},
pages = {260--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
title={Neural architectures for named entity recognition},
author={Lample, Guillaume and Ballesteros, Miguel and Subramanian, Sandeep and Kawakami, Kazuya and Dyer, Chris},
journal={arXiv preprint arXiv:1603.01360},
......@@ -920,6 +903,7 @@
......@@ -933,13 +917,19 @@
title={Error bounds for convolutional codes and an asymptotically optimum decoding algorithm},
author={ Viterbi, Andrew J. },
journal={IEEE Transactions on Information Theory},
journal={IEEE Trans.informat.theory},
title={Conditional random fields: Probabilistic models for segmenting and labeling sequence data},
author={Lafferty, John and McCallum, Andrew and Pereira, Fernando CN},
author={Harrington, Peter},
......@@ -952,36 +942,41 @@
author = {Brants, Thorsten},
month = apr,
year = {2000},
address = {Seattle, Washington, USA},
publisher = {Association for Computational Linguistics},
doi = {10.3115/974147.974178},
pages = {224--231},
title = {Chunk Parsing Revisited},
author = {Yoshimasa Tsuruoka and
Jun'ichi Tsujii},
author = {Tsuruoka, Yoshimasa and
Tsujii, Jun{'}ichi},
month = oct,
year = {2005},
publisher = {Annual Meeting of the Association for Computational Linguistics},
address = {Vancouver, British Columbia},
publisher = {Association for Computational Linguistics},
pages = {133--140},
title = {News-Oriented Automatic Chinese Keyword Indexing},
title = {News-Oriented Automatic {C}hinese Keyword Indexing},
author = {Li, Sujian and
Wang, Houfeng and
Yu, Shiwen and
Xin, Chengsheng},
month = jul,
year = {2003},
publisher = {Annual Meeting of the Association for Computational Linguistics},
address = {Sapporo, Japan},
publisher = {Association for Computational Linguistics},
doi = {10.3115/1119250.1119263},
pages = {92--97},
title={Bidirectional LSTM-CRF Models for Sequence Tagging},
author={ Huang, Zhiheng and Xu, Wei and Yu, Kai },
journal={Computer ence},
......@@ -996,13 +991,10 @@
author = {Andrej Zukov Gregoric and
Yoram Bachrach and
Sam Coope},
title = {Named Entity Recognition With Parallel Recurrent Neural Networks},
pages = {69--74},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018},
title={Named entity recognition with parallel recurrent neural networks},
author={{\v{Z}}ukov-Gregori{\v{c}}, Andrej and Bachrach, Yoram and Coope, Sam},
......@@ -1015,196 +1007,29 @@
title={Bert: Pre-training of deep bidirectional transformers for language understanding},
author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
pages = {4171--4186},
journal = {Annual Meeting of the Association for Computational Linguistics},
author = {Alexis Conneau and
Kartikay Khandelwal and
Naman Goyal and
Vishrav Chaudhary and
Guillaume Wenzek and
Francisco Guzm{\'{a}}n and
Edouard Grave and
Myle Ott and
Luke Zettlemoyer and
Veselin Stoyanov},
title = {Unsupervised Cross-lingual Representation Learning at Scale},
pages = {8440--8451},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020},
journal={arXiv preprint arXiv:1810.04805},
title={Unsupervised cross-lingual representation learning at scale},
author={Conneau, Alexis and Khandelwal, Kartikay and Goyal, Naman and Chaudhary, Vishrav and Wenzek, Guillaume and Guzm{\'a}n, Francisco and Grave, Edouard and Ott, Myle and Zettlemoyer, Luke and Stoyanov, Veselin},
journal={arXiv preprint arXiv:1911.02116},
title={Lectures on government and binding: The Pisa lectures},
author={Chomsky, Noam},
publisher={Walter de Gruyter}
author = {Rico Sennrich and
Barry Haddow and
Alexandra Birch},
title = {Neural Machine Translation of Rare Words with Subword Units},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
author={刘挺 and 吴岩 and 王开铸},
title = {University of Sheffield: Description of the LaSIE-II system as used for MUC-7},
author = {Kevin Humphreys and
Robert J. Gaizauskas and
Saliha Azzam and
Charles Huyck and
Brian Mitchell and
Hamish Cunningham and
Yorick Wilks},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1995},
title={IsoQuest Inc.: Description of the NetOwl™ Extractor System as Used for MUC-7},
author={Krupka, George and Hausman, Kevin},
publisher = {Annual Meeting of the Association for Computational Linguistics},
author = {William J. Black and
Fabio Rinaldi and
David Mowatt},
title = {{FACILE:} Description of the {NE} System Used for {MUC-7}},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1998},
title={Hidden Markov models.},
author={ Eddy, Sean R },
journal={Current Opinion in Structural Biology},
author = {John D. Lafferty and
Andrew McCallum and
Fernando C. N. Pereira},
title = {Conditional Random Fields: Probabilistic Models for Segmenting and
Labeling Sequence Data},
pages = {282--289},
publisher = {proceedings of the Eighteenth International Conference on Machine
year = {2001},
title={Maximum-entropy models in science and engineering},
author={Kapur, Jagat Narain},
publisher={John Wiley \& Sons}
title={Support vector machines},
author={Hearst, Marti A. and Dumais, Susan T and Osuna, Edgar and Platt, John and Scholkopf, Bernhard},
journal={IEEE Intelligent Systems \& Their Applications},
title={Natural Language Processing (almost) from Scratch},
author={ Collobert, Ronan and Weston, Jason and Bottou, Léon and Karlen, Michael and Kavukcuoglu, Koray and Kuksa, Pavel },
journal={Journal of Machine Learning Research},
title={Introduction to information retrieval},
author={Manning, Christopher D and Sch{\"u}tze, Hinrich and Raghavan, Prabhakar},
publisher={Cambridge university press}
title={A maximum entropy approach to natural language processing},
author={Berger, Adam and Della Pietra, Stephen A and Della Pietra, Vincent J},
journal={Computational linguistics},
title={Machine Learning},
author={Mitchell, Tom},
journal={McCraw Hill},
author = {Franz Josef Och and
Hermann Ney},
title = {Discriminative Training and Maximum Entropy Models for Statistical
Machine Translation},
pages = {295--302},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2002},
title={Speech recognition with weighted finite-state transducers},
author={Mohri, Mehryar and Pereira, Fernando and Riley, Michael},
title={Dynamic programming},
author={Bellman, Richard},
publisher={American Association for the Advancement of Science}
%%%%% chapter 3------------------------------------------------------
......@@ -1647,7 +1472,6 @@
author = {Chris Callison-Burch and
Cameron S. Fordyce and
Philipp Koehn and
Christof Monz and
Josh Schroeder},
title = {(Meta-) Evaluation of Machine Translation},
......@@ -1657,7 +1481,6 @@
author = {Chris Callison-Burch and
Philipp Koehn and
Christof Monz and
Matt Post and
Radu Soricut and
......@@ -1681,7 +1504,6 @@
Barry Haddow and
Matthias Huck and
Chris Hokamp and
Philipp Koehn and
Varvara Logacheva and
Christof Monz and
Matteo Negri and
......@@ -2056,16 +1878,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
author = {Alexander M. Fraser and
Daniel Marcu},
title = {Measuring Word Alignment Quality for Statistical Machine Translation},
journal = {Computational Linguistics},
volume = {33},
number = {3},
pages = {293--303},
year = {2007}
author = {John DeNero and
Dan Klein},
......@@ -2252,17 +2064,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005},
author = {Jiatao Gu and
James Bradbury and
Caiming Xiong and
Victor O. K. Li and
Richard Socher},
title = {Non-Autoregressive Neural Machine Translation},
publisher = {},
year = {2018}
%%%%% chapter 6------------------------------------------------------
......@@ -2297,15 +2098,6 @@
publisher = {AAAI Press},
year = {2000}
author = {Chris Dyer and
Victor Chahuneau and
Noah A. Smith},
title = {A Simple, Fast, and Effective Reparameterization of {IBM} Model 2},
pages = {644--648},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
author = {Benjamin Taskar and
Simon Lacoste-Julien and
......@@ -2366,13 +2158,7 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2014}
author = {Franz Josef Och},
title = {Minimum Error Rate Training in Statistical Machine Translation},
pages = {160--167},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003}
author = {M. J. D. Powell},
title = {An efficient method for finding the minimum of a function of several
......@@ -2605,7 +2391,6 @@
author = {Michael Collins and
Philipp Koehn and
Ivona Kucerova},
title = {Clause Restructuring for Statistical Machine Translation},
pages = {531--540},
......@@ -2721,16 +2506,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003}
author = {David Chiang and
Yuval Marton and
Philip Resnik},
title = {Online Large-Margin Training of Syntactic and Structural Translation
pages = {224--233},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
author = {Phil Blunsom and
Trevor Cohn and
......@@ -2811,15 +2586,6 @@
publisher={University of Southern California},
author = {Richard Zens and
Hermann Ney},
title = {Improvements in dynamic programming beam search for phrase-based statistical
machine translation},
pages = {198--205},
publisher = {International Symposium on Computer Architecture},
year = {2008}
author = {Holger Schwenk and
Marta R. Costa-juss{\`{a}} and
......@@ -2968,13 +2734,6 @@
pages = {1159--1187},
year = {2012}
author = {David Chiang},
title = {A Hierarchical Phrase-Based Model for Statistical Machine Translation},
pages = {263--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005}
title={Hierarchical Phrase-Based Translation},
author ={Chiang David},
......@@ -3031,20 +2790,6 @@
year ={2006},
publisher ={Computationally Hard Problems \& Joint Inference in Speech \& Language Processing}
author = {Michel Galley and
Jonathan Graehl and
Kevin Knight and
Daniel Marcu and
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
title ={What’s in a translation rule?},
author ={Galley, Michel and Hopkins, Mark and Knight, Kevin and Marcu, Daniel},
......@@ -3089,7 +2834,6 @@
author = {Daniel Marcu and
Wei Wang and
Abdessamad Echihabi and
Kevin Knight},
title = {{SPMT:} Statistical Machine Translation with Syntactified Target Language
......@@ -3216,15 +2960,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011}
author = {Hao Zhang and
Liang Huang and
Daniel Gildea and
Kevin Knight},
title = {Synchronous Binarization for Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
author = {Hiyan Alshawi and
Adam L. Buchsbaum and
......@@ -3304,7 +3039,6 @@
author = {Steve DeNeefe and
Kevin Knight and
Wei Wang and
Daniel Marcu},
title = {What Can Syntax-Based {MT} Learn from Phrase-Based MT?},
pages = {755--763},
......@@ -3319,30 +3053,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
author = {Yang Liu and
Qun Liu and
Shouxun Lin},
title = {Tree-to-String Alignment Template for Statistical Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
author = {Andreas Zollmann and
Ashish Venugopal},
title = {Syntax Augmented Machine Translation via Chart Parsing},
pages = {138--141},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
author = {Yuval Marton and
Philip Resnik},
title = {Soft Syntactic Constraints for Hierarchical Phrased-Based Translation},
pages = {1003--1011},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
author = {Rebecca Nesson and Stuart M. Shieber and Alexander Rush},
title = {Induction of probabilistic synchronous tree-insertion grammars for machine translation},
......@@ -3355,15 +3065,6 @@
year = {2007},
publisher = {Machine Translation Summit}
author = {Yang Liu and
Yajuan L{\"{u}} and
Qun Liu},
title = {Improving Tree-to-Tree Translation with Packed Forests},
pages = {558--566},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2009}
author = {Wei Wang and
Kevin Knight and
......@@ -3391,14 +3092,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
author = {Jingbo Zhu and
Tong Xiao},
title = {Improving Decoding Generalization for Tree-to-String Translation},
pages = {418--423},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011}
author = {Jiajun Zhang and
Feifei Zhai and
......@@ -3783,11 +3476,6 @@
number = {1},
pages = {145--151},
year = {1999},
//url = {},
//doi = {10.1016/S0893-6080(98)00116-6},
//timestamp = {Wed, 14 Nov 2018 10:30:22 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -3799,10 +3487,6 @@
volume = {12},
pages = {2121--2159},
year = {2011},
//url = {},
//timestamp = {Wed, 10 Jul 2019 15:28:02 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -3818,23 +3502,15 @@
author = {Diederik P. Kingma and
Jimmy Ba},
//editor = {Yoshua Bengio and
Yann LeCun},
title = {Adam: {A} Method for Stochastic Optimization},
booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015,
San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
year = {2015},
//url = {},
//timestamp = {Thu, 25 Jul 2019 14:25:37 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Sergey Ioffe and
Christian Szegedy},
//editor = {Francis R. Bach and
David M. Blei},
title = {Batch Normalization: Accelerating Deep Network Training by Reducing
Internal Covariate Shift},
booktitle = {Proceedings of the 32nd International Conference on Machine Learning,
......@@ -3844,10 +3520,6 @@
pages = {448--456},
publisher = {},
year = {2015},
//url = {},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -3858,30 +3530,6 @@
journal = {CoRR},
volume = {abs/1607.06450},
year = {2016},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Kaiming He and
Xiangyu Zhang and
Shaoqing Ren and
Jian Sun},
title = {Deep Residual Learning for Image Recognition},
booktitle = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition,
{CVPR} 2016, Las Vegas, NV, USA, June 27-30, 2016},
pages = {770--778},
publisher = {{IEEE} Computer Society},
year = {2016},
//url = {},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -3890,20 +3538,12 @@
Kai Chen and
Gregory S. Corrado and
Jeffrey Dean},
//editor = {Christopher J. C. Burges and
L{\'{e}}on Bottou and
Zoubin Ghahramani and
Kilian Q. Weinberger},
title = {Distributed Representations of Words and Phrases and their Compositionality},
booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual
Conference on Neural Information Processing Systems 2013. Proceedings
of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
pages = {3111--3119},
year = {2013},
//url = {},
//timestamp = {Fri, 06 Mar 2020 17:00:12 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -3919,39 +3559,23 @@
number = {5},
pages = {93:1--93:42},
year = {2019},
//url = {},
//doi = {10.1145/3236009},
//timestamp = {Thu, 09 May 2019 16:06:21 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Pang Wei Koh and
Percy Liang},
//editor = {Doina Precup and
Yee Whye Teh},
title = {Understanding Black-box Predictions via Influence Functions},
booktitle = {Proceedings of the 34th International Conference on Machine Learning,
{ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
series = {Proceedings of Machine Learning Research},
volume = {70},
pages = {1885--1894},
publisher = {{PMLR}},
year = {2017},
//url = {},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Philip Arthur and
Graham Neubig and
Satoshi Nakamura},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Incorporating Discrete Translation Lexicons into Neural Machine Translation},
booktitle = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
......@@ -3959,28 +3583,6 @@
pages = {1557--1567},
publisher = {The Association for Computational Linguistics},
year = {2016},
//url = {},
//doi = {10.18653/v1/d16-1162},
//timestamp = {Tue, 28 Jan 2020 10:28:31 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Andreas Zollmann and
Ashish Venugopal},
//editor = {Philipp Koehn and
Christof Monz},
title = {Syntax Augmented Machine Translation via Chart Parsing},
booktitle = {Proceedings on the Workshop on Statistical Machine Translation, WMT@HLT-NAACL
2006, New York City, NY, USA, June 8-9, 2006},
pages = {138--141},
publisher = {Association for Computational Linguistics},
year = {2006},
//url = {},
//timestamp = {Fri, 13 Sep 2019 13:08:46 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4001,11 +3603,6 @@
2: Short Papers},
publisher = {The Association for Computer Linguistics},
year = {2016},
//url = {},
//doi = {10.18653/v1/p16-2049},
//timestamp = {Tue, 28 Jan 2020 10:27:31 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4019,21 +3616,12 @@
pages = {1498--1507},
publisher = {The Association for Computer Linguistics},
year = {2013},
//url = {},
//timestamp = {Mon, 19 Aug 2019 18:10:05 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Bryan Perozzi and
Rami Al-Rfou and
Steven Skiena},
//editor = {Sofus A. Macskassy and
Claudia Perlich and
Jure Leskovec and
Wei Wang and
Rayid Ghani},
title = {DeepWalk: online learning of social representations},
booktitle = {The 20th {ACM} {SIGKDD} International Conference on Knowledge Discovery
and Data Mining, {KDD} '14, New York, NY, {USA} - August 24 - 27,
......@@ -4041,17 +3629,11 @@
pages = {701--710},
publisher = {{ACM}},
year = {2014},
//url = {},
//doi = {10.1145/2623330.2623732},
//timestamp = {Sun, 02 Jun 2019 21:11:52 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Ronan Collobert and
Jason Weston and
L{\'{e}}on Bottou and
Michael Karlen and
Koray Kavukcuoglu and
Pavel P. Kuksa},
......@@ -4060,10 +3642,6 @@
volume = {12},
pages = {2493--2537},
year = {2011},
//url = {},
//timestamp = {Wed, 10 Jul 2019 15:28:44 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4071,23 +3649,12 @@
James Bradbury and
Caiming Xiong and
Richard Socher},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Learned in Translation: Contextualized Word Vectors},
booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}},
pages = {6294--6305},
year = {2017},
//url = {},
//timestamp = {Fri, 06 Mar 2020 16:57:53 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
%%%%% chapter 9------------------------------------------------------
......@@ -4110,16 +3677,9 @@
pages = {1370--1380},
//publisher = {The Association for Computer Linguistics},
year = {2014},
//url = {},
//doi = {10.3115/v1/p14-1129},
//timestamp = {Tue, 28 Jan 2020 10:27:56 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Holger Schwenk},
//editor = {Martin Kay and
Christian Boitet},
title = {Continuous Space Translation Models for Phrase-Based Statistical Machine
publisher = {{COLING} 2012, 24th International Conference on Computational Linguistics,
......@@ -4128,10 +3688,6 @@
pages = {1071--1080},
//publisher = {Indian Institute of Technology Bombay},
year = {2012},
//url = {},
//timestamp = {Wed, 18 Sep 2019 12:15:53 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Nal Kalchbrenner and
......@@ -4144,10 +3700,6 @@
pages = {1700--1709},
//publisher = {{ACL}},
year = {2013},
//url = {},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Sepp Hochreiter},
......@@ -4159,11 +3711,6 @@
number = {2},
pages = {107--116},
year = {1998},
//url = {},
//doi = {10.1142/S0218488598000094},
//timestamp = {Wed, 14 Nov 2018 10:41:42 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author ={Y. {Bengio} and P. {Simard} and P. {Frasconi}},
......@@ -4183,23 +3730,12 @@ pages ={157-166},
Aidan N. Gomez and
Lukasz Kaiser and
Illia Polosukhin},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Attention is All you Need},
publisher = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}},
pages = {5998--6008},
year = {2017},
//url = {},
//timestamp = {Fri, 06 Mar 2020 17:00:11 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Felix Stahlberg},
......@@ -4207,21 +3743,12 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1912.02047},
year = {2019},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1912.02047},
//timestamp = {Thu, 02 Jan 2020 18:08:18 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Luisa Bentivogli and
Arianna Bisazza and
Mauro Cettolo and
Marcello Federico},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Neural versus Phrase-Based Machine Translation Quality: a Case Study},
publisher = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
......@@ -4229,11 +3756,6 @@ pages ={157-166},
pages = {257--267},
//publisher = {The Association for Computational Linguistics},
year = {2016},
//url = {},
//doi = {10.18653/v1/d16-1025},
//timestamp = {Tue, 28 Jan 2020 10:28:39 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Hany Hassan and
......@@ -4264,12 +3786,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1803.05567},
year = {2018},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1803.05567},
//timestamp = {Mon, 13 Aug 2018 16:47:23 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Qiang Wang and
......@@ -4279,9 +3795,6 @@ pages ={157-166},
Changliang Li and
Derek F. Wong and
Lidia S. Chao},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Learning Deep Transformer Models for Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4289,11 +3802,6 @@ pages ={157-166},
pages = {1810--1822},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/p19-1176},
//timestamp = {Tue, 28 Jan 2020 10:27:53 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Yanyang Li and
......@@ -4305,12 +3813,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/2002.06546},
year = {2020},
//url = {},
//archivePrefix = {arXiv},
//eprint = {2002.06546},
//timestamp = {Mon, 02 Mar 2020 16:46:06 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Hochreiter, Sepp and Schmidhuber, Jürgen},
......@@ -4320,7 +3822,6 @@ pages ={157-166},
title = {Long Short-term Memory},
volume = {9},
journal = {Neural computation},
//doi = {10.1162/neco.1997.9.8.1735}
author = {Kyunghyun Cho and
......@@ -4330,9 +3831,6 @@ pages ={157-166},
Fethi Bougares and
Holger Schwenk and
Yoshua Bengio},
//editor = {Alessandro Moschitti and
Bo Pang and
Walter Daelemans},
title = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
Machine Translation},
publisher = {Proceedings of the 2014 Conference on Empirical Methods in Natural
......@@ -4341,37 +3839,24 @@ pages ={157-166},
pages = {1724--1734},
//publisher = {{ACL}},
year = {2014},
//url = {},
//doi = {10.3115/v1/d14-1179},
//timestamp = {Tue, 28 Jan 2020 10:28:17 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Xavier Glorot and
Yoshua Bengio},
//editor = {Yee Whye Teh and
D. Mike Titterington},
title = {Understanding the difficulty of training deep feedforward neural networks},
publisher = {Proceedings of the Thirteenth International Conference on Artificial
Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
Italy, May 13-15, 2010},
//series = {{JMLR} Proceedings},
volume = {9},
pages = {249--256},
//publisher = {},
year = {2010},
//url = {},
//timestamp = {Wed, 29 May 2019 08:41:47 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Tong Xiao and
Jingbo Zhu and
Tongran Liu and
Chunliang Zhang},
//editor = {Carles Sierra},
title = {Fast Parallel Training of Neural Language Models},
publisher = {Proceedings of the Twenty-Sixth International Joint Conference on
Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
......@@ -4379,11 +3864,6 @@ pages ={157-166},
pages = {4193--4199},
//publisher = {},
year = {2017},
//url = {},
//doi = {10.24963/ijcai.2017/586},
//timestamp = {Tue, 20 Aug 2019 16:17:12 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Jiatao Gu and
......@@ -4392,14 +3872,8 @@ pages ={157-166},
Victor O. K. Li and
Richard Socher},
title = {Non-Autoregressive Neural Machine Translation},
publisher = {6th International Conference on Learning Representations, {ICLR} 2018,
Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
//publisher = {},
publisher = {International Conference on Learning Representations},
year = {2018},
//url = {},
//timestamp = {Thu, 25 Jul 2019 14:25:57 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Yanyang Li and
......@@ -4408,8 +3882,6 @@ pages ={157-166},
Qiang Wang and
Changming Xu and
Jingbo Zhu},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {A Simple and Effective Approach to Coverage-Aware Neural Machine Translation},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -4417,11 +3889,6 @@ pages ={157-166},
pages = {292--297},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/P18-2047},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Zhaopeng Tu and
......@@ -4435,17 +3902,11 @@ pages ={157-166},
1: Long Papers},
//publisher = {The Association for Computer Linguistics},
year = {2016},
//url = {},
//doi = {10.18653/v1/p16-1008},
//timestamp = {Tue, 28 Jan 2020 10:27:13 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Rico Sennrich and
Orhan Firat and
Kyunghyun Cho and
Alexandra Birch and
Barry Haddow and
Julian Hitschler and
Marcin Junczys-Dowmunt and
......@@ -4453,8 +3914,6 @@ pages ={157-166},
Antonio Valerio Miceli Barone and
Jozef Mokry and
Maria Nadejde},
//editor = {Andre Martins and
Anselmo Pe{\~{n}}as},
title = {Nematus: a Toolkit for Neural Machine Translation},
publisher = {Proceedings of the 15th Conference of the European Chapter of the
Association for Computational Linguistics, {EACL} 2017, Valencia,
......@@ -4462,18 +3921,10 @@ pages ={157-166},
pages = {65--68},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {},
//doi = {10.18653/v1/e17-3017},
//timestamp = {Tue, 28 Jan 2020 10:31:12 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Biao Zhang and
Rico Sennrich},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {A Lightweight Recurrent Network for Sequence Modeling},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4481,11 +3932,6 @@ pages ={157-166},
pages = {1538--1548},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/p19-1149},
//timestamp = {Tue, 28 Jan 2020 10:28:03 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Tao Lei and
......@@ -4495,12 +3941,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1709.02755},
year = {2017},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1709.02755},
//timestamp = {Mon, 13 Aug 2018 16:46:29 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Biao Zhang and
......@@ -4508,10 +3948,6 @@ pages ={157-166},
Jinsong Su and
Qian Lin and
Huiji Zhang},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Simplifying Neural Machine Translation with Addition-Subtraction Twin-Gated
Recurrent Networks},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
......@@ -4519,10 +3955,6 @@ pages ={157-166},
pages = {4273--4283},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Shikun Liu and
......@@ -4534,50 +3966,23 @@ pages ={157-166},
pages = {1871--1880},
//publisher = {Computer Vision Foundation / {IEEE}},
year = {2019},
//url = {\_CVPR\_2019/html/Liu\_End-To-End\_Multi-Task\_Learning\_With\_Attention\_CVPR\_2019\_paper.html},
//doi = {10.1109/CVPR.2019.00197},
//timestamp = {Mon, 20 Jan 2020 15:36:04 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Ra{\'{u}}l V{\'{a}}zquez and
Alessandro Raganato and
J{\"{o}}rg Tiedemann and
Mathias Creutz},
//editor = {Isabelle Augenstein and
Spandana Gella and
Sebastian Ruder and
Katharina Kann and
Burcu Can and
Johannes Welbl and
Alexis Conneau and
Xiang Ren and
Marek Rei},
title = {Multilingual {NMT} with a Language-Independent Attention Bridge},
publisher = {Proceedings of the 4th Workshop on Representation Learning for NLP,
RepL4NLP@ACL 2019, Florence, Italy, August 2, 2019},
pages = {33--39},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/w19-4305},
//timestamp = {Fri, 27 Mar 2020 08:52:29 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Pooya Moradi and
Nishant Kambhatla and
Anoop Sarkar},
//editor = {Alexandra Birch and
Andrew M. Finch and
Hiroaki Hayashi and
Ioannis Konstas and
Thang Luong and
Graham Neubig and
Yusuke Oda and
Katsuhito Sudoh},
title = {Interrogating the Explanatory Power of Attention in Neural Machine
publisher = {Proceedings of the 3rd Workshop on Neural Generation and Translation@EMNLP-IJCNLP
......@@ -4585,11 +3990,6 @@ pages ={157-166},
pages = {221--230},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/D19-5624},
//timestamp = {Tue, 24 Mar 2020 15:04:09 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Xing Wang and
......@@ -4598,18 +3998,12 @@ pages ={157-166},
Hang Li and
Deyi Xiong and
Min Zhang},
//editor = {Satinder P. Singh and
Shaul Markovitch},
title = {Neural Machine Translation Advised by Statistical Machine Translation},
publisher = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
February 4-9, 2017, San Francisco, California, {USA}},
pages = {3330--3336},
//publisher = {{AAAI} Press},
year = {2017},
//url = {},
//timestamp = {Tue, 15 Jan 2019 11:48:13 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Elena Voita and
......@@ -4617,9 +4011,6 @@ pages ={157-166},
Fedor Moiseev and
Rico Sennrich and
Ivan Titov},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Analyzing Multi-Head Self-Attention: Specialized Heads Do the Heavy
Lifting, the Rest Can Be Pruned},
publisher = {Proceedings of the 57th Conference of the Association for Computational
......@@ -4628,11 +4019,6 @@ pages ={157-166},
pages = {5797--5808},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/p19-1580},
//timestamp = {Tue, 28 Jan 2020 10:27:29 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Tong Xiao and
......@@ -4640,7 +4026,6 @@ pages ={157-166},
Jingbo Zhu and
Zhengtao Yu and
Tongran Liu},
//editor = {Sarit Kraus},
title = {Sharing Attention Weights for Fast Transformer},
publisher = {Proceedings of the Twenty-Eighth International Joint Conference on
Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
......@@ -4648,11 +4033,6 @@ pages ={157-166},
pages = {5292--5298},
//publisher = {},
year = {2019},
//url = {},
//doi = {10.24963/ijcai.2019/735},
//timestamp = {Tue, 20 Aug 2019 16:18:18 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Baosong Yang and
......@@ -4660,9 +4040,6 @@ pages ={157-166},
Tong Xiao and
Lidia S. Chao and
Jingbo Zhu},
//editor = {Martha Palmer and
Rebecca Hwa and
Sebastian Riedel},
title = {Towards Bidirectional Hierarchical Representations for Attention-based
Neural Machine Translation},
publisher = {Proceedings of the 2017 Conference on Empirical Methods in Natural
......@@ -4671,20 +4048,11 @@ pages ={157-166},
pages = {1432--1441},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {},
//doi = {10.18653/v1/d17-1150},
//timestamp = {Tue, 28 Jan 2020 10:28:08 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Yau-Shian Wang and
Hung-yi Lee and
Yun-Nung Chen},
//editor = {Kentaro Inui and
Jing Jiang and
Vincent Ng and
Xiaojun Wan},
title = {Tree Transformer: Integrating Tree Structures into Self-Attention},
publisher = {Proceedings of the 2019 Conference on Empirical Methods in Natural
Language Processing and the 9th International Joint Conference on
......@@ -4693,51 +4061,29 @@ pages ={157-166},
//publisher = {Association for Computational Linguistics},
pages = {1061--1070},
year = {2019},
//url = {},
//doi = {10.18653/v1/D19-1098},
//timestamp = {Thu, 12 Dec 2019 13:23:46 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Jetic Gu and
Hassan S. Shavarani and
Anoop Sarkar},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {401--413},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/d18-1037},
//timestamp = {Tue, 28 Jan 2020 10:28:48 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Xinyi Wang and
Hieu Pham and
Pengcheng Yin and
Graham Neubig},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {A Tree-based Decoder for Neural Machine Translation},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4772--4777},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Jiajun Zhang and
......@@ -4746,12 +4092,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1610.07272},
year = {2016},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1610.07272},
//timestamp = {Mon, 13 Aug 2018 16:47:14 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Zihang Dai and
......@@ -4764,12 +4104,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1901.02860},
year = {2019},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1901.02860},
//timestamp = {Fri, 01 Feb 2019 13:39:59 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Xintong Li and
......@@ -4777,9 +4111,6 @@ pages ={157-166},
Lemao Liu and
Max Meng and
Shuming Shi},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {On the Word Alignment from Neural Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4787,11 +4118,6 @@ pages ={157-166},
pages = {1293--1303},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {},
//doi = {10.18653/v1/p19-1124},
//timestamp = {Tue, 28 Jan 2020 10:27:51 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4799,10 +4125,6 @@ pages ={157-166},
Dhananjay Ram and
Nikolaos Pappas and
James Henderson},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Document-Level Neural Machine Translation with Hierarchical Attention
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
......@@ -4810,19 +4132,12 @@ pages ={157-166},
pages = {2947--2954},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/d18-1325},
//timestamp = {Fri, 27 Mar 2020 08:46:30 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Elena Voita and
Pavel Serdyukov and
Rico Sennrich and
Ivan Titov},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Context-Aware Neural Machine Translation Learns Anaphora Resolution},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -4830,11 +4145,6 @@ pages ={157-166},
pages = {1264--1274},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/P18-1117},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Aishwarya Bhandare and
......@@ -4849,12 +4159,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1906.00532},
year = {2019},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1906.00532},
//timestamp = {Thu, 13 Jun 2019 13:36:00 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4863,46 +4167,29 @@ pages ={157-166},
Yang Feng and
Lei Shen and
Qun Liu},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Speeding Up Neural Machine Translation Decoding by Cube Pruning},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4284--4294},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//timestamp = {Fri, 29 Nov 2019 14:00:46 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Abigail See and
Minh-Thang Luong and
Christopher D. Manning},
//editor = {Yoav Goldberg and
Stefan Riezler},
title = {Compression of Neural Machine Translation Models via Pruning},
publisher = {Proceedings of the 20th {SIGNLL} Conference on Computational Natural
Language Learning, CoNLL 2016, Berlin, Germany, August 11-12, 2016},
pages = {291--301},
//publisher = {{ACL}},
year = {2016},
//url = {},
//doi = {10.18653/v1/k16-1029},
//timestamp = {Tue, 28 Jan 2020 10:29:27 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Yun Chen and
Yang Liu and
Yong Cheng and
Victor O. K. Li},
//editor = {Regina Barzilay and
Min-Yen Kan},
title = {A Teacher-Student Framework for Zero-Resource Neural Machine Translation},
publisher = {Proceedings of the 55th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
......@@ -4910,11 +4197,6 @@ pages ={157-166},
pages = {1925--1935},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {},
//doi = {10.18653/v1/P17-1176},
//timestamp = {Tue, 20 Aug 2019 11:59:05 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Geoffrey E. Hinton and
......@@ -4924,12 +4206,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1503.02531},
year = {2015},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1503.02531},
//timestamp = {Mon, 13 Aug 2018 16:48:36 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
......@@ -4953,8 +4229,6 @@ pages ={157-166},
year = "2016",
//address = "Austin, Texas",
//publisher = "Association for Computational Linguistics",
//url = "",
//doi = "10.18653/v1/D16-1139",
pages = "1317--1327",
......@@ -4982,18 +4256,11 @@ pages ={157-166},
Toulon, France, April 24-26, 2017, Conference Track Proceedings},
//publisher = {},
year = {2017},
//url = {\_jUqxe},
//timestamp = {Thu, 25 Jul 2019 14:25:44 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Peter Shaw and
Jakob Uszkoreit and
Ashish Vaswani},
//editor = {Marilyn A. Walker and
Heng Ji and
Amanda Stent},
title = {Self-Attention with Relative Position Representations},
publisher = {Proceedings of the 2018 Conference of the North American Chapter of
the Association for Computational Linguistics: Human Language Technologies,
......@@ -5002,11 +4269,6 @@ pages ={157-166},
pages = {464--468},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/n18-2074},
//timestamp = {Tue, 28 Jan 2020 10:30:17 +0100},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Kaiming He and
......@@ -5019,26 +4281,6 @@ pages ={157-166},
pages = {770--778},
//publisher = {{IEEE} Computer Society},
year = {2016},
//url = {},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Lei Jimmy Ba and
Jamie Ryan Kiros and
Geoffrey E. Hinton},
title = {Layer Normalization},
journal = {CoRR},
volume = {abs/1607.06450},
year = {2016},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov},
......@@ -5047,7 +4289,6 @@ pages ={157-166},
year = {2014},
volume = {15},
pages = {1929-1958},
//url = {}
author = {Christian Szegedy and
......@@ -5061,18 +4302,11 @@ pages ={157-166},
pages = {2818--2826},
//publisher = {{IEEE} Computer Society},
year = {2016},
//url = {},
//doi = {10.1109/CVPR.2016.308},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Biao Zhang and
Deyi Xiong and
Jinsong Su},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Accelerating Neural Transformer via an Average Attention Network},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -5080,11 +4314,6 @@ pages ={157-166},
pages = {1789--1798},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {},
//doi = {10.18653/v1/P18-1166},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
author = {Matthieu Courbariaux and
......@@ -5094,12 +4323,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1602.02830},
year = {2016},
//url = {},
//archivePrefix = {arXiv},
//eprint = {1602.02830},
//timestamp = {Mon, 13 Aug 2018 16:46:57 +0200},
//biburl = {},
//bibsource = {dblp computer science bibliography,}
%%%%% chapter 12------------------------------------------------------
Markdown 格式
您添加了 0 到此讨论。请谨慎行事。
注册 或者 后发表评论