Commit 51cd432f by 曹润柘

更新 bibliography.bib

parent 99300e4f
...@@ -186,7 +186,6 @@ ...@@ -186,7 +186,6 @@
Keith Stevens and Keith Stevens and
George Kurian and George Kurian and
Nishant Patil and Nishant Patil and
Wei Wang and
Cliff Young and Cliff Young and
Jason Smith and Jason Smith and
Jason Riesa and Jason Riesa and
...@@ -221,7 +220,6 @@ ...@@ -221,7 +220,6 @@
Yann N. Dauphin}, Yann N. Dauphin},
title = {Convolutional Sequence to Sequence Learning}, title = {Convolutional Sequence to Sequence Learning},
publisher = {International Conference on Machine Learning}, publisher = {International Conference on Machine Learning},
//series = {Proceedings of Machine Learning Research},
volume = {70}, volume = {70},
pages = {1243--1252}, pages = {1243--1252},
year = {2017} year = {2017}
...@@ -270,10 +268,8 @@ ...@@ -270,10 +268,8 @@
@book{Goodfellow-et-al-2016, @book{Goodfellow-et-al-2016,
author = {Ian J. Goodfellow and author = {Ian J. Goodfellow and
Yoshua Bengio and
Aaron C. Courville}, Aaron C. Courville},
title = {Deep Learning}, title = {Deep Learning},
//series = {Adaptive computation and machine learning},
publisher = {{MIT} Press}, publisher = {{MIT} Press},
year = {2016} year = {2016}
} }
...@@ -386,7 +382,6 @@ ...@@ -386,7 +382,6 @@
publisher={International Conference on Acoustics, Speech, and Signal Processing}, publisher={International Conference on Acoustics, Speech, and Signal Processing},
pages={825--828}, pages={825--828},
year={1991}, year={1991},
//organization={IEEE Computer Society}
} }
@inproceedings{stolcke2002srilm, @inproceedings{stolcke2002srilm,
...@@ -425,7 +420,6 @@ ...@@ -425,7 +420,6 @@
title = {Speech and language processing: an introduction to natural language title = {Speech and language processing: an introduction to natural language
processing, computational linguistics, and speech recognition, 2nd processing, computational linguistics, and speech recognition, 2nd
Edition}, Edition},
//series = {Prentice Hall series in artificial intelligence},
publisher = {Prentice Hall, Pearson Education International}, publisher = {Prentice Hall, Pearson Education International},
year = {2009} year = {2009}
} }
...@@ -743,7 +737,6 @@ ...@@ -743,7 +737,6 @@
@inproceedings{Koehn2007Moses, @inproceedings{Koehn2007Moses,
author = {Philipp Koehn and author = {Philipp Koehn and
Hieu Hoang and Hieu Hoang and
Alexandra Birch and
Chris Callison-Burch and Chris Callison-Burch and
Marcello Federico and Marcello Federico and
Nicola Bertoldi and Nicola Bertoldi and
...@@ -824,7 +817,6 @@ ...@@ -824,7 +817,6 @@
Kevin Knight and Kevin Knight and
Daniel Marcu and Daniel Marcu and
Steve DeNeefe and Steve DeNeefe and
Wei Wang and
Ignacio Thayer}, Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation title = {Scalable Inference and Training of Context-Rich Syntactic Translation
Models}, Models},
...@@ -847,28 +839,25 @@ ...@@ -847,28 +839,25 @@
%%%%% chapter 3------------------------------------------------------ %%%%% chapter 3------------------------------------------------------
@inproceedings{ng2002discriminative, @inproceedings{ng2002discriminative,
author = {Andrew Y. Ng and title ={On discriminative vs. generative classifiers: A comparison of logistic regression and naive bayes},
Michael I. Jordan}, author ={Ng, Andrew Y and Jordan, Michael I},
title = {On Discriminative vs. Generative Classifiers: {A} comparison of logistic pages ={841--848},
regression and naive Bayes}, year ={2002}
pages = {841--848},
publisher = {{MIT} Press},
year = {2001},
} }
@inproceedings{huang2008coling, @proceedings{huang2008advanced,
author = {Huang, Liang}, title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications - Tutorial notes},
title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications-Tutorial notes},
year = {2008}, year = {2008},
publisher = {International Conference on Computational Linguistics}, address = {Manchester, UK},
publisher = {Coling 2008 Organizing Committee},
} }
@book{aho1972theory, @book{aho1972theory,
author = {Aho, Alfred V and author = {Alfred V. Aho and
Ullman, Jeffrey D}, Jeffrey D. Ullman},
title = {The theory of parsing, translation, and compiling}, title = {The theory of parsing, translation, and compiling. 2: Compiling},
publisher = {Prentice-Hall Englewood Cliffs, NJ}, publisher = {Prentice-Hall},
year = {1973}, year = {1973},
} }
...@@ -877,7 +866,6 @@ ...@@ -877,7 +866,6 @@
author={Rau, Lisa F}, author={Rau, Lisa F},
pages={29--30}, pages={29--30},
year={1991}, year={1991},
publisher={IEEE Conference on Artificial Intelligence Application},
} }
@article{张小衡1997中文机构名称的识别与分析, @article{张小衡1997中文机构名称的识别与分析,
...@@ -890,16 +878,11 @@ ...@@ -890,16 +878,11 @@
year={1997}, year={1997},
} }
@inproceedings{lample2016neural, @article{lample2016neural,
author = {Guillaume Lample and title={Neural architectures for named entity recognition},
Miguel Ballesteros and author={Lample, Guillaume and Ballesteros, Miguel and Subramanian, Sandeep and Kawakami, Kazuya and Dyer, Chris},
Sandeep Subramanian and journal={arXiv preprint arXiv:1603.01360},
Kazuya Kawakami and year={2016}
Chris Dyer},
title = {Neural Architectures for Named Entity Recognition},
pages = {260--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
} }
@article{Baum1966Statistical, @article{Baum1966Statistical,
...@@ -920,6 +903,7 @@ ...@@ -920,6 +903,7 @@
number={1}, number={1},
pages={164--171}, pages={164--171},
year={1970}, year={1970},
publisher={JSTOR}
} }
@article{1977Maximum, @article{1977Maximum,
...@@ -933,13 +917,19 @@ ...@@ -933,13 +917,19 @@
@article{1967Error, @article{1967Error,
title={Error bounds for convolutional codes and an asymptotically optimum decoding algorithm}, title={Error bounds for convolutional codes and an asymptotically optimum decoding algorithm},
author={ Viterbi, Andrew J. }, author={ Viterbi, Andrew J. },
journal={IEEE Transactions on Information Theory}, journal={IEEE Trans.informat.theory},
volume={13}, volume={13},
number={2}, number={2},
pages={260-269}, pages={260-269},
year={1967}, year={1967},
} }
@article{lafferty2001conditional,
title={Conditional random fields: Probabilistic models for segmenting and labeling sequence data},
author={Lafferty, John and McCallum, Andrew and Pereira, Fernando CN},
year={2001}
}
@article{harrington2013机器学习实战, @article{harrington2013机器学习实战,
title={机器学习实战}, title={机器学习实战},
author={Harrington, Peter}, author={Harrington, Peter},
...@@ -952,36 +942,41 @@ ...@@ -952,36 +942,41 @@
author = {Brants, Thorsten}, author = {Brants, Thorsten},
month = apr, month = apr,
year = {2000}, year = {2000},
address = {Seattle, Washington, USA},
publisher = {Association for Computational Linguistics}, publisher = {Association for Computational Linguistics},
doi = {10.3115/974147.974178},
pages = {224--231}, pages = {224--231},
} }
@inproceedings{tsuruoka-tsujii-2005-chunk, @inproceedings{tsuruoka-tsujii-2005-chunk,
title = {Chunk Parsing Revisited}, title = {Chunk Parsing Revisited},
author = {Yoshimasa Tsuruoka and author = {Tsuruoka, Yoshimasa and
Jun'ichi Tsujii}, Tsujii, Jun{'}ichi},
month = oct, month = oct,
year = {2005}, year = {2005},
publisher = {Annual Meeting of the Association for Computational Linguistics}, address = {Vancouver, British Columbia},
publisher = {Association for Computational Linguistics},
pages = {133--140}, pages = {133--140},
} }
@inproceedings{li-etal-2003-news-oriented, @inproceedings{li-etal-2003-news-oriented,
title = {News-Oriented Automatic Chinese Keyword Indexing}, title = {News-Oriented Automatic {C}hinese Keyword Indexing},
author = {Li, Sujian and author = {Li, Sujian and
Wang, Houfeng and Wang, Houfeng and
Yu, Shiwen and Yu, Shiwen and
Xin, Chengsheng}, Xin, Chengsheng},
month = jul, month = jul,
year = {2003}, year = {2003},
publisher = {Annual Meeting of the Association for Computational Linguistics}, address = {Sapporo, Japan},
publisher = {Association for Computational Linguistics},
doi = {10.3115/1119250.1119263},
pages = {92--97}, pages = {92--97},
} }
@article{2015Bidirectional, @article{2015Bidirectional,
title={Bidirectional LSTM-CRF Models for Sequence Tagging}, title={Bidirectional LSTM-CRF Models for Sequence Tagging},
author={ Huang, Zhiheng and Xu, Wei and Yu, Kai }, author={ Huang, Zhiheng and Xu, Wei and Yu, Kai },
journal={CoRR}, journal={Computer ence},
year={2015}, year={2015},
} }
...@@ -996,13 +991,10 @@ ...@@ -996,13 +991,10 @@
} }
@inproceedings{vzukov2018named, @inproceedings{vzukov2018named,
author = {Andrej Zukov Gregoric and title={Named entity recognition with parallel recurrent neural networks},
Yoram Bachrach and author={{\v{Z}}ukov-Gregori{\v{c}}, Andrej and Bachrach, Yoram and Coope, Sam},
Sam Coope}, pages={69--74},
title = {Named Entity Recognition With Parallel Recurrent Neural Networks}, year={2018}
pages = {69--74},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018},
} }
@article{Li2020A, @article{Li2020A,
...@@ -1015,196 +1007,29 @@ ...@@ -1015,196 +1007,29 @@
year={2020}, year={2020},
} }
@article{devlin2019bert, @article{devlin2018bert,
title={Bert: Pre-training of deep bidirectional transformers for language understanding}, title={Bert: Pre-training of deep bidirectional transformers for language understanding},
author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina}, author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
year={2019}, journal={arXiv preprint arXiv:1810.04805},
pages = {4171--4186}, year={2018}
journal = {Annual Meeting of the Association for Computational Linguistics}, }
}
@inproceedings{conneau2019unsupervised, @article{conneau2019unsupervised,
author = {Alexis Conneau and title={Unsupervised cross-lingual representation learning at scale},
Kartikay Khandelwal and author={Conneau, Alexis and Khandelwal, Kartikay and Goyal, Naman and Chaudhary, Vishrav and Wenzek, Guillaume and Guzm{\'a}n, Francisco and Grave, Edouard and Ott, Myle and Zettlemoyer, Luke and Stoyanov, Veselin},
Naman Goyal and journal={arXiv preprint arXiv:1911.02116},
Vishrav Chaudhary and year={2019}
Guillaume Wenzek and
Francisco Guzm{\'{a}}n and
Edouard Grave and
Myle Ott and
Luke Zettlemoyer and
Veselin Stoyanov},
title = {Unsupervised Cross-lingual Representation Learning at Scale},
pages = {8440--8451},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020},
} }
@book{chomsky1993lectures, @book{chomsky1993lectures,
title={Lectures on government and binding: The Pisa lectures}, title={Lectures on government and binding: The Pisa lectures},
author={Chomsky, Noam}, author={Chomsky, Noam},
number={9},
year={1993}, year={1993},
publisher={Walter de Gruyter} publisher={Walter de Gruyter}
} }
@inproceedings{DBLP:conf/acl/SennrichHB16a,
author = {Rico Sennrich and
Barry Haddow and
Alexandra Birch},
title = {Neural Machine Translation of Rare Words with Subword Units},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
}
@article{刘挺1998最大概率分词问题及其解法,
title={最大概率分词问题及其解法},
author={刘挺 and 吴岩 and 王开铸},
journal={哈尔滨工业大学学报},
number={06},
pages={37-41},
year={1998},
}
@article{丁洁2010基于最大概率分词算法的中文分词方法研究,
title={基于最大概率分词算法的中文分词方法研究},
author={丁洁},
journal={科技信息},
number={21},
pages={I0075--I0075},
year={2010}
}
@book{1995University,
title = {University of Sheffield: Description of the LaSIE-II system as used for MUC-7},
author = {Kevin Humphreys and
Robert J. Gaizauskas and
Saliha Azzam and
Charles Huyck and
Brian Mitchell and
Hamish Cunningham and
Yorick Wilks},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1995},
}
@inproceedings{krupka1998isoquest,
title={IsoQuest Inc.: Description of the NetOwl™ Extractor System as Used for MUC-7},
author={Krupka, George and Hausman, Kevin},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year={1998}
}
@inproceedings{DBLP:conf/muc/BlackRM98,
author = {William J. Black and
Fabio Rinaldi and
David Mowatt},
title = {{FACILE:} Description of the {NE} System Used for {MUC-7}},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1998},
}
@article{1996Hidden,
title={Hidden Markov models.},
author={ Eddy, Sean R },
journal={Current Opinion in Structural Biology},
volume={6},
number={3},
pages={361-5},
year={1996},
}
@inproceedings{lafferty2001conditional,
author = {John D. Lafferty and
Andrew McCallum and
Fernando C. N. Pereira},
title = {Conditional Random Fields: Probabilistic Models for Segmenting and
Labeling Sequence Data},
pages = {282--289},
publisher = {proceedings of the Eighteenth International Conference on Machine
Learning},
year = {2001},
}
@book{kapur1989maximum,
title={Maximum-entropy models in science and engineering},
author={Kapur, Jagat Narain},
year={1989},
publisher={John Wiley \& Sons}
}
@article{1998Support,
title={Support vector machines},
author={Hearst, Marti A. and Dumais, Susan T and Osuna, Edgar and Platt, John and Scholkopf, Bernhard},
journal={IEEE Intelligent Systems \& Their Applications},
volume={13},
number={4},
pages={18-28},
year={1998},
}
@article{2011Natural,
title={Natural Language Processing (almost) from Scratch},
author={ Collobert, Ronan and Weston, Jason and Bottou, Léon and Karlen, Michael and Kavukcuoglu, Koray and Kuksa, Pavel },
journal={Journal of Machine Learning Research},
volume={12},
number={1},
pages={2493-2537},
year={2011},
}
@book{manning2008introduction,
title={Introduction to information retrieval},
author={Manning, Christopher D and Sch{\"u}tze, Hinrich and Raghavan, Prabhakar},
year={2008},
publisher={Cambridge university press}
}
@article{berger1996maximum,
title={A maximum entropy approach to natural language processing},
author={Berger, Adam and Della Pietra, Stephen A and Della Pietra, Vincent J},
journal={Computational linguistics},
volume={22},
number={1},
pages={39--71},
year={1996}
}
@article{mitchell1996m,
title={Machine Learning},
author={Mitchell, Tom},
journal={McCraw Hill},
year={1996}
}
@inproceedings{DBLP:conf/acl/OchN02,
author = {Franz Josef Och and
Hermann Ney},
title = {Discriminative Training and Maximum Entropy Models for Statistical
Machine Translation},
pages = {295--302},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2002},
}
@incollection{mohri2008speech,
title={Speech recognition with weighted finite-state transducers},
author={Mohri, Mehryar and Pereira, Fernando and Riley, Michael},
pages={559--584},
year={2008},
publisher={Springer}
}
@article{bellman1966dynamic,
title={Dynamic programming},
author={Bellman, Richard},
journal={Science},
volume={153},
number={3731},
pages={34--37},
year={1966},
publisher={American Association for the Advancement of Science}
}
%%%%% chapter 3------------------------------------------------------ %%%%% chapter 3------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
...@@ -1647,7 +1472,6 @@ ...@@ -1647,7 +1472,6 @@
@inproceedings{DBLP:conf/wmt/Callison-BurchF07, @inproceedings{DBLP:conf/wmt/Callison-BurchF07,
author = {Chris Callison-Burch and author = {Chris Callison-Burch and
Cameron S. Fordyce and Cameron S. Fordyce and
Philipp Koehn and
Christof Monz and Christof Monz and
Josh Schroeder}, Josh Schroeder},
title = {(Meta-) Evaluation of Machine Translation}, title = {(Meta-) Evaluation of Machine Translation},
...@@ -1657,7 +1481,6 @@ ...@@ -1657,7 +1481,6 @@
} }
@inproceedings{DBLP:conf/wmt/Callison-BurchK12, @inproceedings{DBLP:conf/wmt/Callison-BurchK12,
author = {Chris Callison-Burch and author = {Chris Callison-Burch and
Philipp Koehn and
Christof Monz and Christof Monz and
Matt Post and Matt Post and
Radu Soricut and Radu Soricut and
...@@ -1681,7 +1504,6 @@ ...@@ -1681,7 +1504,6 @@
Barry Haddow and Barry Haddow and
Matthias Huck and Matthias Huck and
Chris Hokamp and Chris Hokamp and
Philipp Koehn and
Varvara Logacheva and Varvara Logacheva and
Christof Monz and Christof Monz and
Matteo Negri and Matteo Negri and
...@@ -2056,16 +1878,6 @@ ...@@ -2056,16 +1878,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013} year = {2013}
} }
@article{DBLP:journals/coling/FraserM07,
author = {Alexander M. Fraser and
Daniel Marcu},
title = {Measuring Word Alignment Quality for Statistical Machine Translation},
journal = {Computational Linguistics},
volume = {33},
number = {3},
pages = {293--303},
year = {2007}
}
@inproceedings{DBLP:conf/acl/DeNeroK07, @inproceedings{DBLP:conf/acl/DeNeroK07,
author = {John DeNero and author = {John DeNero and
Dan Klein}, Dan Klein},
...@@ -2252,17 +2064,6 @@ ...@@ -2252,17 +2064,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005}, year = {2005},
} }
@inproceedings{2018Non,
author = {Jiatao Gu and
James Bradbury and
Caiming Xiong and
Victor O. K. Li and
Richard Socher},
title = {Non-Autoregressive Neural Machine Translation},
publisher = {OpenReview.net},
year = {2018}
}
%%%%% chapter 6------------------------------------------------------ %%%%% chapter 6------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
...@@ -2297,15 +2098,6 @@ ...@@ -2297,15 +2098,6 @@
publisher = {AAAI Press}, publisher = {AAAI Press},
year = {2000} year = {2000}
} }
@inproceedings{dyer2013a,
author = {Chris Dyer and
Victor Chahuneau and
Noah A. Smith},
title = {A Simple, Fast, and Effective Reparameterization of {IBM} Model 2},
pages = {644--648},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
}
@inproceedings{taskar2005a, @inproceedings{taskar2005a,
author = {Benjamin Taskar and author = {Benjamin Taskar and
Simon Lacoste-Julien and Simon Lacoste-Julien and
...@@ -2366,13 +2158,7 @@ ...@@ -2366,13 +2158,7 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2014} year = {2014}
} }
@inproceedings{och2003minimum,
author = {Franz Josef Och},
title = {Minimum Error Rate Training in Statistical Machine Translation},
pages = {160--167},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003}
}
@article{powell1964an, @article{powell1964an,
author = {M. J. D. Powell}, author = {M. J. D. Powell},
title = {An efficient method for finding the minimum of a function of several title = {An efficient method for finding the minimum of a function of several
...@@ -2605,7 +2391,6 @@ ...@@ -2605,7 +2391,6 @@
} }
@inproceedings{DBLP:conf/acl/CollinsKK05, @inproceedings{DBLP:conf/acl/CollinsKK05,
author = {Michael Collins and author = {Michael Collins and
Philipp Koehn and
Ivona Kucerova}, Ivona Kucerova},
title = {Clause Restructuring for Statistical Machine Translation}, title = {Clause Restructuring for Statistical Machine Translation},
pages = {531--540}, pages = {531--540},
...@@ -2721,16 +2506,6 @@ ...@@ -2721,16 +2506,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003} year = {2003}
} }
@inproceedings{chiang2008online,
author = {David Chiang and
Yuval Marton and
Philip Resnik},
title = {Online Large-Margin Training of Syntactic and Structural Translation
Features},
pages = {224--233},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@inproceedings{Blunsom2008A, @inproceedings{Blunsom2008A,
author = {Phil Blunsom and author = {Phil Blunsom and
Trevor Cohn and Trevor Cohn and
...@@ -2811,15 +2586,6 @@ ...@@ -2811,15 +2586,6 @@
publisher={University of Southern California}, publisher={University of Southern California},
year={2006}, year={2006},
} }
@inproceedings{DBLP:conf/iwslt/ZensN08,
author = {Richard Zens and
Hermann Ney},
title = {Improvements in dynamic programming beam search for phrase-based statistical
machine translation},
pages = {198--205},
publisher = {International Symposium on Computer Architecture},
year = {2008}
}
@inproceedings{DBLP:conf/emnlp/SchwenkCF07, @inproceedings{DBLP:conf/emnlp/SchwenkCF07,
author = {Holger Schwenk and author = {Holger Schwenk and
Marta R. Costa-juss{\`{a}} and Marta R. Costa-juss{\`{a}} and
...@@ -2968,13 +2734,6 @@ ...@@ -2968,13 +2734,6 @@
pages = {1159--1187}, pages = {1159--1187},
year = {2012} year = {2012}
} }
@inproceedings{chiang2005a,
author = {David Chiang},
title = {A Hierarchical Phrase-Based Model for Statistical Machine Translation},
pages = {263--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005}
}
@article{chiang2007hierarchical, @article{chiang2007hierarchical,
title={Hierarchical Phrase-Based Translation}, title={Hierarchical Phrase-Based Translation},
author ={Chiang David}, author ={Chiang David},
...@@ -3031,20 +2790,6 @@ ...@@ -3031,20 +2790,6 @@
year ={2006}, year ={2006},
publisher ={Computationally Hard Problems \& Joint Inference in Speech \& Language Processing} publisher ={Computationally Hard Problems \& Joint Inference in Speech \& Language Processing}
} }
@inproceedings{galley2006scalable,
author = {Michel Galley and
Jonathan Graehl and
Kevin Knight and
Daniel Marcu and
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
Models},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{galley2004s, @inproceedings{galley2004s,
title ={What’s in a translation rule?}, title ={What’s in a translation rule?},
author ={Galley, Michel and Hopkins, Mark and Knight, Kevin and Marcu, Daniel}, author ={Galley, Michel and Hopkins, Mark and Knight, Kevin and Marcu, Daniel},
...@@ -3089,7 +2834,6 @@ ...@@ -3089,7 +2834,6 @@
} }
@inproceedings{marcu2006spmt, @inproceedings{marcu2006spmt,
author = {Daniel Marcu and author = {Daniel Marcu and
Wei Wang and
Abdessamad Echihabi and Abdessamad Echihabi and
Kevin Knight}, Kevin Knight},
title = {{SPMT:} Statistical Machine Translation with Syntactified Target Language title = {{SPMT:} Statistical Machine Translation with Syntactified Target Language
...@@ -3216,15 +2960,6 @@ ...@@ -3216,15 +2960,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011} year = {2011}
} }
@inproceedings{zhang2006synchronous,
author = {Hao Zhang and
Liang Huang and
Daniel Gildea and
Kevin Knight},
title = {Synchronous Binarization for Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{DBLP:conf/acl/AlshawiBX97, @inproceedings{DBLP:conf/acl/AlshawiBX97,
author = {Hiyan Alshawi and author = {Hiyan Alshawi and
Adam L. Buchsbaum and Adam L. Buchsbaum and
...@@ -3304,7 +3039,6 @@ ...@@ -3304,7 +3039,6 @@
@inproceedings{DBLP:conf/emnlp/DeNeefeKWM07, @inproceedings{DBLP:conf/emnlp/DeNeefeKWM07,
author = {Steve DeNeefe and author = {Steve DeNeefe and
Kevin Knight and Kevin Knight and
Wei Wang and
Daniel Marcu}, Daniel Marcu},
title = {What Can Syntax-Based {MT} Learn from Phrase-Based MT?}, title = {What Can Syntax-Based {MT} Learn from Phrase-Based MT?},
pages = {755--763}, pages = {755--763},
...@@ -3319,30 +3053,6 @@ ...@@ -3319,30 +3053,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008} year = {2008}
} }
@inproceedings{DBLP:conf/acl/LiuLL06,
author = {Yang Liu and
Qun Liu and
Shouxun Lin},
title = {Tree-to-String Alignment Template for Statistical Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{zollmann2006syntax,
author = {Andreas Zollmann and
Ashish Venugopal},
title = {Syntax Augmented Machine Translation via Chart Parsing},
pages = {138--141},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{DBLP:conf/acl/MartonR08,
author = {Yuval Marton and
Philip Resnik},
title = {Soft Syntactic Constraints for Hierarchical Phrased-Based Translation},
pages = {1003--1011},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@INPROCEEDINGS{Nesson06inductionof, @INPROCEEDINGS{Nesson06inductionof,
author = {Rebecca Nesson and Stuart M. Shieber and Alexander Rush}, author = {Rebecca Nesson and Stuart M. Shieber and Alexander Rush},
title = {Induction of probabilistic synchronous tree-insertion grammars for machine translation}, title = {Induction of probabilistic synchronous tree-insertion grammars for machine translation},
...@@ -3355,15 +3065,6 @@ ...@@ -3355,15 +3065,6 @@
year = {2007}, year = {2007},
publisher = {Machine Translation Summit} publisher = {Machine Translation Summit}
} }
@inproceedings{DBLP:conf/acl/LiuLL09,
author = {Yang Liu and
Yajuan L{\"{u}} and
Qun Liu},
title = {Improving Tree-to-Tree Translation with Packed Forests},
pages = {558--566},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2009}
}
@inproceedings{DBLP:conf/emnlp/WangKM07, @inproceedings{DBLP:conf/emnlp/WangKM07,
author = {Wei Wang and author = {Wei Wang and
Kevin Knight and Kevin Knight and
...@@ -3391,14 +3092,6 @@ ...@@ -3391,14 +3092,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics}, publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008} year = {2008}
} }
@inproceedings{DBLP:conf/acl/ZhuX11,
author = {Jingbo Zhu and
Tong Xiao},
title = {Improving Decoding Generalization for Tree-to-String Translation},
pages = {418--423},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011}
}
@inproceedings{DBLP:conf/emnlp/ZhangZZ11, @inproceedings{DBLP:conf/emnlp/ZhangZZ11,
author = {Jiajun Zhang and author = {Jiajun Zhang and
Feifei Zhai and Feifei Zhai and
...@@ -3783,11 +3476,6 @@ ...@@ -3783,11 +3476,6 @@
number = {1}, number = {1},
pages = {145--151}, pages = {145--151},
year = {1999}, year = {1999},
//url = {https://doi.org/10.1016/S0893-6080(98)00116-6},
//doi = {10.1016/S0893-6080(98)00116-6},
//timestamp = {Wed, 14 Nov 2018 10:30:22 +0100},
//biburl = {https://dblp.org/rec/journals/nn/Qian99.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{duchi2011adaptive, @article{duchi2011adaptive,
...@@ -3799,10 +3487,6 @@ ...@@ -3799,10 +3487,6 @@
volume = {12}, volume = {12},
pages = {2121--2159}, pages = {2121--2159},
year = {2011}, year = {2011},
//url = {http://dl.acm.org/citation.cfm?id=2021068},
//timestamp = {Wed, 10 Jul 2019 15:28:02 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/DuchiHS11.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{tieleman2012rmsprop, @article{tieleman2012rmsprop,
...@@ -3818,23 +3502,15 @@ ...@@ -3818,23 +3502,15 @@
@inproceedings{kingma2014adam, @inproceedings{kingma2014adam,
author = {Diederik P. Kingma and author = {Diederik P. Kingma and
Jimmy Ba}, Jimmy Ba},
//editor = {Yoshua Bengio and
Yann LeCun},
title = {Adam: {A} Method for Stochastic Optimization}, title = {Adam: {A} Method for Stochastic Optimization},
booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015, booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015,
San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings}, San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
year = {2015}, year = {2015},
//url = {http://arxiv.org/abs/1412.6980},
//timestamp = {Thu, 25 Jul 2019 14:25:37 +0200},
//biburl = {https://dblp.org/rec/journals/corr/KingmaB14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{ioffe2015batch, @inproceedings{ioffe2015batch,
author = {Sergey Ioffe and author = {Sergey Ioffe and
Christian Szegedy}, Christian Szegedy},
//editor = {Francis R. Bach and
David M. Blei},
title = {Batch Normalization: Accelerating Deep Network Training by Reducing title = {Batch Normalization: Accelerating Deep Network Training by Reducing
Internal Covariate Shift}, Internal Covariate Shift},
booktitle = {Proceedings of the 32nd International Conference on Machine Learning, booktitle = {Proceedings of the 32nd International Conference on Machine Learning,
...@@ -3844,10 +3520,6 @@ ...@@ -3844,10 +3520,6 @@
pages = {448--456}, pages = {448--456},
publisher = {JMLR.org}, publisher = {JMLR.org},
year = {2015}, year = {2015},
//url = {http://proceedings.mlr.press/v37/ioffe15.html},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {https://dblp.org/rec/conf/icml/IoffeS15.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Ba2016LayerN, @article{Ba2016LayerN,
...@@ -3858,30 +3530,6 @@ ...@@ -3858,30 +3530,6 @@
journal = {CoRR}, journal = {CoRR},
volume = {abs/1607.06450}, volume = {abs/1607.06450},
year = {2016}, year = {2016},
//url = {http://arxiv.org/abs/1607.06450},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/BaKH16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/HeZRS15,
author = {Kaiming He and
Xiangyu Zhang and
Shaoqing Ren and
Jian Sun},
title = {Deep Residual Learning for Image Recognition},
booktitle = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition,
{CVPR} 2016, Las Vegas, NV, USA, June 27-30, 2016},
pages = {770--778},
publisher = {{IEEE} Computer Society},
year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.90},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/HeZRS16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{mikolov2013distributed, @inproceedings{mikolov2013distributed,
...@@ -3890,20 +3538,12 @@ ...@@ -3890,20 +3538,12 @@
Kai Chen and Kai Chen and
Gregory S. Corrado and Gregory S. Corrado and
Jeffrey Dean}, Jeffrey Dean},
//editor = {Christopher J. C. Burges and
L{\'{e}}on Bottou and
Zoubin Ghahramani and
Kilian Q. Weinberger},
title = {Distributed Representations of Words and Phrases and their Compositionality}, title = {Distributed Representations of Words and Phrases and their Compositionality},
booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual
Conference on Neural Information Processing Systems 2013. Proceedings Conference on Neural Information Processing Systems 2013. Proceedings
of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States}, of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
pages = {3111--3119}, pages = {3111--3119},
year = {2013}, year = {2013},
//url = {http://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality},
//timestamp = {Fri, 06 Mar 2020 17:00:12 +0100},
//biburl = {https://dblp.org/rec/conf/nips/MikolovSCCD13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{guidotti2018survey, @article{guidotti2018survey,
...@@ -3919,39 +3559,23 @@ ...@@ -3919,39 +3559,23 @@
number = {5}, number = {5},
pages = {93:1--93:42}, pages = {93:1--93:42},
year = {2019}, year = {2019},
//url = {https://doi.org/10.1145/3236009},
//doi = {10.1145/3236009},
//timestamp = {Thu, 09 May 2019 16:06:21 +0200},
//biburl = {https://dblp.org/rec/journals/csur/GuidottiMRTGP19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{koh2017understanding, @inproceedings{koh2017understanding,
author = {Pang Wei Koh and author = {Pang Wei Koh and
Percy Liang}, Percy Liang},
//editor = {Doina Precup and
Yee Whye Teh},
title = {Understanding Black-box Predictions via Influence Functions}, title = {Understanding Black-box Predictions via Influence Functions},
booktitle = {Proceedings of the 34th International Conference on Machine Learning, booktitle = {Proceedings of the 34th International Conference on Machine Learning,
{ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
series = {Proceedings of Machine Learning Research},
volume = {70}, volume = {70},
pages = {1885--1894}, pages = {1885--1894},
publisher = {{PMLR}}, publisher = {{PMLR}},
year = {2017}, year = {2017},
//url = {http://proceedings.mlr.press/v70/koh17a.html},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {https://dblp.org/rec/conf/icml/KohL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{arthur2016incorporating, @inproceedings{arthur2016incorporating,
author = {Philip Arthur and author = {Philip Arthur and
Graham Neubig and
Satoshi Nakamura}, Satoshi Nakamura},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Incorporating Discrete Translation Lexicons into Neural Machine Translation}, title = {Incorporating Discrete Translation Lexicons into Neural Machine Translation},
booktitle = {Proceedings of the 2016 Conference on Empirical Methods in Natural booktitle = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4, Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
...@@ -3959,28 +3583,6 @@ ...@@ -3959,28 +3583,6 @@
pages = {1557--1567}, pages = {1557--1567},
publisher = {The Association for Computational Linguistics}, publisher = {The Association for Computational Linguistics},
year = {2016}, year = {2016},
//url = {https://doi.org/10.18653/v1/d16-1162},
//doi = {10.18653/v1/d16-1162},
//timestamp = {Tue, 28 Jan 2020 10:28:31 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/ArthurNN16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{zollmann2006syntax,
author = {Andreas Zollmann and
Ashish Venugopal},
//editor = {Philipp Koehn and
Christof Monz},
title = {Syntax Augmented Machine Translation via Chart Parsing},
booktitle = {Proceedings on the Workshop on Statistical Machine Translation, WMT@HLT-NAACL
2006, New York City, NY, USA, June 8-9, 2006},
pages = {138--141},
publisher = {Association for Computational Linguistics},
year = {2006},
//url = {https://www.aclweb.org/anthology/W06-3119/},
//timestamp = {Fri, 13 Sep 2019 13:08:46 +0200},
//biburl = {https://dblp.org/rec/conf/wmt/ZollmannV06.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@INPROCEEDINGS{charniak2003syntax, @INPROCEEDINGS{charniak2003syntax,
...@@ -4001,11 +3603,6 @@ ...@@ -4001,11 +3603,6 @@
2: Short Papers}, 2: Short Papers},
publisher = {The Association for Computer Linguistics}, publisher = {The Association for Computer Linguistics},
year = {2016}, year = {2016},
//url = {https://doi.org/10.18653/v1/p16-2049},
//doi = {10.18653/v1/p16-2049},
//timestamp = {Tue, 28 Jan 2020 10:27:31 +0100},
//biburl = {https://dblp.org/rec/conf/acl/StahlbergHWB16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{plank2013embedding, @inproceedings{plank2013embedding,
...@@ -4019,21 +3616,12 @@ ...@@ -4019,21 +3616,12 @@
pages = {1498--1507}, pages = {1498--1507},
publisher = {The Association for Computer Linguistics}, publisher = {The Association for Computer Linguistics},
year = {2013}, year = {2013},
//url = {https://www.aclweb.org/anthology/P13-1147/},
//timestamp = {Mon, 19 Aug 2019 18:10:05 +0200},
//biburl = {https://dblp.org/rec/conf/acl/PlankM13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{perozzi2014deepwalk, @inproceedings{perozzi2014deepwalk,
author = {Bryan Perozzi and author = {Bryan Perozzi and
Rami Al-Rfou and Rami Al-Rfou and
Steven Skiena}, Steven Skiena},
//editor = {Sofus A. Macskassy and
Claudia Perlich and
Jure Leskovec and
Wei Wang and
Rayid Ghani},
title = {DeepWalk: online learning of social representations}, title = {DeepWalk: online learning of social representations},
booktitle = {The 20th {ACM} {SIGKDD} International Conference on Knowledge Discovery booktitle = {The 20th {ACM} {SIGKDD} International Conference on Knowledge Discovery
and Data Mining, {KDD} '14, New York, NY, {USA} - August 24 - 27, and Data Mining, {KDD} '14, New York, NY, {USA} - August 24 - 27,
...@@ -4041,17 +3629,11 @@ ...@@ -4041,17 +3629,11 @@
pages = {701--710}, pages = {701--710},
publisher = {{ACM}}, publisher = {{ACM}},
year = {2014}, year = {2014},
//url = {https://doi.org/10.1145/2623330.2623732},
//doi = {10.1145/2623330.2623732},
//timestamp = {Sun, 02 Jun 2019 21:11:52 +0200},
//biburl = {https://dblp.org/rec/conf/kdd/PerozziAS14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{collobert2011natural, @article{collobert2011natural,
author = {Ronan Collobert and author = {Ronan Collobert and
Jason Weston and Jason Weston and
L{\'{e}}on Bottou and
Michael Karlen and Michael Karlen and
Koray Kavukcuoglu and Koray Kavukcuoglu and
Pavel P. Kuksa}, Pavel P. Kuksa},
...@@ -4060,10 +3642,6 @@ ...@@ -4060,10 +3642,6 @@
volume = {12}, volume = {12},
pages = {2493--2537}, pages = {2493--2537},
year = {2011}, year = {2011},
//url = {http://dl.acm.org/citation.cfm?id=2078186},
//timestamp = {Wed, 10 Jul 2019 15:28:44 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/CollobertWBKKK11.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{mccann2017learned, @inproceedings{mccann2017learned,
...@@ -4071,23 +3649,12 @@ ...@@ -4071,23 +3649,12 @@
James Bradbury and James Bradbury and
Caiming Xiong and Caiming Xiong and
Richard Socher}, Richard Socher},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Learned in Translation: Contextualized Word Vectors}, title = {Learned in Translation: Contextualized Word Vectors},
booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017, on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}}, Long Beach, CA, {USA}},
pages = {6294--6305}, pages = {6294--6305},
year = {2017}, year = {2017},
//url = {http://papers.nips.cc/paper/7209-learned-in-translation-contextualized-word-vectors},
//timestamp = {Fri, 06 Mar 2020 16:57:53 +0100},
//biburl = {https://dblp.org/rec/conf/nips/McCannBXS17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
%%%%% chapter 9------------------------------------------------------ %%%%% chapter 9------------------------------------------------------
...@@ -4110,16 +3677,9 @@ ...@@ -4110,16 +3677,9 @@
pages = {1370--1380}, pages = {1370--1380},
//publisher = {The Association for Computer Linguistics}, //publisher = {The Association for Computer Linguistics},
year = {2014}, year = {2014},
//url = {https://doi.org/10.3115/v1/p14-1129},
//doi = {10.3115/v1/p14-1129},
//timestamp = {Tue, 28 Jan 2020 10:27:56 +0100},
//biburl = {https://dblp.org/rec/conf/acl/DevlinZHLSM14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Schwenk_continuousspace, @inproceedings{Schwenk_continuousspace,
author = {Holger Schwenk}, author = {Holger Schwenk},
//editor = {Martin Kay and
Christian Boitet},
title = {Continuous Space Translation Models for Phrase-Based Statistical Machine title = {Continuous Space Translation Models for Phrase-Based Statistical Machine
Translation}, Translation},
publisher = {{COLING} 2012, 24th International Conference on Computational Linguistics, publisher = {{COLING} 2012, 24th International Conference on Computational Linguistics,
...@@ -4128,10 +3688,6 @@ ...@@ -4128,10 +3688,6 @@
pages = {1071--1080}, pages = {1071--1080},
//publisher = {Indian Institute of Technology Bombay}, //publisher = {Indian Institute of Technology Bombay},
year = {2012}, year = {2012},
//url = {https://www.aclweb.org/anthology/C12-2104/},
//timestamp = {Wed, 18 Sep 2019 12:15:53 +0200},
//biburl = {https://dblp.org/rec/conf/coling/Schwenk12.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{kalchbrenner-blunsom-2013-recurrent, @inproceedings{kalchbrenner-blunsom-2013-recurrent,
author = {Nal Kalchbrenner and author = {Nal Kalchbrenner and
...@@ -4144,10 +3700,6 @@ ...@@ -4144,10 +3700,6 @@
pages = {1700--1709}, pages = {1700--1709},
//publisher = {{ACL}}, //publisher = {{ACL}},
year = {2013}, year = {2013},
//url = {https://www.aclweb.org/anthology/D13-1176/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/KalchbrennerB13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{HochreiterThe, @article{HochreiterThe,
author = {Sepp Hochreiter}, author = {Sepp Hochreiter},
...@@ -4159,11 +3711,6 @@ ...@@ -4159,11 +3711,6 @@
number = {2}, number = {2},
pages = {107--116}, pages = {107--116},
year = {1998}, year = {1998},
//url = {https://doi.org/10.1142/S0218488598000094},
//doi = {10.1142/S0218488598000094},
//timestamp = {Wed, 14 Nov 2018 10:41:42 +0100},
//biburl = {https://dblp.org/rec/journals/ijufks/Hochreiter98.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{BENGIO1994Learning, @article{BENGIO1994Learning,
author ={Y. {Bengio} and P. {Simard} and P. {Frasconi}}, author ={Y. {Bengio} and P. {Simard} and P. {Frasconi}},
...@@ -4183,23 +3730,12 @@ pages ={157-166}, ...@@ -4183,23 +3730,12 @@ pages ={157-166},
Aidan N. Gomez and Aidan N. Gomez and
Lukasz Kaiser and Lukasz Kaiser and
Illia Polosukhin}, Illia Polosukhin},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Attention is All you Need}, title = {Attention is All you Need},
publisher = {Advances in Neural Information Processing Systems 30: Annual Conference publisher = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017, on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}}, Long Beach, CA, {USA}},
pages = {5998--6008}, pages = {5998--6008},
year = {2017}, year = {2017},
//url = {http://papers.nips.cc/paper/7181-attention-is-all-you-need},
//timestamp = {Fri, 06 Mar 2020 17:00:11 +0100},
//biburl = {https://dblp.org/rec/conf/nips/VaswaniSPUJGKP17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{StahlbergNeural, @article{StahlbergNeural,
author = {Felix Stahlberg}, author = {Felix Stahlberg},
...@@ -4207,21 +3743,12 @@ pages ={157-166}, ...@@ -4207,21 +3743,12 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1912.02047}, volume = {abs/1912.02047},
year = {2019}, year = {2019},
//url = {http://arxiv.org/abs/1912.02047},
//archivePrefix = {arXiv},
//eprint = {1912.02047},
//timestamp = {Thu, 02 Jan 2020 18:08:18 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-1912-02047.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Bentivogli2016NeuralVP, @inproceedings{Bentivogli2016NeuralVP,
author = {Luisa Bentivogli and author = {Luisa Bentivogli and
Arianna Bisazza and Arianna Bisazza and
Mauro Cettolo and Mauro Cettolo and
Marcello Federico}, Marcello Federico},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Neural versus Phrase-Based Machine Translation Quality: a Case Study}, title = {Neural versus Phrase-Based Machine Translation Quality: a Case Study},
publisher = {Proceedings of the 2016 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4, Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
...@@ -4229,11 +3756,6 @@ pages ={157-166}, ...@@ -4229,11 +3756,6 @@ pages ={157-166},
pages = {257--267}, pages = {257--267},
//publisher = {The Association for Computational Linguistics}, //publisher = {The Association for Computational Linguistics},
year = {2016}, year = {2016},
//url = {https://doi.org/10.18653/v1/d16-1025},
//doi = {10.18653/v1/d16-1025},
//timestamp = {Tue, 28 Jan 2020 10:28:39 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/BentivogliBCF16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Hassan2018AchievingHP, @article{Hassan2018AchievingHP,
author = {Hany Hassan and author = {Hany Hassan and
...@@ -4264,12 +3786,6 @@ pages ={157-166}, ...@@ -4264,12 +3786,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1803.05567}, volume = {abs/1803.05567},
year = {2018}, year = {2018},
//url = {http://arxiv.org/abs/1803.05567},
//archivePrefix = {arXiv},
//eprint = {1803.05567},
//timestamp = {Mon, 13 Aug 2018 16:47:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1803-05567.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{WangLearning, @inproceedings{WangLearning,
author = {Qiang Wang and author = {Qiang Wang and
...@@ -4279,9 +3795,6 @@ pages ={157-166}, ...@@ -4279,9 +3795,6 @@ pages ={157-166},
Changliang Li and Changliang Li and
Derek F. Wong and Derek F. Wong and
Lidia S. Chao}, Lidia S. Chao},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Learning Deep Transformer Models for Machine Translation}, title = {Learning Deep Transformer Models for Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019, Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
...@@ -4289,11 +3802,6 @@ pages ={157-166}, ...@@ -4289,11 +3802,6 @@ pages ={157-166},
pages = {1810--1822}, pages = {1810--1822},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1176},
//doi = {10.18653/v1/p19-1176},
//timestamp = {Tue, 28 Jan 2020 10:27:53 +0100},
//biburl = {https://dblp.org/rec/conf/acl/WangLXZLWC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Li2020NeuralMT, @article{Li2020NeuralMT,
author = {Yanyang Li and author = {Yanyang Li and
...@@ -4305,12 +3813,6 @@ pages ={157-166}, ...@@ -4305,12 +3813,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/2002.06546}, volume = {abs/2002.06546},
year = {2020}, year = {2020},
//url = {https://arxiv.org/abs/2002.06546},
//archivePrefix = {arXiv},
//eprint = {2002.06546},
//timestamp = {Mon, 02 Mar 2020 16:46:06 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-2002-06546.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{HochreiterLong, @article{HochreiterLong,
author = {Hochreiter, Sepp and Schmidhuber, Jürgen}, author = {Hochreiter, Sepp and Schmidhuber, Jürgen},
...@@ -4320,7 +3822,6 @@ pages ={157-166}, ...@@ -4320,7 +3822,6 @@ pages ={157-166},
title = {Long Short-term Memory}, title = {Long Short-term Memory},
volume = {9}, volume = {9},
journal = {Neural computation}, journal = {Neural computation},
//doi = {10.1162/neco.1997.9.8.1735}
} }
@inproceedings{Cho2014Learning, @inproceedings{Cho2014Learning,
author = {Kyunghyun Cho and author = {Kyunghyun Cho and
...@@ -4330,9 +3831,6 @@ pages ={157-166}, ...@@ -4330,9 +3831,6 @@ pages ={157-166},
Fethi Bougares and Fethi Bougares and
Holger Schwenk and Holger Schwenk and
Yoshua Bengio}, Yoshua Bengio},
//editor = {Alessandro Moschitti and
Bo Pang and
Walter Daelemans},
title = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical title = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
Machine Translation}, Machine Translation},
publisher = {Proceedings of the 2014 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2014 Conference on Empirical Methods in Natural
...@@ -4341,37 +3839,24 @@ pages ={157-166}, ...@@ -4341,37 +3839,24 @@ pages ={157-166},
pages = {1724--1734}, pages = {1724--1734},
//publisher = {{ACL}}, //publisher = {{ACL}},
year = {2014}, year = {2014},
//url = {https://doi.org/10.3115/v1/d14-1179},
//doi = {10.3115/v1/d14-1179},
//timestamp = {Tue, 28 Jan 2020 10:28:17 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/ChoMGBBSB14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{pmlr-v9-glorot10a, @inproceedings{pmlr-v9-glorot10a,
author = {Xavier Glorot and author = {Xavier Glorot and
Yoshua Bengio}, Yoshua Bengio},
//editor = {Yee Whye Teh and
D. Mike Titterington},
title = {Understanding the difficulty of training deep feedforward neural networks}, title = {Understanding the difficulty of training deep feedforward neural networks},
publisher = {Proceedings of the Thirteenth International Conference on Artificial publisher = {Proceedings of the Thirteenth International Conference on Artificial
Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia, Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
Italy, May 13-15, 2010}, Italy, May 13-15, 2010},
//series = {{JMLR} Proceedings},
volume = {9}, volume = {9},
pages = {249--256}, pages = {249--256},
//publisher = {JMLR.org}, //publisher = {JMLR.org},
year = {2010}, year = {2010},
//url = {http://proceedings.mlr.press/v9/glorot10a.html},
//timestamp = {Wed, 29 May 2019 08:41:47 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/GlorotB10.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{xiao2017fast, @inproceedings{xiao2017fast,
author = {Tong Xiao and author = {Tong Xiao and
Jingbo Zhu and Jingbo Zhu and
Tongran Liu and Tongran Liu and
Chunliang Zhang}, Chunliang Zhang},
//editor = {Carles Sierra},
title = {Fast Parallel Training of Neural Language Models}, title = {Fast Parallel Training of Neural Language Models},
publisher = {Proceedings of the Twenty-Sixth International Joint Conference on publisher = {Proceedings of the Twenty-Sixth International Joint Conference on
Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
...@@ -4379,11 +3864,6 @@ pages ={157-166}, ...@@ -4379,11 +3864,6 @@ pages ={157-166},
pages = {4193--4199}, pages = {4193--4199},
//publisher = {ijcai.org}, //publisher = {ijcai.org},
year = {2017}, year = {2017},
//url = {https://doi.org/10.24963/ijcai.2017/586},
//doi = {10.24963/ijcai.2017/586},
//timestamp = {Tue, 20 Aug 2019 16:17:12 +0200},
//biburl = {https://dblp.org/rec/conf/ijcai/XiaoZLZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Gu2017NonAutoregressiveNM, @inproceedings{Gu2017NonAutoregressiveNM,
author = {Jiatao Gu and author = {Jiatao Gu and
...@@ -4392,14 +3872,8 @@ pages ={157-166}, ...@@ -4392,14 +3872,8 @@ pages ={157-166},
Victor O. K. Li and Victor O. K. Li and
Richard Socher}, Richard Socher},
title = {Non-Autoregressive Neural Machine Translation}, title = {Non-Autoregressive Neural Machine Translation},
publisher = {6th International Conference on Learning Representations, {ICLR} 2018, publisher = {International Conference on Learning Representations},
Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
//publisher = {OpenReview.net},
year = {2018}, year = {2018},
//url = {https://openreview.net/forum?id=B1l8BtlCb},
//timestamp = {Thu, 25 Jul 2019 14:25:57 +0200},
//biburl = {https://dblp.org/rec/conf/iclr/Gu0XLS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{li-etal-2018-simple, @inproceedings{li-etal-2018-simple,
author = {Yanyang Li and author = {Yanyang Li and
...@@ -4408,8 +3882,6 @@ pages ={157-166}, ...@@ -4408,8 +3882,6 @@ pages ={157-166},
Qiang Wang and Qiang Wang and
Changming Xu and Changming Xu and
Jingbo Zhu}, Jingbo Zhu},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {A Simple and Effective Approach to Coverage-Aware Neural Machine Translation}, title = {A Simple and Effective Approach to Coverage-Aware Neural Machine Translation},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
...@@ -4417,11 +3889,6 @@ pages ={157-166}, ...@@ -4417,11 +3889,6 @@ pages ={157-166},
pages = {292--297}, pages = {292--297},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/P18-2047/},
//doi = {10.18653/v1/P18-2047},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/LiXLWXZ18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{TuModeling, @inproceedings{TuModeling,
author = {Zhaopeng Tu and author = {Zhaopeng Tu and
...@@ -4435,17 +3902,11 @@ pages ={157-166}, ...@@ -4435,17 +3902,11 @@ pages ={157-166},
1: Long Papers}, 1: Long Papers},
//publisher = {The Association for Computer Linguistics}, //publisher = {The Association for Computer Linguistics},
year = {2016}, year = {2016},
//url = {https://doi.org/10.18653/v1/p16-1008},
//doi = {10.18653/v1/p16-1008},
//timestamp = {Tue, 28 Jan 2020 10:27:13 +0100},
//biburl = {https://dblp.org/rec/conf/acl/TuLLLL16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/SennrichFCBHHJL17, @inproceedings{DBLP:journals/corr/SennrichFCBHHJL17,
author = {Rico Sennrich and author = {Rico Sennrich and
Orhan Firat and Orhan Firat and
Kyunghyun Cho and Kyunghyun Cho and
Alexandra Birch and
Barry Haddow and Barry Haddow and
Julian Hitschler and Julian Hitschler and
Marcin Junczys-Dowmunt and Marcin Junczys-Dowmunt and
...@@ -4453,8 +3914,6 @@ pages ={157-166}, ...@@ -4453,8 +3914,6 @@ pages ={157-166},
Antonio Valerio Miceli Barone and Antonio Valerio Miceli Barone and
Jozef Mokry and Jozef Mokry and
Maria Nadejde}, Maria Nadejde},
//editor = {Andre Martins and
Anselmo Pe{\~{n}}as},
title = {Nematus: a Toolkit for Neural Machine Translation}, title = {Nematus: a Toolkit for Neural Machine Translation},
publisher = {Proceedings of the 15th Conference of the European Chapter of the publisher = {Proceedings of the 15th Conference of the European Chapter of the
Association for Computational Linguistics, {EACL} 2017, Valencia, Association for Computational Linguistics, {EACL} 2017, Valencia,
...@@ -4462,18 +3921,10 @@ pages ={157-166}, ...@@ -4462,18 +3921,10 @@ pages ={157-166},
pages = {65--68}, pages = {65--68},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2017}, year = {2017},
//url = {https://doi.org/10.18653/v1/e17-3017},
//doi = {10.18653/v1/e17-3017},
//timestamp = {Tue, 28 Jan 2020 10:31:12 +0100},
//biburl = {https://dblp.org/rec/conf/eacl/SennrichFCBHHJL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1905-13324, @inproceedings{DBLP:journals/corr/abs-1905-13324,
author = {Biao Zhang and author = {Biao Zhang and
Rico Sennrich}, Rico Sennrich},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {A Lightweight Recurrent Network for Sequence Modeling}, title = {A Lightweight Recurrent Network for Sequence Modeling},
publisher = {Proceedings of the 57th Conference of the Association for Computational publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019, Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
...@@ -4481,11 +3932,6 @@ pages ={157-166}, ...@@ -4481,11 +3932,6 @@ pages ={157-166},
pages = {1538--1548}, pages = {1538--1548},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1149},
//doi = {10.18653/v1/p19-1149},
//timestamp = {Tue, 28 Jan 2020 10:28:03 +0100},
//biburl = {https://dblp.org/rec/conf/acl/ZhangS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Lei2017TrainingRA, @article{Lei2017TrainingRA,
author = {Tao Lei and author = {Tao Lei and
...@@ -4495,12 +3941,6 @@ pages ={157-166}, ...@@ -4495,12 +3941,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1709.02755}, volume = {abs/1709.02755},
year = {2017}, year = {2017},
//url = {http://arxiv.org/abs/1709.02755},
//archivePrefix = {arXiv},
//eprint = {1709.02755},
//timestamp = {Mon, 13 Aug 2018 16:46:29 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1709-02755.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Zhang2018SimplifyingNM, @inproceedings{Zhang2018SimplifyingNM,
author = {Biao Zhang and author = {Biao Zhang and
...@@ -4508,10 +3948,6 @@ pages ={157-166}, ...@@ -4508,10 +3948,6 @@ pages ={157-166},
Jinsong Su and Jinsong Su and
Qian Lin and Qian Lin and
Huiji Zhang}, Huiji Zhang},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Simplifying Neural Machine Translation with Addition-Subtraction Twin-Gated title = {Simplifying Neural Machine Translation with Addition-Subtraction Twin-Gated
Recurrent Networks}, Recurrent Networks},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
...@@ -4519,10 +3955,6 @@ pages ={157-166}, ...@@ -4519,10 +3955,6 @@ pages ={157-166},
pages = {4273--4283}, pages = {4273--4283},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1459/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/ZhangXSLZ18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Liu_2019_CVPR, @inproceedings{Liu_2019_CVPR,
author = {Shikun Liu and author = {Shikun Liu and
...@@ -4534,50 +3966,23 @@ pages ={157-166}, ...@@ -4534,50 +3966,23 @@ pages ={157-166},
pages = {1871--1880}, pages = {1871--1880},
//publisher = {Computer Vision Foundation / {IEEE}}, //publisher = {Computer Vision Foundation / {IEEE}},
year = {2019}, year = {2019},
//url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Liu\_End-To-End\_Multi-Task\_Learning\_With\_Attention\_CVPR\_2019\_paper.html},
//doi = {10.1109/CVPR.2019.00197},
//timestamp = {Mon, 20 Jan 2020 15:36:04 +0100},
//biburl = {https://dblp.org/rec/conf/cvpr/LiuJD19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1811-00498, @inproceedings{DBLP:journals/corr/abs-1811-00498,
author = {Ra{\'{u}}l V{\'{a}}zquez and author = {Ra{\'{u}}l V{\'{a}}zquez and
Alessandro Raganato and Alessandro Raganato and
J{\"{o}}rg Tiedemann and J{\"{o}}rg Tiedemann and
Mathias Creutz}, Mathias Creutz},
//editor = {Isabelle Augenstein and
Spandana Gella and
Sebastian Ruder and
Katharina Kann and
Burcu Can and
Johannes Welbl and
Alexis Conneau and
Xiang Ren and
Marek Rei},
title = {Multilingual {NMT} with a Language-Independent Attention Bridge}, title = {Multilingual {NMT} with a Language-Independent Attention Bridge},
publisher = {Proceedings of the 4th Workshop on Representation Learning for NLP, publisher = {Proceedings of the 4th Workshop on Representation Learning for NLP,
RepL4NLP@ACL 2019, Florence, Italy, August 2, 2019}, RepL4NLP@ACL 2019, Florence, Italy, August 2, 2019},
pages = {33--39}, pages = {33--39},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/w19-4305},
//doi = {10.18653/v1/w19-4305},
//timestamp = {Fri, 27 Mar 2020 08:52:29 +0100},
//biburl = {https://dblp.org/rec/conf/rep4nlp/VazquezRTC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{MoradiInterrogating, @inproceedings{MoradiInterrogating,
author = {Pooya Moradi and author = {Pooya Moradi and
Nishant Kambhatla and Nishant Kambhatla and
Anoop Sarkar}, Anoop Sarkar},
//editor = {Alexandra Birch and
Andrew M. Finch and
Hiroaki Hayashi and
Ioannis Konstas and
Thang Luong and
Graham Neubig and
Yusuke Oda and
Katsuhito Sudoh},
title = {Interrogating the Explanatory Power of Attention in Neural Machine title = {Interrogating the Explanatory Power of Attention in Neural Machine
Translation}, Translation},
publisher = {Proceedings of the 3rd Workshop on Neural Generation and Translation@EMNLP-IJCNLP publisher = {Proceedings of the 3rd Workshop on Neural Generation and Translation@EMNLP-IJCNLP
...@@ -4585,11 +3990,6 @@ pages ={157-166}, ...@@ -4585,11 +3990,6 @@ pages ={157-166},
pages = {221--230}, pages = {221--230},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/D19-5624},
//doi = {10.18653/v1/D19-5624},
//timestamp = {Tue, 24 Mar 2020 15:04:09 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/MoradiKS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{WangNeural, @inproceedings{WangNeural,
author = {Xing Wang and author = {Xing Wang and
...@@ -4598,18 +3998,12 @@ pages ={157-166}, ...@@ -4598,18 +3998,12 @@ pages ={157-166},
Hang Li and Hang Li and
Deyi Xiong and Deyi Xiong and
Min Zhang}, Min Zhang},
//editor = {Satinder P. Singh and
Shaul Markovitch},
title = {Neural Machine Translation Advised by Statistical Machine Translation}, title = {Neural Machine Translation Advised by Statistical Machine Translation},
publisher = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, publisher = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
February 4-9, 2017, San Francisco, California, {USA}}, February 4-9, 2017, San Francisco, California, {USA}},
pages = {3330--3336}, pages = {3330--3336},
//publisher = {{AAAI} Press}, //publisher = {{AAAI} Press},
year = {2017}, year = {2017},
//url = {http://aaai.org/ocs/index.php/AAAI/AAAI17/paper/view/14451},
//timestamp = {Tue, 15 Jan 2019 11:48:13 +0100},
//biburl = {https://dblp.org/rec/conf/aaai/WangLTLXZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1905-09418, @inproceedings{DBLP:journals/corr/abs-1905-09418,
author = {Elena Voita and author = {Elena Voita and
...@@ -4617,9 +4011,6 @@ pages ={157-166}, ...@@ -4617,9 +4011,6 @@ pages ={157-166},
Fedor Moiseev and Fedor Moiseev and
Rico Sennrich and Rico Sennrich and
Ivan Titov}, Ivan Titov},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Analyzing Multi-Head Self-Attention: Specialized Heads Do the Heavy title = {Analyzing Multi-Head Self-Attention: Specialized Heads Do the Heavy
Lifting, the Rest Can Be Pruned}, Lifting, the Rest Can Be Pruned},
publisher = {Proceedings of the 57th Conference of the Association for Computational publisher = {Proceedings of the 57th Conference of the Association for Computational
...@@ -4628,11 +4019,6 @@ pages ={157-166}, ...@@ -4628,11 +4019,6 @@ pages ={157-166},
pages = {5797--5808}, pages = {5797--5808},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1580},
//doi = {10.18653/v1/p19-1580},
//timestamp = {Tue, 28 Jan 2020 10:27:29 +0100},
//biburl = {https://dblp.org/rec/conf/acl/VoitaTMST19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Xiao2019SharingAW, @inproceedings{Xiao2019SharingAW,
author = {Tong Xiao and author = {Tong Xiao and
...@@ -4640,7 +4026,6 @@ pages ={157-166}, ...@@ -4640,7 +4026,6 @@ pages ={157-166},
Jingbo Zhu and Jingbo Zhu and
Zhengtao Yu and Zhengtao Yu and
Tongran Liu}, Tongran Liu},
//editor = {Sarit Kraus},
title = {Sharing Attention Weights for Fast Transformer}, title = {Sharing Attention Weights for Fast Transformer},
publisher = {Proceedings of the Twenty-Eighth International Joint Conference on publisher = {Proceedings of the Twenty-Eighth International Joint Conference on
Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16, Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
...@@ -4648,11 +4033,6 @@ pages ={157-166}, ...@@ -4648,11 +4033,6 @@ pages ={157-166},
pages = {5292--5298}, pages = {5292--5298},
//publisher = {ijcai.org}, //publisher = {ijcai.org},
year = {2019}, year = {2019},
//url = {https://doi.org/10.24963/ijcai.2019/735},
//doi = {10.24963/ijcai.2019/735},
//timestamp = {Tue, 20 Aug 2019 16:18:18 +0200},
//biburl = {https://dblp.org/rec/conf/ijcai/XiaoLZ0L19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Yang2017TowardsBH, @inproceedings{Yang2017TowardsBH,
author = {Baosong Yang and author = {Baosong Yang and
...@@ -4660,9 +4040,6 @@ pages ={157-166}, ...@@ -4660,9 +4040,6 @@ pages ={157-166},
Tong Xiao and Tong Xiao and
Lidia S. Chao and Lidia S. Chao and
Jingbo Zhu}, Jingbo Zhu},
//editor = {Martha Palmer and
Rebecca Hwa and
Sebastian Riedel},
title = {Towards Bidirectional Hierarchical Representations for Attention-based title = {Towards Bidirectional Hierarchical Representations for Attention-based
Neural Machine Translation}, Neural Machine Translation},
publisher = {Proceedings of the 2017 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2017 Conference on Empirical Methods in Natural
...@@ -4671,20 +4048,11 @@ pages ={157-166}, ...@@ -4671,20 +4048,11 @@ pages ={157-166},
pages = {1432--1441}, pages = {1432--1441},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2017}, year = {2017},
//url = {https://doi.org/10.18653/v1/d17-1150},
//doi = {10.18653/v1/d17-1150},
//timestamp = {Tue, 28 Jan 2020 10:28:08 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/YangWXCZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Wang2019TreeTI, @inproceedings{Wang2019TreeTI,
author = {Yau-Shian Wang and author = {Yau-Shian Wang and
Hung-yi Lee and Hung-yi Lee and
Yun-Nung Chen}, Yun-Nung Chen},
//editor = {Kentaro Inui and
Jing Jiang and
Vincent Ng and
Xiaojun Wan},
title = {Tree Transformer: Integrating Tree Structures into Self-Attention}, title = {Tree Transformer: Integrating Tree Structures into Self-Attention},
publisher = {Proceedings of the 2019 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2019 Conference on Empirical Methods in Natural
Language Processing and the 9th International Joint Conference on Language Processing and the 9th International Joint Conference on
...@@ -4693,51 +4061,29 @@ pages ={157-166}, ...@@ -4693,51 +4061,29 @@ pages ={157-166},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
pages = {1061--1070}, pages = {1061--1070},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/D19-1098},
//doi = {10.18653/v1/D19-1098},
//timestamp = {Thu, 12 Dec 2019 13:23:46 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/WangLC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1809-01854, @inproceedings{DBLP:journals/corr/abs-1809-01854,
author = {Jetic Gu and author = {Jetic Gu and
Hassan S. Shavarani and Hassan S. Shavarani and
Anoop Sarkar}, Anoop Sarkar},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing}, title = {Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {401--413}, pages = {401--413},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://doi.org/10.18653/v1/d18-1037},
//doi = {10.18653/v1/d18-1037},
//timestamp = {Tue, 28 Jan 2020 10:28:48 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/GuSS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1808-09374, @inproceedings{DBLP:journals/corr/abs-1808-09374,
author = {Xinyi Wang and author = {Xinyi Wang and
Hieu Pham and Hieu Pham and
Pengcheng Yin and Pengcheng Yin and
Graham Neubig}, Graham Neubig},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {A Tree-based Decoder for Neural Machine Translation}, title = {A Tree-based Decoder for Neural Machine Translation},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4772--4777}, pages = {4772--4777},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1509/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/WangPYN18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{DBLP:journals/corr/ZhangZ16c, @article{DBLP:journals/corr/ZhangZ16c,
author = {Jiajun Zhang and author = {Jiajun Zhang and
...@@ -4746,12 +4092,6 @@ pages ={157-166}, ...@@ -4746,12 +4092,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1610.07272}, volume = {abs/1610.07272},
year = {2016}, year = {2016},
//url = {http://arxiv.org/abs/1610.07272},
//archivePrefix = {arXiv},
//eprint = {1610.07272},
//timestamp = {Mon, 13 Aug 2018 16:47:14 +0200},
//biburl = {https://dblp.org/rec/journals/corr/ZhangZ16c.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Dai2019TransformerXLAL, @article{Dai2019TransformerXLAL,
author = {Zihang Dai and author = {Zihang Dai and
...@@ -4764,12 +4104,6 @@ pages ={157-166}, ...@@ -4764,12 +4104,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1901.02860}, volume = {abs/1901.02860},
year = {2019}, year = {2019},
//url = {http://arxiv.org/abs/1901.02860},
//archivePrefix = {arXiv},
//eprint = {1901.02860},
//timestamp = {Fri, 01 Feb 2019 13:39:59 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-1901-02860.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{li-etal-2019-word, @inproceedings{li-etal-2019-word,
author = {Xintong Li and author = {Xintong Li and
...@@ -4777,9 +4111,6 @@ pages ={157-166}, ...@@ -4777,9 +4111,6 @@ pages ={157-166},
Lemao Liu and Lemao Liu and
Max Meng and Max Meng and
Shuming Shi}, Shuming Shi},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {On the Word Alignment from Neural Machine Translation}, title = {On the Word Alignment from Neural Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019, Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
...@@ -4787,11 +4118,6 @@ pages ={157-166}, ...@@ -4787,11 +4118,6 @@ pages ={157-166},
pages = {1293--1303}, pages = {1293--1303},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2019}, year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1124},
//doi = {10.18653/v1/p19-1124},
//timestamp = {Tue, 28 Jan 2020 10:27:51 +0100},
//biburl = {https://dblp.org/rec/conf/acl/LiLLMS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Werlen2018DocumentLevelNM, @inproceedings{Werlen2018DocumentLevelNM,
...@@ -4799,10 +4125,6 @@ pages ={157-166}, ...@@ -4799,10 +4125,6 @@ pages ={157-166},
Dhananjay Ram and Dhananjay Ram and
Nikolaos Pappas and Nikolaos Pappas and
James Henderson}, James Henderson},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Document-Level Neural Machine Translation with Hierarchical Attention title = {Document-Level Neural Machine Translation with Hierarchical Attention
Networks}, Networks},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
...@@ -4810,19 +4132,12 @@ pages ={157-166}, ...@@ -4810,19 +4132,12 @@ pages ={157-166},
pages = {2947--2954}, pages = {2947--2954},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://doi.org/10.18653/v1/d18-1325},
//doi = {10.18653/v1/d18-1325},
//timestamp = {Fri, 27 Mar 2020 08:46:30 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/WerlenRPH18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1805-10163, @inproceedings{DBLP:journals/corr/abs-1805-10163,
author = {Elena Voita and author = {Elena Voita and
Pavel Serdyukov and Pavel Serdyukov and
Rico Sennrich and Rico Sennrich and
Ivan Titov}, Ivan Titov},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Context-Aware Neural Machine Translation Learns Anaphora Resolution}, title = {Context-Aware Neural Machine Translation Learns Anaphora Resolution},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
...@@ -4830,11 +4145,6 @@ pages ={157-166}, ...@@ -4830,11 +4145,6 @@ pages ={157-166},
pages = {1264--1274}, pages = {1264--1274},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/P18-1117/},
//doi = {10.18653/v1/P18-1117},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/TitovSSV18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{DBLP:journals/corr/abs-1906-00532, @article{DBLP:journals/corr/abs-1906-00532,
author = {Aishwarya Bhandare and author = {Aishwarya Bhandare and
...@@ -4849,12 +4159,6 @@ pages ={157-166}, ...@@ -4849,12 +4159,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1906.00532}, volume = {abs/1906.00532},
year = {2019}, year = {2019},
//url = {http://arxiv.org/abs/1906.00532},
//archivePrefix = {arXiv},
//eprint = {1906.00532},
//timestamp = {Thu, 13 Jun 2019 13:36:00 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1906-00532.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Zhang2018SpeedingUN, @inproceedings{Zhang2018SpeedingUN,
...@@ -4863,46 +4167,29 @@ pages ={157-166}, ...@@ -4863,46 +4167,29 @@ pages ={157-166},
Yang Feng and Yang Feng and
Lei Shen and Lei Shen and
Qun Liu}, Qun Liu},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Speeding Up Neural Machine Translation Decoding by Cube Pruning}, title = {Speeding Up Neural Machine Translation Decoding by Cube Pruning},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4284--4294}, pages = {4284--4294},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1460/},
//timestamp = {Fri, 29 Nov 2019 14:00:46 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/Zhang0FSL18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/SeeLM16, @inproceedings{DBLP:journals/corr/SeeLM16,
author = {Abigail See and author = {Abigail See and
Minh-Thang Luong and Minh-Thang Luong and
Christopher D. Manning}, Christopher D. Manning},
//editor = {Yoav Goldberg and
Stefan Riezler},
title = {Compression of Neural Machine Translation Models via Pruning}, title = {Compression of Neural Machine Translation Models via Pruning},
publisher = {Proceedings of the 20th {SIGNLL} Conference on Computational Natural publisher = {Proceedings of the 20th {SIGNLL} Conference on Computational Natural
Language Learning, CoNLL 2016, Berlin, Germany, August 11-12, 2016}, Language Learning, CoNLL 2016, Berlin, Germany, August 11-12, 2016},
pages = {291--301}, pages = {291--301},
//publisher = {{ACL}}, //publisher = {{ACL}},
year = {2016}, year = {2016},
//url = {https://doi.org/10.18653/v1/k16-1029},
//doi = {10.18653/v1/k16-1029},
//timestamp = {Tue, 28 Jan 2020 10:29:27 +0100},
//biburl = {https://dblp.org/rec/conf/conll/SeeLM16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/ChenLCL17, @inproceedings{DBLP:journals/corr/ChenLCL17,
author = {Yun Chen and author = {Yun Chen and
Yang Liu and Yang Liu and
Yong Cheng and Yong Cheng and
Victor O. K. Li}, Victor O. K. Li},
//editor = {Regina Barzilay and
Min-Yen Kan},
title = {A Teacher-Student Framework for Zero-Resource Neural Machine Translation}, title = {A Teacher-Student Framework for Zero-Resource Neural Machine Translation},
publisher = {Proceedings of the 55th Annual Meeting of the Association for Computational publisher = {Proceedings of the 55th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
...@@ -4910,11 +4197,6 @@ pages ={157-166}, ...@@ -4910,11 +4197,6 @@ pages ={157-166},
pages = {1925--1935}, pages = {1925--1935},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2017}, year = {2017},
//url = {https://doi.org/10.18653/v1/P17-1176},
//doi = {10.18653/v1/P17-1176},
//timestamp = {Tue, 20 Aug 2019 11:59:05 +0200},
//biburl = {https://dblp.org/rec/conf/acl/ChenLCL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{Hinton2015Distilling, @article{Hinton2015Distilling,
author = {Geoffrey E. Hinton and author = {Geoffrey E. Hinton and
...@@ -4924,12 +4206,6 @@ pages ={157-166}, ...@@ -4924,12 +4206,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1503.02531}, volume = {abs/1503.02531},
year = {2015}, year = {2015},
//url = {http://arxiv.org/abs/1503.02531},
//archivePrefix = {arXiv},
//eprint = {1503.02531},
//timestamp = {Mon, 13 Aug 2018 16:48:36 +0200},
//biburl = {https://dblp.org/rec/journals/corr/HintonVD15.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Ott2018ScalingNM, @inproceedings{Ott2018ScalingNM,
...@@ -4953,8 +4229,6 @@ pages ={157-166}, ...@@ -4953,8 +4229,6 @@ pages ={157-166},
year = "2016", year = "2016",
//address = "Austin, Texas", //address = "Austin, Texas",
//publisher = "Association for Computational Linguistics", //publisher = "Association for Computational Linguistics",
//url = "https://www.aclweb.org/anthology/D16-1139",
//doi = "10.18653/v1/D16-1139",
pages = "1317--1327", pages = "1317--1327",
} }
...@@ -4982,18 +4256,11 @@ pages ={157-166}, ...@@ -4982,18 +4256,11 @@ pages ={157-166},
Toulon, France, April 24-26, 2017, Conference Track Proceedings}, Toulon, France, April 24-26, 2017, Conference Track Proceedings},
//publisher = {OpenReview.net}, //publisher = {OpenReview.net},
year = {2017}, year = {2017},
//url = {https://openreview.net/forum?id=BJC\_jUqxe},
//timestamp = {Thu, 25 Jul 2019 14:25:44 +0200},
//biburl = {https://dblp.org/rec/conf/iclr/LinFSYXZB17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{Shaw2018SelfAttentionWR, @inproceedings{Shaw2018SelfAttentionWR,
author = {Peter Shaw and author = {Peter Shaw and
Jakob Uszkoreit and Jakob Uszkoreit and
Ashish Vaswani}, Ashish Vaswani},
//editor = {Marilyn A. Walker and
Heng Ji and
Amanda Stent},
title = {Self-Attention with Relative Position Representations}, title = {Self-Attention with Relative Position Representations},
publisher = {Proceedings of the 2018 Conference of the North American Chapter of publisher = {Proceedings of the 2018 Conference of the North American Chapter of
the Association for Computational Linguistics: Human Language Technologies, the Association for Computational Linguistics: Human Language Technologies,
...@@ -5002,11 +4269,6 @@ pages ={157-166}, ...@@ -5002,11 +4269,6 @@ pages ={157-166},
pages = {464--468}, pages = {464--468},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://doi.org/10.18653/v1/n18-2074},
//doi = {10.18653/v1/n18-2074},
//timestamp = {Tue, 28 Jan 2020 10:30:17 +0100},
//biburl = {https://dblp.org/rec/conf/naacl/ShawUV18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/HeZRS15, @inproceedings{DBLP:journals/corr/HeZRS15,
author = {Kaiming He and author = {Kaiming He and
...@@ -5019,26 +4281,6 @@ pages ={157-166}, ...@@ -5019,26 +4281,6 @@ pages ={157-166},
pages = {770--778}, pages = {770--778},
//publisher = {{IEEE} Computer Society}, //publisher = {{IEEE} Computer Society},
year = {2016}, year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.90},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/HeZRS16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Ba2016LayerN,
author = {Lei Jimmy Ba and
Jamie Ryan Kiros and
Geoffrey E. Hinton},
title = {Layer Normalization},
journal = {CoRR},
volume = {abs/1607.06450},
year = {2016},
//url = {http://arxiv.org/abs/1607.06450},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/BaKH16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{JMLR:v15:srivastava14a, @article{JMLR:v15:srivastava14a,
author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov}, author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov},
...@@ -5047,7 +4289,6 @@ pages ={157-166}, ...@@ -5047,7 +4289,6 @@ pages ={157-166},
year = {2014}, year = {2014},
volume = {15}, volume = {15},
pages = {1929-1958}, pages = {1929-1958},
//url = {http://jmlr.org/papers/v15/srivastava14a.html}
} }
@inproceedings{Szegedy_2016_CVPR, @inproceedings{Szegedy_2016_CVPR,
author = {Christian Szegedy and author = {Christian Szegedy and
...@@ -5061,18 +4302,11 @@ pages ={157-166}, ...@@ -5061,18 +4302,11 @@ pages ={157-166},
pages = {2818--2826}, pages = {2818--2826},
//publisher = {{IEEE} Computer Society}, //publisher = {{IEEE} Computer Society},
year = {2016}, year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.308},
//doi = {10.1109/CVPR.2016.308},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/SzegedyVISW16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@inproceedings{DBLP:journals/corr/abs-1805-00631, @inproceedings{DBLP:journals/corr/abs-1805-00631,
author = {Biao Zhang and author = {Biao Zhang and
Deyi Xiong and Deyi Xiong and
Jinsong Su}, Jinsong Su},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Accelerating Neural Transformer via an Average Attention Network}, title = {Accelerating Neural Transformer via an Average Attention Network},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
...@@ -5080,11 +4314,6 @@ pages ={157-166}, ...@@ -5080,11 +4314,6 @@ pages ={157-166},
pages = {1789--1798}, pages = {1789--1798},
//publisher = {Association for Computational Linguistics}, //publisher = {Association for Computational Linguistics},
year = {2018}, year = {2018},
//url = {https://www.aclweb.org/anthology/P18-1166/},
//doi = {10.18653/v1/P18-1166},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/XiongZS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
@article{DBLP:journals/corr/CourbariauxB16, @article{DBLP:journals/corr/CourbariauxB16,
author = {Matthieu Courbariaux and author = {Matthieu Courbariaux and
...@@ -5094,12 +4323,6 @@ pages ={157-166}, ...@@ -5094,12 +4323,6 @@ pages ={157-166},
journal = {CoRR}, journal = {CoRR},
volume = {abs/1602.02830}, volume = {abs/1602.02830},
year = {2016}, year = {2016},
//url = {http://arxiv.org/abs/1602.02830},
//archivePrefix = {arXiv},
//eprint = {1602.02830},
//timestamp = {Mon, 13 Aug 2018 16:46:57 +0200},
//biburl = {https://dblp.org/rec/journals/corr/CourbariauxB16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
} }
%%%%% chapter 12------------------------------------------------------ %%%%% chapter 12------------------------------------------------------
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论