Commit 51cd432f by 曹润柘

更新 bibliography.bib

parent 99300e4f
......@@ -186,7 +186,6 @@
Keith Stevens and
George Kurian and
Nishant Patil and
Wei Wang and
Cliff Young and
Jason Smith and
Jason Riesa and
......@@ -221,7 +220,6 @@
Yann N. Dauphin},
title = {Convolutional Sequence to Sequence Learning},
publisher = {International Conference on Machine Learning},
//series = {Proceedings of Machine Learning Research},
volume = {70},
pages = {1243--1252},
year = {2017}
......@@ -270,10 +268,8 @@
@book{Goodfellow-et-al-2016,
author = {Ian J. Goodfellow and
Yoshua Bengio and
Aaron C. Courville},
title = {Deep Learning},
//series = {Adaptive computation and machine learning},
publisher = {{MIT} Press},
year = {2016}
}
......@@ -386,7 +382,6 @@
publisher={International Conference on Acoustics, Speech, and Signal Processing},
pages={825--828},
year={1991},
//organization={IEEE Computer Society}
}
@inproceedings{stolcke2002srilm,
......@@ -425,7 +420,6 @@
title = {Speech and language processing: an introduction to natural language
processing, computational linguistics, and speech recognition, 2nd
Edition},
//series = {Prentice Hall series in artificial intelligence},
publisher = {Prentice Hall, Pearson Education International},
year = {2009}
}
......@@ -743,7 +737,6 @@
@inproceedings{Koehn2007Moses,
author = {Philipp Koehn and
Hieu Hoang and
Alexandra Birch and
Chris Callison-Burch and
Marcello Federico and
Nicola Bertoldi and
......@@ -824,7 +817,6 @@
Kevin Knight and
Daniel Marcu and
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
Models},
......@@ -847,28 +839,25 @@
%%%%% chapter 3------------------------------------------------------
@inproceedings{ng2002discriminative,
author = {Andrew Y. Ng and
Michael I. Jordan},
title = {On Discriminative vs. Generative Classifiers: {A} comparison of logistic
regression and naive Bayes},
pages = {841--848},
publisher = {{MIT} Press},
year = {2001},
title ={On discriminative vs. generative classifiers: A comparison of logistic regression and naive bayes},
author ={Ng, Andrew Y and Jordan, Michael I},
pages ={841--848},
year ={2002}
}
@inproceedings{huang2008coling,
author = {Huang, Liang},
title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications-Tutorial notes},
@proceedings{huang2008advanced,
title = {Coling 2008: Advanced Dynamic Programming in Computational Linguistics: Theory, Algorithms and Applications - Tutorial notes},
year = {2008},
publisher = {International Conference on Computational Linguistics},
address = {Manchester, UK},
publisher = {Coling 2008 Organizing Committee},
}
@book{aho1972theory,
author = {Aho, Alfred V and
Ullman, Jeffrey D},
title = {The theory of parsing, translation, and compiling},
publisher = {Prentice-Hall Englewood Cliffs, NJ},
author = {Alfred V. Aho and
Jeffrey D. Ullman},
title = {The theory of parsing, translation, and compiling. 2: Compiling},
publisher = {Prentice-Hall},
year = {1973},
}
......@@ -877,7 +866,6 @@
author={Rau, Lisa F},
pages={29--30},
year={1991},
publisher={IEEE Conference on Artificial Intelligence Application},
}
@article{张小衡1997中文机构名称的识别与分析,
......@@ -890,16 +878,11 @@
year={1997},
}
@inproceedings{lample2016neural,
author = {Guillaume Lample and
Miguel Ballesteros and
Sandeep Subramanian and
Kazuya Kawakami and
Chris Dyer},
title = {Neural Architectures for Named Entity Recognition},
pages = {260--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
@article{lample2016neural,
title={Neural architectures for named entity recognition},
author={Lample, Guillaume and Ballesteros, Miguel and Subramanian, Sandeep and Kawakami, Kazuya and Dyer, Chris},
journal={arXiv preprint arXiv:1603.01360},
year={2016}
}
@article{Baum1966Statistical,
......@@ -920,6 +903,7 @@
number={1},
pages={164--171},
year={1970},
publisher={JSTOR}
}
@article{1977Maximum,
......@@ -933,13 +917,19 @@
@article{1967Error,
title={Error bounds for convolutional codes and an asymptotically optimum decoding algorithm},
author={ Viterbi, Andrew J. },
journal={IEEE Transactions on Information Theory},
journal={IEEE Trans.informat.theory},
volume={13},
number={2},
pages={260-269},
year={1967},
}
@article{lafferty2001conditional,
title={Conditional random fields: Probabilistic models for segmenting and labeling sequence data},
author={Lafferty, John and McCallum, Andrew and Pereira, Fernando CN},
year={2001}
}
@article{harrington2013机器学习实战,
title={机器学习实战},
author={Harrington, Peter},
......@@ -952,36 +942,41 @@
author = {Brants, Thorsten},
month = apr,
year = {2000},
address = {Seattle, Washington, USA},
publisher = {Association for Computational Linguistics},
doi = {10.3115/974147.974178},
pages = {224--231},
}
@inproceedings{tsuruoka-tsujii-2005-chunk,
title = {Chunk Parsing Revisited},
author = {Yoshimasa Tsuruoka and
Jun'ichi Tsujii},
author = {Tsuruoka, Yoshimasa and
Tsujii, Jun{'}ichi},
month = oct,
year = {2005},
publisher = {Annual Meeting of the Association for Computational Linguistics},
address = {Vancouver, British Columbia},
publisher = {Association for Computational Linguistics},
pages = {133--140},
}
@inproceedings{li-etal-2003-news-oriented,
title = {News-Oriented Automatic Chinese Keyword Indexing},
title = {News-Oriented Automatic {C}hinese Keyword Indexing},
author = {Li, Sujian and
Wang, Houfeng and
Yu, Shiwen and
Xin, Chengsheng},
month = jul,
year = {2003},
publisher = {Annual Meeting of the Association for Computational Linguistics},
address = {Sapporo, Japan},
publisher = {Association for Computational Linguistics},
doi = {10.3115/1119250.1119263},
pages = {92--97},
}
@article{2015Bidirectional,
title={Bidirectional LSTM-CRF Models for Sequence Tagging},
author={ Huang, Zhiheng and Xu, Wei and Yu, Kai },
journal={CoRR},
journal={Computer ence},
year={2015},
}
......@@ -996,13 +991,10 @@
}
@inproceedings{vzukov2018named,
author = {Andrej Zukov Gregoric and
Yoram Bachrach and
Sam Coope},
title = {Named Entity Recognition With Parallel Recurrent Neural Networks},
pages = {69--74},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018},
title={Named entity recognition with parallel recurrent neural networks},
author={{\v{Z}}ukov-Gregori{\v{c}}, Andrej and Bachrach, Yoram and Coope, Sam},
pages={69--74},
year={2018}
}
@article{Li2020A,
......@@ -1015,196 +1007,29 @@
year={2020},
}
@article{devlin2019bert,
@article{devlin2018bert,
title={Bert: Pre-training of deep bidirectional transformers for language understanding},
author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
year={2019},
pages = {4171--4186},
journal = {Annual Meeting of the Association for Computational Linguistics},
}
@inproceedings{conneau2019unsupervised,
author = {Alexis Conneau and
Kartikay Khandelwal and
Naman Goyal and
Vishrav Chaudhary and
Guillaume Wenzek and
Francisco Guzm{\'{a}}n and
Edouard Grave and
Myle Ott and
Luke Zettlemoyer and
Veselin Stoyanov},
title = {Unsupervised Cross-lingual Representation Learning at Scale},
pages = {8440--8451},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020},
journal={arXiv preprint arXiv:1810.04805},
year={2018}
}
@article{conneau2019unsupervised,
title={Unsupervised cross-lingual representation learning at scale},
author={Conneau, Alexis and Khandelwal, Kartikay and Goyal, Naman and Chaudhary, Vishrav and Wenzek, Guillaume and Guzm{\'a}n, Francisco and Grave, Edouard and Ott, Myle and Zettlemoyer, Luke and Stoyanov, Veselin},
journal={arXiv preprint arXiv:1911.02116},
year={2019}
}
@book{chomsky1993lectures,
title={Lectures on government and binding: The Pisa lectures},
author={Chomsky, Noam},
number={9},
year={1993},
publisher={Walter de Gruyter}
}
@inproceedings{DBLP:conf/acl/SennrichHB16a,
author = {Rico Sennrich and
Barry Haddow and
Alexandra Birch},
title = {Neural Machine Translation of Rare Words with Subword Units},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016},
}
@article{刘挺1998最大概率分词问题及其解法,
title={最大概率分词问题及其解法},
author={刘挺 and 吴岩 and 王开铸},
journal={哈尔滨工业大学学报},
number={06},
pages={37-41},
year={1998},
}
@article{丁洁2010基于最大概率分词算法的中文分词方法研究,
title={基于最大概率分词算法的中文分词方法研究},
author={丁洁},
journal={科技信息},
number={21},
pages={I0075--I0075},
year={2010}
}
@book{1995University,
title = {University of Sheffield: Description of the LaSIE-II system as used for MUC-7},
author = {Kevin Humphreys and
Robert J. Gaizauskas and
Saliha Azzam and
Charles Huyck and
Brian Mitchell and
Hamish Cunningham and
Yorick Wilks},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1995},
}
@inproceedings{krupka1998isoquest,
title={IsoQuest Inc.: Description of the NetOwl™ Extractor System as Used for MUC-7},
author={Krupka, George and Hausman, Kevin},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year={1998}
}
@inproceedings{DBLP:conf/muc/BlackRM98,
author = {William J. Black and
Fabio Rinaldi and
David Mowatt},
title = {{FACILE:} Description of the {NE} System Used for {MUC-7}},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {1998},
}
@article{1996Hidden,
title={Hidden Markov models.},
author={ Eddy, Sean R },
journal={Current Opinion in Structural Biology},
volume={6},
number={3},
pages={361-5},
year={1996},
}
@inproceedings{lafferty2001conditional,
author = {John D. Lafferty and
Andrew McCallum and
Fernando C. N. Pereira},
title = {Conditional Random Fields: Probabilistic Models for Segmenting and
Labeling Sequence Data},
pages = {282--289},
publisher = {proceedings of the Eighteenth International Conference on Machine
Learning},
year = {2001},
}
@book{kapur1989maximum,
title={Maximum-entropy models in science and engineering},
author={Kapur, Jagat Narain},
year={1989},
publisher={John Wiley \& Sons}
}
@article{1998Support,
title={Support vector machines},
author={Hearst, Marti A. and Dumais, Susan T and Osuna, Edgar and Platt, John and Scholkopf, Bernhard},
journal={IEEE Intelligent Systems \& Their Applications},
volume={13},
number={4},
pages={18-28},
year={1998},
}
@article{2011Natural,
title={Natural Language Processing (almost) from Scratch},
author={ Collobert, Ronan and Weston, Jason and Bottou, Léon and Karlen, Michael and Kavukcuoglu, Koray and Kuksa, Pavel },
journal={Journal of Machine Learning Research},
volume={12},
number={1},
pages={2493-2537},
year={2011},
}
@book{manning2008introduction,
title={Introduction to information retrieval},
author={Manning, Christopher D and Sch{\"u}tze, Hinrich and Raghavan, Prabhakar},
year={2008},
publisher={Cambridge university press}
}
@article{berger1996maximum,
title={A maximum entropy approach to natural language processing},
author={Berger, Adam and Della Pietra, Stephen A and Della Pietra, Vincent J},
journal={Computational linguistics},
volume={22},
number={1},
pages={39--71},
year={1996}
}
@article{mitchell1996m,
title={Machine Learning},
author={Mitchell, Tom},
journal={McCraw Hill},
year={1996}
}
@inproceedings{DBLP:conf/acl/OchN02,
author = {Franz Josef Och and
Hermann Ney},
title = {Discriminative Training and Maximum Entropy Models for Statistical
Machine Translation},
pages = {295--302},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2002},
}
@incollection{mohri2008speech,
title={Speech recognition with weighted finite-state transducers},
author={Mohri, Mehryar and Pereira, Fernando and Riley, Michael},
pages={559--584},
year={2008},
publisher={Springer}
}
@article{bellman1966dynamic,
title={Dynamic programming},
author={Bellman, Richard},
journal={Science},
volume={153},
number={3731},
pages={34--37},
year={1966},
publisher={American Association for the Advancement of Science}
}
%%%%% chapter 3------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
......@@ -1647,7 +1472,6 @@
@inproceedings{DBLP:conf/wmt/Callison-BurchF07,
author = {Chris Callison-Burch and
Cameron S. Fordyce and
Philipp Koehn and
Christof Monz and
Josh Schroeder},
title = {(Meta-) Evaluation of Machine Translation},
......@@ -1657,7 +1481,6 @@
}
@inproceedings{DBLP:conf/wmt/Callison-BurchK12,
author = {Chris Callison-Burch and
Philipp Koehn and
Christof Monz and
Matt Post and
Radu Soricut and
......@@ -1681,7 +1504,6 @@
Barry Haddow and
Matthias Huck and
Chris Hokamp and
Philipp Koehn and
Varvara Logacheva and
Christof Monz and
Matteo Negri and
......@@ -2056,16 +1878,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
}
@article{DBLP:journals/coling/FraserM07,
author = {Alexander M. Fraser and
Daniel Marcu},
title = {Measuring Word Alignment Quality for Statistical Machine Translation},
journal = {Computational Linguistics},
volume = {33},
number = {3},
pages = {293--303},
year = {2007}
}
@inproceedings{DBLP:conf/acl/DeNeroK07,
author = {John DeNero and
Dan Klein},
......@@ -2252,17 +2064,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005},
}
@inproceedings{2018Non,
author = {Jiatao Gu and
James Bradbury and
Caiming Xiong and
Victor O. K. Li and
Richard Socher},
title = {Non-Autoregressive Neural Machine Translation},
publisher = {OpenReview.net},
year = {2018}
}
%%%%% chapter 6------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
......@@ -2297,15 +2098,6 @@
publisher = {AAAI Press},
year = {2000}
}
@inproceedings{dyer2013a,
author = {Chris Dyer and
Victor Chahuneau and
Noah A. Smith},
title = {A Simple, Fast, and Effective Reparameterization of {IBM} Model 2},
pages = {644--648},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
}
@inproceedings{taskar2005a,
author = {Benjamin Taskar and
Simon Lacoste-Julien and
......@@ -2366,13 +2158,7 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2014}
}
@inproceedings{och2003minimum,
author = {Franz Josef Och},
title = {Minimum Error Rate Training in Statistical Machine Translation},
pages = {160--167},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003}
}
@article{powell1964an,
author = {M. J. D. Powell},
title = {An efficient method for finding the minimum of a function of several
......@@ -2605,7 +2391,6 @@
}
@inproceedings{DBLP:conf/acl/CollinsKK05,
author = {Michael Collins and
Philipp Koehn and
Ivona Kucerova},
title = {Clause Restructuring for Statistical Machine Translation},
pages = {531--540},
......@@ -2721,16 +2506,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2003}
}
@inproceedings{chiang2008online,
author = {David Chiang and
Yuval Marton and
Philip Resnik},
title = {Online Large-Margin Training of Syntactic and Structural Translation
Features},
pages = {224--233},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@inproceedings{Blunsom2008A,
author = {Phil Blunsom and
Trevor Cohn and
......@@ -2811,15 +2586,6 @@
publisher={University of Southern California},
year={2006},
}
@inproceedings{DBLP:conf/iwslt/ZensN08,
author = {Richard Zens and
Hermann Ney},
title = {Improvements in dynamic programming beam search for phrase-based statistical
machine translation},
pages = {198--205},
publisher = {International Symposium on Computer Architecture},
year = {2008}
}
@inproceedings{DBLP:conf/emnlp/SchwenkCF07,
author = {Holger Schwenk and
Marta R. Costa-juss{\`{a}} and
......@@ -2968,13 +2734,6 @@
pages = {1159--1187},
year = {2012}
}
@inproceedings{chiang2005a,
author = {David Chiang},
title = {A Hierarchical Phrase-Based Model for Statistical Machine Translation},
pages = {263--270},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2005}
}
@article{chiang2007hierarchical,
title={Hierarchical Phrase-Based Translation},
author ={Chiang David},
......@@ -3031,20 +2790,6 @@
year ={2006},
publisher ={Computationally Hard Problems \& Joint Inference in Speech \& Language Processing}
}
@inproceedings{galley2006scalable,
author = {Michel Galley and
Jonathan Graehl and
Kevin Knight and
Daniel Marcu and
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
Models},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{galley2004s,
title ={What’s in a translation rule?},
author ={Galley, Michel and Hopkins, Mark and Knight, Kevin and Marcu, Daniel},
......@@ -3089,7 +2834,6 @@
}
@inproceedings{marcu2006spmt,
author = {Daniel Marcu and
Wei Wang and
Abdessamad Echihabi and
Kevin Knight},
title = {{SPMT:} Statistical Machine Translation with Syntactified Target Language
......@@ -3216,15 +2960,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011}
}
@inproceedings{zhang2006synchronous,
author = {Hao Zhang and
Liang Huang and
Daniel Gildea and
Kevin Knight},
title = {Synchronous Binarization for Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{DBLP:conf/acl/AlshawiBX97,
author = {Hiyan Alshawi and
Adam L. Buchsbaum and
......@@ -3304,7 +3039,6 @@
@inproceedings{DBLP:conf/emnlp/DeNeefeKWM07,
author = {Steve DeNeefe and
Kevin Knight and
Wei Wang and
Daniel Marcu},
title = {What Can Syntax-Based {MT} Learn from Phrase-Based MT?},
pages = {755--763},
......@@ -3319,30 +3053,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@inproceedings{DBLP:conf/acl/LiuLL06,
author = {Yang Liu and
Qun Liu and
Shouxun Lin},
title = {Tree-to-String Alignment Template for Statistical Machine Translation},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{zollmann2006syntax,
author = {Andreas Zollmann and
Ashish Venugopal},
title = {Syntax Augmented Machine Translation via Chart Parsing},
pages = {138--141},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2006}
}
@inproceedings{DBLP:conf/acl/MartonR08,
author = {Yuval Marton and
Philip Resnik},
title = {Soft Syntactic Constraints for Hierarchical Phrased-Based Translation},
pages = {1003--1011},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@INPROCEEDINGS{Nesson06inductionof,
author = {Rebecca Nesson and Stuart M. Shieber and Alexander Rush},
title = {Induction of probabilistic synchronous tree-insertion grammars for machine translation},
......@@ -3355,15 +3065,6 @@
year = {2007},
publisher = {Machine Translation Summit}
}
@inproceedings{DBLP:conf/acl/LiuLL09,
author = {Yang Liu and
Yajuan L{\"{u}} and
Qun Liu},
title = {Improving Tree-to-Tree Translation with Packed Forests},
pages = {558--566},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2009}
}
@inproceedings{DBLP:conf/emnlp/WangKM07,
author = {Wei Wang and
Kevin Knight and
......@@ -3391,14 +3092,6 @@
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2008}
}
@inproceedings{DBLP:conf/acl/ZhuX11,
author = {Jingbo Zhu and
Tong Xiao},
title = {Improving Decoding Generalization for Tree-to-String Translation},
pages = {418--423},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2011}
}
@inproceedings{DBLP:conf/emnlp/ZhangZZ11,
author = {Jiajun Zhang and
Feifei Zhai and
......@@ -3783,11 +3476,6 @@
number = {1},
pages = {145--151},
year = {1999},
//url = {https://doi.org/10.1016/S0893-6080(98)00116-6},
//doi = {10.1016/S0893-6080(98)00116-6},
//timestamp = {Wed, 14 Nov 2018 10:30:22 +0100},
//biburl = {https://dblp.org/rec/journals/nn/Qian99.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{duchi2011adaptive,
......@@ -3799,10 +3487,6 @@
volume = {12},
pages = {2121--2159},
year = {2011},
//url = {http://dl.acm.org/citation.cfm?id=2021068},
//timestamp = {Wed, 10 Jul 2019 15:28:02 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/DuchiHS11.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{tieleman2012rmsprop,
......@@ -3818,23 +3502,15 @@
@inproceedings{kingma2014adam,
author = {Diederik P. Kingma and
Jimmy Ba},
//editor = {Yoshua Bengio and
Yann LeCun},
title = {Adam: {A} Method for Stochastic Optimization},
booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015,
San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
year = {2015},
//url = {http://arxiv.org/abs/1412.6980},
//timestamp = {Thu, 25 Jul 2019 14:25:37 +0200},
//biburl = {https://dblp.org/rec/journals/corr/KingmaB14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{ioffe2015batch,
author = {Sergey Ioffe and
Christian Szegedy},
//editor = {Francis R. Bach and
David M. Blei},
title = {Batch Normalization: Accelerating Deep Network Training by Reducing
Internal Covariate Shift},
booktitle = {Proceedings of the 32nd International Conference on Machine Learning,
......@@ -3844,10 +3520,6 @@
pages = {448--456},
publisher = {JMLR.org},
year = {2015},
//url = {http://proceedings.mlr.press/v37/ioffe15.html},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {https://dblp.org/rec/conf/icml/IoffeS15.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Ba2016LayerN,
......@@ -3858,30 +3530,6 @@
journal = {CoRR},
volume = {abs/1607.06450},
year = {2016},
//url = {http://arxiv.org/abs/1607.06450},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/BaKH16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/HeZRS15,
author = {Kaiming He and
Xiangyu Zhang and
Shaoqing Ren and
Jian Sun},
title = {Deep Residual Learning for Image Recognition},
booktitle = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition,
{CVPR} 2016, Las Vegas, NV, USA, June 27-30, 2016},
pages = {770--778},
publisher = {{IEEE} Computer Society},
year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.90},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/HeZRS16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{mikolov2013distributed,
......@@ -3890,20 +3538,12 @@
Kai Chen and
Gregory S. Corrado and
Jeffrey Dean},
//editor = {Christopher J. C. Burges and
L{\'{e}}on Bottou and
Zoubin Ghahramani and
Kilian Q. Weinberger},
title = {Distributed Representations of Words and Phrases and their Compositionality},
booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual
Conference on Neural Information Processing Systems 2013. Proceedings
of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
pages = {3111--3119},
year = {2013},
//url = {http://papers.nips.cc/paper/5021-distributed-representations-of-words-and-phrases-and-their-compositionality},
//timestamp = {Fri, 06 Mar 2020 17:00:12 +0100},
//biburl = {https://dblp.org/rec/conf/nips/MikolovSCCD13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{guidotti2018survey,
......@@ -3919,39 +3559,23 @@
number = {5},
pages = {93:1--93:42},
year = {2019},
//url = {https://doi.org/10.1145/3236009},
//doi = {10.1145/3236009},
//timestamp = {Thu, 09 May 2019 16:06:21 +0200},
//biburl = {https://dblp.org/rec/journals/csur/GuidottiMRTGP19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{koh2017understanding,
author = {Pang Wei Koh and
Percy Liang},
//editor = {Doina Precup and
Yee Whye Teh},
title = {Understanding Black-box Predictions via Influence Functions},
booktitle = {Proceedings of the 34th International Conference on Machine Learning,
{ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
series = {Proceedings of Machine Learning Research},
volume = {70},
pages = {1885--1894},
publisher = {{PMLR}},
year = {2017},
//url = {http://proceedings.mlr.press/v70/koh17a.html},
//timestamp = {Wed, 29 May 2019 08:41:45 +0200},
//biburl = {https://dblp.org/rec/conf/icml/KohL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{arthur2016incorporating,
author = {Philip Arthur and
Graham Neubig and
Satoshi Nakamura},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Incorporating Discrete Translation Lexicons into Neural Machine Translation},
booktitle = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
......@@ -3959,28 +3583,6 @@
pages = {1557--1567},
publisher = {The Association for Computational Linguistics},
year = {2016},
//url = {https://doi.org/10.18653/v1/d16-1162},
//doi = {10.18653/v1/d16-1162},
//timestamp = {Tue, 28 Jan 2020 10:28:31 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/ArthurNN16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{zollmann2006syntax,
author = {Andreas Zollmann and
Ashish Venugopal},
//editor = {Philipp Koehn and
Christof Monz},
title = {Syntax Augmented Machine Translation via Chart Parsing},
booktitle = {Proceedings on the Workshop on Statistical Machine Translation, WMT@HLT-NAACL
2006, New York City, NY, USA, June 8-9, 2006},
pages = {138--141},
publisher = {Association for Computational Linguistics},
year = {2006},
//url = {https://www.aclweb.org/anthology/W06-3119/},
//timestamp = {Fri, 13 Sep 2019 13:08:46 +0200},
//biburl = {https://dblp.org/rec/conf/wmt/ZollmannV06.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@INPROCEEDINGS{charniak2003syntax,
......@@ -4001,11 +3603,6 @@
2: Short Papers},
publisher = {The Association for Computer Linguistics},
year = {2016},
//url = {https://doi.org/10.18653/v1/p16-2049},
//doi = {10.18653/v1/p16-2049},
//timestamp = {Tue, 28 Jan 2020 10:27:31 +0100},
//biburl = {https://dblp.org/rec/conf/acl/StahlbergHWB16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{plank2013embedding,
......@@ -4019,21 +3616,12 @@
pages = {1498--1507},
publisher = {The Association for Computer Linguistics},
year = {2013},
//url = {https://www.aclweb.org/anthology/P13-1147/},
//timestamp = {Mon, 19 Aug 2019 18:10:05 +0200},
//biburl = {https://dblp.org/rec/conf/acl/PlankM13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{perozzi2014deepwalk,
author = {Bryan Perozzi and
Rami Al-Rfou and
Steven Skiena},
//editor = {Sofus A. Macskassy and
Claudia Perlich and
Jure Leskovec and
Wei Wang and
Rayid Ghani},
title = {DeepWalk: online learning of social representations},
booktitle = {The 20th {ACM} {SIGKDD} International Conference on Knowledge Discovery
and Data Mining, {KDD} '14, New York, NY, {USA} - August 24 - 27,
......@@ -4041,17 +3629,11 @@
pages = {701--710},
publisher = {{ACM}},
year = {2014},
//url = {https://doi.org/10.1145/2623330.2623732},
//doi = {10.1145/2623330.2623732},
//timestamp = {Sun, 02 Jun 2019 21:11:52 +0200},
//biburl = {https://dblp.org/rec/conf/kdd/PerozziAS14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{collobert2011natural,
author = {Ronan Collobert and
Jason Weston and
L{\'{e}}on Bottou and
Michael Karlen and
Koray Kavukcuoglu and
Pavel P. Kuksa},
......@@ -4060,10 +3642,6 @@
volume = {12},
pages = {2493--2537},
year = {2011},
//url = {http://dl.acm.org/citation.cfm?id=2078186},
//timestamp = {Wed, 10 Jul 2019 15:28:44 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/CollobertWBKKK11.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{mccann2017learned,
......@@ -4071,23 +3649,12 @@
James Bradbury and
Caiming Xiong and
Richard Socher},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Learned in Translation: Contextualized Word Vectors},
booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}},
pages = {6294--6305},
year = {2017},
//url = {http://papers.nips.cc/paper/7209-learned-in-translation-contextualized-word-vectors},
//timestamp = {Fri, 06 Mar 2020 16:57:53 +0100},
//biburl = {https://dblp.org/rec/conf/nips/McCannBXS17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
%%%%% chapter 9------------------------------------------------------
......@@ -4110,16 +3677,9 @@
pages = {1370--1380},
//publisher = {The Association for Computer Linguistics},
year = {2014},
//url = {https://doi.org/10.3115/v1/p14-1129},
//doi = {10.3115/v1/p14-1129},
//timestamp = {Tue, 28 Jan 2020 10:27:56 +0100},
//biburl = {https://dblp.org/rec/conf/acl/DevlinZHLSM14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Schwenk_continuousspace,
author = {Holger Schwenk},
//editor = {Martin Kay and
Christian Boitet},
title = {Continuous Space Translation Models for Phrase-Based Statistical Machine
Translation},
publisher = {{COLING} 2012, 24th International Conference on Computational Linguistics,
......@@ -4128,10 +3688,6 @@
pages = {1071--1080},
//publisher = {Indian Institute of Technology Bombay},
year = {2012},
//url = {https://www.aclweb.org/anthology/C12-2104/},
//timestamp = {Wed, 18 Sep 2019 12:15:53 +0200},
//biburl = {https://dblp.org/rec/conf/coling/Schwenk12.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{kalchbrenner-blunsom-2013-recurrent,
author = {Nal Kalchbrenner and
......@@ -4144,10 +3700,6 @@
pages = {1700--1709},
//publisher = {{ACL}},
year = {2013},
//url = {https://www.aclweb.org/anthology/D13-1176/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/KalchbrennerB13.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{HochreiterThe,
author = {Sepp Hochreiter},
......@@ -4159,11 +3711,6 @@
number = {2},
pages = {107--116},
year = {1998},
//url = {https://doi.org/10.1142/S0218488598000094},
//doi = {10.1142/S0218488598000094},
//timestamp = {Wed, 14 Nov 2018 10:41:42 +0100},
//biburl = {https://dblp.org/rec/journals/ijufks/Hochreiter98.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{BENGIO1994Learning,
author ={Y. {Bengio} and P. {Simard} and P. {Frasconi}},
......@@ -4183,23 +3730,12 @@ pages ={157-166},
Aidan N. Gomez and
Lukasz Kaiser and
Illia Polosukhin},
//editor = {Isabelle Guyon and
Ulrike von Luxburg and
Samy Bengio and
Hanna M. Wallach and
Rob Fergus and
S. V. N. Vishwanathan and
Roman Garnett},
title = {Attention is All you Need},
publisher = {Advances in Neural Information Processing Systems 30: Annual Conference
on Neural Information Processing Systems 2017, 4-9 December 2017,
Long Beach, CA, {USA}},
pages = {5998--6008},
year = {2017},
//url = {http://papers.nips.cc/paper/7181-attention-is-all-you-need},
//timestamp = {Fri, 06 Mar 2020 17:00:11 +0100},
//biburl = {https://dblp.org/rec/conf/nips/VaswaniSPUJGKP17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{StahlbergNeural,
author = {Felix Stahlberg},
......@@ -4207,21 +3743,12 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1912.02047},
year = {2019},
//url = {http://arxiv.org/abs/1912.02047},
//archivePrefix = {arXiv},
//eprint = {1912.02047},
//timestamp = {Thu, 02 Jan 2020 18:08:18 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-1912-02047.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Bentivogli2016NeuralVP,
author = {Luisa Bentivogli and
Arianna Bisazza and
Mauro Cettolo and
Marcello Federico},
//editor = {Jian Su and
Xavier Carreras and
Kevin Duh},
title = {Neural versus Phrase-Based Machine Translation Quality: a Case Study},
publisher = {Proceedings of the 2016 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2016, Austin, Texas, USA, November 1-4,
......@@ -4229,11 +3756,6 @@ pages ={157-166},
pages = {257--267},
//publisher = {The Association for Computational Linguistics},
year = {2016},
//url = {https://doi.org/10.18653/v1/d16-1025},
//doi = {10.18653/v1/d16-1025},
//timestamp = {Tue, 28 Jan 2020 10:28:39 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/BentivogliBCF16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Hassan2018AchievingHP,
author = {Hany Hassan and
......@@ -4264,12 +3786,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1803.05567},
year = {2018},
//url = {http://arxiv.org/abs/1803.05567},
//archivePrefix = {arXiv},
//eprint = {1803.05567},
//timestamp = {Mon, 13 Aug 2018 16:47:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1803-05567.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{WangLearning,
author = {Qiang Wang and
......@@ -4279,9 +3795,6 @@ pages ={157-166},
Changliang Li and
Derek F. Wong and
Lidia S. Chao},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Learning Deep Transformer Models for Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4289,11 +3802,6 @@ pages ={157-166},
pages = {1810--1822},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1176},
//doi = {10.18653/v1/p19-1176},
//timestamp = {Tue, 28 Jan 2020 10:27:53 +0100},
//biburl = {https://dblp.org/rec/conf/acl/WangLXZLWC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Li2020NeuralMT,
author = {Yanyang Li and
......@@ -4305,12 +3813,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/2002.06546},
year = {2020},
//url = {https://arxiv.org/abs/2002.06546},
//archivePrefix = {arXiv},
//eprint = {2002.06546},
//timestamp = {Mon, 02 Mar 2020 16:46:06 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-2002-06546.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{HochreiterLong,
author = {Hochreiter, Sepp and Schmidhuber, Jürgen},
......@@ -4320,7 +3822,6 @@ pages ={157-166},
title = {Long Short-term Memory},
volume = {9},
journal = {Neural computation},
//doi = {10.1162/neco.1997.9.8.1735}
}
@inproceedings{Cho2014Learning,
author = {Kyunghyun Cho and
......@@ -4330,9 +3831,6 @@ pages ={157-166},
Fethi Bougares and
Holger Schwenk and
Yoshua Bengio},
//editor = {Alessandro Moschitti and
Bo Pang and
Walter Daelemans},
title = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
Machine Translation},
publisher = {Proceedings of the 2014 Conference on Empirical Methods in Natural
......@@ -4341,37 +3839,24 @@ pages ={157-166},
pages = {1724--1734},
//publisher = {{ACL}},
year = {2014},
//url = {https://doi.org/10.3115/v1/d14-1179},
//doi = {10.3115/v1/d14-1179},
//timestamp = {Tue, 28 Jan 2020 10:28:17 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/ChoMGBBSB14.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{pmlr-v9-glorot10a,
author = {Xavier Glorot and
Yoshua Bengio},
//editor = {Yee Whye Teh and
D. Mike Titterington},
title = {Understanding the difficulty of training deep feedforward neural networks},
publisher = {Proceedings of the Thirteenth International Conference on Artificial
Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
Italy, May 13-15, 2010},
//series = {{JMLR} Proceedings},
volume = {9},
pages = {249--256},
//publisher = {JMLR.org},
year = {2010},
//url = {http://proceedings.mlr.press/v9/glorot10a.html},
//timestamp = {Wed, 29 May 2019 08:41:47 +0200},
//biburl = {https://dblp.org/rec/journals/jmlr/GlorotB10.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{xiao2017fast,
author = {Tong Xiao and
Jingbo Zhu and
Tongran Liu and
Chunliang Zhang},
//editor = {Carles Sierra},
title = {Fast Parallel Training of Neural Language Models},
publisher = {Proceedings of the Twenty-Sixth International Joint Conference on
Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
......@@ -4379,11 +3864,6 @@ pages ={157-166},
pages = {4193--4199},
//publisher = {ijcai.org},
year = {2017},
//url = {https://doi.org/10.24963/ijcai.2017/586},
//doi = {10.24963/ijcai.2017/586},
//timestamp = {Tue, 20 Aug 2019 16:17:12 +0200},
//biburl = {https://dblp.org/rec/conf/ijcai/XiaoZLZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Gu2017NonAutoregressiveNM,
author = {Jiatao Gu and
......@@ -4392,14 +3872,8 @@ pages ={157-166},
Victor O. K. Li and
Richard Socher},
title = {Non-Autoregressive Neural Machine Translation},
publisher = {6th International Conference on Learning Representations, {ICLR} 2018,
Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
//publisher = {OpenReview.net},
publisher = {International Conference on Learning Representations},
year = {2018},
//url = {https://openreview.net/forum?id=B1l8BtlCb},
//timestamp = {Thu, 25 Jul 2019 14:25:57 +0200},
//biburl = {https://dblp.org/rec/conf/iclr/Gu0XLS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{li-etal-2018-simple,
author = {Yanyang Li and
......@@ -4408,8 +3882,6 @@ pages ={157-166},
Qiang Wang and
Changming Xu and
Jingbo Zhu},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {A Simple and Effective Approach to Coverage-Aware Neural Machine Translation},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -4417,11 +3889,6 @@ pages ={157-166},
pages = {292--297},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/P18-2047/},
//doi = {10.18653/v1/P18-2047},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/LiXLWXZ18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{TuModeling,
author = {Zhaopeng Tu and
......@@ -4435,17 +3902,11 @@ pages ={157-166},
1: Long Papers},
//publisher = {The Association for Computer Linguistics},
year = {2016},
//url = {https://doi.org/10.18653/v1/p16-1008},
//doi = {10.18653/v1/p16-1008},
//timestamp = {Tue, 28 Jan 2020 10:27:13 +0100},
//biburl = {https://dblp.org/rec/conf/acl/TuLLLL16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/SennrichFCBHHJL17,
author = {Rico Sennrich and
Orhan Firat and
Kyunghyun Cho and
Alexandra Birch and
Barry Haddow and
Julian Hitschler and
Marcin Junczys-Dowmunt and
......@@ -4453,8 +3914,6 @@ pages ={157-166},
Antonio Valerio Miceli Barone and
Jozef Mokry and
Maria Nadejde},
//editor = {Andre Martins and
Anselmo Pe{\~{n}}as},
title = {Nematus: a Toolkit for Neural Machine Translation},
publisher = {Proceedings of the 15th Conference of the European Chapter of the
Association for Computational Linguistics, {EACL} 2017, Valencia,
......@@ -4462,18 +3921,10 @@ pages ={157-166},
pages = {65--68},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {https://doi.org/10.18653/v1/e17-3017},
//doi = {10.18653/v1/e17-3017},
//timestamp = {Tue, 28 Jan 2020 10:31:12 +0100},
//biburl = {https://dblp.org/rec/conf/eacl/SennrichFCBHHJL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1905-13324,
author = {Biao Zhang and
Rico Sennrich},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {A Lightweight Recurrent Network for Sequence Modeling},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4481,11 +3932,6 @@ pages ={157-166},
pages = {1538--1548},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1149},
//doi = {10.18653/v1/p19-1149},
//timestamp = {Tue, 28 Jan 2020 10:28:03 +0100},
//biburl = {https://dblp.org/rec/conf/acl/ZhangS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Lei2017TrainingRA,
author = {Tao Lei and
......@@ -4495,12 +3941,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1709.02755},
year = {2017},
//url = {http://arxiv.org/abs/1709.02755},
//archivePrefix = {arXiv},
//eprint = {1709.02755},
//timestamp = {Mon, 13 Aug 2018 16:46:29 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1709-02755.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Zhang2018SimplifyingNM,
author = {Biao Zhang and
......@@ -4508,10 +3948,6 @@ pages ={157-166},
Jinsong Su and
Qian Lin and
Huiji Zhang},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Simplifying Neural Machine Translation with Addition-Subtraction Twin-Gated
Recurrent Networks},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
......@@ -4519,10 +3955,6 @@ pages ={157-166},
pages = {4273--4283},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1459/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/ZhangXSLZ18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Liu_2019_CVPR,
author = {Shikun Liu and
......@@ -4534,50 +3966,23 @@ pages ={157-166},
pages = {1871--1880},
//publisher = {Computer Vision Foundation / {IEEE}},
year = {2019},
//url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Liu\_End-To-End\_Multi-Task\_Learning\_With\_Attention\_CVPR\_2019\_paper.html},
//doi = {10.1109/CVPR.2019.00197},
//timestamp = {Mon, 20 Jan 2020 15:36:04 +0100},
//biburl = {https://dblp.org/rec/conf/cvpr/LiuJD19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1811-00498,
author = {Ra{\'{u}}l V{\'{a}}zquez and
Alessandro Raganato and
J{\"{o}}rg Tiedemann and
Mathias Creutz},
//editor = {Isabelle Augenstein and
Spandana Gella and
Sebastian Ruder and
Katharina Kann and
Burcu Can and
Johannes Welbl and
Alexis Conneau and
Xiang Ren and
Marek Rei},
title = {Multilingual {NMT} with a Language-Independent Attention Bridge},
publisher = {Proceedings of the 4th Workshop on Representation Learning for NLP,
RepL4NLP@ACL 2019, Florence, Italy, August 2, 2019},
pages = {33--39},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/w19-4305},
//doi = {10.18653/v1/w19-4305},
//timestamp = {Fri, 27 Mar 2020 08:52:29 +0100},
//biburl = {https://dblp.org/rec/conf/rep4nlp/VazquezRTC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{MoradiInterrogating,
author = {Pooya Moradi and
Nishant Kambhatla and
Anoop Sarkar},
//editor = {Alexandra Birch and
Andrew M. Finch and
Hiroaki Hayashi and
Ioannis Konstas and
Thang Luong and
Graham Neubig and
Yusuke Oda and
Katsuhito Sudoh},
title = {Interrogating the Explanatory Power of Attention in Neural Machine
Translation},
publisher = {Proceedings of the 3rd Workshop on Neural Generation and Translation@EMNLP-IJCNLP
......@@ -4585,11 +3990,6 @@ pages ={157-166},
pages = {221--230},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/D19-5624},
//doi = {10.18653/v1/D19-5624},
//timestamp = {Tue, 24 Mar 2020 15:04:09 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/MoradiKS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{WangNeural,
author = {Xing Wang and
......@@ -4598,18 +3998,12 @@ pages ={157-166},
Hang Li and
Deyi Xiong and
Min Zhang},
//editor = {Satinder P. Singh and
Shaul Markovitch},
title = {Neural Machine Translation Advised by Statistical Machine Translation},
publisher = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
February 4-9, 2017, San Francisco, California, {USA}},
pages = {3330--3336},
//publisher = {{AAAI} Press},
year = {2017},
//url = {http://aaai.org/ocs/index.php/AAAI/AAAI17/paper/view/14451},
//timestamp = {Tue, 15 Jan 2019 11:48:13 +0100},
//biburl = {https://dblp.org/rec/conf/aaai/WangLTLXZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1905-09418,
author = {Elena Voita and
......@@ -4617,9 +4011,6 @@ pages ={157-166},
Fedor Moiseev and
Rico Sennrich and
Ivan Titov},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {Analyzing Multi-Head Self-Attention: Specialized Heads Do the Heavy
Lifting, the Rest Can Be Pruned},
publisher = {Proceedings of the 57th Conference of the Association for Computational
......@@ -4628,11 +4019,6 @@ pages ={157-166},
pages = {5797--5808},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1580},
//doi = {10.18653/v1/p19-1580},
//timestamp = {Tue, 28 Jan 2020 10:27:29 +0100},
//biburl = {https://dblp.org/rec/conf/acl/VoitaTMST19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Xiao2019SharingAW,
author = {Tong Xiao and
......@@ -4640,7 +4026,6 @@ pages ={157-166},
Jingbo Zhu and
Zhengtao Yu and
Tongran Liu},
//editor = {Sarit Kraus},
title = {Sharing Attention Weights for Fast Transformer},
publisher = {Proceedings of the Twenty-Eighth International Joint Conference on
Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
......@@ -4648,11 +4033,6 @@ pages ={157-166},
pages = {5292--5298},
//publisher = {ijcai.org},
year = {2019},
//url = {https://doi.org/10.24963/ijcai.2019/735},
//doi = {10.24963/ijcai.2019/735},
//timestamp = {Tue, 20 Aug 2019 16:18:18 +0200},
//biburl = {https://dblp.org/rec/conf/ijcai/XiaoLZ0L19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Yang2017TowardsBH,
author = {Baosong Yang and
......@@ -4660,9 +4040,6 @@ pages ={157-166},
Tong Xiao and
Lidia S. Chao and
Jingbo Zhu},
//editor = {Martha Palmer and
Rebecca Hwa and
Sebastian Riedel},
title = {Towards Bidirectional Hierarchical Representations for Attention-based
Neural Machine Translation},
publisher = {Proceedings of the 2017 Conference on Empirical Methods in Natural
......@@ -4671,20 +4048,11 @@ pages ={157-166},
pages = {1432--1441},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {https://doi.org/10.18653/v1/d17-1150},
//doi = {10.18653/v1/d17-1150},
//timestamp = {Tue, 28 Jan 2020 10:28:08 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/YangWXCZ17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Wang2019TreeTI,
author = {Yau-Shian Wang and
Hung-yi Lee and
Yun-Nung Chen},
//editor = {Kentaro Inui and
Jing Jiang and
Vincent Ng and
Xiaojun Wan},
title = {Tree Transformer: Integrating Tree Structures into Self-Attention},
publisher = {Proceedings of the 2019 Conference on Empirical Methods in Natural
Language Processing and the 9th International Joint Conference on
......@@ -4693,51 +4061,29 @@ pages ={157-166},
//publisher = {Association for Computational Linguistics},
pages = {1061--1070},
year = {2019},
//url = {https://doi.org/10.18653/v1/D19-1098},
//doi = {10.18653/v1/D19-1098},
//timestamp = {Thu, 12 Dec 2019 13:23:46 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/WangLC19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1809-01854,
author = {Jetic Gu and
Hassan S. Shavarani and
Anoop Sarkar},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Top-down Tree Structured Decoding with Syntactic Connections for Neural Machine Translation and Parsing},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {401--413},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://doi.org/10.18653/v1/d18-1037},
//doi = {10.18653/v1/d18-1037},
//timestamp = {Tue, 28 Jan 2020 10:28:48 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/GuSS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1808-09374,
author = {Xinyi Wang and
Hieu Pham and
Pengcheng Yin and
Graham Neubig},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {A Tree-based Decoder for Neural Machine Translation},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4772--4777},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1509/},
//timestamp = {Fri, 13 Sep 2019 13:08:45 +0200},
//biburl = {https://dblp.org/rec/conf/emnlp/WangPYN18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangZ16c,
author = {Jiajun Zhang and
......@@ -4746,12 +4092,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1610.07272},
year = {2016},
//url = {http://arxiv.org/abs/1610.07272},
//archivePrefix = {arXiv},
//eprint = {1610.07272},
//timestamp = {Mon, 13 Aug 2018 16:47:14 +0200},
//biburl = {https://dblp.org/rec/journals/corr/ZhangZ16c.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Dai2019TransformerXLAL,
author = {Zihang Dai and
......@@ -4764,12 +4104,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1901.02860},
year = {2019},
//url = {http://arxiv.org/abs/1901.02860},
//archivePrefix = {arXiv},
//eprint = {1901.02860},
//timestamp = {Fri, 01 Feb 2019 13:39:59 +0100},
//biburl = {https://dblp.org/rec/journals/corr/abs-1901-02860.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{li-etal-2019-word,
author = {Xintong Li and
......@@ -4777,9 +4111,6 @@ pages ={157-166},
Lemao Liu and
Max Meng and
Shuming Shi},
//editor = {Anna Korhonen and
David R. Traum and
Llu{\'{\i}}s M{\`{a}}rquez},
title = {On the Word Alignment from Neural Machine Translation},
publisher = {Proceedings of the 57th Conference of the Association for Computational
Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
......@@ -4787,11 +4118,6 @@ pages ={157-166},
pages = {1293--1303},
//publisher = {Association for Computational Linguistics},
year = {2019},
//url = {https://doi.org/10.18653/v1/p19-1124},
//doi = {10.18653/v1/p19-1124},
//timestamp = {Tue, 28 Jan 2020 10:27:51 +0100},
//biburl = {https://dblp.org/rec/conf/acl/LiLLMS19.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Werlen2018DocumentLevelNM,
......@@ -4799,10 +4125,6 @@ pages ={157-166},
Dhananjay Ram and
Nikolaos Pappas and
James Henderson},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Document-Level Neural Machine Translation with Hierarchical Attention
Networks},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
......@@ -4810,19 +4132,12 @@ pages ={157-166},
pages = {2947--2954},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://doi.org/10.18653/v1/d18-1325},
//doi = {10.18653/v1/d18-1325},
//timestamp = {Fri, 27 Mar 2020 08:46:30 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/WerlenRPH18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1805-10163,
author = {Elena Voita and
Pavel Serdyukov and
Rico Sennrich and
Ivan Titov},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Context-Aware Neural Machine Translation Learns Anaphora Resolution},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -4830,11 +4145,6 @@ pages ={157-166},
pages = {1264--1274},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/P18-1117/},
//doi = {10.18653/v1/P18-1117},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/TitovSSV18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-00532,
author = {Aishwarya Bhandare and
......@@ -4849,12 +4159,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1906.00532},
year = {2019},
//url = {http://arxiv.org/abs/1906.00532},
//archivePrefix = {arXiv},
//eprint = {1906.00532},
//timestamp = {Thu, 13 Jun 2019 13:36:00 +0200},
//biburl = {https://dblp.org/rec/journals/corr/abs-1906-00532.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Zhang2018SpeedingUN,
......@@ -4863,46 +4167,29 @@ pages ={157-166},
Yang Feng and
Lei Shen and
Qun Liu},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Speeding Up Neural Machine Translation Decoding by Cube Pruning},
publisher = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {4284--4294},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/D18-1460/},
//timestamp = {Fri, 29 Nov 2019 14:00:46 +0100},
//biburl = {https://dblp.org/rec/conf/emnlp/Zhang0FSL18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/SeeLM16,
author = {Abigail See and
Minh-Thang Luong and
Christopher D. Manning},
//editor = {Yoav Goldberg and
Stefan Riezler},
title = {Compression of Neural Machine Translation Models via Pruning},
publisher = {Proceedings of the 20th {SIGNLL} Conference on Computational Natural
Language Learning, CoNLL 2016, Berlin, Germany, August 11-12, 2016},
pages = {291--301},
//publisher = {{ACL}},
year = {2016},
//url = {https://doi.org/10.18653/v1/k16-1029},
//doi = {10.18653/v1/k16-1029},
//timestamp = {Tue, 28 Jan 2020 10:29:27 +0100},
//biburl = {https://dblp.org/rec/conf/conll/SeeLM16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/ChenLCL17,
author = {Yun Chen and
Yang Liu and
Yong Cheng and
Victor O. K. Li},
//editor = {Regina Barzilay and
Min-Yen Kan},
title = {A Teacher-Student Framework for Zero-Resource Neural Machine Translation},
publisher = {Proceedings of the 55th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
......@@ -4910,11 +4197,6 @@ pages ={157-166},
pages = {1925--1935},
//publisher = {Association for Computational Linguistics},
year = {2017},
//url = {https://doi.org/10.18653/v1/P17-1176},
//doi = {10.18653/v1/P17-1176},
//timestamp = {Tue, 20 Aug 2019 11:59:05 +0200},
//biburl = {https://dblp.org/rec/conf/acl/ChenLCL17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Hinton2015Distilling,
author = {Geoffrey E. Hinton and
......@@ -4924,12 +4206,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1503.02531},
year = {2015},
//url = {http://arxiv.org/abs/1503.02531},
//archivePrefix = {arXiv},
//eprint = {1503.02531},
//timestamp = {Mon, 13 Aug 2018 16:48:36 +0200},
//biburl = {https://dblp.org/rec/journals/corr/HintonVD15.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Ott2018ScalingNM,
......@@ -4953,8 +4229,6 @@ pages ={157-166},
year = "2016",
//address = "Austin, Texas",
//publisher = "Association for Computational Linguistics",
//url = "https://www.aclweb.org/anthology/D16-1139",
//doi = "10.18653/v1/D16-1139",
pages = "1317--1327",
}
......@@ -4982,18 +4256,11 @@ pages ={157-166},
Toulon, France, April 24-26, 2017, Conference Track Proceedings},
//publisher = {OpenReview.net},
year = {2017},
//url = {https://openreview.net/forum?id=BJC\_jUqxe},
//timestamp = {Thu, 25 Jul 2019 14:25:44 +0200},
//biburl = {https://dblp.org/rec/conf/iclr/LinFSYXZB17.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{Shaw2018SelfAttentionWR,
author = {Peter Shaw and
Jakob Uszkoreit and
Ashish Vaswani},
//editor = {Marilyn A. Walker and
Heng Ji and
Amanda Stent},
title = {Self-Attention with Relative Position Representations},
publisher = {Proceedings of the 2018 Conference of the North American Chapter of
the Association for Computational Linguistics: Human Language Technologies,
......@@ -5002,11 +4269,6 @@ pages ={157-166},
pages = {464--468},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://doi.org/10.18653/v1/n18-2074},
//doi = {10.18653/v1/n18-2074},
//timestamp = {Tue, 28 Jan 2020 10:30:17 +0100},
//biburl = {https://dblp.org/rec/conf/naacl/ShawUV18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/HeZRS15,
author = {Kaiming He and
......@@ -5019,26 +4281,6 @@ pages ={157-166},
pages = {770--778},
//publisher = {{IEEE} Computer Society},
year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.90},
//doi = {10.1109/CVPR.2016.90},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/HeZRS16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{Ba2016LayerN,
author = {Lei Jimmy Ba and
Jamie Ryan Kiros and
Geoffrey E. Hinton},
title = {Layer Normalization},
journal = {CoRR},
volume = {abs/1607.06450},
year = {2016},
//url = {http://arxiv.org/abs/1607.06450},
//archivePrefix = {arXiv},
//eprint = {1607.06450},
//timestamp = {Tue, 23 Jul 2019 17:33:23 +0200},
//biburl = {https://dblp.org/rec/journals/corr/BaKH16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{JMLR:v15:srivastava14a,
author = {Nitish Srivastava and Geoffrey Hinton and Alex Krizhevsky and Ilya Sutskever and Ruslan Salakhutdinov},
......@@ -5047,7 +4289,6 @@ pages ={157-166},
year = {2014},
volume = {15},
pages = {1929-1958},
//url = {http://jmlr.org/papers/v15/srivastava14a.html}
}
@inproceedings{Szegedy_2016_CVPR,
author = {Christian Szegedy and
......@@ -5061,18 +4302,11 @@ pages ={157-166},
pages = {2818--2826},
//publisher = {{IEEE} Computer Society},
year = {2016},
//url = {https://doi.org/10.1109/CVPR.2016.308},
//doi = {10.1109/CVPR.2016.308},
//timestamp = {Wed, 16 Oct 2019 14:14:50 +0200},
//biburl = {https://dblp.org/rec/conf/cvpr/SzegedyVISW16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1805-00631,
author = {Biao Zhang and
Deyi Xiong and
Jinsong Su},
//editor = {Iryna Gurevych and
Yusuke Miyao},
title = {Accelerating Neural Transformer via an Average Attention Network},
publisher = {Proceedings of the 56th Annual Meeting of the Association for Computational
Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
......@@ -5080,11 +4314,6 @@ pages ={157-166},
pages = {1789--1798},
//publisher = {Association for Computational Linguistics},
year = {2018},
//url = {https://www.aclweb.org/anthology/P18-1166/},
//doi = {10.18653/v1/P18-1166},
//timestamp = {Mon, 16 Sep 2019 13:46:41 +0200},
//biburl = {https://dblp.org/rec/conf/acl/XiongZS18.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CourbariauxB16,
author = {Matthieu Courbariaux and
......@@ -5094,12 +4323,6 @@ pages ={157-166},
journal = {CoRR},
volume = {abs/1602.02830},
year = {2016},
//url = {http://arxiv.org/abs/1602.02830},
//archivePrefix = {arXiv},
//eprint = {1602.02830},
//timestamp = {Mon, 13 Aug 2018 16:46:57 +0200},
//biburl = {https://dblp.org/rec/journals/corr/CourbariauxB16.bib},
//bibsource = {dblp computer science bibliography, https://dblp.org}
}
%%%%% chapter 12------------------------------------------------------
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论