Commit f7e614ad by 单韦乔

合并分支 'shanweiqiao' 到 'caorunzhe'

第一二章文献格式更新

查看合并请求 !135
parents bf599c01 24f46b04
......@@ -1051,7 +1051,7 @@ c_{\textrm{KN}}(\cdot) = \left\{\begin{array}{ll}
\vspace{0.5em}
\item 本章更多地关注了语言模型的基本问题和求解思路,但是基于$n$-gram的方法并不是语言建模的唯一方法。从现在自然语言处理的前沿看,端到端的深度学习方法在很多任务中都取得了领先的性能。语言模型同样可以使用这些方法\upcite{jing2019a},而且在近些年取得了巨大成功。例如,最早提出的前馈神经语言模型\upcite{bengio2003a}和后来的基于循环单元的语言模型\upcite{mikolov2010recurrent}、基于长短期记忆单元的语言模型\upcite{sundermeyer2012lstm}以及现在非常流行的Transformer\upcite{vaswani2017attention}。 关于神经语言模型的内容,会在{\chapternine}进行进一步介绍。
\vspace{0.5em}
\item 最后,本章结合语言模型的序列生成任务对搜索技术进行了介绍。类似地,机器翻译任务也需要从大量的翻译后选中快速寻找最优译文。因此在机器翻译任务中也使用了搜索方法,这个过程通常被称作{\small\bfnew{解码}}\index{解码}(Decoding)\index{Decoding}。例如,有研究者在基于词的翻译模型中尝试使用启发式搜索\upcite{DBLP:conf/acl/OchUN01,DBLP:conf/acl/WangW97,tillmann1997a}以及贪婪搜索方法\upcite{germann2001fast}\upcite{germann2003greedy},也有研究者研究基于短语的栈解码方法\upcite{Koehn2007Moses,DBLP:conf/amta/Koehn04}。此外,解码方法还包括有限状态机解码\upcite{bangalore2001a}\upcite{bangalore2000stochastic}以及基于语言学约束的解码\upcite{venugopal2007an,zollmann2007the,liu2006tree,galley2006scalable,chiang2005a}。相关内容将在{\chaptereight}{\chapterfourteen} 进行介绍。
\item 最后,本章结合语言模型的序列生成任务对搜索技术进行了介绍。类似地,机器翻译任务也需要从大量的翻译后选中快速寻找最优译文。因此在机器翻译任务中也使用了搜索方法,这个过程通常被称作{\small\bfnew{解码}}\index{解码}(Decoding)\index{Decoding}。例如,有研究者在基于词的翻译模型中尝试使用启发式搜索\upcite{DBLP:conf/acl/OchUN01,DBLP:conf/acl/WangW97,tillmann1997a}以及贪婪搜索方法\upcite{germann2001fast}\upcite{germann2003greedy},也有研究者研究基于短语的栈解码方法\upcite{Koehn2007Moses,DBLP:conf/amta/Koehn04}。此外,解码方法还包括有限状态机解码\upcite{bangalore2001a}\upcite{DBLP:journals/mt/BangaloreR02}以及基于语言学约束的解码\upcite{venugopal2007an,zollmann2007the,liu2006tree,galley2006scalable,chiang2005a}。相关内容将在{\chaptereight}{\chapterfourteen} 进行介绍。
\vspace{0.5em}
\end{itemize}
\end{adjustwidth}
......@@ -11,10 +11,10 @@
year={1983},
}
@article{2019cns,
@book{2019cns,
title={2019中国语言服务行业发展报告},
author={中国翻译协会},
journal={中国翻译协会},
publisher={中国翻译协会},
year={2019}
}
......@@ -74,8 +74,7 @@
author = {Satoshi Sato and
Makoto Nagao},
title = {Toward Memory-based Translation},
//booktitle = {13th International Conference on Computational Linguistics, {COLING}
1990, University of Helsinki, Finland, August 20-25, 1990},
publisher = {International Conference on Computational Linguistics},
pages = {247--252},
year = {1990}
}
......@@ -207,17 +206,10 @@
author = {Thang Luong and
Hieu Pham and
Christopher D. Manning},
//editor = {Llu{\'{\i}}s M{\`{a}}rquez and
Chris Callison$\dash$Burch and
Jian Su and
Daniele Pighin and
Yuval Marton},
title = {Effective Approaches to Attention-based Neural Machine Translation},
//booktitle = {Proceedings of the 2015 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2015, Lisbon, Portugal, September 17-21,
2015},
publisher = {Conference on Empirical Methods in Natural
Language Processing},
pages = {1412--1421},
publisher = {The Association for Computational Linguistics},
year = {2015}
}
......@@ -227,15 +219,11 @@
David Grangier and
Denis Yarats and
Yann N. Dauphin},
//editor = {Doina Precup and
Yee Whye Teh},
title = {Convolutional Sequence to Sequence Learning},
//booktitle = {Proceedings of the 34th International Conference on Machine Learning,
{ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
publisher = {International Conference on Machine Learning},
series = {Proceedings of Machine Learning Research},
volume = {70},
pages = {1243--1252},
publisher = {{PMLR}},
year = {2017}
}
......@@ -243,11 +231,8 @@
author = {Dzmitry Bahdanau and
Kyunghyun Cho and
Yoshua Bengio},
//editor = {Yoshua Bengio and
Yann LeCun},
title = {Neural Machine Translation by Jointly Learning to Align and Translate},
//booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015,
San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
publisher = {International Conference on Learning Representations},
year = {2015}
}
......@@ -255,15 +240,8 @@
author = {Ilya Sutskever and
Oriol Vinyals and
Quoc V. Le},
//editor = {Zoubin Ghahramani and
Max Welling and
Corinna Cortes and
Neil D. Lawrence and
Kilian Q. Weinberger},
title = {Sequence to Sequence Learning with Neural Networks},
//booktitle = {Advances in Neural Information Processing Systems 27: Annual Conference
on Neural Information Processing Systems 2014, December 8-13 2014,
Montreal, Quebec, Canada},
publisher = {Advances in Neural Information Processing Systems},
pages = {3104--3112},
year = {2014}
}
......@@ -274,7 +252,7 @@
publisher = {Cambridge University Press},
year = {2010}
}
%再看看
@article{DBLP:journals/corr/abs-1709-07809,
author = {Philipp Koehn},
title = {Neural Machine Translation},
......@@ -397,30 +375,24 @@
author = {Reinhard Kneser and
Hermann Ney},
title = {Improved backing-off for M-gram language modeling},
//booktitle = {1995 International Conference on Acoustics, Speech, and Signal Processing,
{ICASSP} '95, Detroit, Michigan, USA, May 08-12, 1995},
publisher = {International Conference on Acoustics, Speech, and Signal Processing},
pages = {181--184},
publisher = {{IEEE} Computer Society},
year = {1995}
}
@inproceedings{ney1991smoothing,
title={On smoothing techniques for bigram-based natural language modelling},
author={Ney, Hermann and Essen, Ute},
//booktitle={Acoustics, Speech, and Signal Processing, IEEE International Conference on},
publisher={International Conference on Acoustics, Speech, and Signal Processing},
pages={825--828},
year={1991},
organization={IEEE Computer Society}
//organization={IEEE Computer Society}
}
@inproceedings{stolcke2002srilm,
author = {Andreas Stolcke},
//editor = {John H. L. Hansen and
Bryan L. Pellom},
title = {{SRILM} - an extensible language modeling toolkit},
//booktitle = {7th International Conference on Spoken Language Processing, {ICSLP2002}
- {INTERSPEECH} 2002, Denver, Colorado, USA, September 16-20, 2002},
publisher = {{ISCA}},
publisher = {International Conference on Spoken Language Processing},
year = {2002}
}
......@@ -453,7 +425,7 @@
title = {Speech and language processing: an introduction to natural language
processing, computational linguistics, and speech recognition, 2nd
Edition},
series = {Prentice Hall series in artificial intelligence},
//series = {Prentice Hall series in artificial intelligence},
publisher = {Prentice Hall, Pearson Education International},
year = {2009}
}
......@@ -553,11 +525,8 @@
Mingbo Ma},
title = {When to Finish? Optimal Beam Search for Neural Text Generation (modulo
beam size)},
//booktitle = {Proceedings of the 2017 Conference on Empirical Methods in Natural
Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September
9-11, 2017},
pages = {2134--2139},
publisher = {Association for Computational Linguistics},
publisher = {The Association for Computational Linguistics},
year = {2017}
}
......@@ -565,16 +534,10 @@
author = {Yilin Yang and
Liang Huang and
Mingbo Ma},
//editor = {Ellen Riloff and
David Chiang and
Julia Hockenmaier and
Jun'ichi Tsujii},
title = {Breaking the Beam Search Curse: {A} Study of (Re-)Scoring Methods
and Stopping Criteria for Neural Machine Translation},
//booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural
Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
pages = {3054--3059},
publisher = {Association for Computational Linguistics},
publisher = {The Association for Computational Linguistics},
year = {2018}
}
......@@ -626,7 +589,7 @@
@inproceedings{kirchhoff2005improved,
title={Improved Language Modeling for Statistical Machine Translation},
author={Katrin {Kirchhoff} and Mei {Yang}},
//booktitle={Proceedings of the ACL Workshop on Building and Using Parallel Texts},
publisher={The Association for Computational Linguistics},
pages={125--128},
year={2005}
}
......@@ -634,7 +597,7 @@
@inproceedings{koehn2007factored,
title={Factored Translation Models},
author={Philipp {Koehn} and Hieu {Hoang}},
//booktitle={Proceedings of the 2007 Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP-CoNLL)},
publisher = {The Association for Computational Linguistics},
pages={868--876},
year={2007}
}
......@@ -642,7 +605,7 @@
@inproceedings{sarikaya2007joint,
title={Joint Morphological-Lexical Language Modeling for Machine Translation},
author={Ruhi {Sarikaya} and Yonggang {Deng}},
//booktitle={Human Language Technologies 2007: The Conference of the North American Chapter of the Association for Computational Linguistics; Companion Volume, Short Papers},
publisher = {The Association for Computational Linguistics},
pages={145--148},
year={2007}
}
......@@ -650,7 +613,7 @@
@inproceedings{heafield2011kenlm,
title={KenLM: Faster and Smaller Language Model Queries},
author={Kenneth {Heafield}},
//booktitle={Proceedings of the Sixth Workshop on Statistical Machine Translation},
publisher = {The Association for Computational Linguistics},
pages={187--197},
year={2011}
}
......@@ -658,7 +621,7 @@
@inproceedings{federico2006how,
title={How Many Bits Are Needed To Store Probabilities for Phrase-Based Translation?},
author={Marcello {Federico} and Nicola {Bertoldi}},
//booktitle={Proceedings on the Workshop on Statistical Machine Translation},
publisher = {The Association for Computational Linguistics},
pages={94--101},
year={2006}
}
......@@ -666,7 +629,7 @@
@inproceedings{federico2007efficient,
title={Efficient Handling of N-gram Language Models for Statistical Machine Translation},
author={Marcello {Federico} and Mauro {Cettolo}},
//booktitle={Proceedings of the Second Workshop on Statistical Machine Translation},
publisher = {The Association for Computational Linguistics},
pages={88--95},
year={2007}
}
......@@ -674,7 +637,7 @@
@inproceedings{talbot2007randomised,
title={Randomised Language Modelling for Statistical Machine Translation},
author={David {Talbot} and Miles {Osborne}},
//booktitle={Proceedings of the 45th Annual Meeting of the Association of Computational Linguistics},
publisher = {The Association for Computational Linguistics},
pages={512--519},
year={2007}
}
......@@ -682,7 +645,7 @@
@inproceedings{talbot2007smoothed,
title={Smoothed Bloom Filter Language Models: Tera-Scale LMs on the Cheap},
author={David {Talbot} and Miles {Osborne}},
//booktitle={Proceedings of the 2007 Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning (EMNLP-CoNLL)},
publisher = {The Association for Computational Linguistics},
pages={468--476},
year={2007}
}
......@@ -710,30 +673,26 @@
Luk{\'{a}}s Burget and
Jan Cernock{\'{y}} and
Sanjeev Khudanpur},
//editor = {Takao Kobayashi and
Keikichi Hirose and
Satoshi Nakamura},
title = {Recurrent neural network based language model},
//booktitle = {{INTERSPEECH} 2010, 11th Annual Conference of the International Speech
Communication Association, Makuhari, Chiba, Japan, September 26-30,
2010},
pages = {1045--1048},
publisher = {{ISCA}},
publisher = {International Speech Communication Association},
year = {2010}
}
@inproceedings{sundermeyer2012lstm,
title={LSTM Neural Networks for Language Modeling.},
author={Martin {Sundermeyer} and Ralf {Schlüter} and Hermann {Ney}},
//booktitle={INTERSPEECH},
pages={194--197},
year={2012}
author = {Martin Sundermeyer and
Ralf Schl{\"{u}}ter and
Hermann Ney},
title = {{LSTM} Neural Networks for Language Modeling},
pages = {194--197},
publisher = {International Speech Communication Association},
year = {2012}
}
@inproceedings{vaswani2017attention,
title={Attention is All You Need},
author={Ashish {Vaswani} and Noam {Shazeer} and Niki {Parmar} and Jakob {Uszkoreit} and Llion {Jones} and Aidan N. {Gomez} and Lukasz {Kaiser} and Illia {Polosukhin}},
//booktitle={Proceedings of the 31st International Conference on Neural Information Processing Systems},
publisher={International Conference on Neural Information Processing},
pages={5998--6008},
year={2017}
}
......@@ -741,7 +700,7 @@
@inproceedings{tillmann1997a,
title={A DP-based Search Using Monotone Alignments in Statistical Translation},
author={Christoph {Tillmann} and Stephan {Vogel} and Hermann {Ney} and Alex {Zubiaga}},
//booktitle={Proceedings of the 35th Annual Meeting of the Association for Computational Linguistics},
publisher = {Morgan Kaufmann Publishers},
pages={289--296},
year={1997}
}
......@@ -749,16 +708,9 @@
@inproceedings{DBLP:conf/acl/WangW97,
author = {Ye$\dash$Yi Wang and
Alex Waibel},
//editor = {Philip R. Cohen and
Wolfgang Wahlster},
title = {Decoding Algorithm in Statistical Machine Translation},
//booktitle = {35th Annual Meeting of the Association for Computational Linguistics
and 8th Conference of the European Chapter of the Association for
Computational Linguistics, Proceedings of the Conference, 7-12 July
1997, Universidad Nacional de Educaci{\'{o}}n a Distancia (UNED),
Madrid, Spain},
pages = {366--372},
publisher = {Morgan Kaufmann Publishers / {ACL}},
publisher = {Morgan Kaufmann Publishers},
year = {1997}
}
......@@ -767,15 +719,15 @@
Nicola Ueffing and
Hermann Ney},
title = {An Efficient A* Search Algorithm for Statistical Machine Translation},
//booktitle = {Proceedings of the {ACL} Workshop on Data-Driven Methods in Machine
Translation, Toulouse, France, July 7, 2001},
publisher = {Proceedings of the {ACL} Workshop on Data-Driven Methods in Machine
Translation},
year = {2001}
}
@inproceedings{germann2001fast,
title={Fast Decoding and Optimal Decoding for Machine Translation},
author={Ulrich {Germann} and Michael {Jahr} and Kevin {Knight} and Daniel {Marcu} and Kenji {Yamada}},
//booktitle={Proceedings of 39th Annual Meeting of the Association for Computational Linguistics},
publisher = {Morgan Kaufmann Publishers},
pages={228--235},
year={2001}
}
......@@ -783,7 +735,7 @@
@inproceedings{germann2003greedy,
title={Greedy decoding for statistical machine translation in almost linear time},
author={Ulrich {Germann}},
//booktitle={NAACL '03 Proceedings of the 2003 Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology - Volume 1},
publisher = {The Association for Computational Linguistics},
pages={1--8},
year={2003}
}
......@@ -803,25 +755,15 @@
Ondrej Bojar and
Alexandra Constantin and
Evan Herbst},
//editor = {John A. Carroll and
Antal van den Bosch and
Annie Zaenen},
title = {Moses: Open Source Toolkit for Statistical Machine Translation},
//booktitle = {{ACL} 2007, Proceedings of the 45th Annual Meeting of the Association
for Computational Linguistics, June 23-30, 2007, Prague, Czech Republic},
publisher = {The Association for Computational Linguistics},
year = {2007}
}
@inproceedings{DBLP:conf/amta/Koehn04,
author = {Philipp Koehn},
//editor = {Robert E. Frederking and
Kathryn Taylor},
title = {Pharaoh: {A} Beam Search Decoder for Phrase-Based Statistical Machine
Translation Models},
//booktitle = {Machine Translation: From Real Users to Research, 6th Conference of
the Association for Machine Translation in the Americas, {AMTA} 2004,
Washington, DC, USA, September 28-October 2, 2004, Proceedings},
series = {Lecture Notes in Computer Science},
volume = {3265},
pages = {115--124},
......@@ -832,23 +774,26 @@
@inproceedings{bangalore2001a,
title={A finite-state approach to machine translation},
author={S. {Bangalore} and G. {Riccardi}},
//booktitle={IEEE Workshop on Automatic Speech Recognition and Understanding, 2001. ASRU '01.},
publisher = {The Association for Computational Linguistics},
pages={381--388},
year={2001}
}
@inproceedings{bangalore2000stochastic,
title={Stochastic finite-state models for spoken language machine translation},
author={Srinivas {Bangalore} and Giuseppe {Riccardi}},
//booktitle={NAACL-ANLP-EMTS '00 Proceedings of the 2000 NAACL-ANLP Workshop on Embedded machine translation systems - Volume 5},
pages={52--59},
year={2000}
@article{DBLP:journals/mt/BangaloreR02,
author = {Srinivas Bangalore and
Giuseppe Riccardi},
title = {Stochastic Finite-State Models for Spoken Language Machine Translation},
journal = {Machine Translation},
volume = {17},
number = {3},
pages = {165--184},
year = {2002}
}
@inproceedings{venugopal2007an,
title={An Efficient Two-Pass Approach to Synchronous-CFG Driven Statistical MT},
author={Ashish {Venugopal} and Andreas {Zollmann} and Vogel {Stephan}},
//booktitle={Human Language Technologies 2007: The Conference of the North American Chapter of the Association for Computational Linguistics; Proceedings of the Main Conference},
publisher = {The Association for Computational Linguistics},
pages={500--507},
year={2007}
}
......@@ -858,16 +803,10 @@
Ashish Venugopal and
Matthias Paulik and
Stephan Vogel},
//editor = {Chris Callison$\dash$Burch and
Philipp Koehn and
Cameron S. Fordyce and
Christof Monz},
title = {The Syntax Augmented {MT} {(SAMT)} System at the Shared Task for the
2007 {ACL} Workshop on Statistical Machine Translation},
//booktitle = {Proceedings of the Second Workshop on Statistical Machine Translation,
WMT@ACL 2007, Prague, Czech Republic, June 23, 2007},
pages = {216--219},
publisher = {Association for Computational Linguistics},
publisher = {The Association for Computational Linguistics},
year = {2007}
}
......@@ -875,13 +814,7 @@
author = {Yang Liu and
Qun Liu and
Shouxun Lin},
//editor = {Nicoletta Calzolari and
Claire Cardie and
Pierre Isabelle},
title = {Tree-to-String Alignment Template for Statistical Machine Translation},
//booktitle = {{ACL} 2006, 21st International Conference on Computational Linguistics
and 44th Annual Meeting of the Association for Computational Linguistics,
Proceedings of the Conference, Sydney, Australia, 17-21 July 2006},
publisher = {The Association for Computer Linguistics},
year = {2006}
}
......@@ -894,27 +827,15 @@
Steve DeNeefe and
Wei Wang and
Ignacio Thayer},
//editor = {Nicoletta Calzolari and
Claire Cardie and
Pierre Isabelle},
title = {Scalable Inference and Training of Context-Rich Syntactic Translation
Models},
//booktitle = {{ACL} 2006, 21st International Conference on Computational Linguistics
and 44th Annual Meeting of the Association for Computational Linguistics,
Proceedings of the Conference, Sydney, Australia, 17-21 July 2006},
publisher = {The Association for Computer Linguistics},
year = {2006}
}
@inproceedings{chiang2005a,
author = {David Chiang},
//editor = {Kevin Knight and
Hwee Tou Ng and
Kemal Oflazer},
title = {A Hierarchical Phrase-Based Model for Statistical Machine Translation},
//booktitle = {{ACL} 2005, 43rd Annual Meeting of the Association for Computational
Linguistics, Proceedings of the Conference, 25-30 June 2005, University
of Michigan, {USA}},
pages = {263--270},
publisher = {The Association for Computer Linguistics},
year = {2005}
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论