\parinterval 神经网络为解决自然语言处理问题提供了全新的思路。而所谓深度学习也是建立在多层神经网络结构之上的一系列模型和方法。本章从神经网络的基本概念到其在语言建模中的应用进行了概述。由于篇幅所限,这里无法覆盖所有神经网络和深度学习的相关内容,感兴趣的读者可以进一步阅读\textit{Neural Network Methods in Natural Language Processing}\cite{goldberg2017neural}和\textit{Deep Learning}\cite{Goodfellow-et-al-2016}。此外,也有一些研究方向值得关注:
title={Sentence-level MT evaluation without reference translations: Beyond language modeling},
...
...
@@ -1499,8 +1491,7 @@
volume={27},
number={3-4},
pages={171--192},
year={2013},
publisher={Springer}
year={2013}
}
@inproceedings{DBLP:conf/wmt/BiciciW14,
author = {Ergun Bi{\c{c}}ici and
...
...
@@ -1801,7 +1792,7 @@
@inproceedings{popovic2011human,
title={From human to automatic error classification for machine translation output},
author={Popovic, Maja and Burchardt, Aljoscha and others},
booktitle={European Association for Machine Translation},
publisher={European Association for Machine Translation},
year={2011}
}
@article{DBLP:journals/mt/CostaLLCC15,
...
...
@@ -2219,6 +2210,7 @@ year = {2012}
}
@article{kepler2019unbabel,
title={Unbabel's Participation in the WMT19 Translation Quality Estimation Shared Task},
pages={78--84},
author={Kepler, F{\'a}bio and Tr{\'e}nous, Jonay and Treviso, Marcos and Vera, Miguel and G{\'o}is, Ant{\'o}nio and Farajian, M Amin and Lopes, Ant{\'o}nio V and Martins, Andr{\'e} FT},
year={2019}
}
...
...
@@ -2271,15 +2263,8 @@ year = {2012}
year={2000},
publisher={Pearson Education India}
}
@article{devlin2018bert,
title={Bert: Pre-training of deep bidirectional transformers for language understanding},
author={Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
title = {Faster Beam-Search Decoding for Phrasal Statistical Machine Translation},
publisher = {Machine Translation Summit XI},
...
...
@@ -3177,7 +3161,7 @@ year = {2012}
}
@inproceedings{DBLP:conf/naacl/ZettlemoyerM07,
author = {Luke S. Zettlemoyer and
Robert Moore},
Robert C. Moore},
title = {Selective Phrase Pair Extraction for Improved Statistical Machine
Translation},
pages = {209--212},
...
...
@@ -3393,7 +3377,7 @@ year = {2012}
@inproceedings{charniak2006multilevel,
title={Multilevel Coarse-to-Fine PCFG Parsing},
author={Eugene {Charniak} and Mark {Johnson} and Micha {Elsner} and Joseph {Austerweil} and David {Ellis} and Isaac {Haxton} and Catherine {Hill} and R. {Shrivaths} and Jeremy {Moore} and Michael {Pozar} and Theresa {Vu}},
booktitle={Proceedings of the Human Language Technology Conference of the North American Chapter of the Association for Computational Linguistics},
publisher={Proceedings of the Human Language Technology Conference of the North American Chapter of the Association for Computational Linguistics},
pages={168--175},
year={2006}
}
...
...
@@ -3769,9 +3753,9 @@ year = {2012}
@inproceedings{bangalore2001computing,
title ={Computing consensus translation from multiple machine translation systems},
author ={Srinivas Bangalore, German Bordel and Giuseppe Riccardi},
publisher = {IEEE Workshop on Automatic Speech Recognition and Understanding},
pages ={351--354},
year ={2001},
organization ={The Institute of Electrical and Electronics Engineers}
year ={2001}
}
@inproceedings{rosti2007combining,
author = {Antti-Veikko I. Rosti and
...
...
@@ -3809,7 +3793,7 @@ year = {2012}
Mei Yang and
Jianfeng Gao and
Patrick Nguyen and
Robert Moore},
Robert C. Moore},
title = {Indirect-HMM-based Hypothesis Alignment for Combining Outputs from