Commit 008ca909 by 曹润柘

合并分支 'caorunzhe' 到 'master'

Caorunzhe

查看合并请求 !678
parents 22f398e4 9557b055
...@@ -296,7 +296,11 @@ ...@@ -296,7 +296,11 @@
%---------------------------------------------------------------------------------------- %----------------------------------------------------------------------------------------
\subsection{对偶学习} \subsection{对偶学习}
\parinterval 对称,也许是人类最喜欢的美,其始终贯穿在整个人类文明的诞生与发展之中。古语“夫美者,上下、内外、大小、远近皆无害焉,故曰美”描述的即是这样的美。在人工智能的任务中,也存在着这样的对称结构,比如机器翻译中英译汉和汉译英、图像处理中的图像标注和图像生成以及语音处理中的语音识别和语音合成等。利用这些任务的对称性质(也称对偶性),可以使互为对偶的两个任务获得更有效的反馈,从而使对应的模型相互学习、相互提高。目前,对偶学习的思想已经广泛应用于自然语言处理、图像处理等领域,它不仅能够提升在有限双语资源下的翻译模型性能({\small\bfnew{有监督对偶学习}},Dual Supervised Learning\index{Dual Supervised Learning}\upcite{DBLP:conf/icml/XiaQCBYL17,DBLP:conf/acl/SuHC19,DBLP:journals/ejasmp/RadzikowskiNWY19},而且能够利用未标注的单语数据来进行学习({\small\bfnew{无监督对偶学习}},Dual Unsupervised Learning\index{Dual Unsupervised Learning}\upcite{qin2020dual,DBLP:conf/iccv/YiZTG17,DBLP:journals/access/DuRZH20}。下面将一一展开讨论。 \parinterval 对称,也许是人类最喜欢的美,其始终贯穿在整个人类文明的诞生与发展之中。古语“夫美者,上下、内外、大小、远近皆无害焉,故曰美”描述的即是这样的美。在人工智能的任务中,也存在着这样的对称结构,比如机器翻译中英译汉和汉译英、图像处理中的图像标注和图像生成以及语音处理中的语音识别和语音合成等。利用这些任务的对称性质(也称对偶性),可以使互为对偶的两个任务获得更有效的反馈,从而使对应的模型相互学习、相互提高。
目前,对偶学习的思想已经广泛应用于低资源机器翻译领域,它不仅能够提升在有限双语资源下的翻译模型性能({\small\bfnew{有监督对偶学习}},Dual Supervised Learning\index{Dual Supervised Learning}\upcite{DBLP:conf/icml/XiaQCBYL17,DBLP:conf/icml/XiaTTQYL18},而且能够利用未标注的单语数据来进行学习({\small\bfnew{无监督对偶学习}},Dual Unsupervised Learning\index{Dual Unsupervised Learning}\upcite{qin2020dual,DBLP:conf/nips/HeXQWYLM16,zhao2020dual}。下面将一一展开讨论。
%---------------------------------------------------------------------------------------- %----------------------------------------------------------------------------------------
% NEW SUB-SUB-SECTION % NEW SUB-SUB-SECTION
......
...@@ -6234,6 +6234,794 @@ author = {Yoshua Bengio and ...@@ -6234,6 +6234,794 @@ author = {Yoshua Bengio and
year={2020} year={2020}
} }
@inproceedings{DBLP:journals/mt/EetemadiLTR15,
author = {Sauleh Eetemadi and
William Lewis and
Kristina Toutanova and
Hayder Radha},
title = {Survey of data-selection methods in statistical machine translation},
publisher = {Machine Translation},
volume = {29},
number = {3-4},
pages = {189--223},
year = {2015}
}
@inproceedings{britz2017effective,
title={Effective domain mixing for neural machine translation},
author={Britz, Denny and Le, Quoc and Pryzant, Reid},
publisher={Proceedings of the Second Conference on Machine Translation},
pages={118--126},
year={2017}
}
@inproceedings{DBLP:conf/emnlp/AxelrodHG11,
author = {Amittai Axelrod and
Xiaodong He and
Jianfeng Gao},
title = {Domain Adaptation via Pseudo In-Domain Data Selection},
pages = {355--362},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2011}
}
@inproceedings{DBLP:conf/wmt/AxelrodRHO15,
author = {Amittai Axelrod and
Philip Resnik and
Xiaodong He and
Mari Ostendorf},
title = {Data Selection With Fewer Words},
pages = {58--65},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2015}
}
@inproceedings{DBLP:conf/emnlp/WangULCS17,
author = {Rui Wang and
Masao Utiyama and
Lemao Liu and
Kehai Chen and
Eiichiro Sumita},
title = {Instance Weighting for Neural Machine Translation Domain Adaptation},
pages = {1482--1488},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2017}
}
@inproceedings{DBLP:conf/iwslt/MansourWN11,
author = {Saab Mansour and
Joern Wuebker and
Hermann Ney},
title = {Combining translation and language model scoring for domain-specific
data filtering},
pages = {222--229},
publisher = {International Workshop on Spoken Language Translation},
year = {2011}
}
@inproceedings{DBLP:conf/conll/ChenH16,
author = {Boxing Chen and
Fei Huang},
title = {Semi-supervised Convolutional Networks for Translation Adaptation
with Tiny Amount of In-domain Data},
pages = {314--323},
publisher = {The SIGNLL Conference on Computational Natural Language Learning},
year = {2016}
}
@inproceedings{chen2016bilingual,
title={Bilingual methods for adaptive training data selection for machine translation},
author={Chen, Boxing and Kuhn, Roland and Foster, George and Cherry, Colin and Huang, Fei},
publisher={Association for Machine Translation in the Americas},
pages={93--103},
year={2016}
}
@inproceedings{DBLP:conf/aclnmt/ChenCFL17,
author = {Boxing Chen and
Colin Cherry and
George F. Foster and
Samuel Larkin},
title = {Cost Weighting for Neural Machine Translation Domain Adaptation},
pages = {40--46},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2017}
}
@inproceedings{DBLP:conf/wmt/DumaM17,
author = {Mirela-Stefania Duma and
Wolfgang Menzel},
title = {Automatic Threshold Detection for Data Selection in Machine Translation},
pages = {483--488},
publisher = {Proceedings of the Second Conference on Machine Translation},
year = {2017}
}
@inproceedings{DBLP:conf/wmt/BiciciY11,
author = {Ergun Bi{\c{c}}ici and
Deniz Yuret},
title = {Instance Selection for Machine Translation using Feature Decay Algorithms},
pages = {272--283},
publisher = {Proceedings of the Sixth Workshop on Statistical Machine Translation},
year = {2011}
}
@inproceedings{poncelas2018feature,
title={Feature decay algorithms for neural machine translation},
author={Poncelas, Alberto and Maillette de Buy Wenniger, Gideon and Way, Andy},
year={2018},
publisher={European Association for Machine Translation}
}
@inproceedings{DBLP:conf/acl/SotoSPW20,
author = {Xabier Soto and
Dimitar Sht. Shterionov and
Alberto Poncelas and
Andy Way},
title = {Selecting Backtranslated Data from Multiple Sources for Improved Neural
Machine Translation},
pages = {3898--3908},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020}
}
@inproceedings{DBLP:journals/corr/abs-1811-03039,
author = {Alberto Poncelas and
Gideon Maillette de Buy Wenniger and
Andy Way},
title = {Data Selection with Feature Decay Algorithms Using an Approximated
Target Side},
publisher = {CoRR},
volume = {abs/1811.03039},
year = {2018}
}
@inproceedings{DBLP:conf/emnlp/WeesBM17,
author = {Marlies van der Wees and
Arianna Bisazza and
Christof Monz},
title = {Dynamic Data Selection for Neural Machine Translation},
pages = {1400--1410},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2017}
}
@inproceedings{DBLP:conf/wmt/WangWHNC18,
author = {Wei Wang and
Taro Watanabe and
Macduff Hughes and
Tetsuji Nakagawa and
Ciprian Chelba},
title = {Denoising Neural Machine Translation Training with Trusted Data and
Online Data Selection},
pages = {133--143},
publisher = {Proceedings of the Third Conference on Machine Translation},
year = {2018}
}
@inproceedings{DBLP:conf/acl/WangUS18,
author = {Rui Wang and
Masao Utiyama and
Eiichiro Sumita},
title = {Dynamic Sentence Sampling for Efficient Training of Neural Machine
Translation},
pages = {298--304},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018}
}
@inproceedings{DBLP:conf/aclnmt/KhayrallahK18,
author = {Huda Khayrallah and
Philipp Koehn},
title = {On the Impact of Various Types of Noise on Neural Machine Translation},
pages = {74--83},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018}
}
@inproceedings{DBLP:conf/coling/FormigaF12,
author = {Llu{\'{\i}}s Formiga and
Jos{\'{e}} A. R. Fonollosa},
title = {Dealing with Input Noise in Statistical Machine Translation},
pages = {319--328},
publisher = {International Conference on Computational Linguistics},
year = {2012}
}
@inproceedings{DBLP:conf/acl/CuiZLLZ13,
author = {Lei Cui and
Dongdong Zhang and
Shujie Liu and
Mu Li and
Ming Zhou},
title = {Bilingual Data Cleaning for {SMT} using Graph-based Random Walk},
pages = {340--345},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2013}
}
@phdthesis{DBLP:phd/dnb/Mediani17,
author = {Mohammed Mediani},
title = {Learning from Noisy Data in Statistical Machine Translation},
school = {Karlsruhe Institute of Technology, Germany},
year = {2017}
}
@inproceedings{rarrick2011mt,
title={MT detection in web-scraped parallel corpora},
author={Rarrick, Spencer and Quirk, Chris and Lewis, Will},
publisher={Machine Translation},
pages={422--430},
year={2011}
}
@inproceedings{taghipour2011parallel,
title={Parallel corpus refinement as an outlier detection algorithm},
author={Taghipour, Kaveh and Khadivi, Shahram and Xu, Jia},
publisher={Machine Translation},
pages={414--421},
year={2011}
}
@inproceedings{Xu2017ZipporahAF,
title={Zipporah: a Fast and Scalable Data Cleaning System for Noisy Web-Crawled Parallel Corpora},
author={Hainan Xu and Philipp Koehn},
booktitle={Conference on Empirical Methods in Natural Language Processing},
year={2017}
}
@inproceedings{DBLP:conf/aclnmt/CarpuatVN17,
author = {Marine Carpuat and
Yogarshi Vyas and
Xing Niu},
title = {Detecting Cross-Lingual Semantic Divergence for Neural Machine Translation},
pages = {69--79},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2017}
}
@inproceedings{DBLP:conf/naacl/VyasNC18,
author = {Yogarshi Vyas and
Xing Niu and
Marine Carpuat},
title = {Identifying Semantic Divergences in Parallel Text without Annotations},
pages = {1503--1515},
publisher = {Annual Conference of the North American Chapter of the Association for Computational Linguistics},
year = {2018}
}
@inproceedings{DBLP:conf/acl/WangCC19,
author = {Wei Wang and
Isaac Caswell and
Ciprian Chelba},
title = {Dynamically Composing Domain-Data Selection with Clean-Data Selection
by "Co-Curricular Learning" for Neural Machine Translation},
pages = {1282--1292},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2019}
}
@inproceedings{DBLP:conf/emnlp/SettlesC08,
author = {Burr Settles and
Mark Craven},
title = {An Analysis of Active Learning Strategies for Sequence Labeling Tasks},
pages = {1070--1079},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2008}
}
@inproceedings{campbell2000query,
title={Query learning with large margin classifiers},
author={Campbell, Colin and Cristianini, Nello and Smola, Alex and others},
publisher={International Conference on Machine Learning},
volume={20},
number={0},
pages={0},
year={2000}
}
@inproceedings{DBLP:conf/icml/SchohnC00,
author = {Greg Schohn and
David Cohn},
title = {Less is More: Active Learning with Support Vector Machines},
pages = {839--846},
publisher = {International Conference on Machine Learning},
year = {2000}
}
@inproceedings{DBLP:conf/colt/SeungOS92,
author = {H. Sebastian Seung and
Manfred Opper and
Haim Sompolinsky},
title = {Query by Committee},
pages = {287--294},
publisher = {Conference on Computational Learning Theory},
year = {1992}
}
@book{mitchell1996m,
title={Machine Learning},
author={Mitchell, Tom},
journal={McCraw Hill},
year={1996}
}
@inproceedings{DBLP:conf/icml/AbeM98,
author = {Naoki Abe and
Hiroshi Mamitsuka},
title = {Query Learning Strategies Using Boosting and Bagging},
pages = {1--9},
publisher = {International Conference on Machine Learning},
year = {1998}
}
@inproceedings{mccallumzy1998employing,
title={Employing EM and pool-based active learning for text classification},
author={McCallumzy, Andrew Kachites and Nigamy, Kamal},
publisher={International Conference on Machine Learning},
pages={359--367},
year={1998}
}
@inproceedings{DBLP:conf/cvpr/DalalT05,
author = {Navneet Dalal and
Bill Triggs},
title = {Histograms of Oriented Gradients for Human Detection},
pages = {886--893},
publisher = {{IEEE} Conference on Computer Vision and Pattern Recognition},
year = {2005}
}
@inproceedings{726791,
author={Yann {Lecun} and Leon {Bottou} and Yoshua {Bengio} and Patrick {Haffner}},
publisher={Proceedings of the IEEE},
title={Gradient-based learning applied to document recognition},
year={1998},
volume={86},
number={11},
pages={2278-2324}
}
@book{atkinson2007optimum,
title={Optimum experimental designs, with SAS},
author={Atkinson, Anthony and Donev, Alexander and Tobias, Randall and others},
volume={34},
year={2007},
publisher={Oxford University Press}
}
@inproceedings{DBLP:journals/jmlr/JiH12,
author = {Ming Ji and
Jiawei Han},
title = {A Variance Minimization Criterion to Active Learning on Graphs},
series = {{JMLR} Proceedings},
volume = {22},
pages = {556--564},
publisher = {International Conference on Artificial Intelligence and Statistics},
year = {2012}
}
@article{DBLP:journals/corr/ZhuB17,
author = {Jia-Jie Zhu and
Jos{\'{e}} Bento},
title = {Generative Adversarial Active Learning},
journal = {CoRR},
volume = {abs/1702.07956},
year = {2017}
}
@inproceedings{DBLP:conf/iccv/HuijserG17,
author = {Miriam W. Huijser and
Jan C. van Gemert},
title = {Active Decision Boundary Annotation with Deep Generative Models},
pages = {5296--5305},
publisher = {{IEEE} International Conference on Computer Vision},
year = {2017}
}
@inproceedings{DBLP:conf/wacv/0007T20,
author = {Christoph Mayer and
Radu Timofte},
title = {Adversarial Sampling for Active Learning},
pages = {3060--3068},
publisher = {{IEEE} Winter Conference on Applications of Computer Vision},
year = {2020}
}
@inproceedings{DBLP:conf/acl/JeanCMB15,
author = {S{\'{e}}bastien Jean and
KyungHyun Cho and
Roland Memisevic and
Yoshua Bengio},
title = {On Using Very Large Target Vocabulary for Neural Machine Translation},
pages = {1--10},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2015}
}
@inproceedings{2015OnGulcehre,
title = {On Using Monolingual Corpora in Neural Machine Translation},
author = {Gulcehre Caglar and
Firat Orhan and
Xu Kelvin and
Cho Kyunghyun and
Barrault Loic and
Lin Huei Chi and
Bougares Fethi and
Schwenk Holger and
Bengio Yoshua},
publisher = {Computer Science},
year = {2015},
}
@inproceedings{Sennrich2016ImprovingNM,
author = {Rico Sennrich and
Barry Haddow and
Alexandra Birch},
title = {Improving Neural Machine Translation Models with Monolingual Data},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2016}
}
@inproceedings{DBLP:conf/aaai/Zhang0LZC18,
author = {Zhirui Zhang and
Shujie Liu and
Mu Li and
Ming Zhou and
Enhong Chen},
title = {Joint Training for Neural Machine Translation Models with Monolingual
Data},
pages = {555--562},
publisher = {AAAI Conference on Artificial Intelligence},
year = {2018}
}
@inproceedings{hoang2018iterative,
title={Iterative back-translation for neural machine translation},
author={Hoang, Vu Cong Duy and Koehn, Philipp and Haffari, Gholamreza and Cohn, Trevor},
publisher={Proceedings of the 2nd Workshop on Neural Machine Translation and Generation},
pages={18--24},
year={2018}
}
@inproceedings{DBLP:conf/mtsummit/ImankulovaDFI19,
author = {Aizhan Imankulova and
Raj Dabre and
Atsushi Fujita and
Kenji Imamura},
title = {Exploiting Out-of-Domain Parallel Data through Multilingual Transfer
Learning for Low-Resource Neural Machine Translation},
pages = {128--139},
publisher = {Machine Translation},
year = {2019}
}
@inproceedings{DBLP:conf/emnlp/CurreyH19,
author = {Anna Currey and
Kenneth Heafield},
title = {Zero-Resource Neural Machine Translation with Monolingual Pivot Data},
pages = {99--107},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2019}
}
@inproceedings{DBLP:conf/emnlp/KimPPKN19,
author = {Yunsu Kim and
Petre Petrov and
Pavel Petrushkov and
Shahram Khadivi and
Hermann Ney},
title = {Pivot-based Transfer Learning for Neural Machine Translation between
Non-English Languages},
pages = {866--876},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2019}
}
@inproceedings{DBLP:conf/iclr/LampleCDR18,
author = {Guillaume Lample and
Alexis Conneau and
Ludovic Denoyer and
Marc'Aurelio Ranzato},
title = {Unsupervised Machine Translation Using Monolingual Corpora Only},
publisher = {International Conference on Learning Representations},
year = {2018}
}
@inproceedings{DBLP:conf/iclr/ArtetxeLAC18,
author = {Mikel Artetxe and
Gorka Labaka and
Eneko Agirre and
Kyunghyun Cho},
title = {Unsupervised Neural Machine Translation},
publisher = {International Conference on Learning Representations},
year = {2018}
}
%下面的publisher在看看
@inproceedings{DBLP:conf/conll/LiuBH18,
author = {Ming Liu and
Wray L. Buntine and
Gholamreza Haffari},
title = {Learning to Actively Learn Neural Machine Translation},
pages = {334--344},
publisher = {The SIGNLL Conference on Computational Natural Language Learning},
year = {2018}
}
@inproceedings{DBLP:conf/emnlp/ZhaoZZZ20,
author = {Yuekai Zhao and
Haoran Zhang and
Shuchang Zhou and
Zhihua Zhang},
title = {Active Learning Approaches to Enhancing Neural Machine Translation:
An Empirical Study},
pages = {1796--1806},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2020}
}
@inproceedings{Peris2018ActiveLF,
title={Active Learning for Interactive Neural Machine Translation of Data Streams},
author={{\'A}lvaro Peris and Francisco Casacuberta},
publisher={The SIGNLL Conference on Computational Natural Language Learning},
pages={151--160},
year={2018}
}
@inproceedings{DBLP:journals/pbml/TurchiNFF17,
author = {Marco Turchi and
Matteo Negri and
M. Amin Farajian and
Marcello Federico},
title = {Continuous Learning from Human Post-Edits for Neural Machine Translation},
publisher = {The Prague Bulletin of Mathematical Linguistics},
volume = {108},
pages = {233--244},
year = {2017}
}
@inproceedings{DBLP:journals/csl/PerisC19,
author = {{\'{A}}lvaro Peris and
Francisco Casacuberta},
title = {Online learning for effort reduction in interactive neural machine
translation},
publisher = {Computer Speech Language},
volume = {58},
pages = {98--126},
year = {2019}
}
@inproceedings{DBLP:conf/eccv/GuoHZZDSH18,
author = {Sheng Guo and
Weilin Huang and
Haozhi Zhang and
Chenfan Zhuang and
Dengke Dong and
Matthew R. Scott and
Dinglong Huang},
title = {CurriculumNet: Weakly Supervised Learning from Large-Scale Web Images},
series = {Lecture Notes in Computer Science},
volume = {11214},
pages = {139--154},
publisher = {European Conference on Computer Vision},
year = {2018}
}
@inproceedings{DBLP:conf/mm/JiangMMH14,
author = {Lu Jiang and
Deyu Meng and
Teruko Mitamura and
Alexander G. Hauptmann},
title = {Easy Samples First: Self-paced Reranking for Zero-Example Multimedia
Search},
pages = {547--556},
publisher = {ACM International Conference on Multimedia},
year = {2014}
}
%下面的pubisher
@inproceedings{DBLP:conf/naacl/PlataniosSNPM19,
author = {Emmanouil Antonios Platanios and
Otilia Stretcu and
Graham Neubig and
Barnab{\'{a}}s P{\'{o}}czos and
Tom M. Mitchell},
title = {Competence-based Curriculum Learning for Neural Machine Translation},
pages = {1162--1172},
publisher = {Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies},
year = {2019}
}
@inproceedings{DBLP:conf/acl/TayWLFPYRHZ19,
author = {Yi Tay and
Shuohang Wang and
Anh Tuan Luu and
Jie Fu and
Minh C. Phan and
Xingdi Yuan and
Jinfeng Rao and
Siu Cheung Hui and
Aston Zhang},
title = {Simple and Effective Curriculum Pointer-Generator Networks for Reading
Comprehension over Long Narratives},
pages = {4922--4931},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2019}
}
@inproceedings{DBLP:conf/icml/GuoCZZ0HT20,
author = {Yong Guo and
Yaofo Chen and
Yin Zheng and
Peilin Zhao and
Jian Chen and
Junzhou Huang and
Mingkui Tan},
title = {Breaking the Curse of Space Explosion: Towards Efficient {NAS} with
Curriculum Search},
series = {Proceedings of Machine Learning Research},
volume = {119},
pages = {3822--3831},
publisher = {International Conference on Machine Learning},
year = {2020}
}
@inproceedings{DBLP:conf/ranlp/KocmiB17,
author = {Tom Kocmi and
Ondrej Bojar},
title = {Curriculum Learning and Minibatch Bucketing in Neural Machine Translation},
pages = {379--386},
publisher = {International Conference Recent Advances in Natural Language Processing},
year = {2017}
}
@inproceedings{DBLP:conf/naacl/ZhangSKMCD19,
author = {Xuan Zhang and
Pamela Shapiro and
Gaurav Kumar and
Paul McNamee and
Marine Carpuat and
Kevin Duh},
title = {Curriculum Learning for Domain Adaptation in Neural Machine Translation},
pages = {1903--1915},
publisher = {Annual Conference of the North American Chapter of the Association for Computational Linguistics},
year = {2019}
}
@inproceedings{zhang2018empirical,
title={An empirical exploration of curriculum learning for neural machine translation},
author={Zhang, Xuan and Kumar, Gaurav and Khayrallah, Huda and Murray, Kenton and Gwinnup, Jeremy and Martindale, Marianna J and McNamee, Paul and Duh, Kevin and Carpuat, Marine},
publisher={arXiv preprint arXiv:1811.00739},
year={2018}
}
@inproceedings{DBLP:conf/coling/XuHJFWHJXZ20,
author = {Chen Xu and
Bojie Hu and
Yufan Jiang and
Kai Feng and
Zeyang Wang and
Shen Huang and
Qi Ju and
Tong Xiao and
Jingbo Zhu},
title = {Dynamic Curriculum Learning for Low-Resource Neural Machine Translation},
pages = {3977--3989},
publisher = {International Committee on Computational Linguistics},
year = {2020}
}
@inproceedings{DBLP:conf/acl/ZhouYWWC20,
author = {Yikai Zhou and
Baosong Yang and
Derek F. Wong and
Yu Wan and
Lidia S. Chao},
title = {Uncertainty-Aware Curriculum Learning for Neural Machine Translation},
pages = {6934--6944},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020}
}
@inproceedings{DBLP:conf/aaai/ZhaoWNW20,
author = {Mingjun Zhao and
Haijiang Wu and
Di Niu and
Xiaoli Wang},
title = {Reinforced Curriculum Learning on Pre-Trained Neural Machine Translation
Models},
pages = {9652--9659},
publisher = {AAAI Conference on Artificial Intelligence},
year = {2020}
}
@inproceedings{DBLP:conf/cvpr/PentinaSL15,
author = {Anastasia Pentina and
Viktoriia Sharmanska and
Christoph H. Lampert},
title = {Curriculum learning of multiple tasks},
pages = {5492--5500},
publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
year = {2015}
}
@inproceedings{DBLP:conf/iccvw/SarafianosGNK17,
author = {Nikolaos Sarafianos and
Theodore Giannakopoulos and
Christophoros Nikou and
Ioannis A. Kakadiaris},
title = {Curriculum Learning for Multi-task Classification of Visual Attributes},
pages = {2608--2615},
publisher = {IEEE International Conference on Computer Vision},
year = {2017}
}
@inproceedings{DBLP:conf/nips/ChangLM17,
author = {Haw-Shiuan Chang and
Erik G. Learned-Miller and
Andrew McCallum},
title = {Active Bias: Training More Accurate Neural Networks by Emphasizing
High Variance Samples},
publisher = {Conference and Workshop on Neural Information Processing Systems},
pages = {1002--1012},
year = {2017}
}
%ieee加{
@inproceedings{DBLP:journals/pami/LiH18a,
author = {Zhizhong Li and
Derek Hoiem},
title = {Learning without Forgetting},
publisher = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
volume = {40},
number = {12},
pages = {2935--2947},
year = {2018}
}
@inproceedings{rusu2016progressive,
title={Progressive neural networks},
author={Rusu, Andrei A and Rabinowitz, Neil C and Desjardins, Guillaume and Soyer, Hubert and Kirkpatrick, James and Kavukcuoglu, Koray and Pascanu, Razvan and Hadsell, Raia},
publisher={arXiv preprint arXiv:1606.04671},
year={2016}
}
@inproceedings{DBLP:journals/corr/FernandoBBZHRPW17,
author = {Chrisantha Fernando and
Dylan Banarse and
Charles Blundell and
Yori Zwols and
David Ha and
Andrei A. Rusu and
Alexander Pritzel and
Daan Wierstra},
title = {PathNet: Evolution Channels Gradient Descent in Super Neural Networks},
publisher = {CoRR},
volume = {abs/1701.08734},
year = {2017}
}
@inproceedings{DBLP:conf/naacl/ThompsonGKDK19,
author = {Brian Thompson and
Jeremy Gwinnup and
Huda Khayrallah and
Kevin Duh and
Philipp Koehn},
title = {Overcoming Catastrophic Forgetting During Domain Adaptation of Neural
Machine Translation},
pages = {2062--2068},
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2019}
}
@inproceedings{DBLP:conf/coling/GuF20,
author = {Shuhao Gu and
Yang Feng},
title = {Investigating Catastrophic Forgetting During Continual Training for
Neural Machine Translation},
pages = {4315--4326},
publisher = {International Committee on Computational Linguistics},
year = {2020}
}
%%%%% chapter 13------------------------------------------------------ %%%%% chapter 13------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
...@@ -12309,6 +13097,42 @@ author = {Zhuang Liu and ...@@ -12309,6 +13097,42 @@ author = {Zhuang Liu and
volume = {abs/1910.01108}, volume = {abs/1910.01108},
year = {2019} year = {2019}
} }
@inproceedings{DBLP:conf/icml/XiaTTQYL18,
author = {Yingce Xia and
Xu Tan and
Fei Tian and
Tao Qin and
Nenghai Yu and
Tie-Yan Liu},
title = {Model-Level Dual Learning},
series = {Proceedings of Machine Learning Research},
volume = {80},
pages = {5379--5388},
publisher = {International Conference on Machine Learning},
year = {2018}
}
@inproceedings{DBLP:conf/nips/HeXQWYLM16,
author = {Di He and
Yingce Xia and
Tao Qin and
Liwei Wang and
Nenghai Yu and
Tie{-}Yan Liu and
Wei{-}Ying Ma},
title = {Dual Learning for Machine Translation},
publisher = {Conference and Workshop on Neural Information Processing Systems},
pages = {820--828},
year = {2016}
}
@article{zhao2020dual,
title={Dual Learning: Theoretical Study and an Algorithmic Extension},
author={Zhao, Zhibing and Xia, Yingce and Qin, Tao and Xia, Lirong and Liu, Tie-Yan},
journal={arXiv preprint arXiv:2005.08238},
year={2020}
}
%%%%% chapter 16------------------------------------------------------ %%%%% chapter 16------------------------------------------------------
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论