@@ -6046,120 +6042,141 @@ author = {Yoshua Bengio and
...
@@ -6046,120 +6042,141 @@ author = {Yoshua Bengio and
@inproceedings{ElMaghraby2018EnhancingTF,
@inproceedings{ElMaghraby2018EnhancingTF,
title={Enhancing Translation from English to Arabic Using Two-Phase Decoder Translation},
title={Enhancing Translation from English to Arabic Using Two-Phase Decoder Translation},
author={Ayah ElMaghraby and Ahmed Rafea},
author={Ayah ElMaghraby and Ahmed Rafea},
booktitle={IntelliSys},
pages = {539--549},
year={2018}
publisher = {Intelligent Systems and Applications},
year = {2018}
}
}
@inproceedings{Geng2018AdaptiveMD,
@inproceedings{Geng2018AdaptiveMD,
title={Adaptive Multi-pass Decoder for Neural Machine Translation},
title={Adaptive Multi-pass Decoder for Neural Machine Translation},
author={X. Geng and X. Feng and B. Qin and T. Liu},
author={Xinwei Geng and
booktitle={EMNLP},
Xiaocheng Feng and
Bing Qin and
Ting Liu},
publisher ={Conference on Empirical Methods in Natural Language Processing},
pages={523--532},
year={2018}
year={2018}
}
}
@article{Lee2018DeterministicNN,
@article{Lee2018DeterministicNN,
title={Deterministic Non-Autoregressive Neural Sequence Modeling by Iterative Refinement},
title={Deterministic Non-Autoregressive Neural Sequence Modeling by Iterative Refinement},
author={Jason Lee and Elman Mansimov and Kyunghyun Cho},
author={Jason Lee and Elman Mansimov and Kyunghyun Cho},
journal={ArXiv},
pages = {1173--1182},
year={2018},
publisher = {Conference on Empirical Methods in Natural Language Processing},
volume={abs/1802.06901}
year = {2018}
}
}
@inproceedings{Gu2019LevenshteinT,
@inproceedings{Gu2019LevenshteinT,
title={Levenshtein Transformer},
title={Levenshtein Transformer},
author={Jiatao Gu and Changhan Wang and Jake Zhao},
author={Jiatao Gu and Changhan Wang and Jake Zhao},
booktitle={NeurIPS},
publisher = {Conference and Workshop on Neural Information Processing Systems},
year={2019}
pages = {11179--11189},
year = {2019},
}
}
@inproceedings{Guo2020JointlyMS,
@inproceedings{Guo2020JointlyMS,
title={Jointly Masked Sequence-to-Sequence Model for Non-Autoregressive Neural Machine Translation},
title={Jointly Masked Sequence-to-Sequence Model for Non-Autoregressive Neural Machine Translation},
author={Junliang Guo and Linli Xu and E. Chen},
author={Junliang Guo and Linli Xu and Enhong Chen},
booktitle={ACL},
pages = {376--385},
year={2020}
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2020}
}
}
@article{Stahlberg2018AnOS,
@article{Stahlberg2018AnOS,
title={An Operation Sequence Model for Explainable Neural Machine Translation},
title={An Operation Sequence Model for Explainable Neural Machine Translation},
author={Felix Stahlberg and Danielle Saunders and B. Byrne},
author={Felix Stahlberg and Danielle Saunders and Bill Byrne},
journal={ArXiv},
pages = {175--186},
year={2018},
publisher = {Conference on Empirical Methods in Natural Language Processing},
volume={abs/1808.09688}
year = {2018}
}
}
@inproceedings{Stern2019InsertionTF,
@inproceedings{Stern2019InsertionTF,
title={Insertion Transformer: Flexible Sequence Generation via Insertion Operations},
title={Insertion Transformer: Flexible Sequence Generation via Insertion Operations},
author={Mitchell Stern and William Chan and J. Kiros and Jakob Uszkoreit},
author={Mitchell Stern and William Chan and Jamie Kiros and Jakob Uszkoreit},
booktitle={ICML},
publisher={International Conference on Machine Learning},
pages={5976--5985},
year={2019}
year={2019}
}
}
@article{stling2017NeuralMT,
@article{stling2017NeuralMT,
title={Neural machine translation for low-resource languages},
title={Neural machine translation for low-resource languages},
author={Robert {\"O}stling and J. Tiedemann},
author={Robert {\"O}stling and J{\"{o}}rg Tiedemann},
journal={ArXiv},
journal={CoRR},
year={2017},
year={2017},
volume={abs/1708.05729}
volume={abs/1708.05729}
}
}
@article{Kikuchi2016ControllingOL,
@article{Kikuchi2016ControllingOL,
title={Controlling Output Length in Neural Encoder-Decoders},
title={Controlling Output Length in Neural Encoder-Decoders},
author={Yuta Kikuchi and Graham Neubig and Ryohei Sasano and H. Takamura and M. Okumura},
author={Yuta Kikuchi and
journal={ArXiv},
Graham Neubig and
year={2016},
Ryohei Sasano and
volume={abs/1609.09552}
Hiroya Takamura and
Manabu Okumura},
pages = {1328--1338},
publisher = {Conference on Empirical Methods in Natural Language Processing},
year = {2016}
}
}
@inproceedings{Takase2019PositionalET,
@inproceedings{Takase2019PositionalET,
title={Positional Encoding to Control Output Sequence Length},
title={Positional Encoding to Control Output Sequence Length},
author={S. Takase and N. Okazaki},
author={Sho Takase and
booktitle={NAACL-HLT},
Naoaki Okazaki},
publisher={Annual Conference of the North American Chapter of the Association for Computational Linguistics},
pages={3999--4004},
year={2019}
year={2019}
}
}
@inproceedings{Murray2018CorrectingLB,
@inproceedings{Murray2018CorrectingLB,
title={Correcting Length Bias in Neural Machine Translation},
title={Correcting Length Bias in Neural Machine Translation},
author={Kenton Murray and David Chiang},
author={Kenton Murray and David Chiang},
booktitle={WMT},
pages = {212--223},
year={2018}
publisher = {Annual Meeting of the Association for Computational Linguistics},
year = {2018}
}
}
@article{Sountsov2016LengthBI,
@article{Sountsov2016LengthBI,
title={Length bias in Encoder Decoder Models and a Case for Global Conditioning},
title={Length bias in Encoder Decoder Models and a Case for Global Conditioning},
author={Pavel Sountsov and Sunita Sarawagi},
author={Pavel Sountsov and Sunita Sarawagi},
journal={ArXiv},
pages = {1516--1525},
year={2016},
publisher = {Conference on Empirical Methods in Natural Language Processing},
volume={abs/1606.03402}
year = {2016}
}
}
@inproceedings{Jean2015MontrealNM,
@inproceedings{Jean2015MontrealNM,
title={Montreal Neural Machine Translation Systems for WMT'15},
title={Montreal Neural Machine Translation Systems for WMT'15},
author={S. Jean and Orhan Firat and Kyunghyun Cho and R. Memisevic and Yoshua Bengio},
author={S{\'{e}}bastien Jean and
booktitle={WMT@EMNLP},
Orhan Firat and
Kyunghyun Cho and
Roland Memisevic and
Yoshua Bengio},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={134--140},
year={2015}
year={2015}
}
}
@inproceedings{Yang2018OtemUtemOA,
@inproceedings{Yang2018OtemUtemOA,
title={Otem{\&}Utem: Over- and Under-Translation Evaluation Metric for NMT},
title={Otem{\&}Utem: Over- and Under-Translation Evaluation Metric for NMT},
author={J. Yang and Biao Zhang and Yue Qin and Xiangwen Zhang and Q. Lin and Jinsong Su},
author={Jing Yang and
booktitle={NLPCC},
Biao Zhang and
Yue Qin and
Xiangwen Zhang and
Qian Lin and
Jinsong Su},
publisher={CCF International Conference on Natural Language Processing and Chinese Computing},
pages={291--302},
year={2018}
year={2018}
}
}
@inproceedings{Mi2016CoverageEM,
@inproceedings{Mi2016CoverageEM,
title={Coverage Embedding Models for Neural Machine Translation},
title={Coverage Embedding Models for Neural Machine Translation},
author={Haitao Mi and B. Sankaran and Z. Wang and Abe Ittycheriah},
author={Haitao Mi and
booktitle={EMNLP},
Baskaran Sankaran and
year={2016}
Zhiguo Wang and
}
Abe Ittycheriah},
pages = {955--960},
@article{Kazimi2017CoverageFC,
publisher = {Conference on Empirical Methods in Natural Language Processing},
title={Coverage for Character Based Neural Machine Translation},
year = {2016}
author={M. Kazimi and Marta R. Costa-juss{\`a}},
journal={Proces. del Leng. Natural},
year={2017},
volume={59},
pages={99-106}
}
}
@inproceedings{DBLP:conf/emnlp/HuangZM17,
@inproceedings{DBLP:conf/emnlp/HuangZM17,
...
@@ -6176,7 +6193,8 @@ author = {Yoshua Bengio and
...
@@ -6176,7 +6193,8 @@ author = {Yoshua Bengio and
@inproceedings{Wiseman2016SequencetoSequenceLA,
@inproceedings{Wiseman2016SequencetoSequenceLA,
title={Sequence-to-Sequence Learning as Beam-Search Optimization},
title={Sequence-to-Sequence Learning as Beam-Search Optimization},
author={Sam Wiseman and Alexander M. Rush},
author={Sam Wiseman and Alexander M. Rush},
booktitle={EMNLP},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={1296--1306},
year={2016}
year={2016}
}
}
...
@@ -6193,10 +6211,12 @@ author = {Yoshua Bengio and
...
@@ -6193,10 +6211,12 @@ author = {Yoshua Bengio and
@article{Ma2019LearningTS,
@article{Ma2019LearningTS,
title={Learning to Stop in Structured Prediction for Neural Machine Translation},
title={Learning to Stop in Structured Prediction for Neural Machine Translation},
author={M. Ma and Renjie Zheng and Liang Huang},
author={Mingbo Ma and
journal={ArXiv},
Renjie Zheng and
year={2019},
Liang Huang},
volume={abs/1904.01032}
pages = {1884--1889},
publisher = { Annual Conference of the North American Chapter of the Association for Computational Linguistics},
year = {2019}
}
}
@inproceedings{KleinOpenNMT,
@inproceedings{KleinOpenNMT,
...
@@ -6220,119 +6240,153 @@ author = {Yoshua Bengio and
...
@@ -6220,119 +6240,153 @@ author = {Yoshua Bengio and
year = {2015}
year = {2015}
}
}
@inproceedings{Eisner2011LearningST,
title={Learning Speed-Accuracy Tradeoffs in Nondeterministic Inference Algorithms},
author={J. Eisner and Hal Daum{\'e}},
year={2011}
}
@inproceedings{Jiang2012LearnedPF,
@inproceedings{Jiang2012LearnedPF,
title={Learned Prioritization for Trading Off Accuracy and Speed},
title={Learned Prioritization for Trading Off Accuracy and Speed},
author={J. Jiang and Adam R. Teichert and Hal Daum{\'e} and J. Eisner},
author={Jiarong Jiang and Adam R. Teichert and Hal Daum{\'e} and Jason Eisner},
booktitle={NIPS},
publisher={Conference and Workshop on Neural Information Processing Systems},
year={2012}
pages={1340--1348},
year= {2012}
}
}
@inproceedings{Zheng2020OpportunisticDW,
@inproceedings{Zheng2020OpportunisticDW,
title={Opportunistic Decoding with Timely Correction for Simultaneous Translation},
title={Opportunistic Decoding with Timely Correction for Simultaneous Translation},
author={Renjie Zheng and M. Ma and Baigong Zheng and Kaibo Liu and Liang Huang},
author={Renjie Zheng and
booktitle={ACL},
Mingbo Ma and
Baigong Zheng and
Kaibo Liu and
Liang Huang},
publisher={Annual Meeting of the Association for Computational Linguistics},
pages={437--442},
year={2020}
year={2020}
}
}
@inproceedings{Ma2019STACLST,
@inproceedings{Ma2019STACLST,
title={STACL: Simultaneous Translation with Implicit Anticipation and Controllable Latency using Prefix-to-Prefix Framework},
title={STACL: Simultaneous Translation with Implicit Anticipation and Controllable Latency using Prefix-to-Prefix Framework},
author={M. Ma and L. Huang and Hao Xiong and Renjie Zheng and Kaibo Liu and Baigong Zheng and Chuanqiang Zhang and Zhongjun He and Hairong Liu and X. Li and H. Wu and Haifeng Wang},
author={Mingbo Ma and
booktitle={ACL},
Liang Huang and
Hao Xiong and
Renjie Zheng and
Kaibo Liu and
Baigong Zheng and
Chuanqiang Zhang and
Zhongjun He and
Hairong Liu and
Xing Li and
Hua Wu and
Haifeng Wang},
publisher={Annual Meeting of the Association for Computational Linguistics},
pages={3025--3036},
year={2019}
year={2019}
}
}
@inproceedings{Gimpel2013ASE,
@inproceedings{Gimpel2013ASE,
title={A Systematic Exploration of Diversity in Machine Translation},
title={A Systematic Exploration of Diversity in Machine Translation},
author={Kevin Gimpel and Dhruv Batra and Chris Dyer and Gregory Shakhnarovich},
author={Kevin Gimpel and Dhruv Batra and Chris Dyer and Gregory Shakhnarovich},
booktitle={EMNLP},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={1100--1111},
year={2013}
year={2013}
}
}
@article{Li2016MutualIA,
@article{Li2016MutualIA,
title={Mutual Information and Diverse Decoding Improve Neural Machine Translation},
title={Mutual Information and Diverse Decoding Improve Neural Machine Translation},
author={J. Li and Dan Jurafsky},
author={Jiwei Li and Dan Jurafsky},
journal={ArXiv},
journal={CoRR},
year={2016},
year={2016},
volume={abs/1601.00372}
volume={abs/1601.00372}
}
}
@inproceedings{Li2016ADO,
@inproceedings{Li2016ADO,
title={A Diversity-Promoting Objective Function for Neural Conversation Models},
title={A Diversity-Promoting Objective Function for Neural Conversation Models},
author={J. Li and Michel Galley and Chris Brockett and Jianfeng Gao and W. Dolan},
author={Jiwei Li and
booktitle={HLT-NAACL},
Michel Galley and
Chris Brockett and
Jianfeng Gao and
Bill Dolan},
publisher={Annual Conference of the North American Chapter of the Association for Computational Linguistics},
pages={110--119},
year={2016}
year={2016}
}
}
@inproceedings{He2018SequenceTS,
@inproceedings{He2018SequenceTS,
title={Sequence to Sequence Mixture Model for Diverse Machine Translation},
title={Sequence to Sequence Mixture Model for Diverse Machine Translation},
author={Xuanli He and Gholamreza Haffari and Mohammad Norouzi},
author={Xuanli He and Gholamreza Haffari and Mohammad Norouzi},
booktitle={CoNLL},
pages = {583--592},
year={2018}
publisher = {International Conference on Computational Linguistics},
year = {2018}
}
}
@article{Shen2019MixtureMF,
@article{Shen2019MixtureMF,
title={Mixture Models for Diverse Machine Translation: Tricks of the Trade},
title={Mixture Models for Diverse Machine Translation: Tricks of the Trade},
author={Tianxiao Shen and Myle Ott and M. Auli and Marc'Aurelio Ranzato},
author={Tianxiao Shen and Myle Ott and Michael Auli and Marc'Aurelio Ranzato},
journal={ArXiv},
pages = {5719--5728},
year={2019},
publisher = {International Conference on Machine Learning},
volume={abs/1902.07816}
year = {2019},
}
}
@article{Wu2020GeneratingDT,
@article{Wu2020GeneratingDT,
title={Generating Diverse Translation from Model Distribution with Dropout},
title={Generating Diverse Translation from Model Distribution with Dropout},
author={Xuanfu Wu and Yang Feng and Chenze Shao},
author={Xuanfu Wu and Yang Feng and Chenze Shao},
journal={ArXiv},
pages={1088--1097},
year={2020},
publisher={Annual Meeting of the Association for Computational Linguistics},
volume={abs/2010.08178}
year={2020}
}
}
@inproceedings{Sun2020GeneratingDT,
@inproceedings{Sun2020GeneratingDT,
title={Generating Diverse Translation by Manipulating Multi-Head Attention},
title={Generating Diverse Translation by Manipulating Multi-Head Attention},
author={Zewei Sun and Shujian Huang and Hao-Ran Wei and Xin-Yu Dai and Jiajun Chen},
author={Zewei Sun and Shujian Huang and Hao Ran Wei and Xin Yu Dai and Jiajun Chen},
booktitle={AAAI},
publisher={AAAI Conference on Artificial Intelligence},
pages={8976--8983},
year={2020}
year={2020}
}
}
@article{Vijayakumar2016DiverseBS,
@article{Vijayakumar2016DiverseBS,
title={Diverse Beam Search: Decoding Diverse Solutions from Neural Sequence Models},
title={Diverse Beam Search: Decoding Diverse Solutions from Neural Sequence Models},
author={Ashwin K. Vijayakumar and Michael Cogswell and R. R. Selvaraju and Q. Sun and Stefan Lee and David J. Crandall and Dhruv Batra},
author={Ashwin K. Vijayakumar and
journal={ArXiv},
Michael Cogswell and
Ramprasaath R. Selvaraju and
Qing Sun and
Stefan Lee and
David J. Crandall and
Dhruv Batra},
journal={CoRR},
year={2016},
year={2016},
volume={abs/1610.02424}
volume={abs/1610.02424}
}
}
@inproceedings{Liu2014SearchAwareTF,
@inproceedings{Liu2014SearchAwareTF,
title={Search-Aware Tuning for Machine Translation},
title={Search-Aware Tuning for Machine Translation},
author={L. Liu and Liang Huang},
author={Lemao Liu and
booktitle={EMNLP},
Liang Huang},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={1942--1952},
year={2014}
year={2014}
}
}
@inproceedings{Yu2013MaxViolationPA,
@inproceedings{Yu2013MaxViolationPA,
title={Max-Violation Perceptron and Forced Decoding for Scalable MT Training},
title={Max-Violation Perceptron and Forced Decoding for Scalable MT Training},
author={Heng Yu and Liang Huang and Haitao Mi and Kai Zhao},
author={Heng Yu and Liang Huang and Haitao Mi and Kai Zhao},
booktitle={EMNLP},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={1112--1123},
year={2013}
year={2013}
}
}
@inproceedings{Stahlberg2019OnNS,
@inproceedings{Stahlberg2019OnNS,
title={On NMT Search Errors and Model Errors: Cat Got Your Tongue?},
title={On NMT Search Errors and Model Errors: Cat Got Your Tongue?},
author={Felix Stahlberg and
author={Felix Stahlberg and
B. Byrne},
Bill Byrne},
booktitle={EMNLP/IJCNLP},
publisher={Conference on Empirical Methods in Natural Language Processing},
pages={3354--3360},
year={2019}
year={2019}
}
}
@inproceedings{Niehues2017AnalyzingNM,
@inproceedings{Niehues2017AnalyzingNM,
title={Analyzing Neural MT Search and Model Performance},
title={Analyzing Neural MT Search and Model Performance},
author={J. Niehues and Eunah Cho and Thanh-Le Ha and Alexander H. Waibel},
author={Jan Niehues and
booktitle={NMT@ACL},
Eunah Cho and
Thanh-Le Ha and
Alex Waibel},
pages={11--17},
publisher={Annual Meeting of the Association for Computational Linguistics},
year={2017}
year={2017}
}
}
...
@@ -6347,26 +6401,31 @@ author = {Yoshua Bengio and
...
@@ -6347,26 +6401,31 @@ author = {Yoshua Bengio and
@article{Ranzato2016SequenceLT,
@article{Ranzato2016SequenceLT,
title={Sequence Level Training with Recurrent Neural Networks},
title={Sequence Level Training with Recurrent Neural Networks},
author={Marc'Aurelio Ranzato and S. Chopra and M. Auli and W. Zaremba},
author={Marc'Aurelio Ranzato and
journal={CoRR},
Sumit Chopra and
year={2016},
Michael Auli and
volume={abs/1511.06732}
Wojciech Zaremba},
publisher={International Conference on Learning Representations},
year={2016}
}
}
@article{Bengio2015ScheduledSF,
@article{Bengio2015ScheduledSF,
title={Scheduled Sampling for Sequence Prediction with Recurrent Neural Networks},
title={Scheduled Sampling for Sequence Prediction with Recurrent Neural Networks},
author={S. Bengio and Oriol Vinyals and Navdeep Jaitly and Noam Shazeer},
author={Samy Bengio and
journal={ArXiv},
Oriol Vinyals and
year={2015},
Navdeep Jaitly and
volume={abs/1506.03099}
Noam Shazeer},
booktitle = {Conference and Workshop on Neural Information Processing Systems},
pages = {1171--1179},
year = {2015}
}
}
@article{Zhang2019BridgingTG,
@article{Zhang2019BridgingTG,
title={Bridging the Gap between Training and Inference for Neural Machine Translation},
title={Bridging the Gap between Training and Inference for Neural Machine Translation},
author={Wen Zhang and Y. Feng and Fandong Meng and Di You and Qun Liu},
author={Wen Zhang and Yang Feng and Fandong Meng and Di You and Qun Liu},
journal={ArXiv},
pages = {4334--4343},
year={2019},
publisher = {Annual Meeting of the Association for Computational Linguistics},
volume={abs/1906.02448}
year = {2019}
}
}
@inproceedings{DBLP:conf/acl/ShenCHHWSL16,
@inproceedings{DBLP:conf/acl/ShenCHHWSL16,
...
@@ -6382,15 +6441,6 @@ author = {Yoshua Bengio and
...
@@ -6382,15 +6441,6 @@ author = {Yoshua Bengio and
year = {2016},
year = {2016},
}
}
@article{Gage1994ANA,
title={A new algorithm for data compression},
author={P. Gage},
journal={The C Users Journal archive},
year={1994},
volume={12},
pages={23-38}
}
@inproceedings{DBLP:conf/acl/SennrichHB16a,
@inproceedings{DBLP:conf/acl/SennrichHB16a,
author = {Rico Sennrich and
author = {Rico Sennrich and
Barry Haddow and
Barry Haddow and
...
@@ -6434,26 +6484,31 @@ author = {Yoshua Bengio and
...
@@ -6434,26 +6484,31 @@ author = {Yoshua Bengio and
@article{Narang2017BlockSparseRN,
@article{Narang2017BlockSparseRN,
title={Block-Sparse Recurrent Neural Networks},
title={Block-Sparse Recurrent Neural Networks},
author={Sharan Narang and Eric Undersander and G. Diamos},
author={Sharan Narang and Eric Undersander and Gregory Diamos},
journal={ArXiv},
journal={CoRR},
year={2017},
year={2017},
volume={abs/1711.02782}
volume={abs/1711.02782}
}
}
@article{Gale2019TheSO,
@article{Gale2019TheSO,
title={The State of Sparsity in Deep Neural Networks},
title={The State of Sparsity in Deep Neural Networks},
author={T. Gale and E. Elsen and Sara Hooker},
author={Trevor Gale and
journal={ArXiv},
Erich Elsen and
Sara Hooker},
journal={CoRR},
year={2019},
year={2019},
volume={abs/1902.09574}
volume={abs/1902.09574}
}
}
@article{Michel2019AreSH,
@article{Michel2019AreSH,
title={Are Sixteen Heads Really Better than One?},
title={Are Sixteen Heads Really Better than One?},
author={Paul Michel and Omer Levy and Graham Neubig},
author = {Paul Michel and
journal={ArXiv},
Omer Levy and
year={2019},
Graham Neubig},
volume={abs/1905.10650}
title = {Are Sixteen Heads Really Better than One?},
publisher = {Conference and Workshop on Neural Information Processing Systems},
pages = {14014--14024},
year = {2019}
}
}
@inproceedings{DBLP:journals/corr/abs-1905-09418,
@inproceedings{DBLP:journals/corr/abs-1905-09418,
...
@@ -6481,17 +6536,11 @@ author = {Yoshua Bengio and
...
@@ -6481,17 +6536,11 @@ author = {Yoshua Bengio and
@article{Katharopoulos2020TransformersAR,
@article{Katharopoulos2020TransformersAR,
title={Transformers are RNNs: Fast Autoregressive Transformers with Linear Attention},
title={Transformers are RNNs: Fast Autoregressive Transformers with Linear Attention},
author={Angelos Katharopoulos and Apoorv Vyas and Nikolaos Pappas and Franccois Fleuret},
author={Angelos Katharopoulos and Apoorv Vyas and Nikolaos Pappas and Franccois Fleuret},
journal={ArXiv},
journal={CoRR},
year={2020},
year={2020},
volume={abs/2006.16236}
volume={abs/2006.16236}
}
}
@inproceedings{Beal2003VariationalAF,
title={Variational algorithms for approximate Bayesian inference},
author={M. Beal},
year={2003}
}
@article{xiao2011language,
@article{xiao2011language,
title ={Language Modeling for Syntax-Based Machine Translation Using Tree Substitution Grammars: A Case Study on Chinese-English Translation},
title ={Language Modeling for Syntax-Based Machine Translation Using Tree Substitution Grammars: A Case Study on Chinese-English Translation},
author ={Xiao, Tong and Zhu, Jingbo and Zhu, Muhua},
author ={Xiao, Tong and Zhu, Jingbo and Zhu, Muhua},
...
@@ -6504,33 +6553,40 @@ author = {Yoshua Bengio and
...
@@ -6504,33 +6553,40 @@ author = {Yoshua Bengio and
@inproceedings{Li2009VariationalDF,
@inproceedings{Li2009VariationalDF,
title={Variational Decoding for Statistical Machine Translation},
title={Variational Decoding for Statistical Machine Translation},
author={Zhifei Li and J. Eisner and S. Khudanpur},
author={Zhifei Li and
booktitle={ACL/IJCNLP},
Jason Eisner and
Sanjeev Khudanpur},
publisher={Annual Meeting of the Association for Computational Linguistics},
pages={593--601},
year={2009}
year={2009}
}
}
@article{Bastings2019ModelingLS,
@article{Bastings2019ModelingLS,
title={Modeling Latent Sentence Structure in Neural Machine Translation},
title={Modeling Latent Sentence Structure in Neural Machine Translation},
author={Jasmijn Bastings and W. Aziz and Ivan Titov and K. Sima'an},
author={Jasmijn Bastings and
journal={ArXiv},
Wilker Aziz and
year={2019},
Ivan Titov and
volume={abs/1901.06436}
Khalil Sima'an},
journal = {CoRR},
volume = {abs/1901.06436},
year = {2019}
}
}
@article{Shah2018GenerativeNM,
@article{Shah2018GenerativeNM,
title={Generative Neural Machine Translation},
title={Generative Neural Machine Translation},
author={Harshil Shah and D. Barber},
author={Harshil Shah and
journal={ArXiv},
David Barber},
year={2018},
publisher={Conference and Workshop on Neural Information Processing Systems},
publisher={Conference and Workshop on Neural Information Processing Systems},
pages={4565--4573},
year={2016}
year={2016}
}
}
@article{Duan2017OneShotIL,
@article{Duan2017OneShotIL,
title={One-Shot Imitation Learning},
title={One-Shot Imitation Learning},
author={Yan Duan and Marcin Andrychowicz and Bradly C. Stadie and Jonathan Ho and J. Schneider and Ilya Sutskever and P. Abbeel and W. Zaremba},
author={Yan Duan and Marcin Andrychowicz and Bradly C. Stadie and Jonathan Ho and Jonas Schneider and Ilya Sutskever and Pieter Abbeel and Wojciech Zaremba},