王屹超17参考文献

66b1bf87 · 孟霞 · 2a570810 · 66b1bf87
Commit 66b1bf87 authored Dec 19, 2020 by 孟霞
--- a/bibliography.bib
+++ b/bibliography.bib
@@ -12890,6 +12890,761 @@ author    = {Zhuang Liu and
  publisher={电子工业出版社},
  year={2020}
 }
+%%%%%%%%%%%%%%%%%王屹超部分，孟霞加%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
+@inproceedings{DBLP:conf/mm/LinMSYYGZL20,
+  author    = {Huan Lin and
+               Fandong Meng and
+               Jinsong Su and
+               Yongjing Yin and
+               Zhengyuan Yang and
+               Yubin Ge and
+               Jie Zhou and
+               Jiebo Luo},
+  title     = {Dynamic Context-guided Capsule Network for Multimodal Machine Translation},
+  pages     = {1320--1329},
+  publisher = {	ACM Multimedia},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/wmt/SpeciaFSE16,
+  author    = {Lucia Specia and
+               Stella Frank and
+               Khalil Sima'an and
+               Desmond Elliott},
+  title     = {A Shared Task on Multimodal Machine Translation and Crosslingual Image
+               Description},
+  pages     = {543--553},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/wmt/ElliottFBBS17,
+  author    = {Desmond Elliott and
+               Stella Frank and
+               Lo{\"{\i}}c Barrault and
+               Fethi Bougares and
+               Lucia Specia},
+  title     = {Findings of the Second Shared Task on Multimodal Machine Translation
+               and Multilingual Image Description},
+  pages     = {215--233},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/wmt/BarraultBSLEF18,
+  author    = {Lo{\"{\i}}c Barrault and
+               Fethi Bougares and
+               Lucia Specia and
+               Chiraag Lala and
+               Desmond Elliott and
+               Stella Frank},
+  title     = {Findings of the Third Shared Task on Multimodal Machine Translation},
+  pages     = {304--323},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/wmt/CaglayanABGBBMH17,
+  author    = {Ozan Caglayan and
+               Walid Aransa and
+               Adrien Bardet and
+               Mercedes Garc{\'{\i}}a{-}Mart{\'{\i}}nez and
+               Fethi Bougares and
+               Lo{\"{\i}}c Barrault and
+               Marc Masana and
+               Luis Herranz and
+               Joost van de Weijer},
+  title     = {{LIUM-CVC} Submissions for {WMT17} Multimodal Translation Task},
+  pages     = {432--439},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/wmt/LibovickyHTBP16,
+  author    = {Jindrich Libovick{\'{y}} and
+               Jindrich Helcl and
+               Marek Tlust{\'{y}} and
+               Ondrej Bojar and
+               Pavel Pecina},
+  title     = {{CUNI} System for {WMT16} Automatic Post-Editing and Multimodal Translation
+               Tasks},
+  pages     = {646--654},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/emnlp/CalixtoL17,
+  author    = {Iacer Calixto and
+               Qun Liu},
+  title     = {Incorporating Global Visual Features into Attention-based Neural Machine
+               Translation},
+  pages     = {992--1003},
+  publisher = {Conference on Empirical Methods in Natural Language Processing},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/wmt/HuangLSOD16,
+  author    = {Po{-}Yao Huang and
+               Frederick Liu and
+               Sz{-}Rung Shiang and
+               Jean Oh and
+               Chris Dyer},
+  title     = {Attention-based Multimodal Neural Machine Translation},
+  pages     = {639--645},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2016}
+}
+
+@article{Elliott2015MultilingualID,
+  title={Multilingual Image Description with Neural Sequence Models},
+  author={Desmond Elliott and 
+          Stella Frank and 
+		  Eva Hasler},
+  journal={arXiv: Computation and Language},
+  year={2015}
+}
+
+@inproceedings{DBLP:conf/wmt/MadhyasthaWS17,
+  author    = {Pranava Swaroop Madhyastha and
+               Josiah Wang and
+               Lucia Specia},
+  title     = {Sheffield MultiMT: Using Object Posterior Predictions for Multimodal
+               Machine Translation},
+  pages     = {470--476},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/CaglayanBB16,
+  author    = {Ozan Caglayan and
+               Lo{\"{\i}}c Barrault and
+               Fethi Bougares},
+  title     = {Multimodal Attention for Neural Machine Translation},
+  journal   = {CoRR},
+  volume    = {abs/1609.03976},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/acl/CalixtoLC17,
+  author    = {Iacer Calixto and
+               Qun Liu and
+               Nick Campbell},
+  title     = {Doubly-Attentive Decoder for Multi-modal Neural Machine Translation},
+  pages     = {1913--1924},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/DelbrouckD17,
+  author    = {Jean{-}Benoit Delbrouck and
+               St{\'{e}}phane Dupont},
+  title     = {Multimodal Compact Bilinear Pooling for Multimodal Neural Machine
+               Translation},
+  journal   = {CoRR},
+  volume    = {abs/1703.08084},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/acl/LibovickyH17,
+  author    = {Jindrich Libovick{\'{y}} and
+               Jindrich Helcl},
+  title     = {Attention Strategies for Multi-Source Sequence-to-Sequence Learning},
+  pages     = {196--202},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/abs-1712-03449,
+  author    = {Jean{-}Benoit Delbrouck and
+               St{\'{e}}phane Dupont},
+  title     = {Modulating and attending the source image during encoding improves
+               Multimodal Translation},
+  journal   = {CoRR},
+  volume    = {abs/1712.03449},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/abs-1807-11605,
+  author    = {Hasan Sait Arslan and
+               Mark Fishel and
+               Gholamreza Anbarjafari},
+  title     = {Doubly Attentive Transformer Machine Translation},
+  journal   = {CoRR},
+  volume    = {abs/1807.11605},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/wmt/HelclLV18,
+  author    = {Jindrich Helcl and
+               Jindrich Libovick{\'{y}} and
+               Dusan Varis},
+  title     = {{CUNI} System for the {WMT18} Multimodal Translation Task},
+  pages     = {616--623},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/ijcnlp/ElliottK17,
+  author    = {Desmond Elliott and
+               {\'{A}}kos K{\'{a}}d{\'{a}}r},
+  title     = {Imagination Improves Multimodal Translation},
+  pages     = {130--141},
+  publisher = {International Joint Conference on Natural Language Processing},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/emnlp/ZhouCLY18,
+  author    = {Mingyang Zhou and
+               Runxiang Cheng and
+               Yong Jae Lee and
+               Zhou Yu},
+  title     = {A Visual Attention Grounding Neural Model for Multimodal Machine Translation},
+  pages     = {3643--3653},
+  publisher = {Conference on Empirical Methods in Natural Language Processing},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/acl/CalixtoRA19,
+  author    = {Iacer Calixto and
+               Miguel Rios and
+               Wilker Aziz},
+  title     = {Latent Variable Model for Multi-modal Translation},
+  pages     = {6392--6405},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2019}
+}
+
+@inproceedings{DBLP:conf/acl/YinMSZYZL20,
+  author    = {Yongjing Yin and
+               Fandong Meng and
+               Jinsong Su and
+               Chulun Zhou and
+               Zhengyuan Yang and
+               Jie Zhou and
+               Jiebo Luo},
+  title     = {A Novel Graph-based Multi-modal Fusion Encoder for Neural Machine
+               Translation},
+  pages     = {3025--3035},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2020}
+}
+
+@article{DBLP:journals/corr/abs-1712-03449,
+  author    = {Jean{-}Benoit Delbrouck and
+               St{\'{e}}phane Dupont},
+  title     = {Modulating and attending the source image during encoding improves
+               Multimodal Translation},
+  journal   = {CoRR},
+  volume    = {abs/1712.03449},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/acl/YaoW20,
+  author    = {Shaowei Yao and
+               Xiaojun Wan},
+  title     = {Multimodal Transformer for Multimodal Machine Translation},
+  pages     = {4346--4350},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/nips/LuYBP16,
+  author    = {Jiasen Lu and
+               Jianwei Yang and
+               Dhruv Batra and
+               Devi Parikh},
+  title     = {Hierarchical Question-Image Co-Attention for Visual Question Answering},
+  booktitle = {Conference on Neural Information Processing Systems},
+  pages     = {289--297},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/cvpr/VinyalsTBE15,
+  author    = {Oriol Vinyals and
+               Alexander Toshev and
+               Samy Bengio and
+               Dumitru Erhan},
+  title     = {Show and tell: {A} neural image caption generator},
+  pages     = {3156--3164},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2015}
+}
+
+@inproceedings{DBLP:conf/icml/XuBKCCSZB15,
+  author    = {Kelvin Xu and
+               Jimmy Ba and
+               Ryan Kiros and
+               Kyunghyun Cho and
+               Aaron C. Courville and
+               Ruslan Salakhutdinov and
+               Richard S. Zemel and
+               Yoshua Bengio},
+  title     = {Show, Attend and Tell: Neural Image Caption Generation with Visual
+               Attention},
+  volume    = {37},
+  pages     = {2048--2057},
+  publisher = {International Conference on Machine Learning},
+  year      = {2015}
+}
+
+@inproceedings{DBLP:conf/cvpr/YouJWFL16,
+  author    = {Quanzeng You and
+               Hailin Jin and
+               Zhaowen Wang and
+               Chen Fang and
+               Jiebo Luo},
+  title     = {Image Captioning with Semantic Attention},
+  pages     = {4651--4659},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/cvpr/ChenZXNSLC17,
+  author    = {Long Chen and
+               Hanwang Zhang and
+               Jun Xiao and
+               Liqiang Nie and
+               Jian Shao and
+               Wei Liu and
+               Tat{-}Seng Chua},
+  title     = {{SCA-CNN:} Spatial and Channel-Wise Attention in Convolutional Networks
+               for Image Captioning},
+  pages     = {6298--6306},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2017}
+}
+
+@article{DBLP:journals/pami/FuJCSZ17,
+  author    = {Kun Fu and
+               Junqi Jin and
+               Runpeng Cui and
+               Fei Sha and
+               Changshui Zhang},
+  title     = {Aligning Where to See and What to Tell: Image Captioning with Region-Based
+               Attention and Scene-Specific Contexts},
+  journal   = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
+  volume    = {39},
+  number    = {12},
+  pages     = {2321--2334},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/eccv/YaoPLM18,
+  author    = {Ting Yao and
+               Yingwei Pan and
+               Yehao Li and
+               Tao Mei},
+  title     = {Exploring Visual Relationship for Image Captioning},
+  series    = {Lecture Notes in Computer Science},
+  volume    = {11218},
+  pages     = {711--727},
+  publisher = {European Conference on Computer Vision},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/ijcai/LiuSWWY17,
+  author    = {Chang Liu and
+               Fuchun Sun and
+               Changhu Wang and
+               Feng Wang and
+               Alan L. Yuille},
+  title     = {{MAT:} {A} Multimodal Attentive Translator for Image Captioning},
+  pages     = {4033--4039},
+  publisher = {International Joint Conference on Artificial Intelligence},
+  year      = {2017}
+}
+
+@article{DBLP:journals/pami/RenHG017,
+  author    = {Shaoqing Ren and
+               Kaiming He and
+               Ross B. Girshick and
+               Jian Sun},
+  title     = {Faster {R-CNN:} Towards Real-Time Object Detection with Region Proposal
+               Networks},
+  journal   = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
+  volume    = {39},
+  number    = {6},
+  pages     = {1137--1149},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/abs-1804-02767,
+  author    = {Joseph Redmon and
+               Ali Farhadi},
+  title     = {YOLOv3: An Incremental Improvement},
+  journal   = {CoRR},
+  volume    = {abs/1804.02767},
+  year      = {2018}
+}
+
+@article{DBLP:journals/corr/abs-2004-10934,
+  author    = {Alexey Bochkovskiy and
+               Chien{-}Yao Wang and
+               Hong{-}Yuan Mark Liao},
+  title     = {YOLOv4: Optimal Speed and Accuracy of Object Detection},
+  journal   = {CoRR},
+  volume    = {abs/2004.10934},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/cvpr/LuXPS17,
+  author    = {Jiasen Lu and
+               Caiming Xiong and
+               Devi Parikh and
+               Richard Socher},
+  title     = {Knowing When to Look: Adaptive Attention via a Visual Sentinel for
+               Image Captioning},
+  pages     = {3242--3250},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/cvpr/00010BT0GZ18,
+  author    = {Peter Anderson and
+               Xiaodong He and
+               Chris Buehler and
+               Damien Teney and
+               Mark Johnson and
+               Stephen Gould and
+               Lei Zhang},
+  title     = {Bottom-Up and Top-Down Attention for Image Captioning and Visual Question
+               Answering},
+  pages     = {6077--6086},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/mm/ZhouXKC17,
+  author    = {Luowei Zhou and
+               Chenliang Xu and
+               Parker A. Koch and
+               Jason J. Corso},
+  title     = {Watch What You Just Said: Image Captioning with Text-Conditional Attention},
+  pages     = {305--313},
+  publisher = {ACM Multimedia},
+  year      = {2017}
+}
+
+@article{DBLP:journals/mta/FangWCT18,
+  author    = {Fang Fang and
+               Hanli Wang and
+               Yihao Chen and
+               Pengjie Tang},
+  title     = {Looking deeper and transferring attention for image captioning},
+  journal   = {Multimedia Tools Applications},
+  volume    = {77},
+  number    = {23},
+  pages     = {31159--31175},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/cvpr/AnejaDS18,
+  author    = {Jyoti Aneja and
+               Aditya Deshpande and
+               Alexander G. Schwing},
+  title     = {Convolutional Image Captioning},
+  pages     = {5561--5570},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2018}
+}
+
+@article{DBLP:journals/corr/abs-1805-09019,
+  author    = {Qingzhong Wang and
+               Antoni B. Chan},
+  title     = {{CNN+CNN:} Convolutional Decoders for Image Captioning},
+  journal   = {CoRR},
+  volume    = {abs/1805.09019},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/eccv/DaiYL18,
+  author    = {Bo Dai and
+               Deming Ye and
+               Dahua Lin},
+  title     = {Rethinking the Form of Latent States in Image Captioning},
+  volume    = {11209},
+  pages     = {294--310},
+  publisher = {European Conference on Computer Vision},
+  year      = {2018}
+}
+
+@inproceedings{DBLP:conf/iccv/AntolALMBZP15,
+  author    = {Stanislaw Antol and
+               Aishwarya Agrawal and
+               Jiasen Lu and
+               Margaret Mitchell and
+               Dhruv Batra and
+               C. Lawrence Zitnick and
+               Devi Parikh},
+  title     = {{VQA:} Visual Question Answering},
+  pages     = {2425--2433},
+  publisher = {International Conference on Computer Vision},
+  year      = {2015}
+}
+
+@inproceedings{DBLP:conf/eccv/CarionMSUKZ20,
+  author    = {Nicolas Carion and
+               Francisco Massa and
+               Gabriel Synnaeve and
+               Nicolas Usunier and
+               Alexander Kirillov and
+               Sergey Zagoruyko},
+  title     = {End-to-End Object Detection with Transformers},
+  volume    = {12346},
+  pages     = {213--229},
+  publisher = {European Conference on Computer Vision},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/acl/YaoW20,
+  author    = {Shaowei Yao and
+               Xiaojun Wan},
+  title     = {Multimodal Transformer for Multimodal Machine Translation},
+  pages     = {4346--4350},
+  publisher = {Annual Meeting of the Association for Computational Linguistics},
+  year      = {2020}
+}
+
+@article{DBLP:journals/tcsv/YuLYH20,
+  author    = {Jun Yu and
+               Jing Li and
+               Zhou Yu and
+               Qingming Huang},
+  title     = {Multimodal Transformer With Multi-View Visual Representation for Image
+               Captioning},
+  journal   = {IEEE Transactions on Circuits and Systems for Video Technology},
+  volume    = {30},
+  number    = {12},
+  pages     = {4467--4480},
+  year      = {2020}
+}
+
+@article{Huasong2020SelfAdaptiveNM,
+  title={Self-Adaptive Neural Module Transformer for Visual Question Answering},
+  author={Zhong Huasong and Jingyuan Chen and Chen Shen and Hanwang Zhang and Jianqiang Huang and Xian-Sheng Hua},
+  journal={IEEE Transactions on Multimedia},
+  year={2020},
+  pages={1-1}
+}
+
+@inproceedings{DBLP:conf/emnlp/GokhaleBBY20,
+  author    = {Tejas Gokhale and
+               Pratyay Banerjee and
+               Chitta Baral and
+               Yezhou Yang},
+  title     = {{MUTANT:} {A} Training Paradigm for Out-of-Distribution Generalization
+               in Visual Question Answering},
+  pages     = {878--892},
+  publisher = {Conference on Empirical Methods in Natural Language Processing},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/eccv/Tang0ZWY20,
+  author    = {Ruixue Tang and
+               Chao Ma and
+               Wei Emma Zhang and
+               Qi Wu and
+               Xiaokang Yang},
+  title     = {Semantic Equivalent Adversarial Data Augmentation for Visual Question
+               Answering},
+  volume    = {12364},
+  pages     = {437--453},
+  publisher = {	European Conference on Computer Vision},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/eccv/Li0LZHZWH0WCG20,
+  author    = {Xiujun Li and
+               Xi Yin and
+               Chunyuan Li and
+               Pengchuan Zhang and
+               Xiaowei Hu and
+               Lei Zhang and
+               Lijuan Wang and
+               Houdong Hu and
+               Li Dong and
+               Furu Wei and
+               Yejin Choi and
+               Jianfeng Gao},
+  title     = {Oscar: Object-Semantics Aligned Pre-training for Vision-Language Tasks},
+  volume    = {12375},
+  pages     = {121--137},
+  publisher = {	European Conference on Computer Vision},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/aaai/ZhouPZHCG20,
+  author    = {Luowei Zhou and
+               Hamid Palangi and
+               Lei Zhang and
+               Houdong Hu and
+               Jason J. Corso and
+               Jianfeng Gao},
+  title     = {Unified Vision-Language Pre-Training for Image Captioning and {VQA}},
+  pages     = {13041--13049},
+  publisher = {AAAI Conference on Artificial Intelligence},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/iclr/SuZCLLWD20,
+  author    = {Weijie Su and
+               Xizhou Zhu and
+               Yue Cao and
+               Bin Li and
+               Lewei Lu and
+               Furu Wei and
+               Jifeng Dai},
+  title     = {{VL-BERT:} Pre-training of Generic Visual-Linguistic Representations},
+  publisher = {International Conference on Learning Representations},
+  year      = {2020}
+}
+
+@inproceedings{DBLP:conf/nips/GoodfellowPMXWOCB14,
+  author    = {Ian J. Goodfellow and
+               Jean Pouget{-}Abadie and
+               Mehdi Mirza and
+               Bing Xu and
+               David Warde{-}Farley and
+               Sherjil Ozair and
+               Aaron C. Courville and
+               Yoshua Bengio},
+  title     = {Generative Adversarial Nets},
+  publisher = {Conference on Neural Information Processing Systems},
+  pages     = {2672--2680},
+  year      = {2014}
+}
+
+@inproceedings{DBLP:conf/nips/ZhuZPDEWS17,
+  author    = {Jun{-}Yan Zhu and
+               Richard Zhang and
+               Deepak Pathak and
+               Trevor Darrell and
+               Alexei A. Efros and
+               Oliver Wang and
+               Eli Shechtman},
+  title     = {Toward Multimodal Image-to-Image Translation},
+  publisher = {Conference on Neural Information Processing Systems},
+  pages     = {465--476},
+  year      = {2017}
+}
+
+@article{DBLP:journals/corr/abs-1908-06616,
+  author    = {Hajar Emami and
+               Majid Moradi Aliabadi and
+               Ming Dong and
+               Ratna Babu Chinnam},
+  title     = {{SPA-GAN:} Spatial Attention {GAN} for Image-to-Image Translation},
+  journal   = {CoRR},
+  volume    = {abs/1908.06616},
+  year      = {2019}
+}
+
+@article{DBLP:journals/access/XiongWG19,
+  author    = {Feng Xiong and
+               Qianqian Wang and
+               Quanxue Gao},
+  title     = {Consistent Embedded {GAN} for Image-to-Image Translation},
+  journal   = {International Conference on Access Networks},
+  volume    = {7},
+  pages     = {126651--126661},
+  year      = {2019}
+}
+
+@inproceedings{DBLP:conf/iccv/ZhuPIE17,
+  author    = {Jun{-}Yan Zhu and
+               Taesung Park and
+               Phillip Isola and
+               Alexei A. Efros},
+  title     = {Unpaired Image-to-Image Translation Using Cycle-Consistent Adversarial
+               Networks},
+  pages     = {2242--2251},
+  publisher = {International Conference on Computer Vision},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/iccv/YiZTG17,
+  author    = {Zili Yi and
+               Hao (Richard) Zhang and
+               Ping Tan and
+               Minglun Gong},
+  title     = {DualGAN: Unsupervised Dual Learning for Image-to-Image Translation},
+  pages     = {2868--2876},
+  publisher = {International Conference on Computer Vision},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/nips/LiuBK17,
+  author    = {Ming{-}Yu Liu and
+               Thomas Breuel and
+               Jan Kautz},
+  title     = {Unsupervised Image-to-Image Translation Networks},
+  publisher = {Conference on Neural Information Processing Systems},
+  pages     = {700--708},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/cvpr/IsolaZZE17,
+  author    = {Phillip Isola and
+               Jun{-}Yan Zhu and
+               Tinghui Zhou and
+               Alexei A. Efros},
+  title     = {Image-to-Image Translation with Conditional Adversarial Networks},
+  pages     = {5967--5976},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/icml/ReedAYLSL16,
+  author    = {Scott E. Reed and
+               Zeynep Akata and
+               Xinchen Yan and
+               Lajanugen Logeswaran and
+               Bernt Schiele and
+               Honglak Lee},
+  title     = {Generative Adversarial Text to Image Synthesis},
+  volume    = {48},
+  pages     = {1060--1069},
+  publisher = {International Conference on Machine Learning},
+  year      = {2016}
+}
+
+@article{DBLP:journals/corr/DashGALA17,
+  author    = {Ayushman Dash and
+               John Cristian Borges Gamboa and
+               Sheraz Ahmed and
+               Marcus Liwicki and
+               Muhammad Zeshan Afzal},
+  title     = {{TAC-GAN} - Text Conditioned Auxiliary Classifier Generative Adversarial
+               Network},
+  journal   = {CoRR},
+  volume    = {abs/1703.06412},
+  year      = {2017}
+}
+
+@inproceedings{DBLP:conf/nips/ReedAMTSL16,
+  author    = {Scott E. Reed and
+               Zeynep Akata and
+               Santosh Mohan and
+               Samuel Tenka and
+               Bernt Schiele and
+               Honglak Lee},
+  title     = {Learning What and Where to Draw},
+  publisher = {Conference on Neural Information Processing Systems},
+  pages     = {217--225},
+  year      = {2016}
+}
+
+@inproceedings{DBLP:conf/cvpr/ZhangXY18,
+  author    = {Zizhao Zhang and
+               Yuanpu Xie and
+               Lin Yang},
+  title     = {Photographic Text-to-Image Synthesis With a Hierarchically-Nested
+               Adversarial Network},
+  pages     = {6199--6208},
+  publisher = {IEEE Conference on Computer Vision and Pattern Recognition},
+  year      = {2018}
+}
+
 %%%%% chapter 17------------------------------------------------------
 %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%