Last active
November 10, 2017 08:11
-
-
Save iaalm/5e80800f1159546fecf68cfc4b2b684e to your computer and use it in GitHub Desktop.
SimonBibtex
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
@article{kadir2001saliency, | |
title={Saliency, scale and image description}, | |
author={Kadir, Timor and Brady, Michael}, | |
journal={International Journal of Computer Vision}, | |
volume={45}, | |
number={2}, | |
pages={83--105}, | |
year={2001}, | |
publisher={Springer} | |
} | |
@inproceedings{ren2015exploring, | |
title={Exploring models and data for image question answering}, | |
author={Ren, Mengye and Kiros, Ryan and Zemel, Richard}, | |
booktitle={Proceedings of Advances in Neural Information Processing Systems}, | |
month={Dec.}, | |
pages={2953--2961}, | |
year={2015} | |
} | |
@inproceedings{malinowski2015ask, | |
title={Ask your neurons: A neural-based approach to answering questions about images}, | |
author={Malinowski, Mateusz and Rohrbach, Marcus and Fritz, Mario}, | |
booktitle={Proceedings of the IEEE International Conference on Computer Vision}, | |
month={Dec.}, | |
pages={1--9}, | |
year={2015} | |
} | |
@inproceedings{malinowski2014multi, | |
title={A multi-world approach to question answering about real-world scenes based on uncertain input}, | |
author={Malinowski, Mateusz and Fritz, Mario}, | |
booktitle={Proceedings of Advances in Neural Information Processing Systems}, | |
month={Dec.}, | |
pages={1682--1690}, | |
year={2014} | |
} | |
@inproceedings{luong2015effective, | |
title={Effective approaches to attention-based neural machine translation}, | |
author={Luong, Minh-Thang and Pham, Hieu and Manning, Christopher D}, | |
booktitle={Proceedings of conference on Empirical Methods on Natural Language Processing}, | |
month={Sept.}, | |
year={2015} | |
} | |
@inproceedings{antol2015vqa, | |
title={Vqa: Visual question answering}, | |
author={Antol, Stanislaw and Agrawal, Aishwarya and Lu, Jiasen and Mitchell, Margaret and Batra, Dhruv and Lawrence Zitnick, C and Parikh, Devi}, | |
booktitle={Proceedings of the IEEE International Conference on Computer Vision}, | |
month={Dec.}, | |
pages={2425--2433}, | |
year={2015} | |
} | |
@inproceedings{kuznetsova2013generalizing, | |
title={Generalizing Image Captions for Image-Text Parallel Corpus}, | |
author={Kuznetsova, Polina and Ordonez, Vicente and Berg, Alexander C and Berg, Tamara L and Choi, Yejin}, | |
booktitle={Proceedings of the 51st Annual Meeting of the Association for Computational Linguistics}, | |
pages={790--796}, | |
month={Aug.}, | |
year={2013}, | |
organization={Citeseer} | |
} | |
@inproceedings{kuznetsova2012collective, | |
title={Collective generation of natural image descriptions}, | |
author={Kuznetsova, Polina and Ordonez, Vicente and Berg, Alexander C and Berg, Tamara L and Choi, Yejin}, | |
booktitle={Proceedings of the 50th Annual Meeting of the Association for Computational Linguistics}, | |
volume={1}, | |
month={Jul.}, | |
pages={359--368}, | |
year={2012}, | |
organization={Association for Computational Linguistics} | |
} | |
@article{kulkarni2013babytalk, | |
title={Babytalk: Understanding and generating simple image descriptions}, | |
author={Kulkarni, Girish and Premraj, Visruth and Ordonez, Vicente and Dhar, Sagnik and Li, Siming and Choi, Yejin and Berg, Alexander C and Berg, Tamara L}, | |
journal={IEEE Transactions on Pattern Analysis and Machine Intelligence}, | |
volume={35}, | |
number={12}, | |
pages={2891--2903}, | |
year={2013}, | |
publisher={IEEE} | |
} | |
@inproceedings{farhadi2010every, | |
title={Every picture tells a story: Generating sentences from images}, | |
author={Farhadi, Ali and Hejrati, Mohsen and Sadeghi, Mohammad Amin and Young, Peter and Rashtchian, Cyrus and Hockenmaier, Julia and Forsyth, David}, | |
booktitle={Proceedings of European conference on computer vision}, | |
month={Sept.}, | |
pages={15--29}, | |
year={2010}, | |
organization={Springer} | |
} | |
@inproceedings{lin2004automatic, | |
title={Automatic evaluation of machine translation quality using longest common subsequence and skip-bigram statistics}, | |
author={Lin, Chin-Yew and Och, Franz Josef}, | |
booktitle={Proceedings of the 42nd Annual Meeting on Association for Computational Linguistics}, | |
month={Jul.}, | |
pages={605--612}, | |
year={2004}, | |
organization={Association for Computational Linguistics} | |
} | |
@inproceedings{ma2015learning, | |
title={Learning to answer questions from image using convolutional neural network}, | |
author={Ma, Lin and Lu, Zhengdong and Li, Hang}, | |
booktitle={Proceedings of Association for the Advancement of Artificial Intelligence Conference}, | |
month={Feb.}, | |
page={3567--3573}, | |
year={2016} | |
} | |
@inproceedings{wu2015value, | |
title={What value do explicit high level concepts have in vision to language problems?}, | |
author={Wu, Qi and Shen, Chunhua and Liu, Lingqiaoand Dick, AAnthony and Hengel, Anton van den}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
month = {Jun.}, | |
pages={203--212}, | |
year={2016} | |
} | |
@inproceedings{karpathy2015deep, | |
title={Deep visual-semantic alignments for generating image descriptions}, | |
author={Karpathy, Andrej and Fei-Fei, Li}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
month = {Jun.}, | |
pages={3128--3137}, | |
year={2015} | |
} | |
@inproceedings{vinyals2015show, | |
title={Show and tell: A neural image caption generator}, | |
author={Vinyals, Oriol and Toshev, Alexander and Bengio, Samy and Erhan, Dumitru}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
month = {Jun.}, | |
pages={3156--3164}, | |
year={2015} | |
} | |
@inproceedings{fang2015captions, | |
title={From captions to visual concepts and back}, | |
author={Fang, Hao and Gupta, Saurabh and Iandola, Forrest and Srivastava, Rupesh K and Deng, Li and Doll{\'a}r, Piotr and Gao, Jianfeng and He, Xiaodong and Mitchell, Margaret and Platt, John C and others}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
pages={1473--1482}, | |
year={2015} | |
} | |
@inproceedings{xu2015show, | |
title="Show, Attend and Tell: Neural Image Caption Generation with Visual Attention", | |
Author={Xu, Kelvin and Ba, Jimmy Lei and Kiros, Ryan and Cho, Kyunghyun and Courville, Aaronand and Salakhudinov, Ruslan and Zemel, Richard S and Bengio, Yoshua}, | |
year={2015}, | |
Booktitle={Proceedings of the International Conference on Machine Learning}, | |
month = {Jul.}, | |
pages={2048--2057} | |
} | |
@article{ferreira2007introduction, | |
title={Introduction to the special issue on language--vision interactions}, | |
author={Ferreira, Fernanda and Tanenhaus, Michael K}, | |
journal={Journal of Memory and Language}, | |
volume={57}, | |
number={4}, | |
pages={455--459}, | |
year={2007}, | |
publisher={Elsevier} | |
} | |
@incollection{nuallain1994investigation, | |
title={An investigation into the common semantics of language and vision}, | |
author={Nuallain, Sean O and Smith, Arnold G}, | |
booktitle={Integration of Natural Language and Vision Processing}, | |
pages={21--30}, | |
year={1994}, | |
publisher={Springer} | |
} | |
@article{rosch1976basic, | |
title={Basic objects in natural categories}, | |
author={Rosch, Eleanor and Mervis, Carolyn B and Gray, Wayne D and Johnson, David M and Boyes-Braem, Penny}, | |
journal={Cognitive psychology}, | |
volume={8}, | |
number={3}, | |
pages={382--439}, | |
year={1976}, | |
publisher={Elsevier} | |
} | |
@inproceedings{vreeswijk2012all, | |
title={All vehicles are cars: Subclass preferences in container concepts}, | |
author={Vreeswijk, Daan TJ and Snoek, Cees GM and van de Sande, Koen EA and Smeulders, Arnold WM}, | |
booktitle={Proceedings of the 2nd ACM International Conference on Multimedia Retrieval}, | |
pages={8}, | |
year={2012}, | |
organization={ACM} | |
} | |
@inproceedings{mettes2016imagenet, | |
title={The imagenet shuffle: Reorganized pre-training for video event detection}, | |
author={Mettes, Pascal and Koelma, Dennis C and Snoek, Cees GM}, | |
booktitle={Proceedings of the ACM International Conference on Multimedia Retrieval}, | |
pages={175--182}, | |
year={2016}, | |
organization={ACM} | |
} | |
@inproceedings{deselaers2011visual, | |
title={Visual and semantic similarity in imagenet}, | |
author={Deselaers, Thomas and Ferrari, Vittorio}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
pages={1777--1784}, | |
year={2011}, | |
organization={IEEE} | |
} | |
@inproceedings{szegedy2015going, | |
title={Going deeper with convolutions}, | |
author={Szegedy, Christian and Liu, Wei and Jia, Yangqing and Sermanet, Pierre and Reed, Scott and Anguelov, Dragomir and Erhan, Dumitru and Vanhoucke, Vincent and Rabinovich, Andre}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
pages={1--9}, | |
month={Jun.}, | |
year={2015} | |
} | |
@inproceedings{bahdanau2014neural, | |
title={Neural machine translation by jointly learning to align and translate}, | |
author={Bahdanau, Dzmitry and Cho, Kyunghyun and Bengio, Yoshua}, | |
booktitle={Proceedings of the International Conference on Learning Representations}, | |
month={May.}, | |
year={2015} | |
} | |
@article{russakovsky2015imagenet, | |
title={Imagenet large scale visual recognition challenge}, | |
author={Russakovsky, Olga and Deng, Jia and Su, Hao and Krause, Jonathan and Satheesh, Sanjeev and Ma, Sean and Huang, Zhiheng and Karpathy, Andrej and Khosla, Aditya and Bernstein, Michael and others}, | |
journal={International Journal of Computer Vision}, | |
volume={115}, | |
number={3}, | |
pages={211--252}, | |
year={2015}, | |
publisher={Springer} | |
} | |
@inproceedings{he2016deep, | |
title={Deep residual learning for image recognition}, | |
author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
pages={770--778}, | |
year={2016} | |
} | |
@inproceedings{krizhevsky2012imagenet, | |
title={Imagenet classification with deep convolutional neural networks}, | |
author={Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E}, | |
booktitle={Proceedings of Advances in Neural Information Processing Systems}, | |
pages={1097--1105}, | |
year={2012} | |
} | |
@article{chen2015microsoft, | |
title={Microsoft COCO captions: Data collection and evaluation server}, | |
author={Chen, Xinlei and Fang, Hao and Lin, Tsung-Yi and Vedantam, Ramakrishna and Gupta, Saurabh and Doll{\'a}r, Piotr and Zitnick, C Lawrence}, | |
journal={arXiv preprint arXiv:1504.00325}, | |
year={2015} | |
} | |
@inproceedings{lin2014microsoft, | |
title={Microsoft coco: Common objects in context}, | |
author={Lin, Tsung-Yi and Maire, Michael and Belongie, Serge and Hays, James and Perona, Pietro and Ramanan, Deva and Doll{\'a}r, Piotr and Zitnick, C Lawrence}, | |
booktitle={Proceedings of the European Conference on Computer Vision}, | |
month = {Sept.}, | |
pages={740--755}, | |
year={2014} | |
} | |
@inproceedings{eiselt2013two, | |
title={A Two-Step Named Entity Recognizer for Open-Domain Search Queries.}, | |
author={Eiselt, Andreas and Figueroa, Alejandro}, | |
booktitle={International Joint Conference on Natural Language Processing}, | |
pages={829--833}, | |
year={2013} | |
} | |
@inproceedings{vedantam2015cider, | |
title={{CIDEr}: Consensus-based image description evaluation}, | |
author={Vedantam, Ramakrishna and Zitnick, C. Lawrence and Parikh, Devi}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
month = {Jun.}, | |
pages={4566--4575}, | |
year={2015} | |
} | |
@inproceedings{papineni2002bleu, | |
title={{BLEU}: a method for automatic evaluation of machine translation}, | |
author={Papineni, Kishore and Roukos, Salim and Ward, Todd and Zhu, Wei-Jing}, | |
booktitle={Proceedings of the 40th Annual Meeting on Association for Computational Linguistics}, | |
month = {Jul.}, | |
pages={311--318}, | |
year={2002}, | |
} | |
@article{banerjee2005meteor, | |
title={The Meteor metric for automatic evaluation of machine translation}, | |
author={Lavie, Alon and Denkowski, Michael J.}, | |
journal={Machine Translation}, | |
volume={23}, | |
pages={105-115}, | |
month = {Sept.}, | |
year={2009} | |
} | |
@article{hodosh2013framing, | |
title={Framing image description as a ranking task: Data, models and evaluation metrics}, | |
author={Hodosh, Micah and Young, Peter and Hockenmaier, Julia}, | |
journal={Journal Artificial Intelligence Research}, | |
volume={47}, | |
pages={853--899}, | |
month={Aug.}, | |
year={2013} | |
} | |
@inproceedings{kiros2014multimodal, | |
title={Multimodal Neural Language Models}, | |
author={Kiros, Ryan and Salakhutdinov, Ruslan and Zemel, Richard S}, | |
Booktitle={Proceedings of the International Conference on Machine Learning}, | |
month = {Jun.}, | |
volume={14}, | |
pages={595--603}, | |
year={2014} | |
} | |
@inproceedings{donahue2015long, | |
title={Long-term recurrent convolutional networks for visual recognition and description}, | |
author={Donahue, Jeffrey and Anne Hendricks, Lisa and Guadarrama, Sergio and Rohrbach, Marcus and Venugopalan, Subhashini and Saenko, Kate and Darrell, Trevor}, | |
booktitle={Proceedings of the IEEE conference on Computer Vision and Pattern Recognition}, | |
pages={2625--2634}, | |
year={2015} | |
} | |
@inproceedings{mao2014deep, | |
title={Deep captioning with multimodal recurrent neural networks (m-{RNN})}, | |
author={Mao, Junhua and Xu, Wei and Yang, Yi and Wang, Jiang and Huang, Zhiheng and Yuille, Alan}, | |
booktitle={Proceedings of the International Conference on Learning Representations}, | |
month = {Dec.}, | |
year={2015} | |
} | |
@inproceedings{jia2015guiding, | |
title={Guiding the long-short term memory model for image caption generation}, | |
author={Jia, Xu and Gavves, Efstratios and Fernando, Basura and Tuytelaars, Tinne}, | |
booktitle={Proceedings of the IEEE International Conference on Computer Vision}, | |
pages={2407--2415}, | |
year={2015} | |
} | |
@article{jin2015aligning, | |
author={Jin, Junqi and Fu, Kun and Cui, Runpeng and Sha, Fei and Zhang, Changshui}, | |
journal={IEEE Transactions on Pattern Analysis and Machine Intelligence}, | |
title={Aligning Where to See and What to Tell: Image Captioning with Region-based Attention and Scene-specific Contexts}, | |
year={2016}, | |
volume={PP}, | |
number={99}, | |
pages={1-1} | |
} | |
@inproceedings{wu2016image, | |
title={Ask Me Anything: Free-form Visual Question Answering Based on Knowledge from External Sources}, | |
author={Wu, Qi and Shen, Chunhua and Hengel, Anton van den and Wang, Peng and Dick, Anthony}, | |
journal={Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition}, | |
year={2016}, | |
month={June}, | |
pages={ 4622-4630} | |
} | |
@inproceedings{RefCap, | |
author = {Ren, Zhou and Wang, Xiaoyu and Zhang, Ning and Lv, Xutao and Li, Li-Jia}, | |
booktitle = {Proceeding of IEEE conference on Computer Vision and Pattern Recognition}, | |
title = {Deep Reinforcement Learning-based Image Captioning with Embedding Reward}, | |
year = {2017}, | |
month={Jul.}, | |
pages={290-298} | |
} | |
@inproceedings{GLA, | |
author = {Li, Linghui and Tang, Sheng and Deng, Lixi and Zhang, Yongdong and Tian, Qi}, | |
booktitle={Proceedings of Association for the Advancement of Artificial Intelligence Conference}, | |
title = {Image Caption with Global-Local Attention}, | |
year = {2017}, | |
month={Feb.}, | |
pages={4133-4139} | |
} | |
@inproceedings{vonAhn, | |
author = {von Ahn, Luis and Dabbish, Laura}, | |
title = {Labeling Images with a Computer Game}, | |
booktitle = {Proceedings of the SIGCHI Conference on Human Factors in Computing Systems}, | |
year = {2004}, | |
pages = {319--326} | |
} | |
@inproceedings{Cole2002PrinciplesOC, | |
title={Principles of Categorization}, | |
author={Cole, Michael and Quinn, N. and Rosch,Eleanor and GIick,Joseph and Sinclair,Hermina}, | |
booktitle = {Cognition and categorization}, | |
year={2002}, | |
pages = {189--206} | |
} | |
@article{Mareschal2000ACA, | |
title={A connectionist account of asymmetric category learning in early infancy.}, | |
author={Denis Mareschal and Robert M. French and Paul C. Quinn}, | |
journal={Developmental psychology}, | |
year={2000}, | |
volume={365}, | |
pages={635-645} | |
} | |
@inproceedings{densecap, | |
title={DenseCap: Fully Convolutional Localization Networks for Dense Captioning}, | |
author={Johnson, Justin and Karpathy, Andrej and Fei-Fei, Li}, | |
booktitle={Proceedings of the IEEE Conference on Computer Vision and | |
Pattern Recognition}, | |
year={2016}, | |
month={Jul.}, | |
pages={4565-4574} | |
} | |
@inproceedings{finegained, | |
author = {Jonathan Krause and Hailin Jin and Jianchao Yang and Li Fei-Fei}, | |
title = {Fine-Grained Recognition without Part Annotations}, | |
booktitle = "IEEE Conference on Computer Vision and Pattern Recognition", | |
year = {2015}, | |
month = {June}, | |
pages={5546-5555} | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment