@inproceedings{8f06f2cc794d4bee8793edd1f6776d99,
title = "Generating diverse and meaningful captions: Unsupervised specificity optimization for image captioning",
abstract = "Image Captioning is a task that requires models to acquire a multimodal understanding of the world and to express this understanding in natural language text. While the state-of-the-art for this task has rapidly improved in terms of n-gram metrics, these models tend to output the same generic captions for similar images. In this work, we address this limitation and train a model that generates more diverse and specific captions through an unsupervised training approach that incorporates a learning signal from an Image Retrieval model. We summarize previous results and improve the state-of-the-art on caption diversity and novelty. We make our source code publicly available online (https://github.com/AnnikaLindh/Diverse_and_Specific_Image_Captioning).",
keywords = "Computer vision, Contrastive learning, Deep learning, Diversity, Image captioning, Image retrieval, MS COCO, Machine learning, Multimodal training, Natural language generation, Natural language processing, Neural networks, Specificity",
author = "Annika Lindh and Ross, {Robert J.} and Abhijit Mahalunkar and Giancarlo Salton and Kelleher, {John D.}",
note = "Publisher Copyright: {\textcopyright} Springer Nature Switzerland AG 2018.; 27th International Conference on Artificial Neural Networks, ICANN 2018 ; Conference date: 04-10-2018 Through 07-10-2018",
year = "2018",
doi = "10.1007/978-3-030-01418-6_18",
language = "English",
isbn = "9783030014179",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "176--187",
editor = "Vera Kurkova and Barbara Hammer and Yannis Manolopoulos and Lazaros Iliadis and Ilias Maglogiannis",
booktitle = "Artificial Neural Networks and Machine Learning – ICANN 2018 - 27th International Conference on Artificial Neural Networks, 2018, Proceedings",
address = "Germany",
}