@inproceedings{0e4e9111993d4572aa5c2fc2bdfa2729,
title = "SentiCap: Generating image descriptions with sentiments",
abstract = "The recent progress on image recognition and language modeling is making automatic description of image content a reality. However, stylized, non-factual aspects of the written description are missing from the current systems. One such style is descriptions with emotions, which is commonplace in everyday communication, and influences decision-making and interpersonal relationships. We design a system to describe an image with emotions, and present a model that automatically generates captions with positive or negative sentiments. We propose a novel switching recurrent neural network with word-level regularization, which is able to produce emotional image captions using only 2000+ training sentences containing sentiments. We evaluate the captions with different automatic and crowd-sourcing metrics. Our model compares favourably in common quality metrics for image captioning. In 84.6\% of cases the generated positive captions were judged as being at least as descriptive as the factual captions. Of these positive captions 88\% were confirmed by the crowd-sourced workers as having the appropriate sentiment.",
author = "Alexander Mathews and Lexing Xie and Xuming He",
note = "Publisher Copyright: {\textcopyright} Copyright 2016, Association for the Advancement of Artificial Intelligence (www.aaai.org). All rights reserved.; 30th AAAI Conference on Artificial Intelligence, AAAI 2016 ; Conference date: 12-02-2016 Through 17-02-2016",
year = "2016",
language = "English",
series = "30th AAAI Conference on Artificial Intelligence, AAAI 2016",
publisher = "AAAI Press",
pages = "3574--3580",
booktitle = "30th AAAI Conference on Artificial Intelligence, AAAI 2016",
}