@inproceedings{678cad2b0c35445d80e21216d81b7209,
title = "Learning goal-oriented visual dialog agents: Imitating and surpassing analytic experts",
abstract = "This paper tackles the problem of learning a questioner in the goal-oriented visual dialog task. Several previous works adopt model-free reinforcement learning. Most pretrain the model from a finite set of human-generated data. We argue that using limited demonstrations to kick-start the questioner is insufficient due to the large policy search space. Inspired by a recently proposed information theoretic approach, we develop two analytic experts to serve as a source of high-quality demonstrations for imitation learning. We then take advantage of reinforcement learning to refine the model towards the goal-oriented objective. Experimental results on the GuessWhat?! dataset show that our method has the combined merits of imitation and reinforcement learning, achieving the state-of-the-art performance.",
keywords = "Goal oriented visual dialog, Imitation learning, Reinforcement learning",
author = "Chang, {Yen Wei} and Wen-Hsiao Peng",
year = "2019",
month = jul,
day = "1",
doi = "10.1109/ICME.2019.00096",
language = "English",
series = "Proceedings - IEEE International Conference on Multimedia and Expo",
publisher = "IEEE Computer Society",
pages = "520--525",
booktitle = "Proceedings - 2019 IEEE International Conference on Multimedia and Expo, ICME 2019",
address = "United States",
note = "2019 IEEE International Conference on Multimedia and Expo, ICME 2019 ; Conference date: 08-07-2019 Through 12-07-2019",
}