@inproceedings{864f550569d24e2fb6f066578104a726,
title = "Exploring state transition uncertainty in variational reinforcement learning",
abstract = "Model-free agent in reinforcement learning (RL) generally performs well but inefficient in training process with sparse data. A practical solution is to incorporate a model-based module in model-free agent. State transition can be learned to make desirable prediction of next state based on current state and action at each time step. This paper presents a new learning representation for variational RL by introducing the so-called transition uncertainty critic based on the variational encoder-decoder network where the uncertainty of structured state transition is encoded in a model-based agent. In particular, an action-gating mechanism is carried out to learn and decode the trajectory of actions and state transitions in latent variable space. The transition uncertainty maximizing exploration (TUME) is performed according to the entropy search by using the intrinsic reward based on the uncertainty measure corresponding to different states and actions. A dedicate latent variable model with a penalty using the bias of state-action value is developed. Experiments on Cart Pole and dialogue system show that the proposed TUME considerably performs better than the other exploration methods for reinforcement learning.",
keywords = "Machine learning, Reward optimization",
author = "Jen-Tzung Chien and Liao, {Wei Lin} and Naqa, {Issam El}",
note = "Publisher Copyright: {\textcopyright} 2021 European Signal Processing Conference, EUSIPCO. All rights reserved. Copyright: Copyright 2021 Elsevier B.V., All rights reserved.; 28th European Signal Processing Conference, EUSIPCO 2020 ; Conference date: 24-08-2020 Through 28-08-2020",
year = "2021",
month = jan,
day = "24",
doi = "10.23919/Eusipco47968.2020.9287440",
language = "English",
series = "European Signal Processing Conference",
publisher = "European Signal Processing Conference, EUSIPCO",
pages = "1527--1531",
booktitle = "28th European Signal Processing Conference, EUSIPCO 2020 - Proceedings",
}