@inproceedings{713b4d1de7d84e5b87ae07bf90a052e4,
title = "Log-linear dialog manager",
abstract = "We design a log-linear probabilistic model for solving the dialog management task. In both planning and learning we optimize the same objective function: the expected reward. Rather than performing full policy optimization, we perform on-line estimation of the optimal action as a belief-propagation inference step. We employ context-free grammars to describe our variable spaces, which enables us to define rich features. To scale our approach to large variable spaces, we use particle belief propagation. Experiments show that the model is able to choose system actions that yield a high expected reward, outperforming its POMDP-like log-linear counterpart and a hand-crafted rule-based system.",
keywords = "Dialog Manager, Log-linear Model, POMDP",
author = "Hao Tang and Shinji Watanabe and Marks, {Tim K.} and Hershey, {John R.}",
year = "2014",
doi = "10.1109/ICASSP.2014.6854371",
language = "English",
isbn = "9781479928927",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "4092--4096",
booktitle = "2014 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2014",
note = "2014 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2014 ; Conference date: 04-05-2014 Through 09-05-2014",
}