@inproceedings{0d3db53fb5754ff89e596d6fd4e549de,
title = "Logistic Markov decision processes",
abstract = "User modeling in advertising and recommendation has typically focused on myopic predictors of user responses. In this work, we consider the long-term decision problem associated with user interaction. We propose a concise specification of long-term interaction dynamics by combining factored dynamic Bayesian networks with logistic predictors of user responses, allowing state-of-the-art prediction models to be seamlessly extended. We show how to solve such models at scale by providing a constraint generation approach for approximate linear programming that overcomes the variable coupling and nonlinearity induced by the logistic regression predictor. The efficacy of the approach is demonstrated on advertising domains with up to 254 states and 239 actions.",
author = "Martin Mladenov and Ofer Meshi and Craig Boutilier and Gal Elidan and Dale Schuurmans and Tyler Lu",
year = "2017",
doi = "10.24963/ijcai.2017/346",
language = "אנגלית",
series = "IJCAI International Joint Conference on Artificial Intelligence",
publisher = "International Joint Conferences on Artificial Intelligence",
pages = "2486--2493",
editor = "Carles Sierra",
booktitle = "26th International Joint Conference on Artificial Intelligence, IJCAI 2017",
note = "26th International Joint Conference on Artificial Intelligence, IJCAI 2017 ; Conference date: 19-08-2017 Through 25-08-2017",
}