The game of Jeopardy! features four types of strategic decision-making: 1) Daily Double wagering; 2) Final Jeopardy! wagering; 3) selecting the next square when in control of the board; and 4) deciding whether to attempt to answer, i.e., buzz in. Strategies that properly account for the game state and future event probabilities can yield a huge boost in overall winning chances, when compared with simple rule-of-thumb strategies. In this paper, we present an approach to developing and testing components to make said strategy decisions, founded upon development of reasonably faithful simulation models of the players and the Jeopardy! game environment. We describe machine learning and Monte Carlo methods used in simulations to optimize the respective strategy algorithms. Application of these methods yielded superhuman game strategies for IBM Watson that significantly enhanced its overall competitive record.
%0 Journal Article
%1 TesauroGondekEtAl12ibmjrd
%A Tesauro, G.
%A Gondek, D. C.
%A Lenchner, J.
%A Fan, J.
%A Prager, J. M.
%D 2012
%J IBM Journal of Research and Development
%K 01801 ieee paper ibm ai answer application optimize zzz.iui
%N 3/4
%P 16:1--16:11
%R 10.1147/JRD.2012.2188931
%T Simulation, Learning, and Optimization Techniques in Watson's Game Strategies
%V 56
%X The game of Jeopardy! features four types of strategic decision-making: 1) Daily Double wagering; 2) Final Jeopardy! wagering; 3) selecting the next square when in control of the board; and 4) deciding whether to attempt to answer, i.e., buzz in. Strategies that properly account for the game state and future event probabilities can yield a huge boost in overall winning chances, when compared with simple rule-of-thumb strategies. In this paper, we present an approach to developing and testing components to make said strategy decisions, founded upon development of reasonably faithful simulation models of the players and the Jeopardy! game environment. We describe machine learning and Monte Carlo methods used in simulations to optimize the respective strategy algorithms. Application of these methods yielded superhuman game strategies for IBM Watson that significantly enhanced its overall competitive record.
@article{TesauroGondekEtAl12ibmjrd,
abstract = {The game of Jeopardy! features four types of strategic decision-making: 1) Daily Double wagering; 2) Final Jeopardy! wagering; 3) selecting the next square when in control of the board; and 4) deciding whether to attempt to answer, i.e., buzz in. Strategies that properly account for the game state and future event probabilities can yield a huge boost in overall winning chances, when compared with simple rule-of-thumb strategies. In this paper, we present an approach to developing and testing components to make said strategy decisions, founded upon development of reasonably faithful simulation models of the players and the Jeopardy! game environment. We describe machine learning and Monte Carlo methods used in simulations to optimize the respective strategy algorithms. Application of these methods yielded superhuman game strategies for IBM Watson that significantly enhanced its overall competitive record.},
added-at = {2017-11-13T14:45:01.000+0100},
author = {Tesauro, G. and Gondek, D. C. and Lenchner, J. and Fan, J. and Prager, J. M.},
biburl = {https://www.bibsonomy.org/bibtex/2d48d7c79c44031c8e47d5204c6bb219a/flint63},
doi = {10.1147/JRD.2012.2188931},
file = {IEEE Digital Library:2012/TesauroGondekEtAl12ibmjrd.pdf:PDF},
groups = {public},
interhash = {2ca184935be87a2d053865f0afad067a},
intrahash = {d48d7c79c44031c8e47d5204c6bb219a},
issn = {0018-8646},
journal = {IBM Journal of Research and Development},
keywords = {01801 ieee paper ibm ai answer application optimize zzz.iui},
number = {3/4},
pages = {16:1--16:11},
timestamp = {2018-04-16T11:49:44.000+0200},
title = {Simulation, Learning, and Optimization Techniques in {Watson}'s Game Strategies},
username = {flint63},
volume = 56,
year = 2012
}