<?xml version="1.0"?>
<!-- name="generator" content="blosxom/2.0" -->
<!DOCTYPE rss PUBLIC "-//Netscape Communications//DTD RSS 0.91//EN" "http://my.netscape.com/publish/formats/rss-0.91.dtd">

<rss version="0.91">
  <channel>
    <title>Notebooks   </title>
    <link>http://bactra.org/notebooks</link>
    <description>Cosma's Notebooks</description>
    <language>en</language>

  <item>
    <title>Learning in Games</title>
    <link>http://bactra.org/notebooks/2009/11/21#learning-games</link>
    <description>
&lt;P&gt;See also
	&lt;a href=&quot;collective-cognition.html&quot;&gt;Collective Cognition&lt;/a&gt;;
	&lt;a href=&quot;evol-econ.html&quot;&gt;Evolutionary Economics&lt;/a&gt;;
	&lt;a href=&quot;learning-inference-induction.html&quot;&gt;Machine Learning, Statistical Inference and Induction&lt;/a&gt;;
	the &lt;a href=&quot;minority-game.html&quot;&gt;Minority Game&lt;/a&gt;;
	&lt;a href=&quot;sequential-decisions.html&quot;&gt;Sequential Decisions Under
Uncertainty&lt;/a&gt;;
	&lt;a href=&quot;universal-prediction.html&quot;&gt;Universal Prediction Algorithms&lt;/A&gt;

&lt;ul&gt;Recommended:
	&lt;li&gt;Jenna Bednar and Scott Page, &quot;Games Theory and Culture&quot; [&lt;a
href=&quot;http://www-personal.umich.edu/~jbednar/papers.htm#culturepaper&quot;&gt;PDF&lt;/a&gt;]
	&lt;li&gt;Nicolo Cesa-Bianchi and Gabor Lugosi, &lt;citE&gt;Prediction, Learning,
and Games&lt;/cite&gt; [&lt;a href=&quot;../weblog/algae-2008-07.html#prediction&quot;&gt;Mini-review&lt;/a&gt;]
	&lt;li&gt;Dean P. Foster and H. Peyton Young, &quot;Learning, hypothesis testing,
and Nash equilibrium,&quot; &lt;cite&gt;Games and Economic
Behavior&lt;/cite&gt; &lt;strong&gt;45&lt;/strong&gt; (2003): 73--96 [&lt;a
href=&quot;http://gosset.wharton.upenn.edu/~foster/research/nash.pdf&quot;&gt;pdf&lt;/a&gt;]
	&lt;li&gt;Herbert Gintis, &lt;cite&gt;Game Theory Evolving: A Problem-Centered
Introduction to Modeling Strategic Interaction&lt;/cite&gt;
	&lt;li&gt;Ariel Rubinstein, &lt;cite&gt;Modeling Bounded Rationality&lt;/cite&gt; [&lt;a
href=&quot;../reviews/modeling-bounded-rationality/&quot;&gt;Review: &lt;em&gt;O docta
simplicitas!&lt;/em&gt;&lt;/a&gt;]
	&lt;li&gt;Larry Samuelson (no relation of &lt;em&gt;the&lt;/em&gt; Samuelson),
&lt;cite&gt;Evolutionary Games and Equilibrium Selection&lt;/cite&gt;
	&lt;li&gt;Jos&amp;eacute; M. Vidal and Edmund H. Durfee, &quot;Predicting the Expected
Behavior of Agents That Learn About Agents: The CLRI Framework,&quot; &lt;a
href=&quot;http://arxiv.org/abs/cs.MA/0001008&quot;&gt;cs.MA/0001008&lt;/a&gt;
	&lt;li&gt;H. Peyton Young, &lt;cite&gt;Individual Strategy and Social Structure: An
Evolutionary Theory of Institutions&lt;/cite&gt; [&lt;a
href=&quot;../reviews/young-strategy-and-structure/&quot;&gt;Review: A Myopic (and Sometimes
Blind) Eye on the Main Chance, or, the Origins of Custom&lt;/a&gt;]
	&lt;/ul&gt;

&lt;ul&gt;To read:
	&lt;li&gt;Jacob Abernethy, Alekh Agarwal, Peter L. Bartlett, Alexander Rakhlin, &quot;A Stochastic View of Optimal Regret through Minimax Duality&quot;, &lt;a href=&quot;http://arxiv.org/abs/0903.5328&quot;&gt;arxiv:0903.5328&lt;/a&gt;
	&lt;li&gt;James Bergin and Barton L. Lipman, 1996, &quot;Evolution with
State-Dependent Mutations,&quot; &lt;cite&gt;Econometrica&lt;/cite&gt; &lt;strong&gt;64&lt;/strong&gt;
(1996): 943--956
	&lt;li&gt;Andreas Blume, &quot;A Learning-Efficiency Explanation of Structure in
Language&quot;, &lt;a href=&quot;http://dx.doi.org/10.1007/s11238-005-0280-1&quot;&gt;&lt;cite&gt;Theory
and Decision&lt;/cite&gt; &lt;strong&gt;57&lt;/strong&gt; (2004): 265--285&lt;/a&gt;
	&lt;li&gt;Lawrence E. Blume and David Easley
		&lt;ul&gt;
		&lt;li&gt;&quot;If You're So Smart, Why Aren't You Rich?  Belief Selection
in Complete and Incomplete Markets,&quot; SFI Working Paper 01-06-031
		&lt;li&gt;&quot;Optimality and Natural Selection in Markets,&quot; &lt;a
href=&quot;http://www.santafe.edu/sfi/publications/Abstracts/98-09-082abs.html&quot;&gt;SFI
Working Paper 98-09-0 82&lt;/a&gt;
		&lt;/ul&gt;
	&lt;li&gt;Oliver Board, &quot;Dynamic interactive epistemology&quot;, &lt;a
href=&quot;http://dx.doi.org/10.1016/j.geb.2003.10.006&quot;&gt;&lt;cite&gt;Games and
Economic Behavior&lt;/cite&gt; &lt;strong&gt;49&lt;/strong&gt; (2004): 49--80&lt;/a&gt;
	&lt;li&gt;Christophe Chamley, &lt;cite&gt;Rational Herds: Economic Models of Social
Learning&lt;/cite&gt;
	&lt;li&gt;Emilio De Santis and Carlo Marinelli, &quot;Stochastic games with
infinitely many interacting
agents&quot;, &lt;a href=&quot;http://arxiv.org/abs/math.PR/0505608&quot;&gt;math.PR/0505608&lt;/a&gt;
[Sounds very cool: &quot;study a class of infinite-horizon non-zero-sum
non-cooperative stochastic games with infinitely many interacting agents using
ideas of statistical mechanics.... in the general case of asymmetric
interactions, the existence of a strategy that allows any player to eliminate
losses after a finite random time.  In the special case of symmetric
interactions ... as time goes to infinity, the game converges to a Nash
equilibrium. Moreover, assuming that all agents adopt the same strategy, using
arguments related to those leading to perfect simulation algorithms, spatial
mixing and ergodicity are proved ... ergodicity [implies] ``fixation'',
i.e. that players will adopt a constant strategy after a finite
time. ... related to zero-temperature Glauber dynamics on random graphs of
possibly infinite volume.&quot;]
	&lt;li&gt;Pradeep Dubey and Ori Haimanko, &quot;Learning with Perfect
Information&quot;, &lt;a
href=&quot;http://dx.doi.org/10.1016/S0899-8256(03)00127-1&quot;&gt;&lt;cite&gt;Games and Economic
Behavior&lt;/cite&gt; &lt;strong&gt;46&lt;/strong&gt; (2004): 304--324&lt;/a&gt;
	&lt;li&gt;Jim Engle-Warnick, William J. McCausland and John H. Miller,
&quot;The Ghost in the Machine: Inferring Machine-Based Strategies from
Observed Behavior&quot; [i.e., inferring stochastic transducers from data; hence
the inclusion here]
	&lt;li&gt;Anders Eriksson and Kristian Lindgren, &quot;A simple model of cognitive
processing in repeated
games&quot;, &lt;a href=&quot;http://arxiv.org/abs/q-bio.PE/0608015&quot;&gt;q-bio.PE/0608015&lt;/a&gt;
	&lt;li&gt;Fudenberg and Levine, &lt;cite&gt;The Theory of Learning in Games&lt;/cite&gt;
	&lt;li&gt;Douglas Gale and Hamid Sabourian, &quot;Complexity and Competition&quot;,
&lt;a
href=&quot;http://dx.doi.org/10.1111/j.1468-0262.2005.00595.x&quot;&gt;&lt;cite&gt;Econometrica&lt;/cite&gt; &lt;strong&gt;73&lt;/strong&gt;
(2005): 739--769&lt;/a&gt; [&quot;Extensive-form market games typically have a large
number of noncompetitive equilibria. In this paper, we argue that the
complexity of noncompetitive behavior provides a justification for competitive
equilibrium in the sense that if rational agents have an aversion to complexity
(at the margin), then maximizing behavior will result in simple behavioral
rules and hence in a competitive outcome. For this purpose, we use a class of
extensive-form dynamic matching and bargaining games with a finite number of
agents. In particular, we consider markets with heterogeneous buyers and
sellers and deterministic, exogenous, sequential matching rules, although the
results can be extended to other matching processes. If the complexity costs of
implementing strategies enter players' preferences lexicographically with the
standard payoff, then every equilibrium strategy profile induces a competitive
outcome.&quot;]
	&lt;li&gt;Val E. Lambson and Daniel A. Probst, &quot;Learning by Matching
Patterns&quot;, &lt;a
href=&quot;http://dx.doi.org/10.1016/S0899-8256(03)00125-8&quot;&gt;&lt;cite&gt;Games and Economic
Behavior&lt;/cite&gt; &lt;strong&gt;46&lt;/strong&gt; (2004): 398--409&lt;/a&gt;
	&lt;li&gt;Jacek Miekisz
		&lt;ul&gt;
		&lt;li&gt;&quot;Statistical mechanics of spatial evolutionary games&quot;, &lt;a
href=&quot;http://arxiv.org/abs/cond-mat/0210094&quot;&gt;cond-mat/0210094&lt;/a&gt;
		&lt;li&gt;&quot;Stochastic stability in spatial games&quot;, &lt;a
href=&quot;http://arxiv.org/abs/cond-mat/0409647&quot;&gt;cond-mat/0409647&lt;/a&gt; = &lt;cite&gt;Journal of Statistical Physics&lt;/cite&gt; &lt;strong&gt;117&lt;/strong&gt; (2004): 99--110
		&lt;li&gt;&quot;Long-run behavior of games with many players&quot;, &lt;a
href=&quot;http://arxiv.org/abs/cond-mat/0409742&quot;&gt;cond-mat/0409742&lt;/a&gt;
		&lt;/ul&gt;
	&lt;li&gt;Gillies Pag&amp;egrave;s, &quot;A two armed bandit type problem
revisited&quot;, &lt;a href=&quot;http://arxiv.org/abs/math.PR/0502182&quot;&gt;math.PR/0502182&lt;/a&gt;
	&lt;li&gt;Liviu Panait, Karl Tuyls, Sean Luke, &quot;Theoretical Advantages of
Lenient Learners: An Evolutionary Game Theoretic Perspective&quot;,
&lt;a href=&quot;http://jmlr.csail.mit.edu/papers/v9/panait08a.html&quot;&gt;&lt;cite&gt;Journal of
Machine Learning Research&lt;/cite&gt; &lt;strong&gt;9&lt;/strong&gt; (2008): 423--457&lt;/a&gt;
	&lt;li&gt;Mark Stegeman and Paul Rhode, &quot;Stochastic Darwinian equilibria in
small and large populations&quot;, &lt;a
href=&quot;http://dx.doi.org/10.1016/j.geb.2003.10.005&quot;&gt;&lt;cite&gt;Games and Economic
Behavior&lt;/cite&gt; &lt;strong&gt;49&lt;/strong&gt; (2004): 171--214&lt;/a&gt;
	&lt;li&gt;Jos&amp;eacute; M. Vidal, &lt;cite&gt;Computational Agents That Learn About
Agents: Algorithms for Their Design and a Predictive Theory of Their
Behavior&lt;/cite&gt; [Ph.D. thesis, U. Michigan, 1998;
&lt;a href=&quot;http://jmvidal.ece.sc.edu/papers/diss/&quot;&gt;on-line&lt;/a&gt;]
	&lt;/ul&gt;
</description>
  </item>
  </channel>
</rss>