@article{1200,
  author       = {Hilbe, Christian and Traulsen, Arne},
  journal      = {Physics of Life Reviews},
  pages        = {29 -- 31},
  publisher    = {Elsevier},
  title        = {{Only the combination of mathematics and agent based simulations can leverage the full potential of evolutionary modeling: Comment on “Evolutionary game theory using agent-based methods” by C. Adami, J. Schossau and A. Hintze}},
  doi          = {10.1016/j.plrev.2016.10.004},
  volume       = {19},
  year         = {2016},
}

@inproceedings{1245,
  abstract     = {To facilitate collaboration in massive online classrooms, instructors must make many decisions. For instance, the following parameters need to be decided when designing a peer-feedback system where students review each others' essays: the number of students each student must provide feedback to, an algorithm to map feedback providers to receivers, constraints that ensure students do not become free-riders (receiving feedback but not providing it), the best times to receive feedback to improve learning etc. While instructors can answer these questions by running experiments or invoking past experience, game-theoretic models with data from online learning platforms can identify better initial designs for further improvements. As an example, we explore the design space of a peer feedback system by modeling it using game theory. Our simulations show that incentivizing students to provide feedback requires the value obtained from receiving a feedback to exceed the cost of providing it by a large factor (greater than 7). Furthermore, hiding feedback from low-effort students incentivizes them to provide more feedback.},
  author       = {Pandey, Vineet and Chatterjee, Krishnendu},
  booktitle    = {Proceedings of the ACM Conference on Computer Supported Cooperative Work},
  location     = {San Francisco, CA, USA},
  number       = {Februar-2016},
  pages        = {365 -- 368},
  publisher    = {ACM},
  title        = {{Game-theoretic models identify useful principles for peer collaboration in online learning platforms}},
  doi          = {10.1145/2818052.2869122},
  volume       = {26},
  year         = {2016},
}

@inproceedings{1325,
  abstract     = {We study graphs and two-player games in which rewards are assigned to states, and the goal of the players is to satisfy or dissatisfy certain property of the generated outcome, given as a mean payoff property. Since the notion of mean-payoff does not reflect possible fluctuations from the mean-payoff along a run, we propose definitions and algorithms for capturing the stability of the system, and give algorithms for deciding if a given mean payoff and stability objective can be ensured in the system.},
  author       = {Brázdil, Tomáš and Forejt, Vojtěch and Kučera, Antonín and Novotny, Petr},
  location     = {Quebec City, Canada},
  publisher    = {Schloss Dagstuhl - Leibniz-Zentrum für Informatik},
  title        = {{Stability in graphs and games}},
  doi          = {10.4230/LIPIcs.CONCUR.2016.10},
  volume       = {59},
  year         = {2016},
}

@inproceedings{1324,
  abstract     = {DEC-POMDPs extend POMDPs to a multi-agent setting, where several agents operate in an uncertain environment independently to achieve a joint objective. DEC-POMDPs have been studied with finite-horizon and infinite-horizon discounted-sum objectives, and there exist solvers both for exact and approximate solutions. In this work we consider Goal-DEC-POMDPs, where given a set of target states, the objective is to ensure that the target set is reached with minimal cost. We consider the indefinite-horizon (infinite-horizon with either discounted-sum, or undiscounted-sum, where absorbing goal states have zero-cost) problem. We present a new and novel method to solve the problem that extends methods for finite-horizon DEC-POMDPs and the RTDP-Bel approach for POMDPs. We present experimental results on several examples, and show that our approach presents promising results. Copyright },
  author       = {Chatterjee, Krishnendu and Chmelik, Martin},
  booktitle    = {Proceedings of the Twenty-Sixth International Conference on International Conference on Automated Planning and Scheduling},
  location     = {London, United Kingdom},
  pages        = {88 -- 96},
  publisher    = {AAAI Press},
  title        = {{Indefinite-horizon reachability in Goal-DEC-POMDPs}},
  volume       = {2016-January},
  year         = {2016},
}

@inproceedings{1327,
  abstract     = {We consider partially observable Markov decision processes (POMDPs) with a set of target states and positive integer costs associated with every transition. The traditional optimization objective (stochastic shortest path) asks to minimize the expected total cost until the target set is reached. We extend the traditional framework of POMDPs to model energy consumption, which represents a hard constraint. The energy levels may increase and decrease with transitions, and the hard constraint requires that the energy level must remain positive in all steps till the target is reached. First, we present a novel algorithm for solving POMDPs with energy levels, developing on existing POMDP solvers and using RTDP as its main method. Our second contribution is related to policy representation. For larger POMDP instances the policies computed by existing solvers are too large to be understandable. We present an automated procedure based on machine learning techniques that automatically extracts important decisions of the policy allowing us to compute succinct human readable policies. Finally, we show experimentally that our algorithm performs well and computes succinct policies on a number of POMDP instances from the literature that were naturally enhanced with energy levels. },
  author       = {Brázdil, Tomáš and Chatterjee, Krishnendu and Chmelik, Martin and Gupta, Anchit and Novotny, Petr},
  booktitle    = {Proceedings of the 15th International Conference on Autonomous Agents and Multiagent Systems},
  location     = {Singapore},
  pages        = {1465 -- 1466},
  publisher    = {ACM},
  title        = {{Stochastic shortest path with energy constraints in POMDPs}},
  year         = {2016},
}