@Book{ wooldridge, title = "Multi Agent Systems", author = "Michael Wooldridge", month = mar, year = "2005", key = "wooldridge", publisher = "MIT Press" } @Article{ 1_rmm_bayes_learning, title = "Urban traffic multi-agent system based on RMM and Bayesian learning", author = "H. Ou and W. Zhang and X. Xu", journal = "American Control Conference", year = "2002" } @Article{ 2_int_a_in_dec, title = "Intelligent agents in decentralized traffic control", author = "E.D. Ferreira and E. Subrahmanian and D. Manstetten", journal = "Intelligent Transportation Systems", year = "2001" } @Article{ 3_i_traff_light_c, title = "Intelligent traffic light control", author = "M. Wiering and J. {Van Veenen} and J. Vreeken and A. Koopman", journal = "European Research Consortium for Informatics and Mathematics", year = "2003" } @Article{ 4_rmm_formalization, title = "A rigorous, operational formalization of recursive modeling", author = "P. J. Gmytrasiewicz and E. H. Durfee", journal = " First International Conference on Multiagent Systems", year = "1995" } @Article{ 5_bayes_learn, title = "O bayesovsk{\'e}m u\v{c}en{\'i}", author = "I. Nagy and P. Nedoma and P. Ettler and L. Pavelkov{\'a} and NewAuthor2", journal = "Automa", year = "2002" } @Article{ learning_to_predict, author = "R. S. Sutton", journal = "Machine Learning", year = "1988", title = "Learning to predict by the methods of temporal didffrences" } @Article{ dynamic_programming, title = "Dynamic programming", author = "R. Bellman", journal = "Princeton University Press", year = "1957" } @Article{ tlc_using_sarsa, title = "Vehicle traffic light controlusing sarsa", author = "T. Thorpe", journal = "Master’s thesis, Department of Computer Science, Colorado State University", year = "1997" } @Article{ leraning_from_delayed_rewards, title = "Leraning from Delayed Rewards", author = "C. J. C. H. Watkins", journal = "PhD thesis, King's College, Cambridge, England", year = "1989" } @Article{ q_learning, title = "Q-leraning", author = "C. J. C. H. Watkins and P. Dayan", journal = "Machine Learning", year = "1992" }