[1419] | 1 | % This file was created with JabRef 2.7b. |
---|
| 2 | % Encoding: UTF-8 |
---|
| 3 | |
---|
| 4 | @ARTICLE{7_lq_methods, |
---|
| 5 | author = {Anderson, B.D.O., Moore, J.B.}, |
---|
| 6 | title = {Optimal Control - Linear Quadratic Methods}, |
---|
| 7 | journal = {Prentice Hall, Englewood Cliffs, NJ}, |
---|
| 8 | year = {1990}, |
---|
| 9 | owner = {jabu}, |
---|
| 10 | timestamp = {2011.11.24} |
---|
| 11 | } |
---|
| 12 | |
---|
| 13 | @ARTICLE{dynamic_programming, |
---|
| 14 | author = {R. Bellman}, |
---|
| 15 | title = {Dynamic programming}, |
---|
| 16 | journal = {Princeton University Press}, |
---|
| 17 | year = {1957} |
---|
| 18 | } |
---|
| 19 | |
---|
| 20 | @ARTICLE{2_int_a_in_dec, |
---|
| 21 | author = {E.D. Ferreira and E. Subrahmanian and D. Manstetten}, |
---|
| 22 | title = {Intelligent agents in decentralized traffic control}, |
---|
| 23 | journal = {Intelligent Transportation Systems}, |
---|
| 24 | year = {2001} |
---|
| 25 | } |
---|
| 26 | |
---|
| 27 | @ARTICLE{4_rmm_formalization, |
---|
| 28 | author = {P. J. Gmytrasiewicz and E. H. Durfee}, |
---|
| 29 | title = {A rigorous, operational formalization of recursive modeling}, |
---|
| 30 | journal = { First International Conference on Multiagent Systems}, |
---|
| 31 | year = {1995} |
---|
| 32 | } |
---|
| 33 | |
---|
| 34 | @ARTICLE{5_bayes_learn, |
---|
| 35 | author = {I. Nagy and P. Nedoma and P. Ettler and L. Pavelkov{\'a} and NewAuthor2}, |
---|
| 36 | title = {O bayesovsk{\'e}m u\v{c}en{\'i}}, |
---|
| 37 | journal = {Automa}, |
---|
| 38 | year = {2002} |
---|
| 39 | } |
---|
| 40 | |
---|
| 41 | @ARTICLE{1_rmm_bayes_learning, |
---|
| 42 | author = {H. Ou and W. Zhang and X. Xu}, |
---|
| 43 | title = {Urban traffic multi-agent system based on RMM and Bayesian learning}, |
---|
| 44 | journal = {American Control Conference}, |
---|
| 45 | year = {2002} |
---|
| 46 | } |
---|
| 47 | |
---|
| 48 | @ARTICLE{17_fronta, |
---|
| 49 | author = {Pecherkov{\'a} P. and Dun{\'i}k J. and Fl{\'i}dr}, |
---|
| 50 | title = {Modelling and Simultaneous Estimation of State |
---|
| 51 | |
---|
| 52 | and Parameters of Traffic System}, |
---|
| 53 | journal = {Robotics, Automation and Control}, |
---|
| 54 | year = {2008}, |
---|
| 55 | owner = {jabu}, |
---|
| 56 | timestamp = {2011.12.31} |
---|
| 57 | } |
---|
| 58 | |
---|
| 59 | @ARTICLE{learning_to_predict, |
---|
| 60 | author = {R. S. Sutton}, |
---|
| 61 | title = {Learning to predict by the methods of temporal didffrences}, |
---|
| 62 | journal = {Machine Learning}, |
---|
| 63 | year = {1988} |
---|
| 64 | } |
---|
| 65 | |
---|
| 66 | @ARTICLE{tlc_using_sarsa, |
---|
| 67 | author = {T. Thorpe}, |
---|
| 68 | title = {Vehicle traffic light controlusing sarsa}, |
---|
| 69 | journal = {Master’s thesis, Department of Computer Science, Colorado State University}, |
---|
| 70 | year = {1997} |
---|
| 71 | } |
---|
| 72 | |
---|
| 73 | @ARTICLE{6_tuc_lq, |
---|
| 74 | author = {Vaya Dinopoulou, Christina Diakaki, Markos Papageorgiou}, |
---|
| 75 | title = {Applications of the urban traffic control strategy TUC}, |
---|
| 76 | journal = {European Journal of Operational Research}, |
---|
| 77 | year = {2005}, |
---|
| 78 | owner = {jabu}, |
---|
| 79 | timestamp = {2011.11.24} |
---|
| 80 | } |
---|
| 81 | |
---|
| 82 | @ARTICLE{leraning_from_delayed_rewards, |
---|
| 83 | author = {C. J. C. H. Watkins}, |
---|
| 84 | title = {Leraning from Delayed Rewards}, |
---|
| 85 | journal = {PhD thesis, King's College, Cambridge, England}, |
---|
| 86 | year = {1989} |
---|
| 87 | } |
---|
| 88 | |
---|
| 89 | @ARTICLE{q_learning, |
---|
| 90 | author = {C. J. C. H. Watkins and P. Dayan}, |
---|
| 91 | title = {Q-leraning}, |
---|
| 92 | journal = {Machine Learning}, |
---|
| 93 | year = {1992} |
---|
| 94 | } |
---|
| 95 | |
---|
| 96 | @ARTICLE{3_i_traff_light_c, |
---|
| 97 | author = {M. Wiering and J. {Van Veenen} and J. Vreeken and A. Koopman}, |
---|
| 98 | title = {Intelligent traffic light control}, |
---|
| 99 | journal = {European Research Consortium for Informatics and Mathematics}, |
---|
| 100 | year = {2003} |
---|
| 101 | } |
---|
| 102 | |
---|
| 103 | @BOOK{wooldridge, |
---|
| 104 | title = {Multi Agent Systems}, |
---|
| 105 | publisher = {MIT Press}, |
---|
| 106 | year = {2005}, |
---|
| 107 | author = {Michael Wooldridge}, |
---|
| 108 | month = mar, |
---|
| 109 | key = {wooldridge} |
---|
| 110 | } |
---|