iBet uBet web content aggregator. Adding the entire web to your favor.
iBet uBet web content aggregator. Adding the entire web to your favor.



Link to original content: https://api.crossref.org/works/10.1142/S0219525902000535
{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T22:30:46Z","timestamp":1717281046701},"reference-count":15,"publisher":"World Scientific Pub Co Pte Lt","issue":"01","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Advs. Complex Syst."],"published-print":{"date-parts":[[2002,3]]},"abstract":" A population of agents plays a stochastic dynamic game wherein there is an underlying state process with a Markovian dynamics that also affects their costs. A learning mechanism is proposed which takes into account intertemporal effects and incorporates an explicit process of expectation formation. The agents use this scheme to update their mixed strategies incrementally. The asymptotic behavior of this scheme is captured by an associated ordinary differential equation. Both the formulation and the analysis of the scheme draw upon the theory of reinforcement learning in artificial intelligence. <\/jats:p>","DOI":"10.1142\/s0219525902000535","type":"journal-article","created":{"date-parts":[[2002,7,27]],"date-time":"2002-07-27T11:07:52Z","timestamp":1027768072000},"page":"55-72","source":"Crossref","is-referenced-by-count":15,"title":["REINFORCEMENT LEARNING IN MARKOVIAN EVOLUTIONARY GAMES"],"prefix":"10.1142","volume":"05","author":[{"given":"V. S.","family":"BORKAR","sequence":"first","affiliation":[{"name":"School of Technology and Computer Science, Tata Institute of Fundamental Research, Homi Bhabha Road, Mumbai 400005, India"}]}],"member":"219","published-online":{"date-parts":[[2011,11,20]]},"reference":[{"key":"p_1","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.1983.6313077"},{"key":"p_3","doi-asserted-by":"publisher","DOI":"10.1006\/game.1999.0717"},{"key":"p_4","doi-asserted-by":"publisher","DOI":"10.1023\/A:1026463628355"},{"key":"p_8","doi-asserted-by":"publisher","DOI":"10.1006\/jeth.1997.2319"},{"key":"p_9","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6911(97)90015-3"},{"key":"p_10","first-page":"155","author":"Borkar V. S.","year":"1998","journal-title":"Physica D125"},{"key":"p_13","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007518724497"},{"key":"p_14","doi-asserted-by":"publisher","DOI":"10.2307\/1426945"},{"key":"p_15","doi-asserted-by":"publisher","DOI":"10.1006\/game.1993.1021"},{"key":"p_20","doi-asserted-by":"publisher","DOI":"10.1016\/0022-0396(81)90038-3"},{"key":"p_22","doi-asserted-by":"publisher","DOI":"10.1137\/S036301299731669X"},{"key":"p_23","doi-asserted-by":"publisher","DOI":"10.1016\/S1389-0417(01)00015-8"},{"key":"p_25","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177729586"},{"key":"p_33","doi-asserted-by":"publisher","DOI":"10.1023\/A:1007514623589"},{"key":"p_35","doi-asserted-by":"publisher","DOI":"10.1142\/S0219525901000188"}],"container-title":["Advances in Complex Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.worldscientific.com\/doi\/pdf\/10.1142\/S0219525902000535","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,6]],"date-time":"2019-08-06T20:28:40Z","timestamp":1565123320000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.worldscientific.com\/doi\/abs\/10.1142\/S0219525902000535"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2002,3]]},"references-count":15,"journal-issue":{"issue":"01","published-online":{"date-parts":[[2011,11,20]]},"published-print":{"date-parts":[[2002,3]]}},"alternative-id":["10.1142\/S0219525902000535"],"URL":"http:\/\/dx.doi.org\/10.1142\/s0219525902000535","relation":{},"ISSN":["0219-5259","1793-6802"],"issn-type":[{"value":"0219-5259","type":"print"},{"value":"1793-6802","type":"electronic"}],"subject":[],"published":{"date-parts":[[2002,3]]}}}