iBet uBet web content aggregator. Adding the entire web to your favor.
iBet uBet web content aggregator. Adding the entire web to your favor.



Link to original content: https://api.crossref.org/works/10.1145/3331453.3360975
{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T20:49:08Z","timestamp":1730321348827,"version":"3.28.0"},"publisher-location":"New York, NY, USA","reference-count":17,"publisher":"ACM","license":[{"start":{"date-parts":[[2019,10,22]],"date-time":"2019-10-22T00:00:00Z","timestamp":1571702400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2019,10,22]]},"DOI":"10.1145\/3331453.3360975","type":"proceedings-article","created":{"date-parts":[[2019,10,21]],"date-time":"2019-10-21T13:34:22Z","timestamp":1571664862000},"page":"1-6","update-policy":"http:\/\/dx.doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Competitive Evolution Multi-Agent Deep Reinforcement Learning"],"prefix":"10.1145","author":[{"given":"Wenhong","family":"Zhou","sequence":"first","affiliation":[{"name":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"}]},{"given":"Yiting","family":"Chen","sequence":"additional","affiliation":[{"name":"College of Intelligence Science and Technology,National University of Defense Technology, Changsha, China"}]},{"given":"Jie","family":"Li","sequence":"additional","affiliation":[{"name":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"}]}],"member":"320","published-online":{"date-parts":[[2019,10,22]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.5555\/3237383.3237908"},{"volume-title":"W Liu and J Pan","year":"2018","author":"Fan T","key":"e_1_3_2_1_2_1","unstructured":"T Fan , P Long , W Liu and J Pan ( 2018 ). Fully Distributed Multi-Robot Collision Avoidance via Deep Reinforcement Learning for Safe and Efficient Navigation in Complex Scenarios. arXiv Prepr . arXiv1808.04099. T Fan, P Long, W Liu and J Pan (2018). Fully Distributed Multi-Robot Collision Avoidance via Deep Reinforcement Learning for Safe and Efficient Navigation in Complex Scenarios. arXiv Prepr. arXiv1808.04099."},{"volume-title":"J Wang and Y Yu","year":"2017","author":"Zheng L","key":"e_1_3_2_1_3_1","unstructured":"L Zheng , J Yang , H Cai , W Zhang , J Wang and Y Yu ( 2017 ). MAgent: A Many-Agent Reinforcement Learning Platform for Artificial Collective Intelligence. arXiv Prepr . arXiv1712.00600. L Zheng, J Yang, H Cai, W Zhang, J Wang and Y Yu (2017). MAgent: A Many-Agent Reinforcement Learning Platform for Artificial Collective Intelligence. arXiv Prepr. arXiv1712.00600."},{"volume-title":"Proc. 35th Int. Conf. Mach. Learn.","year":"2018","author":"Yang Y","key":"e_1_3_2_1_4_1","unstructured":"Y Yang , R Luo , M Li , M Zhou , W Zhang and J. Wang ( 2018 ). Mean Field Multi-Agent Reinforcement Learning . Proc. 35th Int. Conf. Mach. Learn. Y Yang, R Luo, M Li, M Zhou, W Zhang and J. Wang (2018). Mean Field Multi-Agent Reinforcement Learning. Proc. 35th Int. Conf. Mach. Learn."},{"volume-title":"V Kumar and A Ribeiro","year":"2018","author":"Khan A","key":"e_1_3_2_1_5_1","unstructured":"A Khan , C Zhang , D D Lee , V Kumar and A Ribeiro ( 2018 ). Scalable Centralized Deep Multi-Agent Reinforcement Learning via Policy Gradients. Arxiv 1805.08776. A Khan, C Zhang, D D Lee, V Kumar and A Ribeiro (2018). Scalable Centralized Deep Multi-Agent Reinforcement Learning via Policy Gradients. Arxiv 1805.08776."},{"first-page":"1","volume-title":"Towards Designing Optimal Reward Functions in Multi-Agent Reinforcement Learning Problems. 2018 IEEE Jt. Conf. Neural Networks","author":"da Silva C.","key":"e_1_3_2_1_6_1","unstructured":"Ricardo Grunitzki, Bruno C. da Silva , Ana L. C. Bazzan and Jorge C. Chamby-Diaz (2018) . Towards Designing Optimal Reward Functions in Multi-Agent Reinforcement Learning Problems. 2018 IEEE Jt. Conf. Neural Networks , pp. 1 -- 8 . Ricardo Grunitzki, Bruno C. da Silva, Ana L. C. Bazzan and Jorge C. Chamby-Diaz (2018). Towards Designing Optimal Reward Functions in Multi-Agent Reinforcement Learning Problems. 2018 IEEE Jt. Conf. Neural Networks, pp. 1--8."},{"volume-title":"Deep Reinforcement Learning from Self-Play in Imperfect-Information Games. arXiv Prepr. arXiv1603.01121","year":"2016","author":"Heinrich J","key":"e_1_3_2_1_7_1","unstructured":"J Heinrich and D Silver ( 2016 ). Deep Reinforcement Learning from Self-Play in Imperfect-Information Games. arXiv Prepr. arXiv1603.01121 . J Heinrich and D Silver (2016). Deep Reinforcement Learning from Self-Play in Imperfect-Information Games. arXiv Prepr. arXiv1603.01121."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10115-018-1234-6"},{"issue":"1","key":"e_1_3_2_1_9_1","first-page":"77","article-title":"Cooperative Learning in a Competitive Environment: Classroom Applications","volume":"19","author":"Attle S.","year":"2007","unstructured":"S. Attle and B. Baker ( 2007 ). \" Cooperative Learning in a Competitive Environment: Classroom Applications ,\" Int. J. Teach. Learn. High. Educ. , vol. 19 , no. 1 , pp. 77 -- 83 . S. Attle and B. Baker (2007). \"Cooperative Learning in a Competitive Environment: Classroom Applications,\" Int. J. Teach. Learn. High. Educ., vol. 19, no. 1, pp. 77--83.","journal-title":"Int. J. Teach. Learn. High. Educ."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/CIG.2008.5035657"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1145\/1102351.1102372"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-33509-4_12"},{"key":"e_1_3_2_1_13_1","first-page":"57","article-title":"Self-Play and Using an Expert to Learn to Play Backgammon with Temporal Difference Learning","volume":"2","author":"Wiering M A","year":"2010","unstructured":"M A Wiering ( 2010 ). Self-Play and Using an Expert to Learn to Play Backgammon with Temporal Difference Learning . J. Intell. Learn. Syst. Appl. , vol. 2 , pp. 57 -- 68 . M A Wiering (2010). Self-Play and Using an Expert to Learn to Play Backgammon with Temporal Difference Learning. J. Intell. Learn. Syst. Appl., vol. 2, pp. 57--68.","journal-title":"J. Intell. Learn. Syst. Appl."},{"key":"e_1_3_2_1_14_1","first-page":"1","volume-title":"ICLR","volume":"2","author":"Bansal T","year":"2018","unstructured":"T Bansal , J Pachocki , S Sidor , I Sutskever and I Mordatch ( 2018 ). Emergent Complexity via Multi-Agent Competition . ICLR 2018, vol. 2 , pp. 1 -- 12 . T Bansal, J Pachocki, S Sidor, I Sutskever and I Mordatch (2018). Emergent Complexity via Multi-Agent Competition. ICLR 2018, vol. 2, pp. 1--12."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1038\/nature14236"},{"key":"e_1_3_2_1_16_1","first-page":"173","volume-title":"Y Zhang and X Duan","author":"Chen W","year":"2016","unstructured":"W Chen , M Zhang , Y Zhang and X Duan ( 2016 ). Exploiting meta features for dependency parsing and part-of-speech tagging. Artif. Intell ., 230(September 2015), pp. 173 -- 191 . W Chen, M Zhang, Y Zhang and X Duan (2016). Exploiting meta features for dependency parsing and part-of-speech tagging. Artif. Intell., 230(September 2015), pp. 173--191."},{"key":"e_1_3_2_1_17_1","unstructured":"M Jaderberg etal (2017). Population Based Training of Neural Networks. arXiv Prepr. arXiv1711.0984. M Jaderberg et al. (2017). Population Based Training of Neural Networks. arXiv Prepr. arXiv1711.0984."}],"event":{"name":"CSAE 2019: The 3rd International Conference on Computer Science and Application Engineering","acronym":"CSAE 2019","location":"Sanya China"},"container-title":["Proceedings of the 3rd International Conference on Computer Science and Application Engineering"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3331453.3360975","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,14]],"date-time":"2023-01-14T19:59:05Z","timestamp":1673726345000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3331453.3360975"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,10,22]]},"references-count":17,"alternative-id":["10.1145\/3331453.3360975","10.1145\/3331453"],"URL":"https:\/\/doi.org\/10.1145\/3331453.3360975","relation":{},"subject":[],"published":{"date-parts":[[2019,10,22]]},"assertion":[{"value":"2019-10-22","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}