<?xml version="1.0" encoding="UTF-8"?><xml><records><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Matthew E. Taylor</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author><author><style face="normal" font="default" size="100%">Pascal Poupart</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Decentralized Mean Field Games</style></title><secondary-title><style face="normal" font="default" size="100%">AAAI Conference on Artificial Intelligence (2022), Vancouver, BC, Canada</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2022</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2112.09099.pdf</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">AAAI press</style></publisher><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>17</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Matthew E. Taylor</style></author><author><style face="normal" font="default" size="100%">Kate Larson</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Multi-Agent Advisor Q-Learning</style></title><secondary-title><style face="normal" font="default" size="100%">Journal of Aritificial Intelligence Research (JAIR)</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2022</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://jair.org/index.php/jair/article/view/13445/26794</style></url></web-urls></urls><volume><style face="normal" font="default" size="100%">74</style></volume><pages><style face="normal" font="default" size="100%">1--74</style></pages><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Volodymyr Tkachuk</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Matthew E Taylor</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">The Effect of Q-function Reuse on the Total Regret of Tabular, Model-Free, Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">International Conference on Autonomous Agents and Multi-Agent Systems (AAMAS 2021), London, UK - Adaptive Learning Agents Workshop</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2021</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2103.04416.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Ken Ming Lee</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Investigation of Independent Reinforcement Learning Algorithms in Multi-Agent Environments</style></title><secondary-title><style face="normal" font="default" size="100%">Neural Information Processing Systems (NeurIPS) - Deep Reinforcement Learning workshop</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2021</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2111.01100.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Matthew E. Taylor</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author><author><style face="normal" font="default" size="100%">Pascal Poupart</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Partially Observable Mean Field Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">International Conference on Autonomous Agents and Multi-Agent Systems (AAMAS 2021), London, UK</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2021</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2012.15791.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sushrut Bhalla</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Deep Multi Agent Reinforcement Learning for Autonomous Driving</style></title><secondary-title><style face="normal" font="default" size="100%">Canadian AI </style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2020</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://link.springer.com/chapter/10.1007/978-3-030-47358-7_7</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">Springer LNCS</style></publisher><language><style face="normal" font="default" size="100%">eng</style></language><notes><style face="normal" font="default" size="100%">Best paper award - Nominee</style></notes></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sai Krishna Gottipati</style></author><author><style face="normal" font="default" size="100%">Yashaswi Pathak</style></author><author><style face="normal" font="default" size="100%">Rohan Nuttall</style></author><author><style face="normal" font="default" size="100%">Sahir</style></author><author><style face="normal" font="default" size="100%">Raviteja Chunduru</style></author><author><style face="normal" font="default" size="100%">Ahmed Touati</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Matthew E. Taylor</style></author><author><style face="normal" font="default" size="100%">Sarath Chandar</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Maximum Reward Formulation In Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">Deep Reinforcement Learning Workshop</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2020</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2010.03744.pdf</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">NeurIPS 2020</style></publisher><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Pascal Poupart</style></author><author><style face="normal" font="default" size="100%">Matthew E. Taylor</style></author><author><style face="normal" font="default" size="100%">Nidhi Hegde</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Multi Type Mean Field Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">International Conference on Autonomous Agents and Multi agent Systems (AAMAS 2020), Aukland, New Zealand</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2020</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2002.02513.pdf</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">IFAAMAS</style></publisher><pub-location><style face="normal" font="default" size="100%">AAMAS 2020, Aukland, New Zealand</style></pub-location><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>13</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Piyush Jain</style></author><author><style face="normal" font="default" size="100%">Sean C P Coogan</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author><author><style face="normal" font="default" size="100%">Steve Taylor</style></author><author><style face="normal" font="default" size="100%">Mike D Flannigan</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">A review of machine learning applications in wildfire science and management</style></title><secondary-title><style face="normal" font="default" size="100%">Environmental Reviews</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2020</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://arxiv.org/pdf/2003.00646.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sushrut Bhalla</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Learning Multi-Agent Communication with Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">Conference on Reinforcement Learning and Decision Making</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2019</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">http://rldm.org/papers/abstracts.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Pascal Poupart</style></author><author><style face="normal" font="default" size="100%">Matt Taylor</style></author><author><style face="normal" font="default" size="100%">Nidhi Hegde</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Multi Type Mean Field Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">Conference on Reinforcement Learning and Decision Making</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2019</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">http://rldm.org/papers/abstracts.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sushruth Bhalla</style></author><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Training Cooperative Agents for Multi-Agent Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">International Conference on Autonomous Agents and Multiagent System (AAMAS 2019), Montreal, Canada</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2019</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">http://www.ifaamas.org/Proceedings/aamas2019/pdfs/p1826.pdf</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Combining MCTS and A3C for Prediction of Spatially Spreading Processes in Forest Wildfire Setting</style></title><secondary-title><style face="normal" font="default" size="100%">31st Canadian Conference on Artificial Intelligence, Toronto</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2018</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://link.springer.com/chapter/10.1007/978-3-319-89656-4_28</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">Springer</style></publisher><pages><style face="normal" font="default" size="100%">285-291</style></pages><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">A Complementary Approach to Improve WildFire Prediction Systems.</style></title><secondary-title><style face="normal" font="default" size="100%">Neural Information Processing Systems (AI for social good workshop)</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2018</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://aiforsocialgood.github.io/2018/pdfs/track1/37_aisg_neurips2018.pdf</style></url></web-urls></urls><pub-location><style face="normal" font="default" size="100%">NeurIPS</style></pub-location><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Benyamin Ghojogh</style></author><author><style face="normal" font="default" size="100%">Jaspreet Singh Sambee</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Decision Assist For Self-Driving Cars</style></title><secondary-title><style face="normal" font="default" size="100%">31st Canadian Conference on Artificial Intelligence, Toronto</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2018</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://link.springer.com/chapter/10.1007/978-3-319-89656-4_44</style></url></web-urls></urls><publisher><style face="normal" font="default" size="100%">Springer</style></publisher><pages><style face="normal" font="default" size="100%">381 - 387</style></pages><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>32</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Reinforcement Learning for Determining Spread Dynamics of Spatially Spreading Processes with Emphasis on Forest Fires</style></title><secondary-title><style face="normal" font="default" size="100%">Electrical and Computer Engineering, University of Waterloo</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2018</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">http://hdl.handle.net/10012/13148</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language><work-type><style face="normal" font="default" size="100%">Masters</style></work-type></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>17</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Using Spatial Reinforcement Learning to Build Forest Wildfire Dynamics Models from Satellite Images</style></title><secondary-title><style face="normal" font="default" size="100%">Journal of Frontiers in ICT- Environmental Informatics</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2018</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://www.frontiersin.org/articles/10.3389/fict.2018.00006/full?&amp;utm_source=Email_to_authors_&amp;utm_medium=Email&amp;utm_content=T1_11.5e1_author&amp;utm_campaign=Email_publication&amp;field=&amp;journalName=Frontiers_in_ICT&amp;id=334036</style></url></web-urls></urls><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Mark Crowley</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Learning Forest Wildfire Dynamics from Satellite Images using Reinforcement Learning</style></title><secondary-title><style face="normal" font="default" size="100%">Conference on Reinforcement Learning and Decision Making</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2017</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">http://www.princeton.edu/~ndaw/RLDM17ExtendedAbstracts.pdf</style></url></web-urls></urls><pub-location><style face="normal" font="default" size="100%">Conference on Reinforcement Learning and Decision Making, Ann Arbor, MI, USA</style></pub-location><pages><style face="normal" font="default" size="100%">244-248</style></pages><language><style face="normal" font="default" size="100%">eng</style></language></record><record><source-app name="Biblio" version="7.x">Drupal-Biblio</source-app><ref-type>47</ref-type><contributors><authors><author><style face="normal" font="default" size="100%">Sriram Ganapathi Subramanian</style></author><author><style face="normal" font="default" size="100%">Amrith Ganesh. P</style></author></authors></contributors><titles><title><style face="normal" font="default" size="100%">Spatial Decision Support System for Industrial Robots</style></title><secondary-title><style face="normal" font="default" size="100%">Innovations in Marine Electrical and Electronics Engineering</style></secondary-title></titles><dates><year><style  face="normal" font="default" size="100%">2015</style></year></dates><urls><web-urls><url><style face="normal" font="default" size="100%">https://uwaterloo.ca/scholar/sites/ca.scholar/files/s2ganapa/files/paper29.pdf</style></url></web-urls></urls><pub-location><style face="normal" font="default" size="100%">International Conference on Innovations in Marine Electrical  and Electronics Engineering, Chennai, Tamil Nadu, India,</style></pub-location><language><style face="normal" font="default" size="100%">eng</style></language></record></records></xml>