BibTeX records: Peter Stone

download as .bib file

@inproceedings{DBLP:conf/aaai/KnoxHABDSN24,
  author       = {W. Bradley Knox and
                  Stephane Hatgis{-}Kessell and
                  Sigurdur O. Adalgeirsson and
                  Serena Booth and
                  Anca D. Dragan and
                  Peter Stone and
                  Scott Niekum},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Learning Optimal Advantage from Preferences and Mistaking It for Reward},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {10066--10073},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i9.28870},
  doi          = {10.1609/AAAI.V38I9.28870},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KnoxHABDSN24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WangWXZS24,
  author       = {Zizhao Wang and
                  Caroline Wang and
                  Xuesu Xiao and
                  Yuke Zhu and
                  Peter Stone},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Building Minimal and Reusable Causal State Abstractions for Reinforcement
                  Learning},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {15778--15786},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i14.29507},
  doi          = {10.1609/AAAI.V38I14.29507},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WangWXZS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/RahmanCS24,
  author       = {Muhammad Rahman and
                  Jiaxun Cui and
                  Peter Stone},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Minimum Coverage Sets for Training Robust Ad Hoc Teamwork Agents},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {17523--17530},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i16.29702},
  doi          = {10.1609/AAAI.V38I16.29702},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/RahmanCS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KnoxABSS24,
  author       = {W. Bradley Knox and
                  Alessandro Allievi and
                  Holger Banzhaf and
                  Felix Schmitt and
                  Peter Stone},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Reward (Mis)design for Autonomous Driving (Abstract Reprint)},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {22702},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i20.30602},
  doi          = {10.1609/AAAI.V38I20.30602},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KnoxABSS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-02576,
  author       = {William Yue and
                  Bo Liu and
                  Peter Stone},
  title        = {t-DGR: {A} Trajectory-Based Deep Generative Replay Method for Continual
                  Learning in Decision Making},
  journal      = {CoRR},
  volume       = {abs/2401.02576},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.02576},
  doi          = {10.48550/ARXIV.2401.02576},
  eprinttype    = {arXiv},
  eprint       = {2401.02576},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-02576.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-12497,
  author       = {Zizhao Wang and
                  Caroline Wang and
                  Xuesu Xiao and
                  Yuke Zhu and
                  Peter Stone},
  title        = {Building Minimal and Reusable Causal State Abstractions for Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2401.12497},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.12497},
  doi          = {10.48550/ARXIV.2401.12497},
  eprinttype    = {arXiv},
  eprint       = {2401.12497},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-12497.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-01636,
  author       = {Ziping Xu and
                  Zifan Xu and
                  Runxuan Jiang and
                  Peter Stone and
                  Ambuj Tewari},
  title        = {Sample Efficient Myopic Exploration Through Multitask Reinforcement
                  Learning with Diverse Tasks},
  journal      = {CoRR},
  volume       = {abs/2403.01636},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.01636},
  doi          = {10.48550/ARXIV.2403.01636},
  eprinttype    = {arXiv},
  eprint       = {2403.01636},
  timestamp    = {Wed, 10 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-01636.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-03848,
  author       = {Zifan Xu and
                  Amir Hossain Raj and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Dexterous Legged Locomotion in Confined 3D Spaces with Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2403.03848},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.03848},
  doi          = {10.48550/ARXIV.2403.03848},
  eprinttype    = {arXiv},
  eprint       = {2403.03848},
  timestamp    = {Wed, 03 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-03848.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-07869,
  author       = {Shivin Dass and
                  Wensi Ai and
                  Yuqian Jiang and
                  Samik Singh and
                  Jiaheng Hu and
                  Ruohan Zhang and
                  Peter Stone and
                  Ben Abbatematteo and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n},
  title        = {TeleMoMa: {A} Modular and Versatile Teleoperation System for Mobile
                  Manipulation},
  journal      = {CoRR},
  volume       = {abs/2403.07869},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.07869},
  doi          = {10.48550/ARXIV.2403.07869},
  eprinttype    = {arXiv},
  eprint       = {2403.07869},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-07869.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-11940,
  author       = {Alexander Levine and
                  Peter Stone and
                  Amy Zhang},
  title        = {Multistep Inverse Is Not All You Need},
  journal      = {CoRR},
  volume       = {abs/2403.11940},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.11940},
  doi          = {10.48550/ARXIV.2403.11940},
  eprinttype    = {arXiv},
  eprint       = {2403.11940},
  timestamp    = {Mon, 08 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-11940.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-17231,
  author       = {Saad Abdul Ghani and
                  Zizhao Wang and
                  Peter Stone and
                  Xuesu Xiao},
  title        = {Dyna-LfLH: Learning Agile Navigation in Dynamic Environments from
                  Learned Hallucination},
  journal      = {CoRR},
  volume       = {abs/2403.17231},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.17231},
  doi          = {10.48550/ARXIV.2403.17231},
  eprinttype    = {arXiv},
  eprint       = {2403.17231},
  timestamp    = {Wed, 10 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-17231.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/KnoxABSS23,
  author       = {W. Bradley Knox and
                  Alessandro Allievi and
                  Holger Banzhaf and
                  Felix Schmitt and
                  Peter Stone},
  title        = {Reward (Mis)design for autonomous driving},
  journal      = {Artif. Intell.},
  volume       = {316},
  pages        = {103829},
  year         = {2023},
  url          = {https://doi.org/10.1016/j.artint.2022.103829},
  doi          = {10.1016/J.ARTINT.2022.103829},
  timestamp    = {Sat, 13 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/KnoxABSS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/arobots/ZhangASTSZ23,
  author       = {Xiaohan Zhang and
                  Saeid Amiri and
                  Jivko Sinapov and
                  Jesse Thomason and
                  Peter Stone and
                  Shiqi Zhang},
  title        = {Multimodal embodied attribute learning by robots for object-centric
                  action policies},
  journal      = {Auton. Robots},
  volume       = {47},
  number       = {5},
  pages        = {505--528},
  year         = {2023},
  url          = {https://doi.org/10.1007/s10514-023-10098-5},
  doi          = {10.1007/S10514-023-10098-5},
  timestamp    = {Thu, 31 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/arobots/ZhangASTSZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/BakerNAAABBBBDDDDEFGHIKKKKKLLLMMNPPR23,
  author       = {Megan M. Baker and
                  Alexander New and
                  Mario Aguilar{-}Simon and
                  Ziad Al{-}Halah and
                  S{\'{e}}bastien M. R. Arnold and
                  Eseoghene Ben{-}Iwhiwhu and
                  Andrew P. Brna and
                  Ethan Brooks and
                  Ryan C. Brown and
                  Zachary Daniels and
                  Anurag Reddy Daram and
                  Fabien Delattre and
                  Ryan Dellana and
                  Eric Eaton and
                  Haotian Fu and
                  Kristen Grauman and
                  Jesse Hostetler and
                  Shariq Iqbal and
                  Cassandra Kent and
                  Nicholas Ketz and
                  Soheil Kolouri and
                  George Konidaris and
                  Dhireesha Kudithipudi and
                  Erik G. Learned{-}Miller and
                  Seungwon Lee and
                  Michael Littman and
                  Sandeep Madireddy and
                  Jorge A. Mendez and
                  Eric Q. Nguyen and
                  Christine D. Piatko and
                  Praveen K. Pilly and
                  Aswin Raghavan and
                  Abrar Rahman and
                  Santhosh Kumar Ramakrishnan and
                  Neale Ratzlaff and
                  Andrea Soltoggio and
                  Peter Stone and
                  Indranil Sur and
                  Zhipeng Tang and
                  Saket Tiwari and
                  Kyle Vedder and
                  Felix Wang and
                  Zifan Xu and
                  Angel Yanguas{-}Gil and
                  Harel Yedidsion and
                  Shangqun Yu and
                  Gautam K. Vallabha},
  title        = {A domain-agnostic approach for characterization of lifelong learning
                  systems},
  journal      = {Neural Networks},
  volume       = {160},
  pages        = {274--296},
  year         = {2023},
  url          = {https://doi.org/10.1016/j.neunet.2023.01.007},
  doi          = {10.1016/J.NEUNET.2023.01.007},
  timestamp    = {Mon, 09 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/BakerNAAABBBBDDDDEFGHIKKKKKLLLMMNPPR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ram/XiaoXWSGRBMCBR23,
  author       = {Xuesu Xiao and
                  Zifan Xu and
                  Garrett Warnell and
                  Peter Stone and
                  Ferran Gebelli Guinjoan and
                  R{\^{o}}mulo T. Rodrigues and
                  Herman Bruyninckx and
                  Hanjaya Mandala and
                  Guilherme Christmann and
                  Jos{\'{e}} Luis Blanco{-}Claraco and
                  Shravan Somashekara Rai},
  title        = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons
                  Learned From the Second {BARN} Challenge at {ICRA} 2023 [Competitions]},
  journal      = {{IEEE} Robotics Autom. Mag.},
  volume       = {30},
  number       = {4},
  pages        = {91--97},
  year         = {2023},
  url          = {https://doi.org/10.1109/MRA.2023.3322920},
  doi          = {10.1109/MRA.2023.3322920},
  timestamp    = {Sat, 13 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ram/XiaoXWSGRBMCBR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BoothKSNSA23,
  author       = {Serena Booth and
                  W. Bradley Knox and
                  Julie Shah and
                  Scott Niekum and
                  Peter Stone and
                  Alessandro Allievi},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {The Perils of Trial-and-Error Reward Design: Misdesign through Overfitting
                  and Invalid Task Specifications},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {5920--5929},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i5.25733},
  doi          = {10.1609/AAAI.V37I5.25733},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BoothKSNSA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/0042F0S23,
  author       = {Bo Liu and
                  Yihao Feng and
                  Qiang Liu and
                  Peter Stone},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {Metric Residual Network for Sample Efficient Goal-Conditioned Reinforcement
                  Learning},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {8799--8806},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i7.26058},
  doi          = {10.1609/AAAI.V37I7.26058},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/0042F0S23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WangDLS23,
  author       = {Caroline Wang and
                  Ishan Durugkar and
                  Elad Liebman and
                  Peter Stone},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {DM{\({^2}\)}: Decentralized Multi-Agent Reinforcement Learning via
                  Distribution Matching},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {11699--11707},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i10.26382},
  doi          = {10.1609/AAAI.V37I10.26382},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WangDLS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/BajajSS23,
  author       = {Vaibhav Bajaj and
                  Guni Sharon and
                  Peter Stone},
  editor       = {Sven Koenig and
                  Roni Stern and
                  Mauro Vallati},
  title        = {Task Phasing: Automated Curriculum Learning from Demonstrations},
  booktitle    = {Proceedings of the Thirty-Third International Conference on Automated
                  Planning and Scheduling, July 8-13, 2023, Prague, Czech Republic},
  pages        = {542--550},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/icaps.v33i1.27235},
  doi          = {10.1609/ICAPS.V33I1.27235},
  timestamp    = {Wed, 20 Sep 2023 11:58:30 +0200},
  biburl       = {https://dblp.org/rec/conf/aips/BajajSS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/WangWS23,
  author       = {Caroline Wang and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {Noa Agmon and
                  Bo An and
                  Alessandro Ricci and
                  William Yeoh},
  title        = {D-Shape: Demonstration-Shaped Reinforcement Learning via Goal-Conditioning},
  booktitle    = {Proceedings of the 2023 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2023, London, United Kingdom, 29 May
                  2023 - 2 June 2023},
  pages        = {1267--1275},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://dl.acm.org/doi/10.5555/3545946.3598772},
  doi          = {10.5555/3545946.3598772},
  timestamp    = {Tue, 23 May 2023 14:27:14 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/WangWS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ShperbergLS23,
  author       = {Shahaf S. Shperberg and
                  Bo Liu and
                  Peter Stone},
  editor       = {Noa Agmon and
                  Bo An and
                  Alessandro Ricci and
                  William Yeoh},
  title        = {Relaxed Exploration Constrained Reinforcement Learning},
  booktitle    = {Proceedings of the 2023 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2023, London, United Kingdom, 29 May
                  2023 - 2 June 2023},
  pages        = {2821--2823},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://dl.acm.org/doi/10.5555/3545946.3599090},
  doi          = {10.5555/3545946.3599090},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/ShperbergLS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/collas/XuZSMJLS23,
  author       = {Zifan Xu and
                  Yulin Zhang and
                  Shahaf S. Shperberg and
                  Reuth Mirsky and
                  Yuqian Jiang and
                  Bo Liu and
                  Peter Stone},
  editor       = {Sarath Chandar and
                  Razvan Pascanu and
                  Hanie Sedghi and
                  Doina Precup},
  title        = {Model-Based Meta Automatic Curriculum Learning},
  booktitle    = {Conference on Lifelong Learning Agents, 22-25 August 2023, McGill
                  University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada},
  series       = {Proceedings of Machine Learning Research},
  volume       = {232},
  pages        = {846--860},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v232/xu23a.html},
  timestamp    = {Tue, 20 Feb 2024 13:52:18 +0100},
  biburl       = {https://dblp.org/rec/conf/collas/XuZSMJLS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/KarnanYFWBS23,
  author       = {Haresh Karnan and
                  Elvin Yang and
                  Daniel Farkash and
                  Garrett Warnell and
                  Joydeep Biswas and
                  Peter Stone},
  editor       = {Jie Tan and
                  Marc Toussaint and
                  Kourosh Darvish},
  title        = {{STERLING:} Self-Supervised Terrain Representation Learning from Unconstrained
                  Robot Experience},
  booktitle    = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta,
                  GA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {229},
  pages        = {2393--2413},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v229/karnan23a.html},
  timestamp    = {Tue, 20 Feb 2024 12:11:46 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/KarnanYFWBS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/Zhu0SZ23,
  author       = {Yifeng Zhu and
                  Zhenyu Jiang and
                  Peter Stone and
                  Yuke Zhu},
  editor       = {Jie Tan and
                  Marc Toussaint and
                  Kourosh Darvish},
  title        = {Learning Generalizable Manipulation Policies with Object-Centric 3D
                  Representations},
  booktitle    = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta,
                  GA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {229},
  pages        = {3418--3433},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v229/zhu23b.html},
  timestamp    = {Tue, 20 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/Zhu0SZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/humanoids/MannemMSM23,
  author       = {Swathi Mannem and
                  William Macke and
                  Peter Stone and
                  Reuth Mirsky},
  title        = {Exploring the Cost of Interruptions in Human-Robot Teaming},
  booktitle    = {22nd {IEEE-RAS} International Conference on Humanoid Robots, Humanoids
                  2023, Austin, TX, USA, December 12-14, 2023},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/Humanoids57100.2023.10375236},
  doi          = {10.1109/HUMANOIDS57100.2023.10375236},
  timestamp    = {Tue, 09 Jan 2024 15:27:05 +0100},
  biburl       = {https://dblp.org/rec/conf/humanoids/MannemMSM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CuiYLLSLLS0T23,
  author       = {Jiaxun Cui and
                  Xiaomeng Yang and
                  Mulong Luo and
                  Geunbae Lee and
                  Peter Stone and
                  Hsien{-}Hsin S. Lee and
                  Benjamin Lee and
                  G. Edward Suh and
                  Wenjie Xiong and
                  Yuandong Tian},
  title        = {{MACTA:} {A} Multi-agent Reinforcement Learning Approach for Cache
                  Timing Attacks and Detection},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=CDlHZ78-Xzi},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/CuiYLLSLLS0T23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/XuLXNS23,
  author       = {Zifan Xu and
                  Bo Liu and
                  Xuesu Xiao and
                  Anirudh Nair and
                  Peter Stone},
  title        = {Benchmarking Reinforcement Learning Techniques for Autonomous Navigation},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2023, London, UK, May 29 - June 2, 2023},
  pages        = {9224--9230},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICRA48891.2023.10160583},
  doi          = {10.1109/ICRA48891.2023.10160583},
  timestamp    = {Tue, 08 Aug 2023 10:24:29 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/XuLXNS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ParkXWYS23,
  author       = {Jin Soo Park and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Harel Yedidsion and
                  Peter Stone},
  title        = {Learning Perceptual Hallucination for Multi-Robot Navigation in Narrow
                  Hallways},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2023, London, UK, May 29 - June 2, 2023},
  pages        = {10033--10039},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/ICRA48891.2023.10161327},
  doi          = {10.1109/ICRA48891.2023.10161327},
  timestamp    = {Tue, 08 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/ParkXWYS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/0002ZDJZS023,
  author       = {Xiaohan Zhang and
                  Yifeng Zhu and
                  Yan Ding and
                  Yuqian Jiang and
                  Yuke Zhu and
                  Peter Stone and
                  Shiqi Zhang},
  title        = {Symbolic State Space Optimization for Long Horizon Mobile Manipulation
                  Planning},
  booktitle    = {{IROS}},
  pages        = {866--872},
  year         = {2023},
  url          = {https://doi.org/10.1109/IROS55552.2023.10342224},
  doi          = {10.1109/IROS55552.2023.10342224},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/0002ZDJZS023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/GhonasgiMHSD23,
  author       = {Keya Ghonasgi and
                  Reuth Mirsky and
                  Adrian M. Haith and
                  Peter Stone and
                  Ashish D. Deshpande},
  title        = {A Novel Control Law for Multi-Joint Human-Robot Interaction Tasks
                  While Maintaining Postural Coordination},
  booktitle    = {{IROS}},
  pages        = {6110--6116},
  year         = {2023},
  url          = {https://doi.org/10.1109/IROS55552.2023.10342501},
  doi          = {10.1109/IROS55552.2023.10342501},
  timestamp    = {Fri, 05 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/GhonasgiMHSD23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AgarwalDSZ23,
  author       = {Siddhant Agarwal and
                  Ishan Durugkar and
                  Peter Stone and
                  Amy Zhang},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {f-Policy Gradients: {A} General Framework for Goal-Conditioned {RL}
                  using f-Divergences},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/27f4d95417bb722201597bf4d67cbacc-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/AgarwalDSZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuFSL23,
  author       = {Bo Liu and
                  Yihao Feng and
                  Peter Stone and
                  Qiang Liu},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {{FAMO:} Fast Adaptive Multitask Optimization},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/b2fe1ee8d936ac08dd26f2ff58986c8f-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuFSL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuZGFLZS23,
  author       = {Bo Liu and
                  Yifeng Zhu and
                  Chongkai Gao and
                  Yihao Feng and
                  Qiang Liu and
                  Yuke Zhu and
                  Peter Stone},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {{LIBERO:} Benchmarking Knowledge Transfer for Lifelong Robot Learning},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/8c3c666820ea055a77726d66fc7d447f-Abstract-Datasets\_and\_Benchmarks.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuZGFLZS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WangHSM23,
  author       = {Zizhao Wang and
                  Jiaheng Hu and
                  Peter Stone and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {{ELDEN:} Exploration via Local Dependencies},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/31ed129feae64a7e44a15b148c15558d-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WangHSM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/HuSM23,
  author       = {Jiaheng Hu and
                  Peter Stone and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n},
  editor       = {Kostas E. Bekris and
                  Kris Hauser and
                  Sylvia L. Herbert and
                  Jingjin Yu},
  title        = {Causal Policy Gradient for Whole-Body Mobile Manipulation},
  booktitle    = {Robotics: Science and Systems XIX, Daegu, Republic of Korea, July
                  10-14, 2023},
  year         = {2023},
  url          = {https://doi.org/10.15607/RSS.2023.XIX.049},
  doi          = {10.15607/RSS.2023.XIX.049},
  timestamp    = {Thu, 20 Jul 2023 14:53:22 +0200},
  biburl       = {https://dblp.org/rec/conf/rss/HuSM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/SungS23,
  author       = {Yoonchang Sung and
                  Peter Stone},
  editor       = {Kostas E. Bekris and
                  Kris Hauser and
                  Sylvia L. Herbert and
                  Jingjin Yu},
  title        = {Motion Planning (In)feasibility Detection using a Prior Roadmap via
                  Path and Cut Search},
  booktitle    = {Robotics: Science and Systems XIX, Daegu, Republic of Korea, July
                  10-14, 2023},
  year         = {2023},
  url          = {https://doi.org/10.15607/RSS.2023.XIX.060},
  doi          = {10.15607/RSS.2023.XIX.060},
  timestamp    = {Thu, 20 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/rss/SungS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/tas/HauserCCHWDGEKH23,
  author       = {Elliott Hauser and
                  Yao{-}Cheng Chan and
                  Parth Chonkar and
                  Geethika Hemkumar and
                  Huihai Wang and
                  Daksh Dua and
                  Shikhar Gupta and
                  Efren Mendoza Enriquez and
                  Tiffany Kao and
                  Justin W. Hart and
                  Reuth Mirsky and
                  Joydeep Biswas and
                  Junfeng Jiao and
                  Peter Stone},
  title        = {"What's That Robot Doing Here?": Perceptions Of Incidental
                  Encounters With Autonomous Quadruped Robots},
  booktitle    = {Proceedings of the First International Symposium on Trustworthy Autonomous
                  Systems, {TAS} 2023, Edinburgh, United Kingdom, July 11-12, 2023},
  pages        = {12:1--12:15},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3597512.3599707},
  doi          = {10.1145/3597512.3599707},
  timestamp    = {Fri, 21 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/tas/HauserCCHWDGEKH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/Morrill0HWS23,
  author       = {Dustin Morrill and
                  Thomas J. Walsh and
                  Daniel Hernandez and
                  Peter R. Wurman and
                  Peter Stone},
  editor       = {Robin J. Evans and
                  Ilya Shpitser},
  title        = {Composing Efficient, Robust Tests for Policy Selection},
  booktitle    = {Uncertainty in Artificial Intelligence, {UAI} 2023, July 31 - 4 August
                  2023, Pittsburgh, PA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {216},
  pages        = {1456--1466},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v216/morrill23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/Morrill0HWS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-07799,
  author       = {Megan M. Baker and
                  Alexander New and
                  Mario Aguilar{-}Simon and
                  Ziad Al{-}Halah and
                  S{\'{e}}bastien M. R. Arnold and
                  Eseoghene Ben{-}Iwhiwhu and
                  Andrew P. Brna and
                  Ethan Brooks and
                  Ryan C. Brown and
                  Zachary Daniels and
                  Anurag Reddy Daram and
                  Fabien Delattre and
                  Ryan Dellana and
                  Eric Eaton and
                  Haotian Fu and
                  Kristen Grauman and
                  Jesse Hostetler and
                  Shariq Iqbal and
                  Cassandra Kent and
                  Nicholas Ketz and
                  Soheil Kolouri and
                  George Dimitri Konidaris and
                  Dhireesha Kudithipudi and
                  Erik G. Learned{-}Miller and
                  Seungwon Lee and
                  Michael Littman and
                  Sandeep Madireddy and
                  Jorge A. Mendez and
                  Eric Q. Nguyen and
                  Christine D. Piatko and
                  Praveen K. Pilly and
                  Aswin Raghavan and
                  Abrar Rahman and
                  Santhosh Kumar Ramakrishnan and
                  Neale Ratzlaff and
                  Andrea Soltoggio and
                  Peter Stone and
                  Indranil Sur and
                  Zhipeng Tang and
                  Saket Tiwari and
                  Kyle Vedder and
                  Felix Wang and
                  Zifan Xu and
                  Angel Yanguas{-}Gil and
                  Harel Yedidsion and
                  Shangqun Yu and
                  Gautam K. Vallabha},
  title        = {A Domain-Agnostic Approach for Characterization of Lifelong Learning
                  Systems},
  journal      = {CoRR},
  volume       = {abs/2301.07799},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.07799},
  doi          = {10.48550/ARXIV.2301.07799},
  eprinttype    = {arXiv},
  eprint       = {2301.07799},
  timestamp    = {Mon, 09 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-07799.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2304-11477,
  author       = {Bo Liu and
                  Yuqian Jiang and
                  Xiaohan Zhang and
                  Qiang Liu and
                  Shiqi Zhang and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {{LLM+P:} Empowering Large Language Models with Optimal Planning Proficiency},
  journal      = {CoRR},
  volume       = {abs/2304.11477},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.11477},
  doi          = {10.48550/ARXIV.2304.11477},
  eprinttype    = {arXiv},
  eprint       = {2304.11477},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-11477.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-04866,
  author       = {Jiaheng Hu and
                  Peter Stone and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n},
  title        = {Causal Policy Gradient for Whole-Body Mobile Manipulation},
  journal      = {CoRR},
  volume       = {abs/2305.04866},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.04866},
  doi          = {10.48550/ARXIV.2305.04866},
  eprinttype    = {arXiv},
  eprint       = {2305.04866},
  timestamp    = {Fri, 12 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-04866.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-10395,
  author       = {Yoonchang Sung and
                  Peter Stone},
  title        = {Motion Planning (In)feasibility Detection using a Prior Roadmap via
                  Path and Cut Search},
  journal      = {CoRR},
  volume       = {abs/2305.10395},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10395},
  doi          = {10.48550/ARXIV.2305.10395},
  eprinttype    = {arXiv},
  eprint       = {2305.10395},
  timestamp    = {Wed, 24 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10395.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03310,
  author       = {Bo Liu and
                  Yifeng Zhu and
                  Chongkai Gao and
                  Yihao Feng and
                  Qiang Liu and
                  Yuke Zhu and
                  Peter Stone},
  title        = {{LIBERO:} Benchmarking Knowledge Transfer for Lifelong Robot Learning},
  journal      = {CoRR},
  volume       = {abs/2306.03310},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03310},
  doi          = {10.48550/ARXIV.2306.03310},
  eprinttype    = {arXiv},
  eprint       = {2306.03310},
  timestamp    = {Mon, 31 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03310.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03792,
  author       = {Bo Liu and
                  Yihao Feng and
                  Peter Stone and
                  Qiang Liu},
  title        = {{FAMO:} Fast Adaptive Multitask Optimization},
  journal      = {CoRR},
  volume       = {abs/2306.03792},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03792},
  doi          = {10.48550/ARXIV.2306.03792},
  eprinttype    = {arXiv},
  eprint       = {2306.03792},
  timestamp    = {Mon, 31 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03792.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-07372,
  author       = {Dustin Morrill and
                  Thomas J. Walsh and
                  Daniel Hernandez and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Composing Efficient, Robust Tests for Policy Selection},
  journal      = {CoRR},
  volume       = {abs/2306.07372},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.07372},
  doi          = {10.48550/ARXIV.2306.07372},
  eprinttype    = {arXiv},
  eprint       = {2306.07372},
  timestamp    = {Sat, 17 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-07372.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-16740,
  author       = {Anthony G. Francis and
                  Claudia P{\'{e}}rez{-}D'Arpino and
                  Chengshu Li and
                  Fei Xia and
                  Alexandre Alahi and
                  Rachid Alami and
                  Aniket Bera and
                  Abhijat Biswas and
                  Joydeep Biswas and
                  Rohan Chandra and
                  Hao{-}Tien Lewis Chiang and
                  Michael Everett and
                  Sehoon Ha and
                  Justin W. Hart and
                  Jonathan P. How and
                  Haresh Karnan and
                  Tsang{-}Wei Edward Lee and
                  Luis J. Manso and
                  Reuth Mirsky and
                  S{\"{o}}ren Pirk and
                  Phani{-}Teja Singamaneni and
                  Peter Stone and
                  Ada V. Taylor and
                  Peter Trautman and
                  Nathan Tsoi and
                  Marynel V{\'{a}}zquez and
                  Xuesu Xiao and
                  Peng Xu and
                  Naoki Yokoyama and
                  Alexander Toshev and
                  Roberto Martin Martin},
  title        = {Principles and Guidelines for Evaluating Social Robot Navigation Algorithms},
  journal      = {CoRR},
  volume       = {abs/2306.16740},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.16740},
  doi          = {10.48550/ARXIV.2306.16740},
  eprinttype    = {arXiv},
  eprint       = {2306.16740},
  timestamp    = {Mon, 03 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-16740.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-11889,
  author       = {Xiaohan Zhang and
                  Yifeng Zhu and
                  Yan Ding and
                  Yuqian Jiang and
                  Yuke Zhu and
                  Peter Stone and
                  Shiqi Zhang},
  title        = {Symbolic State Space Optimization for Long Horizon Mobile Manipulation
                  Planning},
  journal      = {CoRR},
  volume       = {abs/2307.11889},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.11889},
  doi          = {10.48550/ARXIV.2307.11889},
  eprinttype    = {arXiv},
  eprint       = {2307.11889},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-11889.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-03205,
  author       = {Xuesu Xiao and
                  Zifan Xu and
                  Garrett Warnell and
                  Peter Stone and
                  Ferran Gebelli Guinjoan and
                  R{\^{o}}mulo T. Rodrigues and
                  Herman Bruyninckx and
                  Hanjaya Mandala and
                  Guilherme Christmann and
                  Jos{\'{e}} Luis Blanco{-}Claraco and
                  Shravan Somashekara Rai},
  title        = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons
                  learned from The 2nd {BARN} Challenge at {ICRA} 2023},
  journal      = {CoRR},
  volume       = {abs/2308.03205},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.03205},
  doi          = {10.48550/ARXIV.2308.03205},
  eprinttype    = {arXiv},
  eprint       = {2308.03205},
  timestamp    = {Mon, 21 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-03205.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-09595,
  author       = {Arrasy Rahman and
                  Jiaxun Cui and
                  Peter Stone},
  title        = {Minimum Coverage Sets for Training Robust Ad Hoc Teamwork Agents},
  journal      = {CoRR},
  volume       = {abs/2308.09595},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.09595},
  doi          = {10.48550/ARXIV.2308.09595},
  eprinttype    = {arXiv},
  eprint       = {2308.09595},
  timestamp    = {Fri, 25 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-09595.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-10966,
  author       = {Rohan Chandra and
                  Vrushabh Zinage and
                  Efstathios Bakolas and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Decentralized Multi-Robot Social Navigation in Constrained Environments
                  via Game-Theoretic Control Barrier Functions},
  journal      = {CoRR},
  volume       = {abs/2308.10966},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.10966},
  doi          = {10.48550/ARXIV.2308.10966},
  eprinttype    = {arXiv},
  eprint       = {2308.10966},
  timestamp    = {Wed, 30 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-10966.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-14269,
  author       = {Elad Liebman and
                  Peter Stone},
  title        = {Utilizing Mood-Inducing Background Music in Human-Robot Interaction},
  journal      = {CoRR},
  volume       = {abs/2308.14269},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.14269},
  doi          = {10.48550/ARXIV.2308.14269},
  eprinttype    = {arXiv},
  eprint       = {2308.14269},
  timestamp    = {Fri, 01 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-14269.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-08897,
  author       = {Yoonchang Sung and
                  Rahul Shome and
                  Peter Stone},
  title        = {Asynchronous Task Plan Refinement for Multi-Robot Task and Motion
                  Planning},
  journal      = {CoRR},
  volume       = {abs/2309.08897},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.08897},
  doi          = {10.48550/ARXIV.2309.08897},
  eprinttype    = {arXiv},
  eprint       = {2309.08897},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-08897.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-09912,
  author       = {Haresh Karnan and
                  Elvin Yang and
                  Garrett Warnell and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Wait, That Feels Familiar: Learning to Extrapolate Human Preferences
                  for Preference Aligned Path Planning},
  journal      = {CoRR},
  volume       = {abs/2309.09912},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.09912},
  doi          = {10.48550/ARXIV.2309.09912},
  eprinttype    = {arXiv},
  eprint       = {2309.09912},
  timestamp    = {Fri, 22 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-09912.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-13466,
  author       = {Amir Hossain Raj and
                  Zichao Hu and
                  Haresh Karnan and
                  Rohan Chandra and
                  Amirreza Payandeh and
                  Luisa Mao and
                  Peter Stone and
                  Joydeep Biswas and
                  Xuesu Xiao},
  title        = {Targeted Learning: {A} Hybrid Approach to Social Robot Navigation},
  journal      = {CoRR},
  volume       = {abs/2309.13466},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.13466},
  doi          = {10.48550/ARXIV.2309.13466},
  eprinttype    = {arXiv},
  eprint       = {2309.13466},
  timestamp    = {Wed, 27 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-13466.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-15302,
  author       = {Haresh Karnan and
                  Elvin Yang and
                  Daniel Farkash and
                  Garrett Warnell and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Self-Supervised Terrain Representation Learning from Unconstrained
                  Robot Experience},
  journal      = {CoRR},
  volume       = {abs/2309.15302},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.15302},
  doi          = {10.48550/ARXIV.2309.15302},
  eprinttype    = {arXiv},
  eprint       = {2309.15302},
  timestamp    = {Tue, 17 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-15302.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02456,
  author       = {W. Bradley Knox and
                  Stephane Hatgis{-}Kessell and
                  Sigurdur O. Adalgeirsson and
                  Serena Booth and
                  Anca D. Dragan and
                  Peter Stone and
                  Scott Niekum},
  title        = {Learning Optimal Advantage from Preferences and Mistaking it for Reward},
  journal      = {CoRR},
  volume       = {abs/2310.02456},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02456},
  doi          = {10.48550/ARXIV.2310.02456},
  eprinttype    = {arXiv},
  eprint       = {2310.02456},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02456.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06303,
  author       = {Carson Stark and
                  Bohkyung Chun and
                  Casey Charleston and
                  Varsha Ravi and
                  Luis Pabon and
                  Surya Sunkari and
                  Tarun Mohan and
                  Peter Stone and
                  Justin W. Hart},
  title        = {Dobby: {A} Conversational Service Robot Driven by {GPT-4}},
  journal      = {CoRR},
  volume       = {abs/2310.06303},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06303},
  doi          = {10.48550/ARXIV.2310.06303},
  eprinttype    = {arXiv},
  eprint       = {2310.06303},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06303.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06794,
  author       = {Siddhant Agarwal and
                  Ishan Durugkar and
                  Peter Stone and
                  Amy Zhang},
  title        = {f-Policy Gradients: {A} General Framework for Goal Conditioned {RL}
                  using f-Divergences},
  journal      = {CoRR},
  volume       = {abs/2310.06794},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06794},
  doi          = {10.48550/ARXIV.2310.06794},
  eprinttype    = {arXiv},
  eprint       = {2310.06794},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06794.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08702,
  author       = {Jiaheng Hu and
                  Zizhao Wang and
                  Peter Stone and
                  Roberto Martin Martin},
  title        = {{ELDEN:} Exploration via Local Dependencies},
  journal      = {CoRR},
  volume       = {abs/2310.08702},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08702},
  doi          = {10.48550/ARXIV.2310.08702},
  eprinttype    = {arXiv},
  eprint       = {2310.08702},
  timestamp    = {Wed, 25 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08702.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-14386,
  author       = {Yifeng Zhu and
                  Zhenyu Jiang and
                  Peter Stone and
                  Yuke Zhu},
  title        = {Learning Generalizable Manipulation Policies with Object-Centric 3D
                  Representations},
  journal      = {CoRR},
  volume       = {abs/2310.14386},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.14386},
  doi          = {10.48550/ARXIV.2310.14386},
  eprinttype    = {arXiv},
  eprint       = {2310.14386},
  timestamp    = {Mon, 30 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-14386.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-00785,
  author       = {Swathi Mannem and
                  William Macke and
                  Peter Stone and
                  Reuth Mirsky},
  title        = {Exploring the Cost of Interruptions in Human-Robot Teaming},
  journal      = {CoRR},
  volume       = {abs/2311.00785},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.00785},
  doi          = {10.48550/ARXIV.2311.00785},
  eprinttype    = {arXiv},
  eprint       = {2311.00785},
  timestamp    = {Tue, 07 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-00785.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-08783,
  author       = {Sveta Paster and
                  Kantwon Rogers and
                  Gordon Briggs and
                  Peter Stone and
                  Reuth Mirsky},
  title        = {{ICRA} Roboethics Challenge 2023: Intelligent Disobedience in an Elderly
                  Care Home},
  journal      = {CoRR},
  volume       = {abs/2311.08783},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.08783},
  doi          = {10.48550/ARXIV.2311.08783},
  eprinttype    = {arXiv},
  eprint       = {2311.08783},
  timestamp    = {Tue, 21 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-08783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-04684,
  author       = {Zifan Xu and
                  Haozhu Wang and
                  Dmitriy Bespalov and
                  Peter Stone and
                  Yanjun Qi},
  title        = {Latent Skill Discovery for Chain-of-Thought Reasoning},
  journal      = {CoRR},
  volume       = {abs/2312.04684},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.04684},
  doi          = {10.48550/ARXIV.2312.04684},
  eprinttype    = {arXiv},
  eprint       = {2312.04684},
  timestamp    = {Wed, 03 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-04684.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/arobots/XiaoLWS22,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Motion planning and control for mobile robot navigation using machine
                  learning: a survey},
  journal      = {Auton. Robots},
  volume       = {46},
  number       = {5},
  pages        = {569--597},
  year         = {2022},
  url          = {https://doi.org/10.1007/s10514-022-10039-8},
  doi          = {10.1007/S10514-022-10039-8},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/arobots/XiaoLWS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/expert/WurmanSS22,
  author       = {Peter R. Wurman and
                  Peter Stone and
                  Michael Spranger},
  title        = {Challenges and Opportunities of Applying Reinforcement Learning to
                  Autonomous Racing},
  journal      = {{IEEE} Intell. Syst.},
  volume       = {37},
  number       = {3},
  pages        = {20--23},
  year         = {2022},
  url          = {https://doi.org/10.1109/MIS.2022.3184427},
  doi          = {10.1109/MIS.2022.3184427},
  timestamp    = {Mon, 08 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/expert/WurmanSS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ior/AlbertCLS22,
  author       = {Michael Albert and
                  Vincent Conitzer and
                  Giuseppe Lopomo and
                  Peter Stone},
  title        = {Mechanism Design for Correlated Valuations: Efficient Methods for
                  Revenue Maximization},
  journal      = {Oper. Res.},
  volume       = {70},
  number       = {1},
  pages        = {562--584},
  year         = {2022},
  url          = {https://doi.org/10.1287/opre.2020.2092},
  doi          = {10.1287/OPRE.2020.2092},
  timestamp    = {Wed, 23 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ior/AlbertCLS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nature/WurmanBKMS0CDE022,
  author       = {Peter R. Wurman and
                  Samuel Barrett and
                  Kenta Kawamoto and
                  James MacGlashan and
                  Kaushik Subramanian and
                  Thomas J. Walsh and
                  Roberto Capobianco and
                  Alisa Devlic and
                  Franziska Eckert and
                  Florian Fuchs and
                  Leilani Gilpin and
                  Piyush Khandelwal and
                  Varun Kompella and
                  HaoChih Lin and
                  Patrick MacAlpine and
                  Declan Oller and
                  Takuma Seno and
                  Craig Sherstan and
                  Michael D. Thomure and
                  Houmehr Aghabozorgi and
                  Leon Barrett and
                  Rory Douglas and
                  Dion Whitehead and
                  Peter D{\"{u}}rr and
                  Peter Stone and
                  Michael Spranger and
                  Hiroaki Kitano},
  title        = {Outracing champion Gran Turismo drivers with deep reinforcement learning},
  journal      = {Nat.},
  volume       = {602},
  number       = {7896},
  pages        = {223--228},
  year         = {2022},
  url          = {https://doi.org/10.1038/s41586-021-04357-7},
  doi          = {10.1038/S41586-021-04357-7},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nature/WurmanBKMS0CDE022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nca/DuWGST22,
  author       = {Yunshu Du and
                  Garrett Warnell and
                  Assefaw H. Gebremedhin and
                  Peter Stone and
                  Matthew E. Taylor},
  title        = {Lucid dreaming for experience replay: refreshing past states with
                  the current policy},
  journal      = {Neural Comput. Appl.},
  volume       = {34},
  number       = {3},
  pages        = {1687--1712},
  year         = {2022},
  url          = {https://doi.org/10.1007/s00521-021-06104-5},
  doi          = {10.1007/S00521-021-06104-5},
  timestamp    = {Wed, 23 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nca/DuWGST22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/ZhuSZ22,
  author       = {Yifeng Zhu and
                  Peter Stone and
                  Yuke Zhu},
  title        = {Bottom-Up Skill Discovery From Unsegmented Demonstrations for Long-Horizon
                  Robot Manipulation},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {7},
  number       = {2},
  pages        = {4126--4133},
  year         = {2022},
  url          = {https://doi.org/10.1109/LRA.2022.3146589},
  doi          = {10.1109/LRA.2022.3146589},
  timestamp    = {Fri, 01 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/ZhuSZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/KarnanNXWPTHBS22,
  author       = {Haresh Karnan and
                  Anirudh Nair and
                  Xuesu Xiao and
                  Garrett Warnell and
                  S{\"{o}}ren Pirk and
                  Alexander Toshev and
                  Justin W. Hart and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Socially CompliAnt Navigation Dataset {(SCAND):} {A} Large-Scale Dataset
                  of Demonstrations for Social Navigation},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {7},
  number       = {4},
  pages        = {11807--11814},
  year         = {2022},
  url          = {https://doi.org/10.1109/LRA.2022.3184025},
  doi          = {10.1109/LRA.2022.3184025},
  timestamp    = {Mon, 05 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/KarnanNXWPTHBS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ram/XiaoXWSWSZRWKBM22,
  author       = {Xuesu Xiao and
                  Zifan Xu and
                  Zizhao Wang and
                  Yunlong Song and
                  Garrett Warnell and
                  Peter Stone and
                  Tingnan Zhang and
                  Shravan Ravi and
                  Gary Wang and
                  Haresh Karnan and
                  Joydeep Biswas and
                  Nicholas Mohammad and
                  Lauren Bramblett and
                  Rahul Peddi and
                  Nicola Bezzo and
                  Zhanteng Xie and
                  Philip M. Dames},
  title        = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons
                  Learned From the Benchmark Autonomous Robot Navigation Challenge at
                  {ICRA} 2022 [Competitions]},
  journal      = {{IEEE} Robotics Autom. Mag.},
  volume       = {29},
  number       = {4},
  pages        = {148--156},
  year         = {2022},
  url          = {https://doi.org/10.1109/MRA.2022.3213466},
  doi          = {10.1109/MRA.2022.3213466},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ram/XiaoXWSWSZRWKBM22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/XiaoWXLWDNS22,
  author       = {Xuesu Xiao and
                  Zizhao Wang and
                  Zifan Xu and
                  Bo Liu and
                  Garrett Warnell and
                  Gauraang Dhamankar and
                  Anirudh Nair and
                  Peter Stone},
  title        = {{APPL:} Adaptive Planner Parameter Learning},
  journal      = {Robotics Auton. Syst.},
  volume       = {154},
  pages        = {104132},
  year         = {2022},
  url          = {https://doi.org/10.1016/j.robot.2022.104132},
  doi          = {10.1016/J.ROBOT.2022.104132},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ras/XiaoWXLWDNS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/collas/Shperberg0AS22,
  author       = {Shahaf S. Shperberg and
                  Bo Liu and
                  Alessandro Allievi and
                  Peter Stone},
  editor       = {Sarath Chandar and
                  Razvan Pascanu and
                  Doina Precup},
  title        = {A Rule-based Shield: Accumulating Safety Rules from Catastrophic Action
                  Effects},
  booktitle    = {Conference on Lifelong Learning Agents, CoLLAs 2022, 22-24 August
                  2022, McGill University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada},
  series       = {Proceedings of Machine Learning Research},
  volume       = {199},
  pages        = {231--242},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v199/shperberg22a.html},
  timestamp    = {Fri, 17 Feb 2023 16:29:10 +0100},
  biburl       = {https://dblp.org/rec/conf/collas/Shperberg0AS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/collas/LiuLS22,
  author       = {Bo Liu and
                  Qiang Liu and
                  Peter Stone},
  editor       = {Sarath Chandar and
                  Razvan Pascanu and
                  Doina Precup},
  title        = {Continual Learning and Private Unlearning},
  booktitle    = {Conference on Lifelong Learning Agents, CoLLAs 2022, 22-24 August
                  2022, McGill University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada},
  series       = {Proceedings of Machine Learning Research},
  volume       = {199},
  pages        = {243--254},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v199/liu22a.html},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/collas/LiuLS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/ZhuJSZ22,
  author       = {Yifeng Zhu and
                  Abhishek Joshi and
                  Peter Stone and
                  Yuke Zhu},
  editor       = {Karen Liu and
                  Dana Kulic and
                  Jeffrey Ichnowski},
  title        = {{VIOLA:} Object-Centric Imitation Learning for Vision-Based Robot
                  Manipulation},
  booktitle    = {Conference on Robot Learning, CoRL 2022, 14-18 December 2022, Auckland,
                  New Zealand},
  series       = {Proceedings of Machine Learning Research},
  volume       = {205},
  pages        = {1199--1210},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v205/zhu23a.html},
  timestamp    = {Wed, 15 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/ZhuJSZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/SungWS22,
  author       = {Yoonchang Sung and
                  Zizhao Wang and
                  Peter Stone},
  editor       = {Karen Liu and
                  Dana Kulic and
                  Jeffrey Ichnowski},
  title        = {Learning to Correct Mistakes: Backjumping in Long-Horizon Task and
                  Motion Planning},
  booktitle    = {Conference on Robot Learning, CoRL 2022, 14-18 December 2022, Auckland,
                  New Zealand},
  series       = {Proceedings of Machine Learning Research},
  volume       = {205},
  pages        = {2115--2124},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v205/sung23a.html},
  timestamp    = {Wed, 15 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/corl/SungWS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/CuiQ0SZ22,
  author       = {Jiaxun Cui and
                  Hang Qiu and
                  Dian Chen and
                  Peter Stone and
                  Yuke Zhu},
  title        = {Coopernaut: End-to-End Driving with Cooperative Perception for Networked
                  Vehicles},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {17231--17241},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.01674},
  doi          = {10.1109/CVPR52688.2022.01674},
  timestamp    = {Mon, 13 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/CuiQ0SZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eenergy/Nweye0LS22,
  author       = {Kingsley Nweye and
                  Zolt{\'{a}}n Nagy and
                  Bo Liu and
                  Peter Stone},
  editor       = {Sebastian Lehnhoff and
                  David E. Irwin and
                  Dan Wang},
  title        = {Offline training of multi-agent reinforcement agents for grid-interactive
                  buildings control},
  booktitle    = {e-Energy '22: The Thirteenth {ACM} International Conference on Future
                  Energy Systems, Virtual Event, 28 June 2022 - 1 July 2022},
  pages        = {442--443},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3538637.3538752},
  doi          = {10.1145/3538637.3538752},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eenergy/Nweye0LS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eumas/MirskyCRFMSSA22,
  author       = {Reuth Mirsky and
                  Ignacio Carlucho and
                  Arrasy Rahman and
                  Elliot Fosong and
                  William Macke and
                  Mohan Sridharan and
                  Peter Stone and
                  Stefano V. Albrecht},
  editor       = {Dorothea Baumeister and
                  J{\"{o}}rg Rothe},
  title        = {A Survey of Ad Hoc Teamwork Research},
  booktitle    = {Multi-Agent Systems - 19th European Conference, {EUMAS} 2022, D{\"{u}}sseldorf,
                  Germany, September 14-16, 2022, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {13442},
  pages        = {275--293},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-20614-6\_16},
  doi          = {10.1007/978-3-031-20614-6\_16},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eumas/MirskyCRFMSSA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/KumarLMS22,
  author       = {Akarsh Kumar and
                  Bo Liu and
                  Risto Miikkulainen and
                  Peter Stone},
  editor       = {Jonathan E. Fieldsend and
                  Markus Wagner},
  title        = {Effective mutation rate adaptation through group elite selection},
  booktitle    = {{GECCO} '22: Genetic and Evolutionary Computation Conference, Boston,
                  Massachusetts, USA, July 9 - 13, 2022},
  pages        = {721--729},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3512290.3528706},
  doi          = {10.1145/3512290.3528706},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/KumarLMS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/WangXXZS22,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Zifan Xu and
                  Yuke Zhu and
                  Peter Stone},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Causal Dynamics Learning for Task-Independent State Abstraction},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {23151--23180},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/wang22ae.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/WangXXZS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ZhangZDZS022,
  author       = {Xiaohan Zhang and
                  Yifeng Zhu and
                  Yan Ding and
                  Yuke Zhu and
                  Peter Stone and
                  Shiqi Zhang},
  title        = {Visually Grounded Task and Motion Planning for Mobile Manipulation},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {1925--1931},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9812055},
  doi          = {10.1109/ICRA46639.2022.9812055},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/ZhangZDZS022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KarnanTWS22,
  author       = {Haresh Karnan and
                  Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Adversarial Imitation Learning from Video Using a State Observer},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {2452--2458},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9811570},
  doi          = {10.1109/ICRA46639.2022.9811570},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KarnanTWS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/HudsonWTS22,
  author       = {Eddy Hudson and
                  Garrett Warnell and
                  Faraz Torabi and
                  Peter Stone},
  title        = {Skeletal Feature Compensation for Imitation Learning with Embodiment
                  Mismatch},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {2482--2488},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9812127},
  doi          = {10.1109/ICRA46639.2022.9812127},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/HudsonWTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KarnanWXS22,
  author       = {Haresh Karnan and
                  Garrett Warnell and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {{VOILA:} Visual-Observation-Only Imitation Learning for Autonomous
                  Navigation},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {2497--2503},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9812316},
  doi          = {10.1109/ICRA46639.2022.9812316},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KarnanWXS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SokarMMPS22,
  author       = {Ghada Sokar and
                  Elena Mocanu and
                  Decebal Constantin Mocanu and
                  Mykola Pechenizkiy and
                  Peter Stone},
  editor       = {Luc De Raedt},
  title        = {Dynamic Sparse Training for Deep Reinforcement Learning},
  booktitle    = {Proceedings of the Thirty-First International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2022, Vienna, Austria, 23-29 July
                  2022},
  pages        = {3437--3443},
  publisher    = {ijcai.org},
  year         = {2022},
  url          = {https://doi.org/10.24963/ijcai.2022/477},
  doi          = {10.24963/IJCAI.2022/477},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/SokarMMPS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/KarnanSARXWSB22,
  author       = {Haresh Karnan and
                  Kavan Singh Sikand and
                  Pranav Atreya and
                  Sadegh Rabiee and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Peter Stone and
                  Joydeep Biswas},
  title        = {{VI-IKD:} High-Speed Accurate Off-Road Navigation using Learned Visual-Inertial
                  Inverse Kinodynamics},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2022, Kyoto, Japan, October 23-27, 2022},
  pages        = {3294--3301},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IROS47612.2022.9982060},
  doi          = {10.1109/IROS47612.2022.9982060},
  timestamp    = {Tue, 03 Jan 2023 14:18:21 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/KarnanSARXWSB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/GhonasgiMHSD22,
  author       = {Keya Ghonasgi and
                  Reuth Mirsky and
                  Adrian M. Haith and
                  Peter Stone and
                  Ashish D. Deshpande},
  title        = {Quantifying Changes in Kinematic Behavior of a Human-Exoskeleton Interactive
                  System},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2022, Kyoto, Japan, October 23-27, 2022},
  pages        = {10734--10739},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IROS47612.2022.9981032},
  doi          = {10.1109/IROS47612.2022.9981032},
  timestamp    = {Tue, 03 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/GhonasgiMHSD22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuYWSL22,
  author       = {Bo Liu and
                  Mao Ye and
                  Stephen Wright and
                  Peter Stone and
                  Qiang Liu},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {BOME! Bilevel Optimization Made Easy: {A} Simple First-Order Approach},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/6dddcff5b115b40c998a08fbd1cea4d7-Abstract-Conference.html},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuYWSL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MacGlashanADSSW22,
  author       = {James MacGlashan and
                  Evan Archer and
                  Alisa Devlic and
                  Takuma Seno and
                  Craig Sherstan and
                  Peter R. Wurman and
                  Peter Stone},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Value Function Decomposition for Iterative Design of Reinforcement
                  Learning Agents},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/4eb2c0adafbe71269f3a772c130f9e53-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MacGlashanADSSW22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/NarayanaswamiTD22,
  author       = {Sai Kiran Narayanaswami and
                  Mauricio Tec and
                  Ishan Durugkar and
                  Siddharth Desai and
                  Bharath Masetty and
                  Sanmit Narvekar and
                  Peter Stone},
  editor       = {Amy Eguchi and
                  Nuno Lau and
                  Maike Paetzel{-}Pr{\"{u}}smann and
                  Thanapat Wanichanon},
  title        = {Towards a Real-Time, Low-Resource, End-to-End Object Detection Pipeline
                  for Robot Soccer},
  booktitle    = {RoboCup 2022: - Robot World Cup {XXV} [Bangkok, Thailand, July 11-17,
                  2022]},
  series       = {Lecture Notes in Computer Science},
  volume       = {13561},
  pages        = {62--74},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-28469-4\_6},
  doi          = {10.1007/978-3-031-28469-4\_6},
  timestamp    = {Wed, 24 May 2023 15:08:30 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/NarayanaswamiTD22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssrr/NairJHXLXS22,
  author       = {Anirudh Nair and
                  Fulin Jiang and
                  Kang Hou and
                  Zifan Xu and
                  Shuozhe Li and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {DynaBARN: Benchmarking Metric Ground Navigation in Dynamic Environments},
  booktitle    = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics,
                  {SSRR} 2022, Sevilla, Spain, November 8-10, 2022},
  pages        = {347--352},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/SSRR56537.2022.10018758},
  doi          = {10.1109/SSRR56537.2022.10018758},
  timestamp    = {Wed, 08 Feb 2023 22:09:23 +0100},
  biburl       = {https://dblp.org/rec/conf/ssrr/NairJHXLXS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-00243,
  author       = {Haresh Karnan and
                  Garrett Warnell and
                  Faraz Torabi and
                  Peter Stone},
  title        = {Adversarial Imitation Learning from Video using a State Observer},
  journal      = {CoRR},
  volume       = {abs/2202.00243},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.00243},
  eprinttype    = {arXiv},
  eprint       = {2202.00243},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-00243.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-09516,
  author       = {Shahaf S. Shperberg and
                  Bo Liu and
                  Peter Stone},
  title        = {Learning a Shield from Catastrophic Action Effects: Never Repeat the
                  Same Mistake},
  journal      = {CoRR},
  volume       = {abs/2202.09516},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.09516},
  eprinttype    = {arXiv},
  eprint       = {2202.09516},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-09516.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-10450,
  author       = {Reuth Mirsky and
                  Ignacio Carlucho and
                  Arrasy Rahman and
                  Elliot Fosong and
                  William Macke and
                  Mohan Sridharan and
                  Peter Stone and
                  Stefano V. Albrecht},
  title        = {A Survey of Ad Hoc Teamwork: Definitions, Methods, and Open Problems},
  journal      = {CoRR},
  volume       = {abs/2202.10450},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.10450},
  eprinttype    = {arXiv},
  eprint       = {2202.10450},
  timestamp    = {Wed, 02 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-10450.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-10667,
  author       = {Xiaohan Zhang and
                  Yifeng Zhu and
                  Yan Ding and
                  Yuke Zhu and
                  Peter Stone and
                  Shiqi Zhang},
  title        = {Visually Grounded Task and Motion Planning for Mobile Manipulation},
  journal      = {CoRR},
  volume       = {abs/2202.10667},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.10667},
  eprinttype    = {arXiv},
  eprint       = {2202.10667},
  timestamp    = {Mon, 25 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-10667.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-12817,
  author       = {Bo Liu and
                  Qiang Liu and
                  Peter Stone},
  title        = {Continual Learning and Private Unlearning},
  journal      = {CoRR},
  volume       = {abs/2203.12817},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.12817},
  doi          = {10.48550/ARXIV.2203.12817},
  eprinttype    = {arXiv},
  eprint       = {2203.12817},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-12817.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-15041,
  author       = {Haresh Karnan and
                  Anirudh Nair and
                  Xuesu Xiao and
                  Garrett Warnell and
                  S{\"{o}}ren Pirk and
                  Alexander Toshev and
                  Justin W. Hart and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Socially Compliant Navigation Dataset {(SCAND):} {A} Large-Scale Dataset
                  of Demonstrations for Social Navigation},
  journal      = {CoRR},
  volume       = {abs/2203.15041},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.15041},
  doi          = {10.48550/ARXIV.2203.15041},
  eprinttype    = {arXiv},
  eprint       = {2203.15041},
  timestamp    = {Mon, 28 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-15041.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-15983,
  author       = {Haresh Karnan and
                  Kavan Singh Sikand and
                  Pranav Atreya and
                  Sadegh Rabiee and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Peter Stone and
                  Joydeep Biswas},
  title        = {{VI-IKD:} High-Speed Accurate Off-Road Navigation using Learned Visual-Inertial
                  Inverse Kinodynamics},
  journal      = {CoRR},
  volume       = {abs/2203.15983},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.15983},
  doi          = {10.48550/ARXIV.2203.15983},
  eprinttype    = {arXiv},
  eprint       = {2203.15983},
  timestamp    = {Mon, 04 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-15983.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-04817,
  author       = {Akarsh Kumar and
                  Bo Liu and
                  Risto Miikkulainen and
                  Peter Stone},
  title        = {Effective Mutation Rate Adaptation through Group Elite Selection},
  journal      = {CoRR},
  volume       = {abs/2204.04817},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.04817},
  doi          = {10.48550/ARXIV.2204.04817},
  eprinttype    = {arXiv},
  eprint       = {2204.04817},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-04817.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-02222,
  author       = {Jiaxun Cui and
                  Hang Qiu and
                  Dian Chen and
                  Peter Stone and
                  Yuke Zhu},
  title        = {{COOPERNAUT:} End-to-End Driving with Cooperative Perception for Networked
                  Vehicles},
  journal      = {CoRR},
  volume       = {abs/2205.02222},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.02222},
  doi          = {10.48550/ARXIV.2205.02222},
  eprinttype    = {arXiv},
  eprint       = {2205.02222},
  timestamp    = {Mon, 13 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-02222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-00233,
  author       = {Caroline Wang and
                  Ishan Durugkar and
                  Elad Liebman and
                  Peter Stone},
  title        = {DM\({}^{\mbox{2}}\): Distributed Multi-Agent Reinforcement Learning
                  for Distribution Matching},
  journal      = {CoRR},
  volume       = {abs/2206.00233},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.00233},
  doi          = {10.48550/ARXIV.2206.00233},
  eprinttype    = {arXiv},
  eprint       = {2206.00233},
  timestamp    = {Mon, 13 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-00233.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-02231,
  author       = {W. Bradley Knox and
                  Stephane Hatgis{-}Kessell and
                  Serena Booth and
                  Scott Niekum and
                  Peter Stone and
                  Alessandro Allievi},
  title        = {Models of human preference for learning reward functions},
  journal      = {CoRR},
  volume       = {abs/2206.02231},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.02231},
  doi          = {10.48550/ARXIV.2206.02231},
  eprinttype    = {arXiv},
  eprint       = {2206.02231},
  timestamp    = {Mon, 13 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-02231.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-08487,
  author       = {Pranav Atreya and
                  Haresh Karnan and
                  Kavan Singh Sikand and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Sadegh Rabiee and
                  Peter Stone and
                  Joydeep Biswas},
  title        = {High-Speed Accurate Robot Control using Learned Forward Kinodynamics
                  and Non-linear Least Squares Optimization},
  journal      = {CoRR},
  volume       = {abs/2206.08487},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.08487},
  doi          = {10.48550/ARXIV.2206.08487},
  eprinttype    = {arXiv},
  eprint       = {2206.08487},
  timestamp    = {Tue, 21 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-08487.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-13452,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Zifan Xu and
                  Yuke Zhu and
                  Peter Stone},
  title        = {Causal Dynamics Learning for Task-Independent State Abstraction},
  journal      = {CoRR},
  volume       = {abs/2206.13452},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.13452},
  doi          = {10.48550/ARXIV.2206.13452},
  eprinttype    = {arXiv},
  eprint       = {2206.13452},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-13452.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-13901,
  author       = {James MacGlashan and
                  Evan Archer and
                  Alisa Devlic and
                  Takuma Seno and
                  Craig Sherstan and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Value Function Decomposition for Iterative Design of Reinforcement
                  Learning Agents},
  journal      = {CoRR},
  volume       = {abs/2206.13901},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.13901},
  doi          = {10.48550/ARXIV.2206.13901},
  eprinttype    = {arXiv},
  eprint       = {2206.13901},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-13901.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-08133,
  author       = {Bo Liu and
                  Yihao Feng and
                  Qiang Liu and
                  Peter Stone},
  title        = {Metric Residual Networks for Sample Efficient Goal-conditioned Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2208.08133},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.08133},
  doi          = {10.48550/ARXIV.2208.08133},
  eprinttype    = {arXiv},
  eprint       = {2208.08133},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-08133.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-10473,
  author       = {Xuesu Xiao and
                  Zifan Xu and
                  Zizhao Wang and
                  Yunlong Song and
                  Garrett Warnell and
                  Peter Stone and
                  Tingnan Zhang and
                  Shravan Ravi and
                  Gary Wang and
                  Haresh Karnan and
                  Joydeep Biswas and
                  Nicholas Mohammad and
                  Lauren Bramblett and
                  Rahul Peddi and
                  Nicola Bezzo and
                  Zhanteng Xie and
                  Philip M. Dames},
  title        = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons
                  learned from The {BARN} Challenge at {ICRA} 2022},
  journal      = {CoRR},
  volume       = {abs/2208.10473},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.10473},
  doi          = {10.48550/ARXIV.2208.10473},
  eprinttype    = {arXiv},
  eprint       = {2208.10473},
  timestamp    = {Mon, 29 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-10473.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-08709,
  author       = {Mao Ye and
                  Bo Liu and
                  Stephen Wright and
                  Peter Stone and
                  Qiang Liu},
  title        = {BOME! Bilevel Optimization Made Easy: {A} Simple First-Order Approach},
  journal      = {CoRR},
  volume       = {abs/2209.08709},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.08709},
  doi          = {10.48550/ARXIV.2209.08709},
  eprinttype    = {arXiv},
  eprint       = {2209.08709},
  timestamp    = {Wed, 15 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-08709.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-13641,
  author       = {Jin Soo Park and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Harel Yedidsion and
                  Peter Stone},
  title        = {Learning Perceptual Hallucination for Multi-Robot Navigation in Narrow
                  Hallways},
  journal      = {CoRR},
  volume       = {abs/2209.13641},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.13641},
  doi          = {10.48550/ARXIV.2209.13641},
  eprinttype    = {arXiv},
  eprint       = {2209.13641},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-13641.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-04839,
  author       = {Zifan Xu and
                  Bo Liu and
                  Xuesu Xiao and
                  Anirudh Nair and
                  Peter Stone},
  title        = {Benchmarking Reinforcement Learning Techniques for Autonomous Navigation},
  journal      = {CoRR},
  volume       = {abs/2210.04839},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.04839},
  doi          = {10.48550/ARXIV.2210.04839},
  eprinttype    = {arXiv},
  eprint       = {2210.04839},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-04839.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-04852,
  author       = {Zifan Xu and
                  Anirudh Nair and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Learning Real-world Autonomous Navigation by Self-Supervised Environment
                  Synthesis},
  journal      = {CoRR},
  volume       = {abs/2210.04852},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.04852},
  doi          = {10.48550/ARXIV.2210.04852},
  eprinttype    = {arXiv},
  eprint       = {2210.04852},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-04852.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-10999,
  author       = {Vaibhav Bajaj and
                  Guni Sharon and
                  Peter Stone},
  title        = {Task Phasing: Automated Curriculum Learning from Demonstrations},
  journal      = {CoRR},
  volume       = {abs/2210.10999},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.10999},
  doi          = {10.48550/ARXIV.2210.10999},
  eprinttype    = {arXiv},
  eprint       = {2210.10999},
  timestamp    = {Tue, 25 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-10999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-11339,
  author       = {Yifeng Zhu and
                  Abhishek Joshi and
                  Peter Stone and
                  Yuke Zhu},
  title        = {{VIOLA:} Imitation Learning for Vision-Based Manipulation with Object
                  Proposal Priors},
  journal      = {CoRR},
  volume       = {abs/2210.11339},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.11339},
  doi          = {10.48550/ARXIV.2210.11339},
  eprinttype    = {arXiv},
  eprint       = {2210.11339},
  timestamp    = {Tue, 25 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-11339.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-14428,
  author       = {Caroline Wang and
                  Garrett Warnell and
                  Peter Stone},
  title        = {D-Shape: Demonstration-Shaped Reinforcement Learning via Goal Conditioning},
  journal      = {CoRR},
  volume       = {abs/2210.14428},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.14428},
  doi          = {10.48550/ARXIV.2210.14428},
  eprinttype    = {arXiv},
  eprint       = {2210.14428},
  timestamp    = {Mon, 31 Oct 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-14428.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00576,
  author       = {Varun Kompella and
                  Thomas Walsh and
                  Samuel Barrett and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Event Tables for Efficient Experience Replay},
  journal      = {CoRR},
  volume       = {abs/2211.00576},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00576},
  doi          = {10.48550/ARXIV.2211.00576},
  eprinttype    = {arXiv},
  eprint       = {2211.00576},
  timestamp    = {Tue, 15 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00576.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-04005,
  author       = {Eddy Hudson and
                  Ishan Durugkar and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{ABC:} Adversarial Behavioral Cloning for Offline Mode-Seeking Imitation
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2211.04005},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.04005},
  doi          = {10.48550/ARXIV.2211.04005},
  eprinttype    = {arXiv},
  eprint       = {2211.04005},
  timestamp    = {Wed, 09 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-04005.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-06318,
  author       = {Peter Stone and
                  Rodney Brooks and
                  Erik Brynjolfsson and
                  Ryan Calo and
                  Oren Etzioni and
                  Greg Hager and
                  Julia Hirschberg and
                  Shivaram Kalyanakrishnan and
                  Ece Kamar and
                  Sarit Kraus and
                  Kevin Leyton{-}Brown and
                  David C. Parkes and
                  William H. Press and
                  AnnaLee Saxenian and
                  Julie Shah and
                  Milind Tambe and
                  Astro Teller},
  title        = {Artificial Intelligence and Life in 2030: The One Hundred Year Study
                  on Artificial Intelligence},
  journal      = {CoRR},
  volume       = {abs/2211.06318},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.06318},
  doi          = {10.48550/ARXIV.2211.06318},
  eprinttype    = {arXiv},
  eprint       = {2211.06318},
  timestamp    = {Sat, 17 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-06318.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-07847,
  author       = {Yoonchang Sung and
                  Zizhao Wang and
                  Peter Stone},
  title        = {Learning to Correct Mistakes: Backjumping in Long-Horizon Task and
                  Motion Planning},
  journal      = {CoRR},
  volume       = {abs/2211.07847},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.07847},
  doi          = {10.48550/ARXIV.2211.07847},
  eprinttype    = {arXiv},
  eprint       = {2211.07847},
  timestamp    = {Wed, 23 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-07847.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-08302,
  author       = {Hager Radi and
                  Josiah P. Hanna and
                  Peter Stone and
                  Matthew E. Taylor},
  title        = {Safe Evaluation For Offline Learning: Are We Ready To Deploy?},
  journal      = {CoRR},
  volume       = {abs/2212.08302},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.08302},
  doi          = {10.48550/ARXIV.2212.08302},
  eprinttype    = {arXiv},
  eprint       = {2212.08302},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-08302.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/ZhangTWS21,
  author       = {Ruohan Zhang and
                  Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Recent advances in leveraging human guidance for sequential decision-making
                  tasks},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {35},
  number       = {2},
  pages        = {31},
  year         = {2021},
  url          = {https://doi.org/10.1007/s10458-021-09514-w},
  doi          = {10.1007/S10458-021-09514-W},
  timestamp    = {Thu, 29 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aamas/ZhangTWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/CapobiancoKASJF21,
  author       = {Roberto Capobianco and
                  Varun Kompella and
                  James Ault and
                  Guni Sharon and
                  Stacy Jong and
                  Spencer J. Fox and
                  Lauren Ancel Meyers and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Agent-Based Markov Modeling for Improved {COVID-19} Mitigation Policies},
  journal      = {J. Artif. Intell. Res.},
  volume       = {71},
  pages        = {953--992},
  year         = {2021},
  url          = {https://doi.org/10.1613/jair.1.12632},
  doi          = {10.1613/JAIR.1.12632},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/CapobiancoKASJF21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/HannaNS21,
  author       = {Josiah P. Hanna and
                  Scott Niekum and
                  Peter Stone},
  title        = {Importance sampling in reinforcement learning with an estimated behavior
                  policy},
  journal      = {Mach. Learn.},
  volume       = {110},
  number       = {6},
  pages        = {1267--1317},
  year         = {2021},
  url          = {https://doi.org/10.1007/s10994-020-05938-9},
  doi          = {10.1007/S10994-020-05938-9},
  timestamp    = {Thu, 05 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/HannaNS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/HannaDKWS21,
  author       = {Josiah P. Hanna and
                  Siddharth Desai and
                  Haresh Karnan and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Grounded action transformation for sim-to-real reinforcement learning},
  journal      = {Mach. Learn.},
  volume       = {110},
  number       = {9},
  pages        = {2469--2499},
  year         = {2021},
  url          = {https://doi.org/10.1007/s10994-021-05982-z},
  doi          = {10.1007/S10994-021-05982-Z},
  timestamp    = {Thu, 16 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ml/HannaDKWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/LiuXS21,
  author       = {Bo Liu and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {A Lifelong Learning Approach to Mobile Robot Navigation},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {6},
  number       = {2},
  pages        = {1090--1096},
  year         = {2021},
  url          = {https://doi.org/10.1109/LRA.2021.3056373},
  doi          = {10.1109/LRA.2021.3056373},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/LiuXS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/XiaoLWS21,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Toward Agile Maneuvers in Highly Constrained Spaces: Learning From
                  Hallucination},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {6},
  number       = {2},
  pages        = {1503--1510},
  year         = {2021},
  url          = {https://doi.org/10.1109/LRA.2021.3058927},
  doi          = {10.1109/LRA.2021.3058927},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/XiaoLWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/XiaoBS21,
  author       = {Xuesu Xiao and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Learning Inverse Kinodynamics for Accurate High-Speed Off-Road Navigation
                  on Unstructured Terrain},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {6},
  number       = {3},
  pages        = {6054--6060},
  year         = {2021},
  url          = {https://doi.org/10.1109/LRA.2021.3090023},
  doi          = {10.1109/LRA.2021.3090023},
  timestamp    = {Tue, 13 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/XiaoBS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/WangXWS21,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{APPLE:} Adaptive Planner Parameter Learning From Evaluative Feedback},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {6},
  number       = {4},
  pages        = {7744--7749},
  year         = {2021},
  url          = {https://doi.org/10.1109/lra.2021.3100940},
  doi          = {10.1109/LRA.2021.3100940},
  timestamp    = {Thu, 13 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/WangXWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ram/StoneITZ21,
  author       = {Peter Stone and
                  Luca Iocchi and
                  Flavio Tonidandel and
                  Changjiu Zhou},
  title        = {RoboCup 2021 Worldwide: {A} Successful Robotics Competition During
                  a Pandemic [Competitions]},
  journal      = {{IEEE} Robotics Autom. Mag.},
  volume       = {28},
  number       = {4},
  pages        = {114--119},
  year         = {2021},
  url          = {https://doi.org/10.1109/MRA.2021.3117413},
  doi          = {10.1109/MRA.2021.3117413},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ram/StoneITZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tac/KoppelWSSR21,
  author       = {Alec Koppel and
                  Garrett Warnell and
                  Ethan Stump and
                  Peter Stone and
                  Alejandro Ribeiro},
  title        = {Policy Evaluation in Continuous MDPs With Efficient Kernelized Gradient
                  Temporal Difference},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {66},
  number       = {4},
  pages        = {1856--1863},
  year         = {2021},
  url          = {https://doi.org/10.1109/TAC.2020.3029315},
  doi          = {10.1109/TAC.2020.3029315},
  timestamp    = {Wed, 07 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/KoppelWSSR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/JiangWS21,
  author       = {Yu{-}Sian Jiang and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Goal Blending for Responsive Shared Autonomy in a Navigating Vehicle},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {5939--5947},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i7.16742},
  doi          = {10.1609/AAAI.V35I7.16742},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/JiangWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/JiangB0STS21,
  author       = {Yuqian Jiang and
                  Suda Bharadwaj and
                  Bo Wu and
                  Rishi Shah and
                  Ufuk Topcu and
                  Peter Stone},
  title        = {Temporal-Logic-Based Reward Shaping for Continuing Reinforcement Learning
                  Tasks},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {7995--8003},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i9.16975},
  doi          = {10.1609/AAAI.V35I9.16975},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/JiangB0STS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MackeMS21,
  author       = {William Macke and
                  Reuth Mirsky and
                  Peter Stone},
  title        = {Expected Value of Communication for Planning in Ad Hoc Teamwork},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {11290--11298},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i13.17346},
  doi          = {10.1609/AAAI.V35I13.17346},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MackeMS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/CuiZJASNK21,
  author       = {Yuchen Cui and
                  Qiping Zhang and
                  Sahil Jain and
                  Alessandro Allievi and
                  Peter Stone and
                  Scott Niekum and
                  W. Bradley Knox},
  title        = {Demonstration of the {EMPATHIC} Framework for Task Learning from Implicit
                  Human Feedback},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {16017--16019},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i18.17998},
  doi          = {10.1609/AAAI.V35I18.17998},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/CuiZJASNK21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MirskyS21,
  author       = {Reuth Mirsky and
                  Peter Stone},
  editor       = {Frank Dignum and
                  Alessio Lomuscio and
                  Ulle Endriss and
                  Ann Now{\'{e}}},
  title        = {The Seeing-Eye Robot Grand Challenge: Rethinking Automated Care},
  booktitle    = {{AAMAS} '21: 20th International Conference on Autonomous Agents and
                  Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021},
  pages        = {28--33},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p28.pdf},
  doi          = {10.5555/3463952.3463959},
  timestamp    = {Wed, 20 Jul 2022 17:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MirskyS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/CuiMYGUS21,
  author       = {Jiaxun Cui and
                  William Macke and
                  Harel Yedidsion and
                  Aastha Goyal and
                  Daniel Urieli and
                  Peter Stone},
  editor       = {Frank Dignum and
                  Alessio Lomuscio and
                  Ulle Endriss and
                  Ann Now{\'{e}}},
  title        = {Scalable Multiagent Driving Policies for Reducing Traffic Congestion},
  booktitle    = {{AAMAS} '21: 20th International Conference on Autonomous Agents and
                  Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021},
  pages        = {386--394},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p386.pdf},
  doi          = {10.5555/3463952.3464002},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/CuiMYGUS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SharonASKC21,
  author       = {Guni Sharon and
                  James Ault and
                  Peter Stone and
                  Varun Kompella and
                  Roberto Capobianco},
  editor       = {Frank Dignum and
                  Alessio Lomuscio and
                  Ulle Endriss and
                  Ann Now{\'{e}}},
  title        = {Multiagent Epidemiologic Inference through Realtime Contact Tracing},
  booktitle    = {{AAMAS} '21: 20th International Conference on Autonomous Agents and
                  Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021},
  pages        = {1182--1190},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p1182.pdf},
  doi          = {10.5555/3463952.3464089},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/SharonASKC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icarsc/Stone21,
  author       = {Peter Stone},
  editor       = {V{\'{\i}}tor Santos and
                  Nuno Lau and
                  Pedro Neto and
                  Ana Cristina Lopes},
  title        = {Efficient Robot Skill Learning: Grounded Simulation Learning and Imitation
                  Learning from Observation},
  booktitle    = {{IEEE} International Conference on Autonomous Robot Systems and Competitions,
                  {ICARSC} 2021, Santa Maria da Feira, Portugal, April 28-29, 2021},
  pages        = {3},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICARSC52212.2021.9429812},
  doi          = {10.1109/ICARSC52212.2021.9429812},
  timestamp    = {Thu, 20 May 2021 15:25:12 +0200},
  biburl       = {https://dblp.org/rec/conf/icarsc/Stone21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuLSGZA21,
  author       = {Bo Liu and
                  Qiang Liu and
                  Peter Stone and
                  Animesh Garg and
                  Yuke Zhu and
                  Anima Anandkumar},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Coach-Player Multi-agent Reinforcement Learning for Dynamic Team Composition},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {6860--6870},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/liu21m.html},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LiuLSGZA21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/HolmanASTHS21,
  author       = {Blake Holman and
                  Abrar Anwar and
                  Akash Singh and
                  Mauricio Tec and
                  Justin W. Hart and
                  Peter Stone},
  title        = {Watch Where You're Going! Gaze and Head Orientation as Predictors
                  for Social Robot Navigation},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {3553--3559},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561286},
  doi          = {10.1109/ICRA48506.2021.9561286},
  timestamp    = {Fri, 22 Oct 2021 19:54:31 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/HolmanASTHS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/WangXLWS21,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{APPLI:} Adaptive Planner Parameter Learning From Interventions},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {6079--6085},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561311},
  doi          = {10.1109/ICRA48506.2021.9561311},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/WangXLWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/XuDNXWLWS21,
  author       = {Zifan Xu and
                  Gauraang Dhamankar and
                  Anirudh Nair and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Bo Liu and
                  Zizhao Wang and
                  Peter Stone},
  title        = {{APPLR:} Adaptive Planner Parameter Learning from Reinforcement},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {6086--6092},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561647},
  doi          = {10.1109/ICRA48506.2021.9561647},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/XuDNXWLWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/XiaoLS21,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Peter Stone},
  title        = {Agile Robot Navigation through Hallucinated Learning and Sober Deployment},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {7316--7322},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9562117},
  doi          = {10.1109/ICRA48506.2021.9562117},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/XiaoLS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/YedidsionSXDS21,
  author       = {Harel Yedidsion and
                  Jennifer Suriadinata and
                  Zifan Xu and
                  Stefan Debruyn and
                  Peter Stone},
  title        = {A Scavenger Hunt for Service Robots},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {7774--7780},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561722},
  doi          = {10.1109/ICRA48506.2021.9561722},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/YedidsionSXDS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LoFST21,
  author       = {Shih{-}Yun Lo and
                  Benito Fernandez and
                  Peter Stone and
                  Andrea Lockerd Thomaz},
  title        = {Towards Safe Motion Planning in Human Workspaces: {A} Robust Multi-agent
                  Approach},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {7929--7935},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9561622},
  doi          = {10.1109/ICRA48506.2021.9561622},
  timestamp    = {Fri, 01 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LoFST21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KhandelwalMWS21,
  author       = {Piyush Khandelwal and
                  James MacGlashan and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Efficient Real-Time Inference in Temporal Convolution Networks},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2021, Xi'an, China, May 30 - June 5, 2021},
  pages        = {13489--13495},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICRA48506.2021.9560784},
  doi          = {10.1109/ICRA48506.2021.9560784},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KhandelwalMWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/WangXNUSBTS21,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Alexander J. Nettekoven and
                  Kadhiravan Umasankar and
                  Anika Singh and
                  Sriram Bommakanti and
                  Ufuk Topcu and
                  Peter Stone},
  title        = {From Agile Ground to Aerial Navigation: Learning from Learned Hallucination},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {148--153},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636402},
  doi          = {10.1109/IROS51168.2021.9636402},
  timestamp    = {Wed, 22 Dec 2021 12:36:19 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/WangXNUSBTS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/GhonasgiMNMHSD21,
  author       = {Keya Ghonasgi and
                  Reuth Mirsky and
                  Sanmit Narvekar and
                  Bharath Masetty and
                  Adrian M. Haith and
                  Peter Stone and
                  Ashish D. Deshpande},
  title        = {Capturing Skill State in Curriculum Learning for Human Skill Acquisition},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {771--776},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636850},
  doi          = {10.1109/IROS51168.2021.9636850},
  timestamp    = {Wed, 22 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/GhonasgiMNMHSD21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/TorabiWS21,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{DEALIO:} Data-Efficient Adversarial Learning for Imitation from Observation},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {2391--2397},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636169},
  doi          = {10.1109/IROS51168.2021.9636169},
  timestamp    = {Wed, 22 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/TorabiWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/LiuXS21,
  author       = {Bo Liu and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Team Orienteering Coverage Planning with Uncertain Reward},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021},
  pages        = {9728--9733},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IROS51168.2021.9636288},
  doi          = {10.1109/IROS51168.2021.9636288},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/LiuXS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DurugkarTNS21,
  author       = {Ishan Durugkar and
                  Mauricio Tec and
                  Scott Niekum and
                  Peter Stone},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Adversarial Intrinsic Motivation for Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {8622--8636},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/486c0401c56bf7ec2daa9eba58907da9-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DurugkarTNS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuLJSL21,
  author       = {Bo Liu and
                  Xingchao Liu and
                  Xiaojie Jin and
                  Peter Stone and
                  Qiang Liu},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Conflict-Averse Gradient Descent for Multi-task learning},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {18878--18890},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/9d27fdf2477ffbff837d73ef7ae23db9-Abstract.html},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuLJSL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GuoZLZBHS21,
  author       = {Sihang Guo and
                  Ruohan Zhang and
                  Bo Liu and
                  Yifeng Zhu and
                  Dana H. Ballard and
                  Mary M. Hayhoe and
                  Peter Stone},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Machine versus Human Attention in Deep Reinforcement Learning Tasks},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {25370--25385},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/d58e2f077670f4de9cd7963c857f2534-Abstract.html},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GuoZLZBHS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineLMWS21,
  author       = {Patrick MacAlpine and
                  Bo Liu and
                  William Macke and
                  Caroline Wang and
                  Peter Stone},
  editor       = {Rachid Alami and
                  Joydeep Biswas and
                  Maya Cakmak and
                  Oliver Obst},
  title        = {{UT} Austin Villa: RoboCup 2021 3D Simulation League Competition Champions},
  booktitle    = {RoboCup 2021: Robot World Cup {XXIV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {13132},
  pages        = {314--326},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-98682-7\_26},
  doi          = {10.1007/978-3-030-98682-7\_26},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineLMWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssrr/XuXWNS21,
  author       = {Zifan Xu and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Anirudh Nair and
                  Peter Stone},
  title        = {Machine Learning Methods for Local Motion Planning: {A} Study of End-to-End
                  vs. Parameter Learning},
  booktitle    = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics,
                  {SSRR} 2021, New York City, NY, USA, October 25-27, 2021},
  pages        = {217--222},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/SSRR53300.2021.9597689},
  doi          = {10.1109/SSRR53300.2021.9597689},
  timestamp    = {Tue, 23 Nov 2021 16:16:49 +0100},
  biburl       = {https://dblp.org/rec/conf/ssrr/XuXWNS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-08574,
  author       = {Lemeng Wu and
                  Bo Liu and
                  Peter Stone and
                  Qiang Liu},
  title        = {Firefly Neural Architecture Descent: a General Approach for Growing
                  Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2102.08574},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.08574},
  eprinttype    = {arXiv},
  eprint       = {2102.08574},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-08574.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-12667,
  author       = {Xuesu Xiao and
                  Joydeep Biswas and
                  Peter Stone},
  title        = {Learning Inverse Kinodynamics for Accurate High-Speed Off-Road Navigation
                  on Unstructured Terrain},
  journal      = {CoRR},
  volume       = {abs/2102.12667},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.12667},
  eprinttype    = {arXiv},
  eprint       = {2102.12667},
  timestamp    = {Tue, 02 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-12667.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-00058,
  author       = {Jiaxun Cui and
                  William Macke and
                  Harel Yedidsion and
                  Aastha Goyal and
                  Daniel Urieli and
                  Peter Stone},
  title        = {Scalable Multiagent Driving Policies For Reducing Traffic Congestion},
  journal      = {CoRR},
  volume       = {abs/2103.00058},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.00058},
  eprinttype    = {arXiv},
  eprint       = {2103.00058},
  timestamp    = {Thu, 04 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-00058.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-01171,
  author       = {William Macke and
                  Reuth Mirsky and
                  Peter Stone},
  title        = {Expected Value of Communication for Planning in Ad Hoc Teamwork},
  journal      = {CoRR},
  volume       = {abs/2103.01171},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.01171},
  eprinttype    = {arXiv},
  eprint       = {2103.01171},
  timestamp    = {Thu, 04 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-01171.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-05225,
  author       = {Harel Yedidsion and
                  Jennifer Suriadinata and
                  Zifan Xu and
                  Stefan Debruyn and
                  Peter Stone},
  title        = {A Scavenger Hunt for Service Robots},
  journal      = {CoRR},
  volume       = {abs/2103.05225},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.05225},
  eprinttype    = {arXiv},
  eprint       = {2103.05225},
  timestamp    = {Mon, 15 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-05225.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-00163,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{DEALIO:} Data-Efficient Adversarial Learning for Imitation from Observation},
  journal      = {CoRR},
  volume       = {abs/2104.00163},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.00163},
  eprinttype    = {arXiv},
  eprint       = {2104.00163},
  timestamp    = {Mon, 12 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-00163.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-04159,
  author       = {Harel Yedidsion and
                  Shani Alkoby and
                  Peter Stone},
  title        = {Sequential Online Chore Division for Autonomous Vehicle Convoy Formation},
  journal      = {CoRR},
  volume       = {abs/2104.04159},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.04159},
  eprinttype    = {arXiv},
  eprint       = {2104.04159},
  timestamp    = {Tue, 13 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-04159.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-07810,
  author       = {Eddy Hudson and
                  Garrett Warnell and
                  Faraz Torabi and
                  Peter Stone},
  title        = {Skeletal Feature Compensation for Imitation Learning with Embodiment
                  Mismatch},
  journal      = {CoRR},
  volume       = {abs/2104.07810},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.07810},
  eprinttype    = {arXiv},
  eprint       = {2104.07810},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-07810.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-13906,
  author       = {W. Bradley Knox and
                  Alessandro Allievi and
                  Holger Banzhaf and
                  Felix Schmitt and
                  Peter Stone},
  title        = {Reward (Mis)design for Autonomous Driving},
  journal      = {CoRR},
  volume       = {abs/2104.13906},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.13906},
  eprinttype    = {arXiv},
  eprint       = {2104.13906},
  timestamp    = {Tue, 04 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-13906.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-03721,
  author       = {Bo Liu and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Team Orienteering Coverage Planning with Uncertain Reward},
  journal      = {CoRR},
  volume       = {abs/2105.03721},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.03721},
  eprinttype    = {arXiv},
  eprint       = {2105.03721},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-03721.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-03756,
  author       = {Eddy Hudson and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{RAIL:} {A} modular framework for Reinforcement-learning-based Adversarial
                  Imitation Learning},
  journal      = {CoRR},
  volume       = {abs/2105.03756},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.03756},
  eprinttype    = {arXiv},
  eprint       = {2105.03756},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-03756.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-07620,
  author       = {Xuesu Xiao and
                  Zizhao Wang and
                  Zifan Xu and
                  Bo Liu and
                  Garrett Warnell and
                  Gauraang Dhamankar and
                  Anirudh Nair and
                  Peter Stone},
  title        = {{APPL:} Adaptive Planner Parameter Learning},
  journal      = {CoRR},
  volume       = {abs/2105.07620},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.07620},
  eprinttype    = {arXiv},
  eprint       = {2105.07620},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-07620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-08692,
  author       = {Bo Liu and
                  Qiang Liu and
                  Peter Stone and
                  Animesh Garg and
                  Yuke Zhu and
                  Animashree Anandkumar},
  title        = {Coach-Player Multi-Agent Reinforcement Learning for Dynamic Team Composition},
  journal      = {CoRR},
  volume       = {abs/2105.08692},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.08692},
  eprinttype    = {arXiv},
  eprint       = {2105.08692},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-08692.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-09371,
  author       = {Haresh Karnan and
                  Garrett Warnell and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {{VOILA:} Visual-Observation-Only Imitation Learning for Autonomous
                  Navigation},
  journal      = {CoRR},
  volume       = {abs/2105.09371},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.09371},
  eprinttype    = {arXiv},
  eprint       = {2105.09371},
  timestamp    = {Mon, 31 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-09371.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-13345,
  author       = {Ishan Durugkar and
                  Mauricio Tec and
                  Scott Niekum and
                  Peter Stone},
  title        = {Adversarial Intrinsic Motivation for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2105.13345},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.13345},
  eprinttype    = {arXiv},
  eprint       = {2105.13345},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-13345.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04217,
  author       = {Ghada Sokar and
                  Elena Mocanu and
                  Decebal Constantin Mocanu and
                  Mykola Pechenizkiy and
                  Peter Stone},
  title        = {Dynamic Sparse Training for Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2106.04217},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04217},
  eprinttype    = {arXiv},
  eprint       = {2106.04217},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04217.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-12113,
  author       = {Reuth Mirsky and
                  Xuesu Xiao and
                  Justin W. Hart and
                  Peter Stone},
  title        = {Prevention and Resolution of Conflicts in Social Navigation - a Survey},
  journal      = {CoRR},
  volume       = {abs/2106.12113},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.12113},
  eprinttype    = {arXiv},
  eprint       = {2106.12113},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-12113.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-04001,
  author       = {Justin W. Hart and
                  Reuth Mirsky and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Incorporating Gaze into Social Navigation},
  journal      = {CoRR},
  volume       = {abs/2107.04001},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.04001},
  eprinttype    = {arXiv},
  eprint       = {2107.04001},
  timestamp    = {Tue, 20 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-04001.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-05825,
  author       = {Ruohan Zhang and
                  Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Recent Advances in Leveraging Human Guidance for Sequential Decision-Making
                  Tasks},
  journal      = {CoRR},
  volume       = {abs/2107.05825},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.05825},
  eprinttype    = {arXiv},
  eprint       = {2107.05825},
  timestamp    = {Wed, 21 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-05825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-09793,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Alexander J. Nettekoven and
                  Kadhiravan Umasankar and
                  Anika Singh and
                  Sriram Bommakanti and
                  Ufuk Topcu and
                  Peter Stone},
  title        = {From Agile Ground to Aerial Navigation: Learning from Learned Hallucination},
  journal      = {CoRR},
  volume       = {abs/2108.09793},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.09793},
  eprinttype    = {arXiv},
  eprint       = {2108.09793},
  timestamp    = {Fri, 27 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-09793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-09801,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{APPLE:} Adaptive Planner Parameter Learning from Evaluative Feedback},
  journal      = {CoRR},
  volume       = {abs/2108.09801},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.09801},
  eprinttype    = {arXiv},
  eprint       = {2108.09801},
  timestamp    = {Fri, 27 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-09801.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-13841,
  author       = {Yifeng Zhu and
                  Peter Stone and
                  Yuke Zhu},
  title        = {Bottom-Up Skill Discovery from Unsegmented Demonstrations for Long-Horizon
                  Robot Manipulation},
  journal      = {CoRR},
  volume       = {abs/2109.13841},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.13841},
  eprinttype    = {arXiv},
  eprint       = {2109.13841},
  timestamp    = {Mon, 04 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-13841.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-14048,
  author       = {Bo Liu and
                  Xingchao Liu and
                  Xiaojie Jin and
                  Peter Stone and
                  Qiang Liu},
  title        = {Conflict-Averse Gradient Descent for Multi-task Learning},
  journal      = {CoRR},
  volume       = {abs/2110.14048},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.14048},
  eprinttype    = {arXiv},
  eprint       = {2110.14048},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-14048.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-03759,
  author       = {Yulin Zhang and
                  William Macke and
                  Jiaxun Cui and
                  Daniel Urieli and
                  Peter Stone},
  title        = {Learning a Robust Multiagent Driving Policy for Traffic Congestion
                  Reduction},
  journal      = {CoRR},
  volume       = {abs/2112.03759},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.03759},
  eprinttype    = {arXiv},
  eprint       = {2112.03759},
  timestamp    = {Mon, 13 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-03759.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/SilvaWCS20,
  author       = {Felipe Leno da Silva and
                  Garrett Warnell and
                  Anna Helena Reali Costa and
                  Peter Stone},
  title        = {Agents teaching agents: a survey on inter-agent transfer learning},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {34},
  number       = {1},
  pages        = {9},
  year         = {2020},
  url          = {https://doi.org/10.1007/s10458-019-09430-0},
  doi          = {10.1007/S10458-019-09430-0},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aamas/SilvaWCS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/AlbrechtSW20,
  author       = {Stefano V. Albrecht and
                  Peter Stone and
                  Michael P. Wellman},
  title        = {Special issue on autonomous agents modelling other agents: Guest editorial},
  journal      = {Artif. Intell.},
  volume       = {285},
  pages        = {103292},
  year         = {2020},
  url          = {https://doi.org/10.1016/j.artint.2020.103292},
  doi          = {10.1016/J.ARTINT.2020.103292},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/AlbrechtSW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jagi/MonettLTBBGBCCS20,
  author       = {Dagmar Monett and
                  Colin W. P. Lewis and
                  Kristinn R. Th{\'{o}}risson and
                  Joscha Bach and
                  Gianluca Baldassarre and
                  Giovanni Granato and
                  Istvan S. N. Berkeley and
                  Fran{\c{c}}ois Chollet and
                  Matthew Crosby and
                  Henry Shevlin and
                  John F. Sowa and
                  John E. Laird and
                  Shane Legg and
                  Peter Lindes and
                  Tom{\'{a}}s Mikolov and
                  William J. Rapaport and
                  Ra{\'{u}}l Rojas and
                  Marek Rosa and
                  Peter Stone and
                  Richard S. Sutton and
                  Roman V. Yampolskiy and
                  Pei Wang and
                  Roger C. Schank and
                  Aaron Sloman and
                  Alan F. T. Winfield},
  title        = {Special Issue "On Defining Artificial Intelligence" - Commentaries
                  and Author's Response},
  journal      = {J. Artif. Gen. Intell.},
  volume       = {11},
  number       = {2},
  pages        = {1--100},
  year         = {2020},
  url          = {https://doi.org/10.2478/jagi-2020-0003},
  doi          = {10.2478/JAGI-2020-0003},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jagi/MonettLTBBGBCCS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/ThomasonPSWJYHS20,
  author       = {Jesse Thomason and
                  Aishwarya Padmakumar and
                  Jivko Sinapov and
                  Nick Walker and
                  Yuqian Jiang and
                  Harel Yedidsion and
                  Justin W. Hart and
                  Peter Stone and
                  Raymond J. Mooney},
  title        = {Jointly Improving Parsing and Perception for Natural Language Commands
                  through Human-Robot Dialog},
  journal      = {J. Artif. Intell. Res.},
  volume       = {67},
  pages        = {327--374},
  year         = {2020},
  url          = {https://doi.org/10.1613/jair.1.11485},
  doi          = {10.1613/JAIR.1.11485},
  timestamp    = {Sun, 08 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/ThomasonPSWJYHS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/LoZS20,
  author       = {Shih{-}Yun Lo and
                  Shiqi Zhang and
                  Peter Stone},
  title        = {The {PETLON} Algorithm to Plan Efficiently for Task-Level-Optimal
                  Navigation},
  journal      = {J. Artif. Intell. Res.},
  volume       = {69},
  pages        = {471--500},
  year         = {2020},
  url          = {https://doi.org/10.1613/jair.1.12181},
  doi          = {10.1613/JAIR.1.12181},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/LoZS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/NarvekarPLSTS20,
  author       = {Sanmit Narvekar and
                  Bei Peng and
                  Matteo Leonetti and
                  Jivko Sinapov and
                  Matthew E. Taylor and
                  Peter Stone},
  title        = {Curriculum Learning for Reinforcement Learning Domains: {A} Framework
                  and Survey},
  journal      = {J. Mach. Learn. Res.},
  volume       = {21},
  pages        = {181:1--181:50},
  year         = {2020},
  url          = {http://jmlr.org/papers/v21/20-212.html},
  timestamp    = {Sun, 18 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jmlr/NarvekarPLSTS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/XiaoLWFS20,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Jonathan Fink and
                  Peter Stone},
  title        = {{APPLD:} Adaptive Planner Parameter Learning From Demonstration},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {5},
  number       = {3},
  pages        = {4541--4547},
  year         = {2020},
  url          = {https://doi.org/10.1109/LRA.2020.3002217},
  doi          = {10.1109/LRA.2020.3002217},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/XiaoLWFS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/PavseTHWS20,
  author       = {Brahma S. Pavse and
                  Faraz Torabi and
                  Josiah Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{RIDM:} Reinforced Inverse Dynamics Modeling for Learning from a Single
                  Observed Demonstration},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {5},
  number       = {4},
  pages        = {6262--6269},
  year         = {2020},
  url          = {https://doi.org/10.1109/LRA.2020.3010750},
  doi          = {10.1109/LRA.2020.3010750},
  timestamp    = {Sat, 14 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/PavseTHWS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/YedidsionAS20,
  author       = {Harel Yedidsion and
                  Shani Alkoby and
                  Peter Stone},
  editor       = {Amal El Fallah Seghrouchni and
                  Gita Sukthankar and
                  Bo An and
                  Neil Yorke{-}Smith},
  title        = {The Sequential Online Chore Division Problem - Definition and Application},
  booktitle    = {Proceedings of the 19th International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13,
                  2020},
  pages        = {2059--2061},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2020},
  url          = {https://dl.acm.org/doi/10.5555/3398761.3399074},
  doi          = {10.5555/3398761.3399074},
  timestamp    = {Tue, 26 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/YedidsionAS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SilvaWCS20,
  author       = {Felipe Leno da Silva and
                  Garrett Warnell and
                  Anna Helena Reali Costa and
                  Peter Stone},
  editor       = {Amal El Fallah Seghrouchni and
                  Gita Sukthankar and
                  Bo An and
                  Neil Yorke{-}Smith},
  title        = {Agents Teaching Agents: {A} Survey on Inter-agent Transfer Learning},
  booktitle    = {Proceedings of the 19th International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13,
                  2020},
  pages        = {2165--2167},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2020},
  url          = {https://dl.acm.org/doi/10.5555/3398761.3399111},
  doi          = {10.5555/3398761.3399111},
  timestamp    = {Tue, 26 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/SilvaWCS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/CuiZKASN20,
  author       = {Yuchen Cui and
                  Qiping Zhang and
                  W. Bradley Knox and
                  Alessandro Allievi and
                  Peter Stone and
                  Scott Niekum},
  editor       = {Jens Kober and
                  Fabio Ramos and
                  Claire J. Tomlin},
  title        = {The {EMPATHIC} Framework for Task Learning from Implicit Human Feedback},
  booktitle    = {4th Conference on Robot Learning, CoRL 2020, 16-18 November 2020,
                  Virtual Event / Cambridge, MA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {155},
  pages        = {604--626},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {https://proceedings.mlr.press/v155/cui21a.html},
  timestamp    = {Tue, 18 Oct 2022 08:35:37 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/CuiZKASN20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/ParkTYWKS20,
  author       = {Jin Soo Park and
                  Brian Tsang and
                  Harel Yedidsion and
                  Garrett Warnell and
                  Daehyun Kyoung and
                  Peter Stone},
  editor       = {Jens Kober and
                  Fabio Ramos and
                  Claire J. Tomlin},
  title        = {Learning to Improve Multi-Robot Hallway Navigation},
  booktitle    = {4th Conference on Robot Learning, CoRL 2020, 16-18 November 2020,
                  Virtual Event / Cambridge, MA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {155},
  pages        = {1883--1895},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {https://proceedings.mlr.press/v155/park21a.html},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/ParkTYWKS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PavseDHS20,
  author       = {Brahma S. Pavse and
                  Ishan Durugkar and
                  Josiah Hanna and
                  Peter Stone},
  title        = {Reducing Sampling Error in Batch Temporal Difference Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {7543--7552},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/pavse20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/PavseDHS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/MirskyMWYS20,
  author       = {Reuth Mirsky and
                  William Macke and
                  Andy Wang and
                  Harel Yedidsion and
                  Peter Stone},
  editor       = {Christian Bessiere},
  title        = {A Penny for Your Thoughts: The Value of Communication in Ad Hoc Teamwork},
  booktitle    = {Proceedings of the Twenty-Ninth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2020},
  pages        = {254--260},
  publisher    = {ijcai.org},
  year         = {2020},
  url          = {https://doi.org/10.24963/ijcai.2020/36},
  doi          = {10.24963/IJCAI.2020/36},
  timestamp    = {Mon, 20 Jul 2020 12:38:52 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/MirskyMWYS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/DurugkarLS20,
  author       = {Ishan Durugkar and
                  Elad Liebman and
                  Peter Stone},
  editor       = {Christian Bessiere},
  title        = {Balancing Individual Preferences and Shared Objectives in Multiagent
                  Reinforcement Learning},
  booktitle    = {Proceedings of the Twenty-Ninth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2020},
  pages        = {2505--2511},
  publisher    = {ijcai.org},
  year         = {2020},
  url          = {https://doi.org/10.24963/ijcai.2020/347},
  doi          = {10.24963/IJCAI.2020/347},
  timestamp    = {Mon, 13 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/DurugkarLS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/KarnanDHWS20,
  author       = {Haresh Karnan and
                  Siddharth Desai and
                  Josiah P. Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Reinforced Grounded Action Transformation for Sim-to-Real Transfer},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021},
  pages        = {4397--4402},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/IROS45743.2020.9341149},
  doi          = {10.1109/IROS45743.2020.9341149},
  timestamp    = {Tue, 16 Feb 2021 19:07:08 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/KarnanDHWS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/ShahJHS20,
  author       = {Rishi Shah and
                  Yuqian Jiang and
                  Justin W. Hart and
                  Peter Stone},
  title        = {Deep R-Learning for Continual Area Sweeping},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021},
  pages        = {5542--5547},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/IROS45743.2020.9341626},
  doi          = {10.1109/IROS45743.2020.9341626},
  timestamp    = {Tue, 16 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/ShahJHS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/DesaiKHWS20,
  author       = {Siddharth Desai and
                  Haresh Karnan and
                  Josiah P. Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Stochastic Grounded Action Transformation for Robot Learning in Simulation},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021},
  pages        = {6106--6111},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/IROS45743.2020.9340780},
  doi          = {10.1109/IROS45743.2020.9340780},
  timestamp    = {Tue, 16 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/DesaiKHWS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DesaiDKWHS20,
  author       = {Siddharth Desai and
                  Ishan Durugkar and
                  Haresh Karnan and
                  Garrett Warnell and
                  Josiah Hanna and
                  Peter Stone},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {An Imitation from Observation Approach to Transfer Learning with Dynamics
                  Mismatch},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/28f248e9279ac845995c4e9f8af35c2b-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DesaiDKWHS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WuLS020,
  author       = {Lemeng Wu and
                  Bo Liu and
                  Peter Stone and
                  Qiang Liu},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Firefly Neural Architecture Descent: a General Approach for Growing
                  Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/fdbe012e2e11314b96402b32c0df26b7-Abstract.html},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WuLS020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigdial/LuZSC20,
  author       = {Keting Lu and
                  Shiqi Zhang and
                  Peter Stone and
                  Xiaoping Chen},
  editor       = {Olivier Pietquin and
                  Smaranda Muresan and
                  Vivian Chen and
                  Casey Kennington and
                  David Vandyke and
                  Nina Dethlefs and
                  Koji Inoue and
                  Erik Ekstedt and
                  Stefan Ultes},
  title        = {Learning and Reasoning for Robot Dialog and Navigation Tasks},
  booktitle    = {Proceedings of the 21th Annual Meeting of the Special Interest Group
                  on Discourse and Dialogue, SIGdial 2020, 1st virtual meeting, July
                  1-3, 2020},
  pages        = {107--117},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.sigdial-1.14},
  doi          = {10.18653/V1/2020.SIGDIAL-1.14},
  timestamp    = {Fri, 12 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigdial/LuZSC20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/socrob/HartMXTMGBOS20,
  author       = {Justin W. Hart and
                  Reuth Mirsky and
                  Xuesu Xiao and
                  Stone Tejeda and
                  Bonny Mahajan and
                  Jamin Goo and
                  Kathryn Baldauf and
                  Sydney Owen and
                  Peter Stone},
  editor       = {Alan R. Wagner and
                  David Feil{-}Seifer and
                  Kerstin Sophie Haring and
                  Silvia Rossi and
                  Thomas Emrys Williams and
                  Hongsheng He and
                  Shuzhi Sam Ge},
  title        = {Using Human-Inspired Signals to Disambiguate Navigational Intentions},
  booktitle    = {Social Robotics - 12th International Conference, {ICSR} 2020, Golden,
                  CO, USA, November 14-18, 2020, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12483},
  pages        = {320--331},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-62056-1\_27},
  doi          = {10.1007/978-3-030-62056-1\_27},
  timestamp    = {Wed, 21 Dec 2022 13:24:29 +0100},
  biburl       = {https://dblp.org/rec/conf/socrob/HartMXTMGBOS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssrr/PerilleTXS20,
  author       = {Daniel Perille and
                  Abigail Truong and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Benchmarking Metric Ground Navigation},
  booktitle    = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics,
                  {SSRR} 2020, Abu Dhabi, United Arab Emirates, November 4-6, 2020},
  pages        = {116--121},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/SSRR50563.2020.9292572},
  doi          = {10.1109/SSRR50563.2020.9292572},
  timestamp    = {Fri, 30 Apr 2021 12:35:39 +0200},
  biburl       = {https://dblp.org/rec/conf/ssrr/PerilleTXS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-04960,
  author       = {Sanmit Narvekar and
                  Bei Peng and
                  Matteo Leonetti and
                  Jivko Sinapov and
                  Matthew E. Taylor and
                  Peter Stone},
  title        = {Curriculum Learning for Reinforcement Learning Domains: {A} Framework
                  and Survey},
  journal      = {CoRR},
  volume       = {abs/2003.04960},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.04960},
  eprinttype    = {arXiv},
  eprint       = {2003.04960},
  timestamp    = {Sun, 18 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-04960.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-00116,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Jonathan Fink and
                  Peter Stone},
  title        = {{APPLD:} Adaptive Planner Parameter Learning from Demonstration},
  journal      = {CoRR},
  volume       = {abs/2004.00116},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.00116},
  eprinttype    = {arXiv},
  eprint       = {2004.00116},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-00116.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-08672,
  author       = {Shiqi Zhang and
                  Peter Stone},
  title        = {iCORPP: Interleaved Commonsense Reasoning and Probabilistic Planning
                  on Robots},
  journal      = {CoRR},
  volume       = {abs/2004.08672},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.08672},
  eprinttype    = {arXiv},
  eprint       = {2004.08672},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-08672.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-09833,
  author       = {Keting Lu and
                  Shiqi Zhang and
                  Peter Stone and
                  Xiaoping Chen},
  title        = {Learning and Reasoning for Robot Dialog and Navigation Tasks},
  journal      = {CoRR},
  volume       = {abs/2005.09833},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.09833},
  eprinttype    = {arXiv},
  eprint       = {2005.09833},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-09833.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-00589,
  author       = {Rishi Shah and
                  Yuqian Jiang and
                  Justin W. Hart and
                  Peter Stone},
  title        = {Deep R-Learning for Continual Area Sweeping},
  journal      = {CoRR},
  volume       = {abs/2006.00589},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.00589},
  eprinttype    = {arXiv},
  eprint       = {2006.00589},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-00589.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-10553,
  author       = {Elad Liebman and
                  Peter Stone},
  title        = {Artificial Musical Intelligence: {A} Survey},
  journal      = {CoRR},
  volume       = {abs/2006.10553},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.10553},
  eprinttype    = {arXiv},
  eprint       = {2006.10553},
  timestamp    = {Tue, 23 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-10553.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-01498,
  author       = {Yuqian Jiang and
                  Sudarshanan Bharadwaj and
                  Bo Wu and
                  Rishi Shah and
                  Ufuk Topcu and
                  Peter Stone},
  title        = {Temporal-Logic-Based Reward Shaping for Continuing Learning Tasks},
  journal      = {CoRR},
  volume       = {abs/2007.01498},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.01498},
  eprinttype    = {arXiv},
  eprint       = {2007.01498},
  timestamp    = {Mon, 06 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-01498.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-14479,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Toward Agile Maneuvers in Highly Constrained Spaces: Learning from
                  Hallucination},
  journal      = {CoRR},
  volume       = {abs/2007.14479},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.14479},
  eprinttype    = {arXiv},
  eprint       = {2007.14479},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-14479.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-14486,
  author       = {Bo Liu and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Lifelong Navigation},
  journal      = {CoRR},
  volume       = {abs/2007.14486},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.14486},
  eprinttype    = {arXiv},
  eprint       = {2007.14486},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-14486.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-01279,
  author       = {Haresh Karnan and
                  Siddharth Desai and
                  Josiah P. Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Reinforced Grounded Action Transformation for Sim-to-Real Transfer},
  journal      = {CoRR},
  volume       = {abs/2008.01279},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.01279},
  eprinttype    = {arXiv},
  eprint       = {2008.01279},
  timestamp    = {Fri, 07 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-01279.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-01281,
  author       = {Siddharth Desai and
                  Haresh Karnan and
                  Josiah P. Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Stochastic Grounded Action Transformation for Robot Learning in Simulation},
  journal      = {CoRR},
  volume       = {abs/2008.01281},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.01281},
  eprinttype    = {arXiv},
  eprint       = {2008.01281},
  timestamp    = {Fri, 07 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-01281.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-01594,
  author       = {Siddharth Desai and
                  Ishan Durugkar and
                  Haresh Karnan and
                  Garrett Warnell and
                  Josiah Hanna and
                  Peter Stone},
  title        = {An Imitation from Observation Approach to Sim-to-Real Transfer},
  journal      = {CoRR},
  volume       = {abs/2008.01594},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.01594},
  eprinttype    = {arXiv},
  eprint       = {2008.01594},
  timestamp    = {Wed, 14 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-01594.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-06738,
  author       = {Brahma S. Pavse and
                  Ishan Durugkar and
                  Josiah Hanna and
                  Peter Stone},
  title        = {Reducing Sampling Error in Batch Temporal Difference Learning},
  journal      = {CoRR},
  volume       = {abs/2008.06738},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.06738},
  eprinttype    = {arXiv},
  eprint       = {2008.06738},
  timestamp    = {Fri, 21 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-06738.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-13315,
  author       = {Daniel Perille and
                  Abigail Truong and
                  Xuesu Xiao and
                  Peter Stone},
  title        = {Benchmarking Metric Ground Navigation},
  journal      = {CoRR},
  volume       = {abs/2008.13315},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.13315},
  eprinttype    = {arXiv},
  eprint       = {2008.13315},
  timestamp    = {Wed, 16 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-13315.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-13649,
  author       = {Yuchen Cui and
                  Qiping Zhang and
                  Alessandro Allievi and
                  Peter Stone and
                  Scott Niekum and
                  W. Bradley Knox},
  title        = {The {EMPATHIC} Framework for Task Learning from Implicit Human Feedback},
  journal      = {CoRR},
  volume       = {abs/2009.13649},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.13649},
  eprinttype    = {arXiv},
  eprint       = {2009.13649},
  timestamp    = {Wed, 30 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-13649.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-13736,
  author       = {Yunshu Du and
                  Garrett Warnell and
                  Assefaw Hadish Gebremedhin and
                  Peter Stone and
                  Matthew E. Taylor},
  title        = {Lucid Dreaming for Experience Replay: Refreshing Past States with
                  the Current Policy},
  journal      = {CoRR},
  volume       = {abs/2009.13736},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.13736},
  eprinttype    = {arXiv},
  eprint       = {2009.13736},
  timestamp    = {Wed, 30 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-13736.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-08098,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Peter Stone},
  title        = {Agile Robot Navigation through Hallucinated Learning and Sober Deployment},
  journal      = {CoRR},
  volume       = {abs/2010.08098},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.08098},
  eprinttype    = {arXiv},
  eprint       = {2010.08098},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-08098.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-09158,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Peter Stone},
  title        = {Extended Abstract: Motion Planners Learned from Geometric Hallucination},
  journal      = {CoRR},
  volume       = {abs/2010.09158},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.09158},
  eprinttype    = {arXiv},
  eprint       = {2010.09158},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-09158.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-10560,
  author       = {Varun Kompella and
                  Roberto Capobianco and
                  Stacy Jong and
                  Jonathan Browne and
                  Spencer J. Fox and
                  Lauren Ancel Meyers and
                  Peter R. Wurman and
                  Peter Stone},
  title        = {Reinforcement Learning for Optimization of {COVID-19} Mitigation policies},
  journal      = {CoRR},
  volume       = {abs/2010.10560},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.10560},
  eprinttype    = {arXiv},
  eprint       = {2010.10560},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-10560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-15942,
  author       = {Ruohan Zhang and
                  Bo Liu and
                  Yifeng Zhu and
                  Sihang Guo and
                  Mary M. Hayhoe and
                  Dana H. Ballard and
                  Peter Stone},
  title        = {Human versus Machine Attention in Deep Reinforcement Learning Tasks},
  journal      = {CoRR},
  volume       = {abs/2010.15942},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.15942},
  eprinttype    = {arXiv},
  eprint       = {2010.15942},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-15942.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-00397,
  author       = {Zifan Xu and
                  Gauraang Dhamankar and
                  Anirudh Nair and
                  Xuesu Xiao and
                  Garrett Warnell and
                  Bo Liu and
                  Zizhao Wang and
                  Peter Stone},
  title        = {{APPLR:} Adaptive Planner Parameter Learning from Reinforcement},
  journal      = {CoRR},
  volume       = {abs/2011.00397},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.00397},
  eprinttype    = {arXiv},
  eprint       = {2011.00397},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-00397.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-00400,
  author       = {Zizhao Wang and
                  Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{APPLI:} Adaptive Planner Parameter Learning From Interventions},
  journal      = {CoRR},
  volume       = {abs/2011.00400},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.00400},
  eprinttype    = {arXiv},
  eprint       = {2011.00400},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-00400.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-13112,
  author       = {Xuesu Xiao and
                  Bo Liu and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Motion Control for Mobile Robot Navigation Using Machine Learning:
                  a Survey},
  journal      = {CoRR},
  volume       = {abs/2011.13112},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.13112},
  eprinttype    = {arXiv},
  eprint       = {2011.13112},
  timestamp    = {Wed, 15 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-13112.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/arobots/JiangYZSS19,
  author       = {Yuqian Jiang and
                  Harel Yedidsion and
                  Shiqi Zhang and
                  Guni Sharon and
                  Peter Stone},
  title        = {Multi-robot planning with conflicts and synergies},
  journal      = {Auton. Robots},
  volume       = {43},
  number       = {8},
  pages        = {2011--2032},
  year         = {2019},
  url          = {https://doi.org/10.1007/s10514-019-09848-1},
  doi          = {10.1007/S10514-019-09848-1},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/arobots/JiangYZSS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jzusc/JiangZKS19,
  author       = {Yuqian Jiang and
                  Shiqi Zhang and
                  Piyush Khandelwal and
                  Peter Stone},
  title        = {Task planning in robotics: an empirical comparison of {PDDL-} and
                  ASP-based systems},
  journal      = {Frontiers Inf. Technol. Electron. Eng.},
  volume       = {20},
  number       = {3},
  pages        = {363--373},
  year         = {2019},
  url          = {https://doi.org/10.1631/FITEE.1800514},
  doi          = {10.1631/FITEE.1800514},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jzusc/JiangZKS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/misq/LiebmanSS19,
  author       = {Elad Liebman and
                  Maytal Saar{-}Tsechansky and
                  Peter Stone},
  title        = {The Right Music at the Right Time: Adaptive Personalized Playlists
                  Based on Sequence Modeling},
  journal      = {{MIS} Q.},
  volume       = {43},
  number       = {3},
  year         = {2019},
  url          = {https://doi.org/10.25300/misq/2019/14750},
  doi          = {10.25300/MISQ/2019/14750},
  timestamp    = {Thu, 30 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/misq/LiebmanSS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ram/AsadaSVLN19,
  author       = {Minoru Asada and
                  Peter Stone and
                  Manuela Veloso and
                  Daniel D. Lee and
                  Daniele Nardi},
  title        = {RoboCup: {A} Treasure Trove of Rich Diversity for Research Issues
                  and Interdisciplinary Connections {[TC} Spotlight]},
  journal      = {{IEEE} Robotics Autom. Mag.},
  volume       = {26},
  number       = {3},
  pages        = {99--102},
  year         = {2019},
  url          = {https://doi.org/10.1109/MRA.2019.2928959},
  doi          = {10.1109/MRA.2019.2928959},
  timestamp    = {Mon, 18 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ram/AsadaSVLN19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HannaSBS19,
  author       = {Josiah P. Hanna and
                  Guni Sharon and
                  Stephen D. Boyles and
                  Peter Stone},
  title        = {Selecting Compliant Agents for Opt-in Micro-Tolling},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {565--572},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.3301565},
  doi          = {10.1609/AAAI.V33I01.3301565},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HannaSBS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LoAS19,
  author       = {Shih{-}Yun Lo and
                  Shani Alkoby and
                  Peter Stone},
  editor       = {Hu{\'{a}}scar Espinoza and
                  Se{\'{a}}n {\'{O}} h{\'{E}}igeartaigh and
                  Xiaowei Huang and
                  Jos{\'{e}} Hern{\'{a}}ndez{-}Orallo and
                  Mauricio Castillo{-}Effen},
  title        = {Robust Motion Planning and Safety Benchmarking in Human Workspaces},
  booktitle    = {Workshop on Artificial Intelligence Safety 2019 co-located with the
                  Thirty-Third {AAAI} Conference on Artificial Intelligence 2019 (AAAI-19),
                  Honolulu, Hawaii, January 27, 2019},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {2301},
  publisher    = {CEUR-WS.org},
  year         = {2019},
  url          = {https://ceur-ws.org/Vol-2301/paper\_28.pdf},
  timestamp    = {Fri, 10 Mar 2023 16:22:15 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/LoAS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/Jiang0HS19,
  author       = {Yuqian Jiang and
                  Nick Walker and
                  Justin W. Hart and
                  Peter Stone},
  editor       = {J. Benton and
                  Nir Lipovetzky and
                  Eva Onaindia and
                  David E. Smith and
                  Siddharth Srivastava},
  title        = {Open-World Reasoning for Service Robots},
  booktitle    = {Proceedings of the Twenty-Ninth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2019, Berkeley, CA, USA, July 11-15,
                  2019},
  pages        = {725--733},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://ojs.aaai.org/index.php/ICAPS/article/view/3541},
  timestamp    = {Thu, 10 Aug 2023 15:31:45 +0200},
  biburl       = {https://dblp.org/rec/conf/aips/Jiang0HS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/NarvekarS19,
  author       = {Sanmit Narvekar and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Learning Curriculum Policies for Reinforcement Learning},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {25--33},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331670},
  timestamp    = {Wed, 29 May 2019 16:36:58 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/NarvekarS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/HannaS19,
  author       = {Josiah P. Hanna and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Reducing Sampling Error in Policy Gradient Learning},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {1016--1024},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331798},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/HannaS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SharonBAS19,
  author       = {Guni Sharon and
                  Stephen D. Boyles and
                  Shani Alkoby and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Marginal Cost Pricing with a Fixed Error Factor in Traffic Networks},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {1539--1546},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331871},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/SharonBAS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlkobyRS19,
  author       = {Shani Alkoby and
                  Avilash Rath and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Teaching Social Behavior through Human Reinforcement for Ad hoc Teamwork
                  - The {STAR} Framework: Extended Abstract},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {1773--1775},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331914},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlkobyRS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MenasheS19,
  author       = {Jacob Menashe and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Escape Room: {A} Configurable Testbed for Hierarchical Reinforcement
                  Learning},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {2123--2125},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3332031},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MenasheS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/TorabiWS19,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Adversarial Imitation Learning from State-only Demonstrations},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {2229--2231},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3332067},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/TorabiWS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bracis/SilvaCS19,
  author       = {Felipe Leno da Silva and
                  Anna Helena Reali Costa and
                  Peter Stone},
  title        = {Building Self-Play Curricula Online by Playing with Expert Agents
                  in Adversarial Games},
  booktitle    = {8th Brazilian Conference on Intelligent Systems, {BRACIS} 2019, Salvador,
                  Brazil, October 15-18, 2019},
  pages        = {479--484},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/BRACIS.2019.00090},
  doi          = {10.1109/BRACIS.2019.00090},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/bracis/SilvaCS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HannaNS19,
  author       = {Josiah Hanna and
                  Scott Niekum and
                  Peter Stone},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Importance Sampling Policy Evaluation with an Estimated Behavior Policy},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {2605--2613},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/hanna19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HannaNS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ThomasonPS0JYHS19,
  author       = {Jesse Thomason and
                  Aishwarya Padmakumar and
                  Jivko Sinapov and
                  Nick Walker and
                  Yuqian Jiang and
                  Harel Yedidsion and
                  Justin W. Hart and
                  Peter Stone and
                  Raymond J. Mooney},
  title        = {Improving Grounded Natural Language Understanding through Human-Robot
                  Dialog},
  booktitle    = {International Conference on Robotics and Automation, {ICRA} 2019,
                  Montreal, QC, Canada, May 20-24, 2019},
  pages        = {6934--6941},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICRA.2019.8794287},
  doi          = {10.1109/ICRA.2019.8794287},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/ThomasonPS0JYHS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/RavulaAS19,
  author       = {Manish Ravula and
                  Shani Alkoby and
                  Peter Stone},
  editor       = {Sarit Kraus},
  title        = {Ad Hoc Teamwork With Behavior Switching Agents},
  booktitle    = {Proceedings of the Twenty-Eighth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
                  2019},
  pages        = {550--556},
  publisher    = {ijcai.org},
  year         = {2019},
  url          = {https://doi.org/10.24963/ijcai.2019/78},
  doi          = {10.24963/IJCAI.2019/78},
  timestamp    = {Tue, 20 Aug 2019 16:18:18 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/RavulaAS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/TorabiWS19,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {Sarit Kraus},
  title        = {Imitation Learning from Video by Leveraging Proprioception},
  booktitle    = {Proceedings of the Twenty-Eighth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
                  2019},
  pages        = {3585--3591},
  publisher    = {ijcai.org},
  year         = {2019},
  url          = {https://doi.org/10.24963/ijcai.2019/497},
  doi          = {10.24963/IJCAI.2019/497},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/TorabiWS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/TorabiWS19a,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {Sarit Kraus},
  title        = {Recent Advances in Imitation Learning from Observation},
  booktitle    = {Proceedings of the Twenty-Eighth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
                  2019},
  pages        = {6325--6331},
  publisher    = {ijcai.org},
  year         = {2019},
  url          = {https://doi.org/10.24963/ijcai.2019/882},
  doi          = {10.24963/IJCAI.2019/882},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/TorabiWS19a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/ZhangTGBS19,
  author       = {Ruohan Zhang and
                  Faraz Torabi and
                  Lin Guan and
                  Dana H. Ballard and
                  Peter Stone},
  editor       = {Sarit Kraus},
  title        = {Leveraging Human Guidance for Deep Reinforcement Learning Tasks},
  booktitle    = {Proceedings of the Twenty-Eighth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
                  2019},
  pages        = {6339--6346},
  publisher    = {ijcai.org},
  year         = {2019},
  url          = {https://doi.org/10.24963/ijcai.2019/884},
  doi          = {10.24963/IJCAI.2019/884},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/ZhangTGBS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/JiangYZS19,
  author       = {Yuqian Jiang and
                  Fangkai Yang and
                  Shiqi Zhang and
                  Peter Stone},
  title        = {Task-Motion Planning with Reinforcement Learning for Adaptable Mobile
                  Service Robots},
  booktitle    = {2019 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2019, Macau, SAR, China, November 3-8, 2019},
  pages        = {7529--7534},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/IROS40897.2019.8967680},
  doi          = {10.1109/IROS40897.2019.8967680},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/JiangYZS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineTPS19,
  author       = {Patrick MacAlpine and
                  Faraz Torabi and
                  Brahma S. Pavse and
                  Peter Stone},
  editor       = {Stephan K. Chalup and
                  Tim Niem{\"{u}}ller and
                  Jackrit Suthakorn and
                  Mary{-}Anne Williams},
  title        = {{UT} Austin Villa: RoboCup 2019 3D Simulation League Competition and
                  Technical Challenge Champions},
  booktitle    = {RoboCup 2019: Robot World Cup {XXIII} [Sydney, NSW, Australia, July
                  8, 2019]},
  series       = {Lecture Notes in Computer Science},
  volume       = {11531},
  pages        = {540--552},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-35699-6\_44},
  doi          = {10.1007/978-3-030-35699-6\_44},
  timestamp    = {Thu, 12 Dec 2019 08:32:25 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineTPS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/socrob/YedidsionDSCHSM19,
  author       = {Harel Yedidsion and
                  Jacqueline Deans and
                  Connor Sheehan and
                  Mahathi Chillara and
                  Justin W. Hart and
                  Peter Stone and
                  Raymond J. Mooney},
  editor       = {Miguel A. Salichs and
                  Shuzhi Sam Ge and
                  Emilia Ivanova Barakova and
                  John{-}John Cabibihan and
                  Alan R. Wagner and
                  {\'{A}}lvaro Castro Gonz{\'{a}}lez and
                  Hongsheng He},
  title        = {Optimal Use of Verbal Instructions for Multi-robot Human Navigation
                  Guidance},
  booktitle    = {Social Robotics - 11th International Conference, {ICSR} 2019, Madrid,
                  Spain, November 26-29, 2019, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {11876},
  pages        = {133--143},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-35888-4\_13},
  doi          = {10.1007/978-3-030-35888-4\_13},
  timestamp    = {Mon, 25 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/socrob/YedidsionDSCHSM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-00122,
  author       = {Jesse Thomason and
                  Aishwarya Padmakumar and
                  Jivko Sinapov and
                  Nick Walker and
                  Yuqian Jiang and
                  Harel Yedidsion and
                  Justin W. Hart and
                  Peter Stone and
                  Raymond J. Mooney},
  title        = {Improving Grounded Natural Language Understanding through Human-Robot
                  Dialog},
  journal      = {CoRR},
  volume       = {abs/1903.00122},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.00122},
  eprinttype    = {arXiv},
  eprint       = {1903.00122},
  timestamp    = {Sat, 30 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-00122.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-09335,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Imitation Learning from Video by Leveraging Proprioception},
  journal      = {CoRR},
  volume       = {abs/1905.09335},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.09335},
  eprinttype    = {arXiv},
  eprint       = {1905.09335},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-09335.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-13566,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Recent Advances in Imitation Learning from Observation},
  journal      = {CoRR},
  volume       = {abs/1905.13566},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.13566},
  eprinttype    = {arXiv},
  eprint       = {1905.13566},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-13566.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-07372,
  author       = {Brahma S. Pavse and
                  Faraz Torabi and
                  Josiah P. Hanna and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{RIDM:} Reinforced Inverse Dynamics Modeling for Learning from a Single
                  Observed Demonstration},
  journal      = {CoRR},
  volume       = {abs/1906.07372},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.07372},
  eprinttype    = {arXiv},
  eprint       = {1906.07372},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-07372.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-07374,
  author       = {Faraz Torabi and
                  Sean Geiger and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Sample-efficient Adversarial Imitation Learning from Observation},
  journal      = {CoRR},
  volume       = {abs/1906.07374},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.07374},
  eprinttype    = {arXiv},
  eprint       = {1906.07374},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-07374.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-11064,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Reasoning about Hypothetical Agent Behaviours and their Parameters},
  journal      = {CoRR},
  volume       = {abs/1906.11064},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.11064},
  eprinttype    = {arXiv},
  eprint       = {1906.11064},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-11064.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-02300,
  author       = {Nick Walker and
                  Yuqian Jiang and
                  Maya Cakmak and
                  Peter Stone},
  title        = {Desiderata for Planning Systems in General-Purpose Service Robots},
  journal      = {CoRR},
  volume       = {abs/1907.02300},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.02300},
  eprinttype    = {arXiv},
  eprint       = {1907.02300},
  timestamp    = {Mon, 08 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-02300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06529,
  author       = {Rishi Shah and
                  Yuqian Jiang and
                  Haresh Karnan and
                  Gilberto Briscoe{-}Martinez and
                  Dominick Mulder and
                  Ryan Gupta and
                  Rachel Schlossman and
                  Marika Murphy and
                  Justin W. Hart and
                  Luis Sentis and
                  Peter Stone},
  title        = {Solving Service Robot Tasks: {UT} Austin Villa@Home 2019 Team Report},
  journal      = {CoRR},
  volume       = {abs/1909.06529},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06529},
  eprinttype    = {arXiv},
  eprint       = {1909.06529},
  timestamp    = {Mon, 23 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06529.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06560,
  author       = {Justin W. Hart and
                  Reuth Mirsky and
                  Stone Tejeda and
                  Bonny Mahajan and
                  Jamin Goo and
                  Kathryn Baldauf and
                  Sydney Owen and
                  Peter Stone},
  title        = {Unclogging Our Arteries: Using Human-Inspired Signals to Disambiguate
                  Navigational Intentions},
  journal      = {CoRR},
  volume       = {abs/1909.06560},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06560},
  eprinttype    = {arXiv},
  eprint       = {1909.06560},
  timestamp    = {Tue, 24 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06560.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-09906,
  author       = {Ruohan Zhang and
                  Faraz Torabi and
                  Lin Guan and
                  Dana H. Ballard and
                  Peter Stone},
  title        = {Leveraging Human Guidance for Deep Reinforcement Learning Tasks},
  journal      = {CoRR},
  volume       = {abs/1909.09906},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.09906},
  eprinttype    = {arXiv},
  eprint       = {1909.09906},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-09906.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/MacAlpineS18,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  title        = {Overlapping layered learning},
  journal      = {Artif. Intell.},
  volume       = {254},
  pages        = {21--43},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.artint.2017.09.001},
  doi          = {10.1016/J.ARTINT.2017.09.001},
  timestamp    = {Mon, 27 Nov 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/MacAlpineS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/AlbrechtS18,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Autonomous agents modelling other agents: {A} comprehensive survey
                  and open problems},
  journal      = {Artif. Intell.},
  volume       = {258},
  pages        = {66--95},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.artint.2018.01.002},
  doi          = {10.1016/J.ARTINT.2018.01.002},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/AlbrechtS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/GroszS18,
  author       = {Barbara J. Grosz and
                  Peter Stone},
  title        = {A century-long commitment to assessing artificial intelligence and
                  its impact on society},
  journal      = {Commun. {ACM}},
  volume       = {61},
  number       = {12},
  pages        = {68--73},
  year         = {2018},
  url          = {https://doi.org/10.1145/3198470},
  doi          = {10.1145/3198470},
  timestamp    = {Mon, 26 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cacm/GroszS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/finr/OssmyHMHSA18,
  author       = {Ori Ossmy and
                  Justine E. Hoch and
                  Patrick MacAlpine and
                  Shohan Hasan and
                  Peter Stone and
                  Karen E. Adolph},
  title        = {Variety Wins: Soccer-Playing Robots and Infant Walking},
  journal      = {Frontiers Neurorobotics},
  volume       = {12},
  pages        = {19},
  year         = {2018},
  url          = {https://doi.org/10.3389/fnbot.2018.00019},
  doi          = {10.3389/FNBOT.2018.00019},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/finr/OssmyHMHSA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiebmanZS18,
  author       = {Elad Liebman and
                  Eric Zavesky and
                  Peter Stone},
  title        = {Autonomous Model Management via Reinforcement Learning},
  booktitle    = {The Workshops of the The Thirty-Second {AAAI} Conference on Artificial
                  Intelligence, New Orleans, Louisiana, USA, February 2-7, 2018},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-18}},
  pages        = {348--355},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/17099},
  timestamp    = {Mon, 04 Sep 2023 16:46:41 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiebmanZS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/JiangWS18,
  author       = {Yu{-}Sian Jiang and
                  Garrett Warnell and
                  Peter Stone},
  title        = {{DIPD:} Gaze-Based Intention Inference in Dynamic Environments},
  booktitle    = {The Workshops of the The Thirty-Second {AAAI} Conference on Artificial
                  Intelligence, New Orleans, Louisiana, USA, February 2-7, 2018},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-18}},
  pages        = {614--621},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/17353},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/JiangWS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ChenASHSMS18,
  author       = {Haipeng Chen and
                  Bo An and
                  Guni Sharon and
                  Josiah P. Hanna and
                  Peter Stone and
                  Chunyan Miao and
                  Yeng Chai Soh},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {DyETC: Dynamic Electronic Toll Collection for Traffic Congestion Alleviation},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {757--765},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11337},
  doi          = {10.1609/AAAI.V32I1.11337},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ChenASHSMS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SharonARBS18,
  author       = {Guni Sharon and
                  Michael Albert and
                  Tarun Rambha and
                  Stephen D. Boyles and
                  Peter Stone},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Traffic Optimization for a Mixture of Self-Interested and Compliant
                  Agents},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {1202--1209},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11444},
  doi          = {10.1609/AAAI.V32I1.11444},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SharonARBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WarnellWLS18,
  author       = {Garrett Warnell and
                  Nicholas R. Waytowich and
                  Vernon Lawhern and
                  Peter Stone},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Deep {TAMER:} Interactive Agent Shaping in High-Dimensional State
                  Spaces},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {1545--1554},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11485},
  doi          = {10.1609/AAAI.V32I1.11485},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WarnellWLS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ThomasonSMS18,
  author       = {Jesse Thomason and
                  Jivko Sinapov and
                  Raymond J. Mooney and
                  Peter Stone},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Guiding Exploratory Behaviors for Multi-Modal Grounding of Linguistic
                  Descriptions},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {5520--5527},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11966},
  doi          = {10.1609/AAAI.V32I1.11966},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ThomasonSMS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DurugkarS18,
  author       = {Ishan Durugkar and
                  Peter Stone},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Adversarial Goal Generation for Intrinsic Motivation},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {8073--8074},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.12195},
  doi          = {10.1609/AAAI.V32I1.12195},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DurugkarS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/AmiriWZSTS18,
  author       = {Saeid Amiri and
                  Suhua Wei and
                  Shiqi Zhang and
                  Jivko Sinapov and
                  Jesse Thomason and
                  Peter Stone},
  title        = {Robot Behavioral Exploration and Multi-modal Perception using Dynamically
                  Constructed Controllers},
  booktitle    = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 26-28, 2018},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17581},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/AmiriWZSTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/HannaS18,
  author       = {Josiah P. Hanna and
                  Peter Stone},
  title        = {Towards a Data Efficient Off-Policy Policy Gradient},
  booktitle    = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 26-28, 2018},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17578},
  timestamp    = {Tue, 08 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/HannaS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/MenasheS18,
  author       = {Jacob Menashe and
                  Peter Stone},
  title        = {State Abstraction Synthesis for Discrete Models of Continuous Domains},
  booktitle    = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 26-28, 2018},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17576},
  timestamp    = {Tue, 08 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/MenasheS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LoZS18,
  author       = {Shih{-}Yun Lo and
                  Shiqi Zhang and
                  Peter Stone},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sven Koenig and
                  Mehdi Dastani and
                  Gita Sukthankar},
  title        = {{PETLON:} Planning Efficiently for Task-Level-Optimal Navigation},
  booktitle    = {Proceedings of the 17th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15,
                  2018},
  pages        = {220--228},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems
                  Richland, SC, {USA} / {ACM}},
  year         = {2018},
  url          = {http://dl.acm.org/citation.cfm?id=3237422},
  timestamp    = {Sat, 30 Sep 2023 09:34:53 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LoZS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LiebmanZS18,
  author       = {Elad Liebman and
                  Eric Zavesky and
                  Peter Stone},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sven Koenig and
                  Mehdi Dastani and
                  Gita Sukthankar},
  title        = {A Stitch in Time - Autonomous Model Management via Reinforcement Learning},
  booktitle    = {Proceedings of the 17th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15,
                  2018},
  pages        = {990--998},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems
                  Richland, SC, {USA} / {ACM}},
  year         = {2018},
  url          = {http://dl.acm.org/citation.cfm?id=3237846},
  timestamp    = {Mon, 16 Jul 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LiebmanZS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MirzaeiSBGS18,
  author       = {Hamid Mirzaei and
                  Guni Sharon and
                  Stephen D. Boyles and
                  Tony Givargis and
                  Peter Stone},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sven Koenig and
                  Mehdi Dastani and
                  Gita Sukthankar},
  title        = {Link-based Parameterized Micro-tolling Scheme for Optimal Traffic
                  Management},
  booktitle    = {Proceedings of the 17th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15,
                  2018},
  pages        = {2013--2015},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems
                  Richland, SC, {USA} / {ACM}},
  year         = {2018},
  url          = {http://dl.acm.org/citation.cfm?id=3238055},
  timestamp    = {Mon, 16 Jul 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MirzaeiSBGS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/PadmakumarSM18,
  author       = {Aishwarya Padmakumar and
                  Peter Stone and
                  Raymond J. Mooney},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Learning a Policy for Opportunistic Active Learning},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {1347--1357},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1165},
  doi          = {10.18653/V1/D18-1165},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/PadmakumarSM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icmi/JiangWS18,
  author       = {Yu{-}Sian Jiang and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {Sidney K. D'Mello and
                  Panayiotis G. Georgiou and
                  Stefan Scherer and
                  Emily Mower Provost and
                  Mohammad Soleymani and
                  Marcelo Worsley},
  title        = {Inferring User Intention using Gaze in Vehicles},
  booktitle    = {Proceedings of the 2018 on International Conference on Multimodal
                  Interaction, {ICMI} 2018, Boulder, CO, USA, October 16-20, 2018},
  pages        = {298--306},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3242969.3243018},
  doi          = {10.1145/3242969.3243018},
  timestamp    = {Tue, 15 Oct 2019 08:40:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icmi/JiangWS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/AmiriWZSTS18,
  author       = {Saeid Amiri and
                  Suhua Wei and
                  Shiqi Zhang and
                  Jivko Sinapov and
                  Jesse Thomason and
                  Peter Stone},
  editor       = {J{\'{e}}r{\^{o}}me Lang},
  title        = {Multi-modal Predicate Identification using Dynamically Learned Robot
                  Controllers},
  booktitle    = {Proceedings of the Twenty-Seventh International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm,
                  Sweden},
  pages        = {4638--4645},
  publisher    = {ijcai.org},
  year         = {2018},
  url          = {https://doi.org/10.24963/ijcai.2018/645},
  doi          = {10.24963/IJCAI.2018/645},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/AmiriWZSTS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/TorabiWS18,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  editor       = {J{\'{e}}r{\^{o}}me Lang},
  title        = {Behavioral Cloning from Observation},
  booktitle    = {Proceedings of the Twenty-Seventh International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm,
                  Sweden},
  pages        = {4950--4957},
  publisher    = {ijcai.org},
  year         = {2018},
  url          = {https://doi.org/10.24963/ijcai.2018/687},
  doi          = {10.24963/IJCAI.2018/687},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/TorabiWS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/HartSKWBJS18,
  author       = {Justin W. Hart and
                  Rishi Shah and
                  Sean Kirmani and
                  Nick Walker and
                  Kathryn Baldauf and
                  Nathan John and
                  Peter Stone},
  title        = {{PRISM:} Pose Registration for Integrated Semantic Mapping},
  booktitle    = {2018 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2018, Madrid, Spain, October 1-5, 2018},
  pages        = {896--902},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/IROS.2018.8593681},
  doi          = {10.1109/IROS.2018.8593681},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/HartSKWBJS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isaim/BuiniSBGS18,
  author       = {Hamid Mirzaei Buini and
                  Guni Sharon and
                  Stephen D. Boyles and
                  Tony Givargis and
                  Peter Stone},
  title        = {Enhanced Delta-tolling: Traffic Optimization via Policy Gradient Reinforcement
                  Learning},
  booktitle    = {International Symposium on Artificial Intelligence and Mathematics,
                  {ISAIM} 2018, Fort Lauderdale, Florida, USA, January 3-5, 2018},
  year         = {2018},
  url          = {https://isaim2018.cs.ou.edu/papers/ISAIM2018\_Traffic\_Buini\_etal.pdf},
  timestamp    = {Wed, 20 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isaim/BuiniSBGS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isaim/SharonARBS18,
  author       = {Guni Sharon and
                  Michael Albert and
                  Tarun Rambha and
                  Stephen D. Boyles and
                  Peter Stone},
  title        = {Traffic Optimization For a Mixture of Self-interested and Compliant
                  Agents},
  booktitle    = {International Symposium on Artificial Intelligence and Mathematics,
                  {ISAIM} 2018, Fort Lauderdale, Florida, USA, January 3-5, 2018},
  year         = {2018},
  url          = {https://isaim2018.cs.ou.edu/papers/ISAIM2018\_Traffic\_Sharon\_etal.pdf},
  timestamp    = {Wed, 20 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isaim/SharonARBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/LiebmanWS18,
  author       = {Elad Liebman and
                  Corey N. White and
                  Peter Stone},
  editor       = {Emilia G{\'{o}}mez and
                  Xiao Hu and
                  Eric Humphrey and
                  Emmanouil Benetos},
  title        = {On the Impact of Music on Decision Making in Cooperative Tasks},
  booktitle    = {Proceedings of the 19th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2018, Paris, France, September 23-27,
                  2018},
  pages        = {695--701},
  year         = {2018},
  url          = {http://ismir2018.ircam.fr/doc/pdfs/298\_Paper.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/LiebmanWS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/itsc/MirzaeiSBGS18,
  author       = {Hamid Mirzaei and
                  Guni Sharon and
                  Stephen D. Boyles and
                  Tony Givargis and
                  Peter Stone},
  editor       = {Wei{-}Bin Zhang and
                  Alexandre M. Bayen and
                  Javier J. S{\'{a}}nchez Medina and
                  Matthew J. Barth},
  title        = {Enhanced Delta-tolling: Traffic Optimization via Policy Gradient Reinforcement
                  Learning},
  booktitle    = {21st International Conference on Intelligent Transportation Systems,
                  {ITSC} 2018, Maui, HI, USA, November 4-7, 2018},
  pages        = {47--52},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ITSC.2018.8569737},
  doi          = {10.1109/ITSC.2018.8569737},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/MirzaeiSBGS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ro-man/FernandezJKHSS18,
  author       = {Rolando Fernandez and
                  Nathan John and
                  Sean Kirmani and
                  Justin W. Hart and
                  Jivko Sinapov and
                  Peter Stone},
  title        = {Passive Demonstrations of Light-Based Robot Signals for Improved Human
                  Interpretability},
  booktitle    = {27th {IEEE} International Symposium on Robot and Human Interactive
                  Communication, {RO-MAN} 2018, Nanjing, China, August 27-31, 2018},
  pages        = {234--239},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ROMAN.2018.8525728},
  doi          = {10.1109/ROMAN.2018.8525728},
  timestamp    = {Wed, 16 Oct 2019 14:14:50 +0200},
  biburl       = {https://dblp.org/rec/conf/ro-man/FernandezJKHSS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ro-man/JiangWMS18,
  author       = {Yu{-}Sian Jiang and
                  Garrett Warnell and
                  Eduardo Munera and
                  Peter Stone},
  title        = {A Study of Human-Robot Copilot Systems for En-route Destination Changing},
  booktitle    = {27th {IEEE} International Symposium on Robot and Human Interactive
                  Communication, {RO-MAN} 2018, Nanjing, China, August 27-31, 2018},
  pages        = {997--1004},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ROMAN.2018.8525701},
  doi          = {10.1109/ROMAN.2018.8525701},
  timestamp    = {Tue, 13 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ro-man/JiangWMS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineTPSS18,
  author       = {Patrick MacAlpine and
                  Faraz Torabi and
                  Brahma S. Pavse and
                  John Sigmon and
                  Peter Stone},
  editor       = {Dirk Holz and
                  Katie Genter and
                  Maarouf Saad and
                  Oskar von Stryk},
  title        = {{UT} Austin Villa: RoboCup 2018 3D Simulation League Champions},
  booktitle    = {RoboCup 2018: Robot World Cup {XXII} [Montreal, QC, Canada, June 18-22,
                  2018]},
  series       = {Lecture Notes in Computer Science},
  volume       = {11374},
  pages        = {462--475},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-27544-0\_38},
  doi          = {10.1007/978-3-030-27544-0\_38},
  timestamp    = {Tue, 06 Aug 2019 14:04:46 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineTPSS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-08229,
  author       = {Yuqian Jiang and
                  Shiqi Zhang and
                  Piyush Khandelwal and
                  Peter Stone},
  title        = {An Empirical Comparison of PDDL-based and ASP-based Task Planners},
  journal      = {CoRR},
  volume       = {abs/1804.08229},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.08229},
  eprinttype    = {arXiv},
  eprint       = {1804.08229},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-08229.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-01954,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Behavioral Cloning from Observation},
  journal      = {CoRR},
  volume       = {abs/1805.01954},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.01954},
  eprinttype    = {arXiv},
  eprint       = {1805.01954},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-01954.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-01347,
  author       = {Josiah Hanna and
                  Scott Niekum and
                  Peter Stone},
  title        = {Importance Sampling Policy Evaluation with an Estimated Behavior Policy},
  journal      = {CoRR},
  volume       = {abs/1806.01347},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.01347},
  eprinttype    = {arXiv},
  eprint       = {1806.01347},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-01347.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-06158,
  author       = {Faraz Torabi and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Generative Adversarial Imitation from Observation},
  journal      = {CoRR},
  volume       = {abs/1807.06158},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.06158},
  eprinttype    = {arXiv},
  eprint       = {1807.06158},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-06158.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-07899,
  author       = {Barbara J. Grosz and
                  Peter Stone},
  title        = {A Century Long Commitment to Assessing Artificial Intelligence and
                  its Impact on Society},
  journal      = {CoRR},
  volume       = {abs/1808.07899},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.07899},
  eprinttype    = {arXiv},
  eprint       = {1808.07899},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-07899.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-10009,
  author       = {Aishwarya Padmakumar and
                  Peter Stone and
                  Raymond J. Mooney},
  title        = {Learning a Policy for Opportunistic Active Learning},
  journal      = {CoRR},
  volume       = {abs/1808.10009},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.10009},
  eprinttype    = {arXiv},
  eprint       = {1808.10009},
  timestamp    = {Mon, 03 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-10009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-05676,
  author       = {Prabhat Nagarajan and
                  Garrett Warnell and
                  Peter Stone},
  title        = {Deterministic Implementations for Reproducibility in Deep Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1809.05676},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.05676},
  eprinttype    = {arXiv},
  eprint       = {1809.05676},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-05676.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-07880,
  author       = {Shani Alkoby and
                  Avilash Rath and
                  Peter Stone},
  title        = {Ad hoc Teamwork and Moral Feedback as a Framework for Safe Agent Behavior},
  journal      = {CoRR},
  volume       = {abs/1809.07880},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.07880},
  eprinttype    = {arXiv},
  eprint       = {1809.07880},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-07880.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-08793,
  author       = {Minkyu Kim and
                  Miguel Arduengo and
                  Nick Walker and
                  Yuqian Jiang and
                  Justin W. Hart and
                  Peter Stone and
                  Luis Sentis},
  title        = {An Architecture for Person-Following using Active Target Search},
  journal      = {CoRR},
  volume       = {abs/1809.08793},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.08793},
  eprinttype    = {arXiv},
  eprint       = {1809.08793},
  timestamp    = {Mon, 25 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-08793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-11074,
  author       = {Keting Lu and
                  Shiqi Zhang and
                  Peter Stone and
                  Xiaoping Chen},
  title        = {Robot Representing and Reasoning with Knowledge from Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1809.11074},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.11074},
  eprinttype    = {arXiv},
  eprint       = {1809.11074},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-11074.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-02919,
  author       = {Justin W. Hart and
                  Harel Yedidsion and
                  Yuqian Jiang and
                  Nick Walker and
                  Rishi Shah and
                  Jesse Thomason and
                  Aishwarya Padmakumar and
                  Rolando Fernandez and
                  Jivko Sinapov and
                  Raymond J. Mooney and
                  Peter Stone},
  title        = {Interaction and Autonomy in RoboCup@Home and Building-Wide Intelligence},
  journal      = {CoRR},
  volume       = {abs/1810.02919},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.02919},
  eprinttype    = {arXiv},
  eprint       = {1810.02919},
  timestamp    = {Mon, 25 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-02919.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-03563,
  author       = {Yuqian Jiang and
                  Nick Walker and
                  Minkyu Kim and
                  Nicolas Brissonneau and
                  Daniel S. Brown and
                  Justin W. Hart and
                  Scott Niekum and
                  Luis Sentis and
                  Peter Stone},
  title        = {{LAAIR:} {A} Layered Architecture for Autonomous Interactive Robots},
  journal      = {CoRR},
  volume       = {abs/1811.03563},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.03563},
  eprinttype    = {arXiv},
  eprint       = {1811.03563},
  timestamp    = {Mon, 25 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-03563.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-08955,
  author       = {Yuqian Jiang and
                  Fangkai Yang and
                  Shiqi Zhang and
                  Peter Stone},
  title        = {Integrating Task-Motion Planning with Reinforcement Learning for Robust
                  Decision Making in Mobile Robots},
  journal      = {CoRR},
  volume       = {abs/1811.08955},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.08955},
  eprinttype    = {arXiv},
  eprint       = {1811.08955},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-08955.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-00285,
  author       = {Sanmit Narvekar and
                  Peter Stone},
  title        = {Learning Curriculum Policies for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1812.00285},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.00285},
  eprinttype    = {arXiv},
  eprint       = {1812.00285},
  timestamp    = {Tue, 01 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-00285.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-09521,
  author       = {Jacob Menashe and
                  Peter Stone},
  title        = {Escape Room: {A} Configurable Testbed for Hierarchical Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1812.09521},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.09521},
  eprinttype    = {arXiv},
  eprint       = {1812.09521},
  timestamp    = {Wed, 02 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-09521.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/AlbrechtLS17,
  author       = {Stefano V. Albrecht and
                  Somchaya Liemhetcharat and
                  Peter Stone},
  title        = {Special issue on multiagent interaction without prior coordination:
                  guest editorial},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {31},
  number       = {4},
  pages        = {765--766},
  year         = {2017},
  url          = {https://doi.org/10.1007/s10458-016-9358-0},
  doi          = {10.1007/S10458-016-9358-0},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/AlbrechtLS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/GenterLS17,
  author       = {Katie Genter and
                  Tim Laue and
                  Peter Stone},
  title        = {Three years of the RoboCup standard platform league drop-in player
                  competition - Creating and maintaining a large scale ad hoc teamwork
                  robotics competition},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {31},
  number       = {4},
  pages        = {790--820},
  year         = {2017},
  url          = {https://doi.org/10.1007/s10458-016-9353-5},
  doi          = {10.1007/S10458-016-9353-5},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/GenterLS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/BarrettRKS17,
  author       = {Samuel Barrett and
                  Avi Rosenfeld and
                  Sarit Kraus and
                  Peter Stone},
  title        = {Making friends on the fly: Cooperating with new teammates},
  journal      = {Artif. Intell.},
  volume       = {242},
  pages        = {132--171},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.artint.2016.10.005},
  doi          = {10.1016/J.ARTINT.2016.10.005},
  timestamp    = {Thu, 28 Dec 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/BarrettRKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/HesterS17,
  author       = {Todd Hester and
                  Peter Stone},
  title        = {Intrinsically motivated model learning for developing curious robots},
  journal      = {Artif. Intell.},
  volume       = {247},
  pages        = {170--186},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.artint.2015.05.002},
  doi          = {10.1016/J.ARTINT.2015.05.002},
  timestamp    = {Fri, 28 Apr 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/HesterS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/expert/AuBDS17,
  author       = {Tsz{-}Chiu Au and
                  Bikramjit Banerjee and
                  Prithviraj Dasgupta and
                  Peter Stone},
  title        = {Multirobot Systems},
  journal      = {{IEEE} Intell. Syst.},
  volume       = {32},
  number       = {6},
  pages        = {3--5},
  year         = {2017},
  url          = {https://doi.org/10.1109/MIS.2017.4531221},
  doi          = {10.1109/MIS.2017.4531221},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/expert/AuBDS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijrr/KhandelwalZSLTY17,
  author       = {Piyush Khandelwal and
                  Shiqi Zhang and
                  Jivko Sinapov and
                  Matteo Leonetti and
                  Jesse Thomason and
                  Fangkai Yang and
                  Ilaria Gori and
                  Maxwell Svetlik and
                  Priyanka Khante and
                  Vladimir Lifschitz and
                  J. K. Aggarwal and
                  Raymond J. Mooney and
                  Peter Stone},
  title        = {BWIBots: {A} platform for bridging the gap between {AI} and human-robot
                  interaction research},
  journal      = {Int. J. Robotics Res.},
  volume       = {36},
  number       = {5-7},
  pages        = {635--659},
  year         = {2017},
  url          = {https://doi.org/10.1177/0278364916688949},
  doi          = {10.1177/0278364916688949},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijrr/KhandelwalZSLTY17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/HausknechtLMS17,
  author       = {Matthew J. Hausknecht and
                  Wen{-}Ke Li and
                  Michael D. Mauk and
                  Peter Stone},
  title        = {Machine Learning Capabilities of a Simulated Cerebellum},
  journal      = {{IEEE} Trans. Neural Networks Learn. Syst.},
  volume       = {28},
  number       = {3},
  pages        = {510--522},
  year         = {2017},
  url          = {https://doi.org/10.1109/TNNLS.2015.2512838},
  doi          = {10.1109/TNNLS.2015.2512838},
  timestamp    = {Mon, 09 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/HausknechtLMS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AlbertCS17,
  author       = {Michael Albert and
                  Vincent Conitzer and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Automated Design of Robust Mechanisms},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {298--304},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10574},
  doi          = {10.1609/AAAI.V31I1.10574},
  timestamp    = {Mon, 04 Sep 2023 14:40:32 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AlbertCS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SvetlikLSSWS17,
  author       = {Maxwell Svetlik and
                  Matteo Leonetti and
                  Jivko Sinapov and
                  Rishi Shah and
                  Nick Walker and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Automatic Curriculum Graph Generation for Reinforcement Learning Agents},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {2590--2596},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10933},
  doi          = {10.1609/AAAI.V31I1.10933},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SvetlikLSSWS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HannaS17,
  author       = {Josiah P. Hanna and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Grounded Action Transformation for Robot Learning in Simulation},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3834--3840},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.11044},
  doi          = {10.1609/AAAI.V31I1.11044},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HannaS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZhangKS17,
  author       = {Shiqi Zhang and
                  Piyush Khandelwal and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Dynamically Constructed (PO)MDPs for Adaptive Robot Planning},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3855--3863},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.11042},
  doi          = {10.1609/AAAI.V31I1.11042},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZhangKS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiebmanKSS17,
  author       = {Elad Liebman and
                  Piyush Khandelwal and
                  Maytal Saar{-}Tsechansky and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Designing Better Playlists with Monte Carlo Tree Search},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {4715--4720},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.19100},
  doi          = {10.1609/AAAI.V31I1.19100},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiebmanKSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HannaS17a,
  author       = {Josiah P. Hanna and
                  Peter Stone},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Grounded Action Transformation for Robot Learning in Simulation},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {4931--4932},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.11124},
  doi          = {10.1609/AAAI.V31I1.11124},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HannaS17a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HannaSN17,
  author       = {Josiah P. Hanna and
                  Peter Stone and
                  Scott Niekum},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Bootstrapping with Models: Confidence Intervals for Off-Policy Evaluation},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {4933--4934},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.11123},
  doi          = {10.1609/AAAI.V31I1.11123},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HannaSN17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlbertCS17,
  author       = {Michael Albert and
                  Vincent Conitzer and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Mechanism Design with Unknown Correlated Distributions: Can We Learn
                  Optimal Mechanisms?},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {69--77},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091141},
  timestamp    = {Wed, 27 Sep 2017 07:24:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlbertCS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SharonS17,
  author       = {Guni Sharon and
                  Peter Stone},
  editor       = {Gita Sukthankar and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar},
  title        = {A Protocol for Mixed Autonomous and Human-Operated Vehicles at Intersections},
  booktitle    = {Autonomous Agents and Multiagent Systems - {AAMAS} 2017 Workshops,
                  Best Papers, S{\~{a}}o Paulo, Brazil, May 8-12, 2017, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {10642},
  pages        = {151--167},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-71682-4\_10},
  doi          = {10.1007/978-3-319-71682-4\_10},
  timestamp    = {Mon, 05 Feb 2024 20:34:11 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/SharonS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MacAlpineS17,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  editor       = {Gita Sukthankar and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar},
  title        = {Evaluating Ad Hoc Teamwork Performance in Drop-In Player Challenges},
  booktitle    = {Autonomous Agents and Multiagent Systems - {AAMAS} 2017 Workshops,
                  Best Papers, S{\~{a}}o Paulo, Brazil, May 8-12, 2017, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {10642},
  pages        = {168--186},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-71682-4\_11},
  doi          = {10.1007/978-3-319-71682-4\_11},
  timestamp    = {Thu, 30 Nov 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/MacAlpineS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ZhangJSS17,
  author       = {Shiqi Zhang and
                  Yuqian Jiang and
                  Guni Sharon and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Multirobot Symbolic Planning under Temporal Uncertainty},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {501--510},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091199},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/ZhangJSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterLS17,
  author       = {Katie Genter and
                  Tim Laue and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Three Years of the RoboCup Standard Platform League Drop-In Player
                  Competition: Creating and Maintaining a Large Scale Ad Hoc Teamwork
                  Robotics Competition},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {520--521},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091201},
  timestamp    = {Thu, 14 Dec 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/GenterLS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/HannaSN17,
  author       = {Josiah P. Hanna and
                  Peter Stone and
                  Scott Niekum},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Bootstrapping with Models: Confidence Intervals for Off-Policy Evaluation},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {538--546},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091205},
  timestamp    = {Thu, 11 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/HannaSN17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AlbrechtS17,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Reasoning about Hypothetical Agent Behaviours and their Parameters},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {547--555},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091206},
  timestamp    = {Thu, 11 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AlbrechtS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KhandelwalS17,
  author       = {Piyush Khandelwal and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Multi-Robot Human Guidance: Human Experiments and Multiple Concurrent
                  Requests},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {1369--1377},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091314},
  timestamp    = {Thu, 11 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/KhandelwalS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterS17,
  author       = {Katie Genter and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Agent Behaviors for Joining and Leaving a Flock},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {1553--1555},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091359},
  timestamp    = {Thu, 11 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/GenterS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LiebmanZS17,
  author       = {Elad Liebman and
                  Eric Zavesky and
                  Peter Stone},
  editor       = {Kate Larson and
                  Michael Winikoff and
                  Sanmay Das and
                  Edmund H. Durfee},
  title        = {Autonomous Model Management via Reinforcement Learning: Extended Abstract},
  booktitle    = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent
                  Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017},
  pages        = {1601--1603},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {http://dl.acm.org/citation.cfm?id=3091376},
  timestamp    = {Thu, 11 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LiebmanZS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/ThomasonPSHSM17,
  author       = {Jesse Thomason and
                  Aishwarya Padmakumar and
                  Jivko Sinapov and
                  Justin W. Hart and
                  Peter Stone and
                  Raymond J. Mooney},
  title        = {Opportunistic Active Learning for Grounding Natural Language Descriptions},
  booktitle    = {1st Annual Conference on Robot Learning, CoRL 2017, Mountain View,
                  California, USA, November 13-15, 2017, Proceedings},
  series       = {Proceedings of Machine Learning Research},
  volume       = {78},
  pages        = {67--76},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v78/thomason17a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:24 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/ThomasonPSHSM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eumas/TuylsS17,
  author       = {Karl Tuyls and
                  Peter Stone},
  editor       = {Francesco Belardinelli and
                  Estefania Argente},
  title        = {Multiagent Learning Paradigms},
  booktitle    = {Multi-Agent Systems and Agreement Technologies - 15th European Conference,
                  {EUMAS} 2017, and 5th International Conference, {AT} 2017, {\'{E}}vry,
                  France, December 14-15, 2017, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {10767},
  pages        = {3--21},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-030-01713-2\_1},
  doi          = {10.1007/978-3-030-01713-2\_1},
  timestamp    = {Tue, 21 Mar 2023 20:59:05 +0100},
  biburl       = {https://dblp.org/rec/conf/eumas/TuylsS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hotstorage/GonzalezCSS17,
  author       = {Santiago Gonzalez and
                  Vijay Chidambaram and
                  Jivko Sinapov and
                  Peter Stone},
  title        = {CC-Log: Drastically Reducing Storage Requirements for Robots Using
                  Classification and Compression},
  booktitle    = {9th {USENIX} Workshop on Hot Topics in Storage and File Systems, HotStorage
                  2017, Santa Clara, CA, USA, July 10-11, 2017},
  publisher    = {{USENIX} Association},
  year         = {2017},
  url          = {https://www.usenix.org/conference/hotstorage17/program/presentation/gonzalez},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/hotstorage/GonzalezCSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HannaTSN17,
  author       = {Josiah P. Hanna and
                  Philip S. Thomas and
                  Peter Stone and
                  Scott Niekum},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Data-Efficient Policy Evaluation Through Behavior Policy Search},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {1394--1403},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/hanna17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HannaTSN17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/NarvekarSS17,
  author       = {Sanmit Narvekar and
                  Jivko Sinapov and
                  Peter Stone},
  editor       = {Carles Sierra},
  title        = {Autonomous Task Sequencing for Customized Curriculum Design in Reinforcement
                  Learning},
  booktitle    = {Proceedings of the Twenty-Sixth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August
                  19-25, 2017},
  pages        = {2536--2542},
  publisher    = {ijcai.org},
  year         = {2017},
  url          = {https://doi.org/10.24963/ijcai.2017/353},
  doi          = {10.24963/IJCAI.2017/353},
  timestamp    = {Tue, 20 Aug 2019 16:16:54 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/NarvekarSS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/LuZSC17,
  author       = {Dongcai Lu and
                  Shiqi Zhang and
                  Peter Stone and
                  Xiaoping Chen},
  title        = {Leveraging commonsense reasoning and multimodal perception for robot
                  spoken dialog systems},
  booktitle    = {2017 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2017, Vancouver, BC, Canada, September 24-28, 2017},
  pages        = {6582--6588},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IROS.2017.8206570},
  doi          = {10.1109/IROS.2017.8206570},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/LuZSC17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MenasheKGHLNZS17,
  author       = {Jacob Menashe and
                  Josh Kelle and
                  Katie Genter and
                  Josiah Hanna and
                  Elad Liebman and
                  Sanmit Narvekar and
                  Ruohan Zhang and
                  Peter Stone},
  editor       = {Hidehisa Akiyama and
                  Oliver Obst and
                  Claude Sammut and
                  Flavio Tonidandel},
  title        = {Fast and Precise Black and White Ball Detection for RoboCup Soccer},
  booktitle    = {RoboCup 2017: Robot World Cup {XXI} [Nagoya, Japan, July 27-31, 2017]},
  series       = {Lecture Notes in Computer Science},
  volume       = {11175},
  pages        = {45--58},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-030-00308-1\_4},
  doi          = {10.1007/978-3-030-00308-1\_4},
  timestamp    = {Wed, 25 Sep 2019 18:10:19 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MenasheKGHLNZS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineS17,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  editor       = {Hidehisa Akiyama and
                  Oliver Obst and
                  Claude Sammut and
                  Flavio Tonidandel},
  title        = {{UT} Austin Villa: RoboCup 2017 3D Simulation League Competition and
                  Technical Challenges Champions},
  booktitle    = {RoboCup 2017: Robot World Cup {XXI} [Nagoya, Japan, July 27-31, 2017]},
  series       = {Lecture Notes in Computer Science},
  volume       = {11175},
  pages        = {473--485},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-030-00308-1\_39},
  doi          = {10.1007/978-3-030-00308-1\_39},
  timestamp    = {Wed, 12 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/ml/Stone17,
  author       = {Peter Stone},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Q-Learning},
  booktitle    = {Encyclopedia of Machine Learning and Data Mining},
  pages        = {1033},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-1-4899-7687-1\_689},
  doi          = {10.1007/978-1-4899-7687-1\_689},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/ml/Stone17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/ml/Stone17a,
  author       = {Peter Stone},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Reinforcement Learning},
  booktitle    = {Encyclopedia of Machine Learning and Data Mining},
  pages        = {1088--1090},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-1-4899-7687-1\_720},
  doi          = {10.1007/978-1-4899-7687-1\_720},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/ml/Stone17a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HannaTSN17,
  author       = {Josiah P. Hanna and
                  Philip S. Thomas and
                  Peter Stone and
                  Scott Niekum},
  title        = {Data-Efficient Policy Evaluation Through Behavior Policy Search},
  journal      = {CoRR},
  volume       = {abs/1706.03469},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.03469},
  eprinttype    = {arXiv},
  eprint       = {1706.03469},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HannaTSN17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MocanuMSNGL17,
  author       = {Decebal Constantin Mocanu and
                  Elena Mocanu and
                  Peter Stone and
                  Phuong H. Nguyen and
                  Madeleine Gibescu and
                  Antonio Liotta},
  title        = {Evolutionary Training of Sparse Artificial Neural Networks: {A} Network
                  Science Perspective},
  journal      = {CoRR},
  volume       = {abs/1707.04780},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.04780},
  eprinttype    = {arXiv},
  eprint       = {1707.04780},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MocanuMSNGL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-08071,
  author       = {Stefano V. Albrecht and
                  Peter Stone},
  title        = {Autonomous Agents Modelling Other Agents: {A} Comprehensive Survey
                  and Open Problems},
  journal      = {CoRR},
  volume       = {abs/1709.08071},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.08071},
  eprinttype    = {arXiv},
  eprint       = {1709.08071},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-08071.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-09569,
  author       = {Guni Sharon and
                  Michael Albert and
                  Tarun Rambha and
                  Stephen D. Boyles and
                  Peter Stone},
  title        = {Traffic Optimization For a Mixture of Self-interested and Compliant
                  Agents},
  journal      = {CoRR},
  volume       = {abs/1709.09569},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.09569},
  eprinttype    = {arXiv},
  eprint       = {1709.09569},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-09569.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-10163,
  author       = {Garrett Warnell and
                  Nicholas R. Waytowich and
                  Vernon Lawhern and
                  Peter Stone},
  title        = {Deep {TAMER:} Interactive Agent Shaping in High-Dimensional State
                  Spaces},
  journal      = {CoRR},
  volume       = {abs/1709.10163},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.10163},
  eprinttype    = {arXiv},
  eprint       = {1709.10163},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-10163.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/LeonettiIS16,
  author       = {Matteo Leonetti and
                  Luca Iocchi and
                  Peter Stone},
  title        = {A synthesis of automated planning and reinforcement learning for efficient,
                  robust decision-making},
  journal      = {Artif. Intell.},
  volume       = {241},
  pages        = {103--130},
  year         = {2016},
  url          = {https://doi.org/10.1016/j.artint.2016.07.004},
  doi          = {10.1016/J.ARTINT.2016.07.004},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ai/LeonettiIS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/expert/GenterMMHLNZS16,
  author       = {Katie Genter and
                  Patrick MacAlpine and
                  Jacob Menashe and
                  Josiah Hanna and
                  Elad Liebman and
                  Sanmit Narvekar and
                  Ruohan Zhang and
                  Peter Stone},
  title        = {{UT} Austin Villa: Project-Driven Research in {AI} and Robotics},
  journal      = {{IEEE} Intell. Syst.},
  volume       = {31},
  number       = {2},
  pages        = {94--101},
  year         = {2016},
  url          = {https://doi.org/10.1109/MIS.2016.35},
  doi          = {10.1109/MIS.2016.35},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/expert/GenterMMHLNZS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/UrieliS16,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Autonomous Electricity Trading Using Time-of-Use Tariffs in a Competitive
                  Market},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {345--352},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.10012},
  doi          = {10.1609/AAAI.V30I1.10012},
  timestamp    = {Mon, 04 Sep 2023 15:08:28 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/UrieliS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Stone16,
  author       = {Peter Stone},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {What's Hot at RoboCup},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {4346--4348},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.9871},
  doi          = {10.1609/AAAI.V30I1.9871},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Stone16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/UrieliS16a,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Enrico Pontelli and
                  Alex Rogers and
                  Sylvie Thi{\'{e}}baux and
                  Tran Cao Son},
  title        = {An MDP-Based Winning Approach to Autonomous Power Trading: Formalization
                  and Empirical Analysis},
  booktitle    = {{AI} for Smart Grids and Smart Buildings, Papers from the 2016 {AAAI}
                  Workshop, Phoenix, Arizona, USA, February 12, 2016},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-16-04}},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {http://www.aaai.org/ocs/index.php/WS/AAAIW16/paper/view/12641},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/UrieliS16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/Stone16,
  author       = {Peter Stone},
  editor       = {Catholijn M. Jonker and
                  Stacy Marsella and
                  John Thangarajah and
                  Karl Tuyls},
  title        = {Autonomous Learning Agents: Layered Learning and Ad Hoc Teamwork},
  booktitle    = {Proceedings of the 2016 International Conference on Autonomous Agents
                  {\&} Multiagent Systems, Singapore, May 9-13, 2016},
  pages        = {2},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {http://dl.acm.org/citation.cfm?id=2936927},
  timestamp    = {Fri, 20 May 2016 20:33:29 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/Stone16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/NarvekarSLS16,
  author       = {Sanmit Narvekar and
                  Jivko Sinapov and
                  Matteo Leonetti and
                  Peter Stone},
  editor       = {Catholijn M. Jonker and
                  Stacy Marsella and
                  John Thangarajah and
                  Karl Tuyls},
  title        = {Source Task Creation for Curriculum Learning},
  booktitle    = {Proceedings of the 2016 International Conference on Autonomous Agents
                  {\&} Multiagent Systems, Singapore, May 9-13, 2016},
  pages        = {566--574},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {http://dl.acm.org/citation.cfm?id=2937007},
  timestamp    = {Fri, 20 May 2016 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/NarvekarSLS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterS16,
  author       = {Katie Genter and
                  Peter Stone},
  editor       = {Catholijn M. Jonker and
                  Stacy Marsella and
                  John Thangarajah and
                  Karl Tuyls},
  title        = {Adding Influencing Agents to a Flock},
  booktitle    = {Proceedings of the 2016 International Conference on Autonomous Agents
                  {\&} Multiagent Systems, Singapore, May 9-13, 2016},
  pages        = {615--623},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {http://dl.acm.org/citation.cfm?id=2937015},
  timestamp    = {Fri, 20 May 2016 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/GenterS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/UrieliS16,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Catholijn M. Jonker and
                  Stacy Marsella and
                  John Thangarajah and
                  Karl Tuyls},
  title        = {An MDP-Based Winning Approach to Autonomous Power Trading: Formalization
                  and Empirical Analysis},
  booktitle    = {Proceedings of the 2016 International Conference on Autonomous Agents
                  {\&} Multiagent Systems, Singapore, May 9-13, 2016},
  pages        = {827--835},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {http://dl.acm.org/citation.cfm?id=2937045},
  timestamp    = {Fri, 20 May 2016 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/UrieliS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/MacAlpineLS16,
  author       = {Patrick MacAlpine and
                  Elad Liebman and
                  Peter Stone},
  editor       = {Tobias Friedrich and
                  Frank Neumann and
                  Andrew M. Sutton},
  title        = {Adaptation of Surrogate Tasks for Bipedal Walk Optimization},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} 2016, Denver,
                  CO, USA, July 20-24, 2016, Companion Material Proceedings},
  pages        = {1275--1276},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2908961.2931712},
  doi          = {10.1145/2908961.2931712},
  timestamp    = {Tue, 06 Nov 2018 11:06:40 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/MacAlpineLS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/humanoids/KimJSS16,
  author       = {Donghyun Kim and
                  Steven Jens Jorgensen and
                  Peter Stone and
                  Luis Sentis},
  title        = {Dynamic behaviors on the {NAO} robot with closed-loop whole body operational
                  space control},
  booktitle    = {16th {IEEE-RAS} International Conference on Humanoid Robots, Humanoids
                  2016, Cancun, Mexico, November 15-17, 2016},
  pages        = {1121--1128},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/HUMANOIDS.2016.7803411},
  doi          = {10.1109/HUMANOIDS.2016.7803411},
  timestamp    = {Wed, 16 Oct 2019 14:14:50 +0200},
  biburl       = {https://dblp.org/rec/conf/humanoids/KimJSS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KhandelwalLNS16,
  author       = {Piyush Khandelwal and
                  Elad Liebman and
                  Scott Niekum and
                  Peter Stone},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {On the Analysis of Complex Backup Strategies in Monte Carlo Tree Search},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {1319--1328},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/khandelwal16.html},
  timestamp    = {Wed, 29 May 2019 08:41:46 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KhandelwalLNS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SharonHRASB16,
  author       = {Guni Sharon and
                  Josiah Hanna and
                  Tarun Rambha and
                  Michael Albert and
                  Peter Stone and
                  Stephen D. Boyles},
  editor       = {Ana L{\'{u}}cia C. Bazzan and
                  Franziska Kl{\"{u}}gl and
                  Sascha Ossowski and
                  Giuseppe Vizzari},
  title        = {Delta-Tolling: Adaptive Tolling for Optimizing Traffic Throughput},
  booktitle    = {Proceedings of the Ninth International Workshop on Agents in Traffic
                  and Transportation {(ATT} 2016) co-located with the 25th International
                  Joint Conference On Artificial Intelligence {(IJCAI} 2016), New York,
                  USA, July 10, 2016},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {1678},
  publisher    = {CEUR-WS.org},
  year         = {2016},
  url          = {https://ceur-ws.org/Vol-1678/paper1.pdf},
  timestamp    = {Fri, 10 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/SharonHRASB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SinapovKSS16,
  author       = {Jivko Sinapov and
                  Priyanka Khante and
                  Maxwell Svetlik and
                  Peter Stone},
  editor       = {Subbarao Kambhampati},
  title        = {Learning to Order Objects Using Haptic and Proprioceptive Exploratory
                  Behaviors},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {3462--3468},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/489},
  timestamp    = {Tue, 20 Aug 2019 16:19:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/SinapovKSS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/ThomasonSSSM16,
  author       = {Jesse Thomason and
                  Jivko Sinapov and
                  Maxwell Svetlik and
                  Peter Stone and
                  Raymond J. Mooney},
  editor       = {Subbarao Kambhampati},
  title        = {Learning Multi-Modal Grounded Linguistic Semantics by Playing "I
                  Spy"},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {3477--3483},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/491},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/ThomasonSSSM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/ZhangLCS16,
  author       = {Shiqi Zhang and
                  Dongcai Lu and
                  Xiaoping Chen and
                  Peter Stone},
  editor       = {Subbarao Kambhampati},
  title        = {Robot Scavenger Hunt: {A} Standardized Framework for Evaluating Intelligent
                  Mobile Robots},
  booktitle    = {Proceedings of the Twenty-Fifth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July
                  2016},
  pages        = {4276--4277},
  publisher    = {{IJCAI/AAAI} Press},
  year         = {2016},
  url          = {http://www.ijcai.org/Abstract/16/658},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/ZhangLCS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/LiebmanSW16,
  author       = {Elad Liebman and
                  Peter Stone and
                  Corey N. White},
  editor       = {Michael I. Mandel and
                  Johanna Devaney and
                  Douglas Turnbull and
                  George Tzanetakis},
  title        = {Impact of Music on Decision Making in Quantitative Tasks},
  booktitle    = {Proceedings of the 17th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2016, New York City, United States,
                  August 7-11, 2016},
  pages        = {661--667},
  year         = {2016},
  url          = {https://wp.nyu.edu/ismir2016/wp-content/uploads/sites/2294/2016/07/272\_Paper.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/LiebmanSW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineS16,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  editor       = {Sven Behnke and
                  Raymond Sheh and
                  Sanem Sariel and
                  Daniel D. Lee},
  title        = {{UT} Austin Villa RoboCup 3D Simulation Base Code Release},
  booktitle    = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July
                  4, 2016]},
  series       = {Lecture Notes in Computer Science},
  volume       = {9776},
  pages        = {135--143},
  publisher    = {Springer},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-68792-6\_11},
  doi          = {10.1007/978-3-319-68792-6\_11},
  timestamp    = {Tue, 14 May 2019 10:00:53 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineS16a,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  editor       = {Sven Behnke and
                  Raymond Sheh and
                  Sanem Sariel and
                  Daniel D. Lee},
  title        = {Prioritized Role Assignment for Marking},
  booktitle    = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July
                  4, 2016]},
  series       = {Lecture Notes in Computer Science},
  volume       = {9776},
  pages        = {306--318},
  publisher    = {Springer},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-68792-6\_25},
  doi          = {10.1007/978-3-319-68792-6\_25},
  timestamp    = {Thu, 02 Nov 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineS16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineS16b,
  author       = {Patrick MacAlpine and
                  Peter Stone},
  editor       = {Sven Behnke and
                  Raymond Sheh and
                  Sanem Sariel and
                  Daniel D. Lee},
  title        = {{UT} Austin Villa: RoboCup 2016 3D Simulation League Competition and
                  Technical Challenges Champions},
  booktitle    = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July
                  4, 2016]},
  series       = {Lecture Notes in Computer Science},
  volume       = {9776},
  pages        = {515--528},
  publisher    = {Springer},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-68792-6\_43},
  doi          = {10.1007/978-3-319-68792-6\_43},
  timestamp    = {Thu, 02 Nov 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineS16b.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/HausknechtS15a,
  author       = {Matthew J. Hausknecht and
                  Peter Stone},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Deep Reinforcement Learning in Parameterized Action Space},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.04143},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HausknechtS15a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HannaSN16,
  author       = {Josiah P. Hanna and
                  Peter Stone and
                  Scott Niekum},
  title        = {High Confidence Off-Policy Evaluation with Models},
  journal      = {CoRR},
  volume       = {abs/1606.06126},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.06126},
  eprinttype    = {arXiv},
  eprint       = {1606.06126},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HannaSN16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MocanuVESL16,
  author       = {Decebal Constantin Mocanu and
                  Maria Torres Vega and
                  Eric Eaton and
                  Peter Stone and
                  Antonio Liotta},
  title        = {Online Contrastive Divergence with Generative Replay: Experience Replay
                  without Storing Data},
  journal      = {CoRR},
  volume       = {abs/1610.05555},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.05555},
  eprinttype    = {arXiv},
  eprint       = {1610.05555},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MocanuVESL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aai/LiebmanCS15,
  author       = {Elad Liebman and
                  Benny Chor and
                  Peter Stone},
  title        = {Representative Selection in Nonmetric Datasets},
  journal      = {Appl. Artif. Intell.},
  volume       = {29},
  number       = {8},
  pages        = {807--838},
  year         = {2015},
  url          = {https://doi.org/10.1080/08839514.2015.1071092},
  doi          = {10.1080/08839514.2015.1071092},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aai/LiebmanCS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/KnoxS15,
  author       = {W. Bradley Knox and
                  Peter Stone},
  title        = {Framing reinforcement learning from human reward: Reward positivity,
                  temporal discounting, episodicity, and performance},
  journal      = {Artif. Intell.},
  volume       = {225},
  pages        = {24--50},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.artint.2015.03.009},
  doi          = {10.1016/J.ARTINT.2015.03.009},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/KnoxS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aimatters/EatonDGGIKLRRSW15,
  author       = {Eric Eaton and
                  Tom Dietterich and
                  Maria L. Gini and
                  Barbara J. Grosz and
                  Charles L. Isbell Jr. and
                  Subbarao Kambhampati and
                  Michael L. Littman and
                  Francesca Rossi and
                  Stuart Russell and
                  Peter Stone and
                  Toby Walsh and
                  Michael J. Wooldridge},
  title        = {Who speaks for AI?},
  journal      = {{AI} Matters},
  volume       = {2},
  number       = {2},
  pages        = {4--14},
  year         = {2015},
  url          = {https://doi.org/10.1145/2847557.2847559},
  doi          = {10.1145/2847557.2847559},
  timestamp    = {Tue, 23 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aimatters/EatonDGGIKLRRSW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cea/HigginsMLPS15,
  author       = {Andrew J. Higgins and
                  Stephen McFallan and
                  Luis Laredo and
                  Di Prestwidge and
                  Peter Stone},
  title        = {{TRANSIT} - {A} model for simulating infrastructure and policy interventions
                  in agriculture logistics: Application to the northern Australia beef
                  industry},
  journal      = {Comput. Electron. Agric.},
  volume       = {114},
  pages        = {32--42},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.compag.2015.03.018},
  doi          = {10.1016/J.COMPAG.2015.03.018},
  timestamp    = {Mon, 03 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cea/HigginsMLPS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZhangS15,
  author       = {Shiqi Zhang and
                  Peter Stone},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {{CORPP:} Commonsense Reasoning and Probabilistic Planning, as Applied
                  to Dialog with a Mobile Robot},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {1394--1400},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9385},
  doi          = {10.1609/AAAI.V29I1.9385},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZhangS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BarrettS15,
  author       = {Samuel Barrett and
                  Peter Stone},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Cooperating with Unknown Teammates in Complex Domains: {A} Robot Soccer
                  Case Study of Ad Hoc Teamwork},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2010--2016},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9428},
  doi          = {10.1609/AAAI.V29I1.9428},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BarrettS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MacAlpinePS15,
  author       = {Patrick MacAlpine and
                  Eric Price and
                  Peter Stone},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {{SCRAM:} Scalable Collision-avoiding Role Assignment with Minimal-Makespan
                  for Formational Positioning},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2096--2102},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9424},
  doi          = {10.1609/AAAI.V29I1.9424},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MacAlpinePS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MacAlpineDS15,
  author       = {Patrick MacAlpine and
                  Mike Depinet and
                  Peter Stone},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {{UT} Austin Villa 2014: RoboCup 3D Simulation League Champion via
                  Overlapping Layered Learning},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2842--2848},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9540},
  doi          = {10.1609/AAAI.V29I1.9540},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MacAlpineDS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GenterS15,
  author       = {Katie Genter and
                  Peter Stone},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {Placing Influencing Agents in a Flock},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {4160--4161},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9743},
  doi          = {10.1609/AAAI.V29I1.9743},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GenterS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HausknechtS15,
  author       = {Matthew J. Hausknecht and
                  Peter Stone},
  editor       = {Michael Bowling and
                  Marc G. Bellemare and
                  Erik Talvitie and
                  Joel Veness and
                  Marlos C. Machado},
  title        = {The Impact of Determinism on Learning Atari 2600 Games},
  booktitle    = {Learning for General Competency in Video Games, Papers from the 2015
                  {AAAI} Workshop, Austin, Texas, USA, January 26, 2015},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-15-10}},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://aaai.org/ocs/index.php/WS/AAAIW15/paper/view/9564},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HausknechtS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/HausknechtS15,
  author       = {Matthew J. Hausknecht and
                  Peter Stone},
  title        = {Deep Recurrent Q-Learning for Partially Observable MDPs},
  booktitle    = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14,
                  2015},
  pages        = {29--37},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11673},
  timestamp    = {Wed, 14 Nov 2018 16:20:12 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/HausknechtS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/UrieliS15,
  author       = {Daniel Urieli and
                  Peter Stone},
  title        = {Autonomous Electricity Trading Using Time-Of-Use Tariffs in a Competitive
                  Market},
  booktitle    = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14,
                  2015},
  pages        = {91--92},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11715},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/UrieliS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/ZhangS15,
  author       = {Shiqi Zhang and
                  Peter Stone},
  title        = {{CORPP:} Commonsense Reasoning and Probabilistic Planning, as Applied
                  to Dialog with a Mobile Robot},
  booktitle    = {2015 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 22-25, 2015},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS15/paper/view/10260},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/ZhangS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterZS15,
  author       = {Katie Genter and
                  Shun Zhang and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Determining Placements of Influencing Agents in a Flock},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {247--255},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2772914},
  timestamp    = {Tue, 08 Mar 2022 10:12:47 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/GenterZS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LiebmanSS15,
  author       = {Elad Liebman and
                  Maytal Saar{-}Tsechansky and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {{DJ-MC:} {A} Reinforcement-Learning Agent for Music Playlist Recommendation},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {591--599},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2772954},
  timestamp    = {Fri, 15 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LiebmanSS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SinapovNLS15,
  author       = {Jivko Sinapov and
                  Sanmit Narvekar and
                  Matteo Leonetti and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Learning Inter-Task Transferability in the Absence of Target Task
                  Samples},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {725--733},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773247},
  timestamp    = {Fri, 15 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/SinapovNLS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MenasheS15,
  author       = {Jacob Menashe and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Monte Carlo Hierarchical Model Learning},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {771--779},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773252},
  timestamp    = {Fri, 15 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MenasheS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KhandelwalBS15,
  author       = {Piyush Khandelwal and
                  Samuel Barrett and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Leading the Way: An Efficient Multi-robot Guidance System},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {1625--1633},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773358},
  timestamp    = {Fri, 15 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/KhandelwalBS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/FangST15,
  author       = {Fei Fang and
                  Peter Stone and
                  Milind Tambe},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Defender Strategies In Domains Involving Frequent Adversary Interaction},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {1663--1664},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773374},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/FangST15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterLS15,
  author       = {Katie Genter and
                  Tim Laue and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {The RoboCup 2014 {SPL} Drop-in Player Competition: Encouraging Teamwork
                  without Pre-coordination},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {1745--1746},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773415},
  timestamp    = {Thu, 14 Dec 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/GenterLS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MenasheS15a,
  author       = {Jacob Menashe and
                  Peter Stone},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Monte Carlo Hierarchical Model Learning: (Doctoral Consortium)},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {1985--1986},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773538},
  timestamp    = {Fri, 15 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MenasheS15a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/ThomasonZMS15,
  author       = {Jesse Thomason and
                  Shiqi Zhang and
                  Raymond J. Mooney and
                  Peter Stone},
  editor       = {Qiang Yang and
                  Michael J. Wooldridge},
  title        = {Learning to Interpret Natural Language Commands through Human-Robot
                  Dialog},
  booktitle    = {Proceedings of the Twenty-Fourth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July
                  25-31, 2015},
  pages        = {1923--1929},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://ijcai.org/Abstract/15/273},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/ThomasonZMS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/FangST15,
  author       = {Fei Fang and
                  Peter Stone and
                  Milind Tambe},
  editor       = {Qiang Yang and
                  Michael J. Wooldridge},
  title        = {When Security Games Go Green: Designing Defender Strategies to Prevent
                  Poaching and Illegal Fishing},
  booktitle    = {Proceedings of the Twenty-Fourth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July
                  25-31, 2015},
  pages        = {2589--2595},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {http://ijcai.org/Abstract/15/367},
  timestamp    = {Wed, 07 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcai/FangST15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/GenterLS15,
  author       = {Katie Genter and
                  Tim Laue and
                  Peter Stone},
  title        = {Benchmarking robot cooperation without pre-coordination in the RoboCup
                  Standard Platform League drop-in player competition},
  booktitle    = {2015 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2015, Hamburg, Germany, September 28 - October 2,
                  2015},
  pages        = {3415--3420},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/IROS.2015.7353853},
  doi          = {10.1109/IROS.2015.7353853},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/GenterLS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/LiebmanSW15,
  author       = {Elad Liebman and
                  Peter Stone and
                  Corey N. White},
  editor       = {Meinard M{\"{u}}ller and
                  Frans Wiering},
  title        = {How Music Alters Decision Making - Impact of Music Stimuli on Emotional
                  Classification},
  booktitle    = {Proceedings of the 16th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2015, M{\'{a}}laga, Spain, October
                  26-30, 2015},
  pages        = {793--799},
  year         = {2015},
  url          = {http://ismir2015.uma.es/articles/293\_Paper.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/LiebmanSW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lpnmr/ZhangYKS15,
  author       = {Shiqi Zhang and
                  Fangkai Yang and
                  Piyush Khandelwal and
                  Peter Stone},
  editor       = {Francesco Calimeri and
                  Giovambattista Ianni and
                  Miroslaw Truszczynski},
  title        = {Mobile Robot Planning Using Action Language \emph{BC} with an Abstraction
                  Hierarchy},
  booktitle    = {Logic Programming and Nonmonotonic Reasoning - 13th International
                  Conference, {LPNMR} 2015, Lexington, KY, USA, September 27-30, 2015.
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {9345},
  pages        = {502--516},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-23264-5\_42},
  doi          = {10.1007/978-3-319-23264-5\_42},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lpnmr/ZhangYKS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineHLS15,
  author       = {Patrick MacAlpine and
                  Josiah Hanna and
                  Jason Liang and
                  Peter Stone},
  editor       = {Lu{\'{\i}}s Almeida and
                  Jianmin Ji and
                  Gerald Steinbauer and
                  Sean Luke},
  title        = {{UT} Austin Villa: RoboCup 2015 3D Simulation League Competition and
                  Technical Challenges Champions},
  booktitle    = {RoboCup 2015: Robot World Cup {XIX} [papers from the 19th Annual RoboCup
                  International Symposium, Hefei, China, July 23, 2015]},
  series       = {Lecture Notes in Computer Science},
  volume       = {9513},
  pages        = {118--131},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-29339-4\_10},
  doi          = {10.1007/978-3-319-29339-4\_10},
  timestamp    = {Thu, 14 Jan 2021 15:08:30 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineHLS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/LeottauRMS15,
  author       = {David Leonardo Leottau and
                  Javier Ruiz{-}del{-}Solar and
                  Patrick MacAlpine and
                  Peter Stone},
  editor       = {Lu{\'{\i}}s Almeida and
                  Jianmin Ji and
                  Gerald Steinbauer and
                  Sean Luke},
  title        = {A Study of Layered Learning Strategies Applied to Individual Behaviors
                  in Robot Soccer},
  booktitle    = {RoboCup 2015: Robot World Cup {XIX} [papers from the 19th Annual RoboCup
                  International Symposium, Hefei, China, July 23, 2015]},
  series       = {Lecture Notes in Computer Science},
  volume       = {9513},
  pages        = {290--302},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-29339-4\_24},
  doi          = {10.1007/978-3-319-29339-4\_24},
  timestamp    = {Tue, 04 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/LeottauRMS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/socrob/GoriSKSA15,
  author       = {Ilaria Gori and
                  Jivko Sinapov and
                  Priyanka Khante and
                  Peter Stone and
                  J. K. Aggarwal},
  editor       = {Adriana Tapus and
                  Elisabeth Andr{\'{e}} and
                  Jean{-}Claude Martin and
                  Fran{\c{c}}ois Ferland and
                  Mehdi Ammi},
  title        = {Robot-Centric Activity Recognition 'in the Wild'},
  booktitle    = {Social Robotics - 7th International Conference, {ICSR} 2015, Paris,
                  France, October 26-30, 2015, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {9388},
  pages        = {224--234},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-25554-5\_23},
  doi          = {10.1007/978-3-319-25554-5\_23},
  timestamp    = {Sat, 30 Sep 2023 09:57:07 +0200},
  biburl       = {https://dblp.org/rec/conf/socrob/GoriSKSA15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiebmanCS15,
  author       = {Elad Liebman and
                  Benny Chor and
                  Peter Stone},
  title        = {Representative Selection in Non Metric Datasets},
  journal      = {CoRR},
  volume       = {abs/1502.07428},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.07428},
  eprinttype    = {arXiv},
  eprint       = {1502.07428},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiebmanCS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HausknechtS15,
  author       = {Matthew J. Hausknecht and
                  Peter Stone},
  title        = {Deep Recurrent Q-Learning for Partially Observable MDPs},
  journal      = {CoRR},
  volume       = {abs/1507.06527},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.06527},
  eprinttype    = {arXiv},
  eprint       = {1507.06527},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HausknechtS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/ChakrabortyS14,
  author       = {Doran Chakraborty and
                  Peter Stone},
  title        = {Multiagent learning in the presence of memory-bounded agents},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {28},
  number       = {2},
  pages        = {182--213},
  year         = {2014},
  url          = {https://doi.org/10.1007/s10458-013-9222-4},
  doi          = {10.1007/S10458-013-9222-4},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/ChakrabortyS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/NardiNRSSV14,
  author       = {Daniele Nardi and
                  Itsuki Noda and
                  A. Fernando Ribeiro and
                  Peter Stone and
                  Oskar von Stryk and
                  Manuela M. Veloso},
  title        = {RoboCup Soccer Leagues},
  journal      = {{AI} Mag.},
  volume       = {35},
  number       = {3},
  pages        = {77--85},
  year         = {2014},
  url          = {https://doi.org/10.1609/aimag.v35i3.2549},
  doi          = {10.1609/AIMAG.V35I3.2549},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aim/NardiNRSSV14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aimatters/StoneMGB14,
  author       = {Peter Stone and
                  Patrick MacAlpine and
                  Katie Genter and
                  Samuel Barrett},
  title        = {Drop-in games at RoboCup},
  journal      = {{AI} Matters},
  volume       = {1},
  number       = {1},
  pages        = {20--22},
  year         = {2014},
  url          = {https://doi.org/10.1145/2639475.2655756},
  doi          = {10.1145/2639475.2655756},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aimatters/StoneMGB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tciaig/HausknechtLMS14,
  author       = {Matthew J. Hausknecht and
                  Joel Lehman and
                  Risto Miikkulainen and
                  Peter Stone},
  title        = {A Neuroevolution Approach to General Atari Game Playing},
  journal      = {{IEEE} Trans. Comput. Intell. {AI} Games},
  volume       = {6},
  number       = {4},
  pages        = {355--366},
  year         = {2014},
  url          = {https://doi.org/10.1109/TCIAIG.2013.2294713},
  doi          = {10.1109/TCIAIG.2013.2294713},
  timestamp    = {Wed, 13 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tciaig/HausknechtLMS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/UrieliS14,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Carla E. Brodley and
                  Peter Stone},
  title        = {TacTex'13: {A} Champion Adaptive Power Trading Agent},
  booktitle    = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence,
                  July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada},
  pages        = {465--471},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {https://doi.org/10.1609/aaai.v28i1.8767},
  doi          = {10.1609/AAAI.V28I1.8767},
  timestamp    = {Mon, 04 Sep 2023 15:06:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/UrieliS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/KhandelwalS14,
  author       = {Piyush Khandelwal and
                  Peter Stone},
  title        = {Leading the Way: An Efficient Multi-Robot Guidance System},
  booktitle    = {2014 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 13-15,
                  2014},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {http://www.aaai.org/ocs/index.php/FSS/FSS14/paper/view/9181},
  timestamp    = {Wed, 14 Nov 2018 17:08:03 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaifs/KhandelwalS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/KhandelwalS14,
  author       = {Piyush Khandelwal and
                  Peter Stone},
  title        = {Multi-Robot Human Guidance Using Topological Graphs},
  booktitle    = {2014 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 24-26, 2014},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS14/paper/view/7726},
  timestamp    = {Wed, 14 Nov 2018 14:23:12 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/KhandelwalS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/YangKLS14,
  author       = {Fangkai Yang and
                  Piyush Khandelwal and
                  Matteo Leonetti and
                  Peter Stone},
  title        = {Planning in Answer Set Programming while Learning Action Costs for
                  Mobile Robots},
  booktitle    = {2014 {AAAI} Spring Symposia, Stanford University, Palo Alto, California,
                  USA, March 24-26, 2014},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS14/paper/view/7727},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/YangKLS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/KhandelwalYLLS14,
  author       = {Piyush Khandelwal and
                  Fangkai Yang and
                  Matteo Leonetti and
                  Vladimir Lifschitz and
                  Peter Stone},
  editor       = {Steve A. Chien and
                  Minh Binh Do and
                  Alan Fern and
                  Wheeler Ruml},
  title        = {Planning in Action Language {BC} while Learning Action Costs for Mobile
                  Robots},
  booktitle    = {Proceedings of the Twenty-Fourth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2014, Portsmouth, New Hampshire,
                  USA, June 21-26, 2014},
  publisher    = {{AAAI}},
  year         = {2014},
  url          = {http://www.aaai.org/ocs/index.php/ICAPS/ICAPS14/paper/view/7940},
  timestamp    = {Thu, 19 Nov 2015 08:52:28 +0100},
  biburl       = {https://dblp.org/rec/conf/aips/KhandelwalYLLS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/antsw/GenterS14,
  author       = {Katie Long Genter and
                  Peter Stone},
  editor       = {Marco Dorigo and
                  Mauro Birattari and
                  Simon Garnier and
                  Heiko Hamann and
                  Marco Antonio Montes de Oca and
                  Christine Solnon and
                  Thomas St{\"{u}}tzle},
  title        = {Influencing a Flock via Ad Hoc Teamwork},
  booktitle    = {Swarm Intelligence - 9th International Conference, {ANTS} 2014, Brussels,
                  Belgium, September 10-12, 2014. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {8667},
  pages        = {110--121},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-319-09952-1\_10},
  doi          = {10.1007/978-3-319-09952-1\_10},
  timestamp    = {Tue, 21 Mar 2023 20:56:33 +0100},
  biburl       = {https://dblp.org/rec/conf/antsw/GenterS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AgmonBS14,
  author       = {Noa Agmon and
                  Samuel Barrett and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {Modeling uncertainty in leading ad hoc teams},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {397--404},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2615797},
  timestamp    = {Thu, 25 Sep 2014 07:46:15 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AgmonBS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/BarrettAHKS14,
  author       = {Samuel Barrett and
                  Noa Agmon and
                  Noam Hazon and
                  Sarit Kraus and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {Communicating with unknown teammates},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1433--1434},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2617509},
  timestamp    = {Thu, 25 Sep 2014 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/BarrettAHKS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/UrieliS14,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {TacTex'13: a champion adaptive power trading agent},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1447--1448},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2617516},
  timestamp    = {Thu, 25 Sep 2014 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/UrieliS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AuZS14,
  author       = {Tsz{-}Chiu Au and
                  Shun Zhang and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {Semi-autonomous intersection management},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1451--1452},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2617518},
  timestamp    = {Thu, 25 Sep 2014 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AuZS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MacAlpineGBS14,
  author       = {Patrick MacAlpine and
                  Katie Long Genter and
                  Samuel Barrett and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {The RoboCup 2013 drop-in player challenges: a testbed for ad hoc teamwork},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1461--1462},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2617523},
  timestamp    = {Thu, 25 Sep 2014 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MacAlpineGBS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MacAlpinePS14,
  author       = {Patrick MacAlpine and
                  Eric Price and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {{SCRAM:} scalable collision-avoiding role assignment with minimal-makespan
                  for formational positioning},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1463--1464},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2617524},
  timestamp    = {Tue, 26 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/MacAlpinePS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterS14,
  author       = {Katie Genter and
                  Peter Stone},
  editor       = {Ana L. C. Bazzan and
                  Michael N. Huhns and
                  Alessio Lomuscio and
                  Paul Scerri},
  title        = {Orienting a flock via ad hoc teamwork},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '14, Paris, France, May 5-9, 2014},
  pages        = {1543--1544},
  publisher    = {{IFAAMAS/ACM}},
  year         = {2014},
  url          = {http://dl.acm.org/citation.cfm?id=2616053},
  timestamp    = {Thu, 25 Sep 2014 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/GenterS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecai/BarrettAHKS14,
  author       = {Samuel Barrett and
                  Noa Agmon and
                  Noam Hazon and
                  Sarit Kraus and
                  Peter Stone},
  editor       = {Torsten Schaub and
                  Gerhard Friedrich and
                  Barry O'Sullivan},
  title        = {Communicating with Unknown Teammates},
  booktitle    = {{ECAI} 2014 - 21st European Conference on Artificial Intelligence,
                  18-22 August 2014, Prague, Czech Republic - Including Prestigious
                  Applications of Intelligent Systems {(PAIS} 2014)},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {263},
  pages        = {45--50},
  publisher    = {{IOS} Press},
  year         = {2014},
  url          = {https://doi.org/10.3233/978-1-61499-419-0-45},
  doi          = {10.3233/978-1-61499-419-0-45},
  timestamp    = {Mon, 19 Jun 2023 16:36:09 +0200},
  biburl       = {https://dblp.org/rec/conf/ecai/BarrettAHKS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/MacAlpineGBS14,
  author       = {Patrick MacAlpine and
                  Katie Genter and
                  Samuel Barrett and
                  Peter Stone},
  title        = {The RoboCup 2013 drop-in player challenges: Experiments in ad hoc
                  teamwork},
  booktitle    = {2014 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2014, Chicago, IL, USA, September 14-18, 2014},
  pages        = {382--387},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/IROS.2014.6942588},
  doi          = {10.1109/IROS.2014.6942588},
  timestamp    = {Tue, 05 Sep 2023 15:07:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/MacAlpineGBS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineDLS14,
  author       = {Patrick MacAlpine and
                  Mike Depinet and
                  Jason Liang and
                  Peter Stone},
  editor       = {Reinaldo A. C. Bianchi and
                  H. Levent Akin and
                  Subramanian Ramamoorthy and
                  Komei Sugiura},
  title        = {{UT} Austin Villa: RoboCup 2014 3D Simulation League Competition and
                  Technical Challenge Champions},
  booktitle    = {RoboCup 2014: Robot World Cup {XVIII} [papers from the 18th Annual
                  RoboCup International Symposium, Jo{\~{a}}o Pessoa, Brazil, July 15},
  series       = {Lecture Notes in Computer Science},
  volume       = {8992},
  pages        = {33--46},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-319-18615-3\_3},
  doi          = {10.1007/978-3-319-18615-3\_3},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineDLS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/DepinetMS14,
  author       = {Mike Depinet and
                  Patrick MacAlpine and
                  Peter Stone},
  editor       = {Reinaldo A. C. Bianchi and
                  H. Levent Akin and
                  Subramanian Ramamoorthy and
                  Komei Sugiura},
  title        = {Keyframe Sampling, Optimization, and Behavior Integration: Towards
                  Long-Distance Kicking in the RoboCup 3D Simulation League},
  booktitle    = {RoboCup 2014: Robot World Cup {XVIII} [papers from the 18th Annual
                  RoboCup International Symposium, Jo{\~{a}}o Pessoa, Brazil, July 15},
  series       = {Lecture Notes in Computer Science},
  volume       = {8992},
  pages        = {571--582},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-319-18615-3\_47},
  doi          = {10.1007/978-3-319-18615-3\_47},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/DepinetMS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/aaai/2014,
  editor       = {Carla E. Brodley and
                  Peter Stone},
  title        = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence,
                  July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {https://ojs.aaai.org/index.php/AAAI/issue/view/305},
  isbn         = {978-1-57735-661-5},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/2014.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiebmanS14,
  author       = {Elad Liebman and
                  Peter Stone},
  title        = {{DJ-MC:} {A} Reinforcement-Learning Agent for Music Playlist Recommendation},
  journal      = {CoRR},
  volume       = {abs/1401.1880},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.1880},
  eprinttype    = {arXiv},
  eprint       = {1401.1880},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiebmanS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/StoneKKRA13,
  author       = {Peter Stone and
                  Gal A. Kaminka and
                  Sarit Kraus and
                  Jeffrey S. Rosenschein and
                  Noa Agmon},
  title        = {Teaching and leading an ad hoc teammate: Collaboration without pre-coordination},
  journal      = {Artif. Intell.},
  volume       = {203},
  pages        = {35--65},
  year         = {2013},
  url          = {https://doi.org/10.1016/j.artint.2013.07.003},
  doi          = {10.1016/J.ARTINT.2013.07.003},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/StoneKKRA13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/HesterS13,
  author       = {Todd Hester and
                  Peter Stone},
  title        = {{TEXPLORE:} real-time sample-efficient reinforcement learning for
                  robots},
  journal      = {Mach. Learn.},
  volume       = {90},
  number       = {3},
  pages        = {385--429},
  year         = {2013},
  url          = {https://doi.org/10.1007/s10994-012-5322-7},
  doi          = {10.1007/S10994-012-5322-7},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/HesterS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/LiHSM13,
  author       = {Wen{-}Ke Li and
                  Matthew J. Hausknecht and
                  Peter Stone and
                  Michael D. Mauk},
  title        = {Using a million cell simulation of the cerebellum: Network scaling
                  and task generality},
  journal      = {Neural Networks},
  volume       = {47},
  pages        = {95--102},
  year         = {2013},
  url          = {https://doi.org/10.1016/j.neunet.2012.11.005},
  doi          = {10.1016/J.NEUNET.2012.11.005},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nn/LiHSM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BarrettSKR13,
  author       = {Samuel Barrett and
                  Peter Stone and
                  Sarit Kraus and
                  Avi Rosenfeld},
  editor       = {Marie desJardins and
                  Michael L. Littman},
  title        = {Teamwork with Limited Knowledge of Teammates},
  booktitle    = {Proceedings of the Twenty-Seventh {AAAI} Conference on Artificial
                  Intelligence, July 14-18, 2013, Bellevue, Washington, {USA}},
  pages        = {102--108},
  publisher    = {{AAAI} Press},
  year         = {2013},
  url          = {https://doi.org/10.1609/aaai.v27i1.8659},
  doi          = {10.1609/AAAI.V27I1.8659},
  timestamp    = {Mon, 04 Sep 2023 15:56:33 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BarrettSKR13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/FarchyBMS13,
  author       = {Alon Farchy and
                  Samuel Barrett and
                  Patrick MacAlpine and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Humanoid robots learning to walk faster: from the real world to simulation
                  and back},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {39--46},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2484930},
  timestamp    = {Thu, 09 Sep 2021 16:09:54 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/FarchyBMS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/GenterAS13,
  author       = {Katie Long Genter and
                  Noa Agmon and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Ad hoc teamwork for leading a flock},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {531--538},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485005},
  timestamp    = {Fri, 28 Jun 2013 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/GenterAS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/HesterLS13,
  author       = {Todd Hester and
                  Manuel Lopes and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Learning exploration strategies in model-based reinforcement learning},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {1069--1076},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485088},
  timestamp    = {Thu, 18 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/HesterLS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ChakrabortyS13,
  author       = {Doran Chakraborty and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Cooperating with a markovian ad hoc teammate},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {1085--1092},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485091},
  timestamp    = {Fri, 28 Jun 2013 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/ChakrabortyS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/UrieliS13,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {A learning agent for heat-pump thermostat control},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {1093--1100},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485092},
  timestamp    = {Fri, 28 Jun 2013 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/UrieliS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/itsc/CarlinoBS13,
  author       = {Dustin Carlino and
                  Stephen D. Boyles and
                  Peter Stone},
  title        = {Auction-based autonomous intersection management},
  booktitle    = {16th International {IEEE} Conference on Intelligent Transportation
                  Systems, {ITSC} 2013, The Hague, The Netherlands, October 6-9, 2013},
  pages        = {529--534},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ITSC.2013.6728285},
  doi          = {10.1109/ITSC.2013.6728285},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/CarlinoBS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iui/KnoxSB13,
  author       = {W. Bradley Knox and
                  Peter Stone and
                  Cynthia Breazeal},
  editor       = {Jihie Kim and
                  Jeffrey Nichols and
                  Pedro A. Szekely},
  title        = {Teaching agents with human feedback: a demonstration of the {TAMER}
                  framework},
  booktitle    = {18th International Conference on Intelligent User Interfaces, {IUI}
                  '13, Santa Monica, CA, USA, March 19-22, 2013, Companion Volume},
  pages        = {65--66},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2451176.2451201},
  doi          = {10.1145/2451176.2451201},
  timestamp    = {Sun, 26 Nov 2023 00:57:51 +0100},
  biburl       = {https://dblp.org/rec/conf/iui/KnoxSB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iui/KnoxS13,
  author       = {W. Bradley Knox and
                  Peter Stone},
  editor       = {Jihie Kim and
                  Jeffrey Nichols and
                  Pedro A. Szekely},
  title        = {Learning non-myopically from human-generated reward},
  booktitle    = {18th International Conference on Intelligent User Interfaces, {IUI}
                  2013, Santa Monica, CA, USA, March 19-22, 2013},
  pages        = {191--202},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2449396.2449422},
  doi          = {10.1145/2449396.2449422},
  timestamp    = {Sun, 26 Nov 2023 00:57:51 +0100},
  biburl       = {https://dblp.org/rec/conf/iui/KnoxS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/UrieliS13,
  author       = {Daniel Urieli and
                  Peter Stone},
  editor       = {Hendrik Blockeel and
                  Kristian Kersting and
                  Siegfried Nijssen and
                  Filip Zelezn{\'{y}}},
  title        = {Model-Selection for Non-parametric Function Approximation in Continuous
                  Control Problems: {A} Case Study in a Smart Energy System},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases - European Conference,
                  {ECML} {PKDD} 2013, Prague, Czech Republic, September 23-27, 2013,
                  Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8188},
  pages        = {65--80},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-40988-2\_5},
  doi          = {10.1007/978-3-642-40988-2\_5},
  timestamp    = {Tue, 21 Mar 2023 21:00:11 +0100},
  biburl       = {https://dblp.org/rec/conf/pkdd/UrieliS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/HesterS13,
  author       = {Todd Hester and
                  Peter Stone},
  editor       = {Sven Behnke and
                  Manuela M. Veloso and
                  Arnoud Visser and
                  Rong Xiong},
  title        = {The Open-Source {TEXPLORE} Code Release for Reinforcement Learning
                  on Robots},
  booktitle    = {RoboCup 2013: Robot World Cup {XVII} [papers from the 17th Annual
                  RoboCup International Symposium, Eindhoven, The Netherlands, July
                  1, 2013]},
  series       = {Lecture Notes in Computer Science},
  volume       = {8371},
  pages        = {536--543},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-662-44468-9\_47},
  doi          = {10.1007/978-3-662-44468-9\_47},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/HesterS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/BarrettGHHKMS13,
  author       = {Samuel Barrett and
                  Katie Long Genter and
                  Yuchen He and
                  Todd Hester and
                  Piyush Khandelwal and
                  Jacob Menashe and
                  Peter Stone},
  editor       = {Sven Behnke and
                  Manuela M. Veloso and
                  Arnoud Visser and
                  Rong Xiong},
  title        = {The 2012 {UT} Austin Villa Code Release},
  booktitle    = {RoboCup 2013: Robot World Cup {XVII} [papers from the 17th Annual
                  RoboCup International Symposium, Eindhoven, The Netherlands, July
                  1, 2013]},
  series       = {Lecture Notes in Computer Science},
  volume       = {8371},
  pages        = {552--559},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-662-44468-9\_49},
  doi          = {10.1007/978-3-662-44468-9\_49},
  timestamp    = {Wed, 28 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/BarrettGHHKMS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/socrob/KnoxSB13,
  author       = {W. Bradley Knox and
                  Peter Stone and
                  Cynthia Breazeal},
  editor       = {Guido Herrmann and
                  Martin J. Pearson and
                  Alexander Lenz and
                  Paul Bremner and
                  Adam Spiers and
                  Ute Leonards},
  title        = {Training a Robot via Human Feedback: {A} Case Study},
  booktitle    = {Social Robotics - 5th International Conference, {ICSR} 2013, Bristol,
                  UK, October 27-29, 2013, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {8239},
  pages        = {460--470},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-319-02675-6\_46},
  doi          = {10.1007/978-3-319-02675-6\_46},
  timestamp    = {Thu, 14 Oct 2021 10:29:56 +0200},
  biburl       = {https://dblp.org/rec/conf/socrob/KnoxSB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/robocup/2012,
  editor       = {Xiaoping Chen and
                  Peter Stone and
                  Luis Enrique Sucar and
                  Tijn van der Zant},
  title        = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual
                  RoboCup International Symposium, Mexico City, Mexico, June 18-24,
                  2012]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7500},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-39250-4},
  doi          = {10.1007/978-3-642-39250-4},
  isbn         = {978-3-642-39249-8},
  timestamp    = {Tue, 14 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/2012.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/SonenbergSTY12,
  author       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {Ten Years of {AAMAS:} Introduction to the Special Issue},
  journal      = {{AI} Mag.},
  volume       = {33},
  number       = {3},
  pages        = {11--13},
  year         = {2012},
  url          = {https://doi.org/10.1609/aimag.v33i3.2423},
  doi          = {10.1609/AIMAG.V33I3.2423},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/SonenbergSTY12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijsr/KnoxGLMS12,
  author       = {W. Bradley Knox and
                  Brian D. Glass and
                  Bradley C. Love and
                  W. Todd Maddox and
                  Peter Stone},
  title        = {How Humans Teach Agents - {A} New Experimental Perspective},
  journal      = {Int. J. Soc. Robotics},
  volume       = {4},
  number       = {4},
  pages        = {409--421},
  year         = {2012},
  url          = {https://doi.org/10.1007/s12369-012-0163-x},
  doi          = {10.1007/S12369-012-0163-X},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijsr/KnoxGLMS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MacAlpineBS12,
  author       = {Patrick MacAlpine and
                  Francisco Barrera and
                  Peter Stone},
  editor       = {Ariel Felner and
                  Nathan R. Sturtevant and
                  Kostas E. Bekris and
                  Roni Stern},
  title        = {Positioning to Win: {A} Dynamic Role Assignment and Formation Positioning
                  System},
  booktitle    = {Multiagent Pathfinding, Papers from the 2012 {AAAI} Workshop, MAPF@AAAI
                  2012, Toronto, Ontario, Canada, July 22, 2012},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-12-10}},
  publisher    = {{AAAI} Press},
  year         = {2012},
  url          = {http://www.aaai.org/ocs/index.php/WS/AAAIW12/paper/view/5220},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MacAlpineBS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MacAlpineBUVS12,
  author       = {Patrick MacAlpine and
                  Samuel Barrett and
                  Daniel Urieli and
                  Victor Vu and
                  Peter Stone},
  editor       = {J{\"{o}}rg Hoffmann and
                  Bart Selman},
  title        = {Design and Optimization of an Omnidirectional Humanoid Walk: {A} Winning
                  Approach at the RoboCup 2011 3D Simulation Competition},
  booktitle    = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2012, Toronto, Ontario, Canada},
  pages        = {1047--1053},
  publisher    = {{AAAI} Press},
  year         = {2012},
  url          = {https://doi.org/10.1609/aaai.v26i1.8317},
  doi          = {10.1609/AAAI.V26I1.8317},
  timestamp    = {Mon, 04 Sep 2023 15:56:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MacAlpineBUVS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/HesterS12,
  author       = {Todd Hester and
                  Peter Stone},
  title        = {{TEXPLORE:} Real-Time Sample-Efficient Reinforcement Learning for
                  Robots},
  booktitle    = {Designing Intelligent Robots, Papers from the 2012 {AAAI} Spring Symposium,
                  Palo Alto, California, USA, March 26-28, 2012},
  series       = {{AAAI} Technical Report},
  volume       = {{SS-12-02}},
  publisher    = {{AAAI}},
  year         = {2012},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS12/paper/view/4271},
  timestamp    = {Wed, 25 Sep 2013 15:48:48 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/HesterS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/MacAlpineUBKBLSVS12,
  author       = {Patrick MacAlpine and
                  Daniel Urieli and
                  Samuel Barrett and
                  Shivaram Kalyanakrishnan and
                  Francisco Barrera and
                  Adrian Lopez{-}Mobilia and
                  Nicolae Stiurca and
                  Victor Vu and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {{UT} Austin Villa 2011: a champion agent in the RoboCup 3D soccer
                  simulation competition},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {129--136},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343594},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/MacAlpineUBKBLSVS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/AgmonS12,
  author       = {Noa Agmon and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {Leading ad hoc agents in joint action settings with multiple teammates},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {341--348},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343625},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/AgmonS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/BarrettS12,
  author       = {Samuel Barrett and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {An analysis framework for ad hoc teamwork tasks},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {357--364},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343627},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/BarrettS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/KnoxS12,
  author       = {W. Bradley Knox and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {Reinforcement learning from simultaneous human and {MDP} reward},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {475--482},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343644},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/KnoxS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aamas/GenterAS12,
  author       = {Katie Long Genter and
                  Noa Agmon and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Lin Padgham and
                  Vincent Conitzer and
                  Michael Winikoff},
  title        = {Role selection in ad hoc teamwork},
  booktitle    = {International Conference on Autonomous Agents and Multiagent Systems,
                  {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)},
  pages        = {1251--1252},
  publisher    = {{IFAAMAS}},
  year         = {2012},
  url          = {http://dl.acm.org/citation.cfm?id=2343948},
  timestamp    = {Thu, 19 Mar 2015 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aamas/GenterAS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/HausknechtKMS12,
  author       = {Matthew J. Hausknecht and
                  Piyush Khandelwal and
                  Risto Miikkulainen and
                  Peter Stone},
  editor       = {Terence Soule and
                  Jason H. Moore},
  title        = {HyperNEAT-GGP: a hyperNEAT-based atari general game player},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} '12, Philadelphia,
                  PA, USA, July 7-11, 2012},
  pages        = {217--224},
  publisher    = {{ACM}},
  year         = {2012},
  url          = {https://doi.org/10.1145/2330163.2330195},
  doi          = {10.1145/2330163.2330195},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/HausknechtKMS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccps/FokHGASJV12,
  author       = {Chien{-}Liang Fok and
                  Maykel Hanna and
                  Seth Gee and
                  Tsz{-}Chiu Au and
                  Peter Stone and
                  Christine Julien and
                  Sriram Vishwanath},
  title        = {A Platform for Evaluating Autonomous Intersection Management Policies},
  booktitle    = {2012 {IEEE/ACM} Third International Conference on Cyber-Physical Systems,
                  {ICCPS} 2012, Beijing, China, April 17-19, 2012},
  pages        = {87--96},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICCPS.2012.17},
  doi          = {10.1109/ICCPS.2012.17},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccps/FokHGASJV12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdl-epirob/HesterS12,
  author       = {Todd Hester and
                  Peter Stone},
  title        = {Intrinsically motivated model learning for a developing curious agent},
  booktitle    = {2012 {IEEE} International Conference on Development and Learning and
                  Epigenetic Robotics, {ICDL-EPIROB} 2012, San Diego, CA, USA, November
                  7-9, 2012},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/DevLrn.2012.6400802},
  doi          = {10.1109/DEVLRN.2012.6400802},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icdl-epirob/HesterS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KalyanakrishnanTAS12,
  author       = {Shivaram Kalyanakrishnan and
                  Ambuj Tewari and
                  Peter Auer and
                  Peter Stone},
  title        = {{PAC} Subset Selection in Stochastic Multi-armed Bandits},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/359.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KalyanakrishnanTAS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/HesterQS12,
  author       = {Todd Hester and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {{RTMBA:} {A} Real-Time Model-Based Reinforcement Learning Architecture
                  for robot control},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}},
  pages        = {85--90},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICRA.2012.6225072},
  doi          = {10.1109/ICRA.2012.6225072},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/HesterQS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/AgmonFESJV12,
  author       = {Noa Agmon and
                  Chien{-}Liang Fok and
                  Yehuda Emaliah and
                  Peter Stone and
                  Christine Julien and
                  Sriram Vishwanath},
  title        = {On coordination in practical multi-robot patrol},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}},
  pages        = {650--656},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICRA.2012.6224708},
  doi          = {10.1109/ICRA.2012.6224708},
  timestamp    = {Sun, 03 Dec 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/AgmonFESJV12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/AuQS12,
  author       = {Tsz{-}Chiu Au and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {Setpoint scheduling for autonomous vehicle controllers},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}},
  pages        = {2055--2060},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICRA.2012.6225232},
  doi          = {10.1109/ICRA.2012.6225232},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/AuQS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/AuFVJS12,
  author       = {Tsz{-}Chiu Au and
                  Chien{-}Liang Fok and
                  Sriram Vishwanath and
                  Christine Julien and
                  Peter Stone},
  title        = {Evasion planning for autonomous vehicles at intersections},
  booktitle    = {2012 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2012, Vilamoura, Algarve, Portugal, October 7-12,
                  2012},
  pages        = {1541--1546},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/IROS.2012.6385936},
  doi          = {10.1109/IROS.2012.6385936},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/AuFVJS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/VelosoS12,
  author       = {Manuela M. Veloso and
                  Peter Stone},
  title        = {Video: RoboCup robot soccer history 1997 - 2011},
  booktitle    = {2012 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2012, Vilamoura, Algarve, Portugal, October 7-12,
                  2012},
  pages        = {5452--5453},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/IROS.2012.6386302},
  doi          = {10.1109/IROS.2012.6386302},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/VelosoS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/itsc/CarlinoDKS12,
  author       = {Dustin Carlino and
                  Mike Depinet and
                  Piyush Khandelwal and
                  Peter Stone},
  title        = {Approximately Orchestrated Routing and Transportation Analyzer: Large-scale
                  traffic simulation for autonomous vehicles},
  booktitle    = {15th International {IEEE} Conference on Intelligent Transportation
                  Systems, {ITSC} 2012, Anchorage, AK, USA, September 16-19, 2012},
  pages        = {334--339},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ITSC.2012.6338701},
  doi          = {10.1109/ITSC.2012.6338701},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/CarlinoDKS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ro-man/KnoxS12,
  author       = {W. Bradley Knox and
                  Peter Stone},
  title        = {Reinforcement learning from human reward: Discounting in episodic
                  tasks},
  booktitle    = {The 21st {IEEE} International Symposium on Robot and Human Interactive
                  Communication, {IEEE} {RO-MAN} 2012, Paris, France, September 9-13,
                  2012},
  pages        = {878--885},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ROMAN.2012.6343862},
  doi          = {10.1109/ROMAN.2012.6343862},
  timestamp    = {Wed, 16 Oct 2019 14:14:50 +0200},
  biburl       = {https://dblp.org/rec/conf/ro-man/KnoxS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/BarrettGHHKMS12,
  author       = {Samuel Barrett and
                  Katie Long Genter and
                  Yuchen He and
                  Todd Hester and
                  Piyush Khandelwal and
                  Jacob Menashe and
                  Peter Stone},
  editor       = {Xiaoping Chen and
                  Peter Stone and
                  Luis Enrique Sucar and
                  Tijn van der Zant},
  title        = {{UT} Austin Villa 2012: Standard Platform League World Champions},
  booktitle    = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual
                  RoboCup International Symposium, Mexico City, Mexico, June 18-24,
                  2012]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7500},
  pages        = {36--47},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-39250-4\_4},
  doi          = {10.1007/978-3-642-39250-4\_4},
  timestamp    = {Wed, 28 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/BarrettGHHKMS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineCLS12,
  author       = {Patrick MacAlpine and
                  Nick Collins and
                  Adrian Lopez{-}Mobilia and
                  Peter Stone},
  editor       = {Xiaoping Chen and
                  Peter Stone and
                  Luis Enrique Sucar and
                  Tijn van der Zant},
  title        = {{UT} Austin Villa: RoboCup 2012 3D Simulation League Champion},
  booktitle    = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual
                  RoboCup International Symposium, Mexico City, Mexico, June 18-24,
                  2012]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7500},
  pages        = {77--88},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-39250-4\_8},
  doi          = {10.1007/978-3-642-39250-4\_8},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineCLS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/MacAlpineBS12,
  author       = {Patrick MacAlpine and
                  Francisco Barrera and
                  Peter Stone},
  editor       = {Xiaoping Chen and
                  Peter Stone and
                  Luis Enrique Sucar and
                  Tijn van der Zant},
  title        = {Positioning to Win: {A} Dynamic Role Assignment and Formation Positioning
                  System},
  booktitle    = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual
                  RoboCup International Symposium, Mexico City, Mexico, June 18-24,
                  2012]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7500},
  pages        = {190--201},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-39250-4\_18},
  doi          = {10.1007/978-3-642-39250-4\_18},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/MacAlpineBS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/12/HesterS12,
  author       = {Todd Hester and
                  Peter Stone},
  editor       = {Marco A. Wiering and
                  Martijn van Otterlo},
  title        = {Learning and Using Models},
  booktitle    = {Reinforcement Learning},
  series       = {Adaptation, Learning, and Optimization},
  volume       = {12},
  pages        = {111--141},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-27645-3\_4},
  doi          = {10.1007/978-3-642-27645-3\_4},
  timestamp    = {Tue, 29 Dec 2020 18:14:51 +0100},
  biburl       = {https://dblp.org/rec/books/sp/12/HesterS12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1201-6583,
  author       = {Tobias Jung and
                  Daniel Polani and
                  Peter Stone},
  title        = {Empowerment for Continuous Agent-Environment Systems},
  journal      = {CoRR},
  volume       = {abs/1201.6583},
  year         = {2012},
  url          = {http://arxiv.org/abs/1201.6583},
  eprinttype    = {arXiv},
  eprint       = {1201.6583},
  timestamp    = {Fri, 19 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1201-6583.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1201-6604,
  author       = {Tobias Jung and
                  Peter Stone},
  title        = {Gaussian Processes for Sample Efficient Reinforcement Learning with
                  RMAX-like Exploration},
  journal      = {CoRR},
  volume       = {abs/1201.6604},
  year         = {2012},
  url          = {http://arxiv.org/abs/1201.6604},
  eprinttype    = {arXiv},
  eprint       = {1201.6604},
  timestamp    = {Fri, 19 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1201-6604.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1201-6615,
  author       = {Tobias Jung and
                  Peter Stone},
  title        = {Feature Selection for Value Function Approximation Using Bayesian
                  Model Selection},
  journal      = {CoRR},
  volume       = {abs/1201.6615},
  year         = {2012},
  url          = {http://arxiv.org/abs/1201.6615},
  eprinttype    = {arXiv},
  eprint       = {1201.6615},
  timestamp    = {Fri, 19 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1201-6615.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/adb/JungPS11,
  author       = {Tobias Jung and
                  Daniel Polani and
                  Peter Stone},
  title        = {Empowerment for continuous agent - environment systems},
  journal      = {Adapt. Behav.},
  volume       = {19},
  number       = {1},
  pages        = {16--39},
  year         = {2011},
  url          = {https://doi.org/10.1177/1059712310392389},
  doi          = {10.1177/1059712310392389},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/adb/JungPS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/TaylorS11,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  title        = {An Introduction to Intertask Transfer for Reinforcement Learning},
  journal      = {{AI} Mag.},
  volume       = {32},
  number       = {1},
  pages        = {15--34},
  year         = {2011},
  url          = {https://doi.org/10.1609/aimag.v32i1.2329},
  doi          = {10.1609/AIMAG.V32I1.2329},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/TaylorS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/KalyanakrishnanS11,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  title        = {Characterizing reinforcement learning methods through parameterized
                  learning problems},
  journal      = {Mach. Learn.},
  volume       = {84},
  number       = {1-2},
  pages        = {205--247},
  year         = {2011},
  url          = {https://doi.org/10.1007/s10994-011-5251-x},
  doi          = {10.1007/S10994-011-5251-X},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/KalyanakrishnanS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigecom/PardoeS11,
  author       = {David Pardoe and
                  Peter Stone},
  title        = {Designing adaptive trading agents},
  journal      = {SIGecom Exch.},
  volume       = {10},
  number       = {2},
  pages        = {37--39},
  year         = {2011},
  url          = {https://doi.org/10.1145/1998549.1998557},
  doi          = {10.1145/1998549.1998557},
  timestamp    = {Thu, 04 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigecom/PardoeS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AgmonS11,
  author       = {Noa Agmon and
                  Peter Stone},
  title        = {Leading Multiple Ad Hoc Teammates in Joint Action Settings},
  booktitle    = {Interactive Decision Theory and Game Theory, Papers from the 2011
                  {AAAI} Workshop, San Francisco, California, USA, August 8, 2011},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-11-13}},
  publisher    = {{AAAI}},
  year         = {2011},
  url          = {http://www.aaai.org/ocs/index.php/WS/AAAIW11/paper/view/3805},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AgmonS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LinKABS11,
  author       = {Raz Lin and
                  Sarit Kraus and
                  Noa Agmon and
                  Samuel Barrett and
                  Peter Stone},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Comparing Agents' Success against People in Security Domains},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {809--814},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.7940},
  doi          = {10.1609/AAAI.V25I1.7940},
  timestamp    = {Mon, 04 Sep 2023 16:05:54 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LinKABS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AgmonUS11,
  author       = {Noa Agmon and
                  Daniel Urieli and
                  Peter Stone},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Multiagent Patrol Generalized to Complex Environmental Conditions},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {1090--1095},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.7988},
  doi          = {10.1609/AAAI.V25I1.7988},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AgmonUS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AuSS11,
  author       = {Tsz{-}Chiu Au and
                  Neda Shahidi and
                  Peter Stone},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Enforcing Liveness in Autonomous Traffic Management},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {1317--1322},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.7807},
  doi          = {10.1609/AAAI.V25I1.7807},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AuSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BarrettS11,
  author       = {Samuel Barrett and
                  Peter Stone},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Ad Hoc Teamwork in Variations of the Pursuit Domain},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {1758--1759},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.8054},
  doi          = {10.1609/AAAI.V25I1.8054},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BarrettS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GenterAS11,
  author       = {Katie Long Genter and
                  Noa Agmon and
                  Peter Stone},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Role-Based Ad Hoc Teamwork},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {1782--1783},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.8057},
  doi          = {10.1609/AAAI.V25I1.8057},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GenterAS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GenterAS11a,
  author       = {Katie Long Genter and
                  Noa Agmon and
                  Peter Stone},
  title        = {Role-Based Ad Hoc Teamwork},
  booktitle    = {Plan, Activity, and Intent Recognition, Papers from the 2011 {AAAI}
                  Workshop, San Francisco, California, USA, August 07, 2011},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-11-16}},
  publisher    = {{AAAI}},
  year         = {2011},
  url          = {http://www.aaai.org/ocs/index.php/WS/AAAIW11/paper/view/3967},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/GenterAS11a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/KnoxSS11,
  author       = {W. Bradley Knox and
                  Adam Bradley Setapen and
                  Peter Stone},
  title        = {Reinforcement Learning with Human Feedback in Mountain Car},
  booktitle    = {Help Me Help You: Bridging the Gaps in Human-Agent Collaboration,
                  Papers from the 2011 {AAAI} Spring Symposium, Technical Report SS-11-05,
                  Stanford, California, USA, March 21-23, 2011},
  publisher    = {{AAAI}},
  year         = {2011},
  url          = {http://www.aaai.org/ocs/index.php/SSS/SSS11/paper/view/2487},
  timestamp    = {Tue, 14 Feb 2012 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaaiss/KnoxSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/admi/Stone11,
  author       = {Peter Stone},
  editor       = {Longbing Cao and
                  Ana L. C. Bazzan and
                  Andreas L. Symeonidis and
                  Vladimir Gorodetsky and
                  Gerhard Weiss and
                  Philip S. Yu},
  title        = {Intersections of the Future: Using Fully Autonomous Vehicles},
  booktitle    = {Agents and Data Mining Interaction - 7th International Workshop on
                  Agents and Data Mining Interation, {ADMI} 2011, Taipei, Taiwan, May
                  2-6, 2011, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7103},
  pages        = {3},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-27609-5\_1},
  doi          = {10.1007/978-3-642-27609-5\_1},
  timestamp    = {Tue, 08 Mar 2022 10:12:50 +0100},
  biburl       = {https://dblp.org/rec/conf/admi/Stone11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/adprl/KalyanakrishnanS11,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  title        = {On learning with imperfect representations},
  booktitle    = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement
                  Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011},
  pages        = {17--24},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ADPRL.2011.5967379},
  doi          = {10.1109/ADPRL.2011.5967379},
  timestamp    = {Wed, 16 Oct 2019 14:14:48 +0200},
  biburl       = {https://dblp.org/rec/conf/adprl/KalyanakrishnanS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/adprl/WhitesonTTS11,
  author       = {Shimon Whiteson and
                  Brian Tanner and
                  Matthew E. Taylor and
                  Peter Stone},
  title        = {Protecting against evaluation overfitting in empirical reinforcement
                  learning},
  booktitle    = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement
                  Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011},
  pages        = {120--127},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ADPRL.2011.5967363},
  doi          = {10.1109/ADPRL.2011.5967363},
  timestamp    = {Thu, 15 Jun 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/adprl/WhitesonTTS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ScerriKVMSTDFCDK11,
  author       = {Paul Scerri and
                  Balajee Kannan and
                  Prasanna Velagapudi and
                  Kate Macarthur and
                  Peter Stone and
                  Matthew E. Taylor and
                  John Dolan and
                  Alessandro Farinelli and
                  Archie C. Chapman and
                  Bernadine Dias and
                  George Kantor},
  editor       = {Francien Dechesne and
                  Hiromitsu Hattori and
                  Adriaan ter Mors and
                  Jose M. Such and
                  Danny Weyns and
                  Frank Dignum},
  title        = {Flood Disaster Mitigation: {A} Real-World Challenge Problem for Multi-agent
                  Unmanned Surface Vehicles},
  booktitle    = {Advanced Agent Technology - {AAMAS} 2011 Workshops, AMPLE, AOSE, ARMS,
                  DOCM3AS, ITMAS, Taipei, Taiwan, May 2-6, 2011. Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7068},
  pages        = {252--269},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-27216-5\_16},
  doi          = {10.1007/978-3-642-27216-5\_16},
  timestamp    = {Mon, 15 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/ScerriKVMSTDFCDK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/BarrettSK11,
  author       = {Samuel Barrett and
                  Peter Stone and
                  Sarit Kraus},
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {Empirical evaluation of ad hoc teamwork in the pursuit domain},
  booktitle    = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  pages        = {567--574},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  url          = {http://portal.acm.org/citation.cfm?id=2031698\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764},
  timestamp    = {Fri, 18 Nov 2011 09:09:28 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/BarrettSK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/UrieliMKBS11,
  author       = {Daniel Urieli and
                  Patrick MacAlpine and
                  Shivaram Kalyanakrishnan and
                  Yinon Bentor and
                  Peter Stone},
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {On optimizing interdependent skills: a case study in simulated 3D
                  humanoid robot soccer},
  booktitle    = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  pages        = {769--776},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  url          = {http://portal.acm.org/citation.cfm?id=2031727\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764},
  timestamp    = {Fri, 18 Nov 2011 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/UrieliMKBS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeS11,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {A particle filter for bid estimation in ad auctions with periodic
                  ranking observations},
  booktitle    = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  pages        = {887--894},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  url          = {http://portal.acm.org/citation.cfm?id=2031744\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764},
  timestamp    = {Fri, 18 Nov 2011 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AgmonUS11,
  author       = {Noa Agmon and
                  Daniel Urieli and
                  Peter Stone},
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {Ship patrol: multiagent patrol under complex environmental conditions},
  booktitle    = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  pages        = {1103--1104},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  url          = {http://portal.acm.org/citation.cfm?id=2034439\&\#38;CFID=69154334\&\#38;CFTOKEN=45298625},
  timestamp    = {Fri, 18 Nov 2011 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/AgmonUS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ShahidiAS11,
  author       = {Neda Shahidi and
                  Tsz{-}Chiu Au and
                  Peter Stone},
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {Batch reservations in autonomous intersection management},
  booktitle    = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  pages        = {1225--1226},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  url          = {http://portal.acm.org/citation.cfm?id=2034498\&\#38;CFID=69154334\&\#38;CFTOKEN=45298625},
  timestamp    = {Fri, 18 Nov 2011 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/ShahidiAS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ewrl/Stone11,
  author       = {Peter Stone},
  editor       = {Scott Sanner and
                  Marcus Hutter},
  title        = {Invited Talk: {PRISM} - Practical {RL:} Representation, Interaction,
                  Synthesis, and Mortality},
  booktitle    = {Recent Advances in Reinforcement Learning - 9th European Workshop,
                  {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {7188},
  pages        = {3},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-29946-9\_3},
  doi          = {10.1007/978-3-642-29946-9\_3},
  timestamp    = {Tue, 14 May 2019 10:00:48 +0200},
  biburl       = {https://dblp.org/rec/conf/ewrl/Stone11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChakrabortyS11,
  author       = {Doran Chakraborty and
                  Peter Stone},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Structure Learning in Ergodic Factored MDPs without Knowledge of the
                  Transition Function's In-Degree},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {737--744},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/418\_icmlpaper.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChakrabortyS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/HausknechtAS11,
  author       = {Matthew J. Hausknecht and
                  Tsz{-}Chiu Au and
                  Peter Stone},
  title        = {Autonomous Intersection Management: Multi-intersection optimization},
  booktitle    = {2011 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2011, San Francisco, CA, USA, September 25-30, 2011},
  pages        = {4581--4586},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/IROS.2011.6094668},
  doi          = {10.1109/IROS.2011.6094668},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/HausknechtAS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/itsc/HausknechtASFW11,
  author       = {Matthew J. Hausknecht and
                  Tsz{-}Chiu Au and
                  Peter Stone and
                  David Fajardo and
                  S. Travis Waller},
  title        = {Dynamic lane reversal in traffic management},
  booktitle    = {14th International {IEEE} Conference on Intelligent Transportation
                  Systems, {ITSC} 2011, Washington, DC, USA, October 5-7, 2011},
  pages        = {1929--1934},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ITSC.2011.6082932},
  doi          = {10.1109/ITSC.2011.6082932},
  timestamp    = {Wed, 16 Oct 2019 14:14:57 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/HausknechtASFW11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/BaiCMUBS11,
  author       = {Aijun Bai and
                  Xiaoping Chen and
                  Patrick MacAlpine and
                  Daniel Urieli and
                  Samuel Barrett and
                  Peter Stone},
  editor       = {Thomas R{\"{o}}fer and
                  Norbert Michael Mayer and
                  Jesus Savage and
                  Uluc Saranli},
  title        = {WrightEagle and {UT} Austin Villa: RoboCup 2011 Simulation League
                  Champions},
  booktitle    = {RoboCup 2011: Robot Soccer World Cup {XV} [papers from the 15th Annual
                  RoboCup International Symposium, Istanbul, Turkey, July 2011]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7416},
  pages        = {1--12},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-32060-6\_1},
  doi          = {10.1007/978-3-642-32060-6\_1},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/BaiCMUBS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KhandelwalS11,
  author       = {Piyush Khandelwal and
                  Peter Stone},
  editor       = {Thomas R{\"{o}}fer and
                  Norbert Michael Mayer and
                  Jesus Savage and
                  Uluc Saranli},
  title        = {A Low Cost Ground Truth Detection System for RoboCup Using the Kinect},
  booktitle    = {RoboCup 2011: Robot Soccer World Cup {XV} [papers from the 15th Annual
                  RoboCup International Symposium, Istanbul, Turkey, July 2011]},
  series       = {Lecture Notes in Computer Science},
  volume       = {7416},
  pages        = {515--527},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-32060-6\_44},
  doi          = {10.1007/978-3-642-32060-6\_44},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KhandelwalS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/atal/2011,
  editor       = {Liz Sonenberg and
                  Peter Stone and
                  Kagan Tumer and
                  Pinar Yolum},
  title        = {10th International Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3},
  publisher    = {{IFAAMAS}},
  year         = {2011},
  isbn         = {978-0-9826571-5-7},
  timestamp    = {Fri, 18 Nov 2011 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/2011.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1105-1749,
  author       = {Todd Hester and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {A Real-Time Model-Based Reinforcement Learning Architecture for Robot
                  Control},
  journal      = {CoRR},
  volume       = {abs/1105.1749},
  year         = {2011},
  url          = {http://arxiv.org/abs/1105.1749},
  eprinttype    = {arXiv},
  eprint       = {1105.1749},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1105-1749.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1106-0678,
  author       = {Michael J. Kearns and
                  Michael L. Littman and
                  Satinder Singh and
                  Peter Stone},
  title        = {ATTac-2000: An Adaptive Autonomous Bidding Agent},
  journal      = {CoRR},
  volume       = {abs/1106.0678},
  year         = {2011},
  url          = {http://arxiv.org/abs/1106.0678},
  eprinttype    = {arXiv},
  eprint       = {1106.0678},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1106-0678.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1106-5270,
  author       = {J{\'{a}}nos A. Csirik and
                  Michael L. Littman and
                  David A. McAllester and
                  Robert E. Schapire and
                  Peter Stone},
  title        = {Decision-Theoretic Bidding Based on Learned Density Models in Simultaneous,
                  Interacting Auctions},
  journal      = {CoRR},
  volume       = {abs/1106.5270},
  year         = {2011},
  url          = {http://arxiv.org/abs/1106.5270},
  eprinttype    = {arXiv},
  eprint       = {1106.5270},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1106-5270.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/WhitesonTS10,
  author       = {Shimon Whiteson and
                  Matthew E. Taylor and
                  Peter Stone},
  title        = {Critical factors in the empirical performance of temporal difference
                  and evolutionary methods for reinforcement learning},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {21},
  number       = {1},
  pages        = {1--35},
  year         = {2010},
  url          = {https://doi.org/10.1007/s10458-009-9100-2},
  doi          = {10.1007/S10458-009-9100-2},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/WhitesonTS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijauc/WildstromSW10,
  author       = {Jonathan Wildstrom and
                  Peter Stone and
                  Emmett Witchel},
  title        = {Autonomous return on investment analysis of additional processing
                  resources},
  journal      = {Int. J. Auton. Comput.},
  volume       = {1},
  number       = {3},
  pages        = {280--296},
  year         = {2010},
  url          = {https://doi.org/10.1504/IJAC.2010.033010},
  doi          = {10.1504/IJAC.2010.033010},
  timestamp    = {Thu, 18 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijauc/WildstromSW10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/informs/PardoeSSKT10,
  author       = {David Pardoe and
                  Peter Stone and
                  Maytal Saar{-}Tsechansky and
                  Tayfun Keskin and
                  Kerem Tomak},
  title        = {Adaptive Auction Mechanism Design and the Incorporation of Prior Knowledge},
  journal      = {{INFORMS} J. Comput.},
  volume       = {22},
  number       = {3},
  pages        = {353--370},
  year         = {2010},
  url          = {https://doi.org/10.1287/ijoc.1090.0353},
  doi          = {10.1287/IJOC.1090.0353},
  timestamp    = {Sun, 15 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/informs/PardoeSSKT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AuS10,
  author       = {Tsz{-}Chiu Au and
                  Peter Stone},
  title        = {Motion Planning Algorithms for Autonomous Intersection Management},
  booktitle    = {Bridging the Gap Between Task and Motion Planning, Papers from the
                  2010 {AAAI} Workshop, Atlanta, Georgia, USA, July 11, 2010},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-10-01}},
  publisher    = {{AAAI}},
  year         = {2010},
  url          = {http://aaai.org/ocs/index.php/WS/AAAIW10/paper/view/2053},
  timestamp    = {Tue, 05 Sep 2023 08:59:27 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AuS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/StoneKKR10,
  author       = {Peter Stone and
                  Gal A. Kaminka and
                  Sarit Kraus and
                  Jeffrey S. Rosenschein},
  editor       = {Maria Fox and
                  David Poole},
  title        = {Ad Hoc Autonomous Agent Teams: Collaboration without Pre-Coordination},
  booktitle    = {Proceedings of the Twenty-Fourth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2010, Atlanta, Georgia, USA, July 11-15, 2010},
  pages        = {1504--1509},
  publisher    = {{AAAI} Press},
  year         = {2010},
  url          = {https://doi.org/10.1609/aaai.v24i1.7529},
  doi          = {10.1609/AAAI.V24I1.7529},
  timestamp    = {Mon, 04 Sep 2023 16:23:45 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/StoneKKR10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KnoxS10,
  author       = {W. Bradley Knox and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {Combining manual feedback with subsequent {MDP} reward signals for
                  reinforcement learning},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {5--12},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838208},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/KnoxS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/StoneK10,
  author       = {Peter Stone and
                  Sarit Kraus},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {To teach or not to teach?: decision making under uncertainty in ad
                  hoc teams},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {117--124},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838223},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/StoneK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeCS10,
  author       = {David Pardoe and
                  Doran Chakraborty and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {TacTex09: a champion bidding agent for ad auctions},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {1273--1280},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838372},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeCS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/SetapenQS10,
  author       = {Adam Setapen and
                  Michael J. Quinlan and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {MARIOnET: motion acquisition for robots through iterative online evaluative
                  training},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {1435--1436},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838419},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/SetapenQS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ChakrabortyS10,
  author       = {Doran Chakraborty and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {Online model learning in adversarial Markov decision processes},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {1583--1584},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838492},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/ChakrabortyS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KnoxS10a,
  author       = {W. Bradley Knox and
                  Peter Stone},
  editor       = {Wiebe van der Hoek and
                  Gal A. Kaminka and
                  Yves Lesp{\'{e}}rance and
                  Michael Luck and
                  Sandip Sen},
  title        = {Training a Tetris agent via interactive shaping: a demonstration of
                  the {TAMER} framework},
  booktitle    = {9th International Conference on Autonomous Agents and Multiagent Systems
                  {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3},
  pages        = {1767--1768},
  publisher    = {{IFAAMAS}},
  year         = {2010},
  url          = {https://dl.acm.org/citation.cfm?id=1838541},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/KnoxS10a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icdl/HesterS10,
  author       = {Todd Hester and
                  Peter Stone},
  editor       = {Benjamin Kuipers and
                  Thomas R. Shultz and
                  Alexander Stoytchev and
                  Chen Yu},
  title        = {Real time targeted exploration in large domains},
  booktitle    = {2010 {IEEE} 9th International Conference on Development and Learning,
                  {ICDL} 2010, Ann Arbor, MI, USA, August 18-21, 2010},
  pages        = {191--196},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/DEVLRN.2010.5578845},
  doi          = {10.1109/DEVLRN.2010.5578845},
  timestamp    = {Thu, 29 Jul 2021 12:02:58 +0200},
  biburl       = {https://dblp.org/rec/conf/icdl/HesterS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChakrabortyS10,
  author       = {Doran Chakraborty and
                  Peter Stone},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Thorsten Joachims},
  title        = {Convergence, Targeted Optimality, and Safety in Multiagent Learning},
  booktitle    = {Proceedings of the 27th International Conference on Machine Learning
                  (ICML-10), June 21-24, 2010, Haifa, Israel},
  pages        = {191--198},
  publisher    = {Omnipress},
  year         = {2010},
  url          = {https://icml.cc/Conferences/2010/papers/453.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChakrabortyS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KalyanakrishnanS10,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Thorsten Joachims},
  title        = {Efficient Selection of Multiple Bandit Arms: Theory and Practice},
  booktitle    = {Proceedings of the 27th International Conference on Machine Learning
                  (ICML-10), June 21-24, 2010, Haifa, Israel},
  pages        = {511--518},
  publisher    = {Omnipress},
  year         = {2010},
  url          = {https://icml.cc/Conferences/2010/papers/410.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KalyanakrishnanS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PardoeS10,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Thorsten Joachims},
  title        = {Boosting for Regression Transfer},
  booktitle    = {Proceedings of the 27th International Conference on Machine Learning
                  (ICML-10), June 21-24, 2010, Haifa, Israel},
  pages        = {863--870},
  publisher    = {Omnipress},
  year         = {2010},
  url          = {https://icml.cc/Conferences/2010/papers/330.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PardoeS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/HesterQS10,
  author       = {Todd Hester and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {Generalized model learning for Reinforcement Learning on a humanoid
                  robot},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2010, Anchorage, Alaska, USA, 3-7 May 2010},
  pages        = {2369--2374},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ROBOT.2010.5509181},
  doi          = {10.1109/ROBOT.2010.5509181},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/HesterQS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/QuinlanAZSS10,
  author       = {Michael J. Quinlan and
                  Tsz{-}Chiu Au and
                  Jesse Zhu and
                  Nicolae Stiurca and
                  Peter Stone},
  title        = {Bringing simulation to life: {A} mixed reality autonomous intersection},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {6083--6088},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5651993},
  doi          = {10.1109/IROS.2010.5651993},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/QuinlanAZSS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/JungS10,
  author       = {Tobias Jung and
                  Peter Stone},
  editor       = {Jos{\'{e}} L. Balc{\'{a}}zar and
                  Francesco Bonchi and
                  Aristides Gionis and
                  Mich{\`{e}}le Sebag},
  title        = {Gaussian Processes for Sample Efficient Reinforcement Learning with
                  RMAX-Like Exploration},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases, European Conference,
                  {ECML} {PKDD} 2010, Barcelona, Spain, September 20-24, 2010, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {6321},
  pages        = {601--616},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15880-3\_44},
  doi          = {10.1007/978-3-642-15880-3\_44},
  timestamp    = {Fri, 19 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/JungS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/HausknechtS10,
  author       = {Matthew J. Hausknecht and
                  Peter Stone},
  editor       = {Javier Ruiz{-}del{-}Solar and
                  Eric Chown and
                  Paul{-}Gerhard Pl{\"{o}}ger},
  title        = {Learning Powerful Kicks on the Aibo {ERS-7:} The Quest for a Striker},
  booktitle    = {RoboCup 2010: Robot Soccer World Cup {XIV} [papers from the 14th annual
                  RoboCup International Symposium, Singapore, June 25, 2010]},
  series       = {Lecture Notes in Computer Science},
  volume       = {6556},
  pages        = {254--265},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-20217-9\_22},
  doi          = {10.1007/978-3-642-20217-9\_22},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/HausknechtS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/daglib/p/NodaSYK10,
  author       = {Itsuki Noda and
                  Peter Stone and
                  Tomohisa Yamashita and
                  Koichi Kurumatani},
  editor       = {Hideyuki Nakashima and
                  Hamid K. Aghajan and
                  Juan Carlos Augusto},
  title        = {Multi-Agent Social Simulation},
  booktitle    = {Handbook of Ambient Intelligence and Smart Environments},
  pages        = {703--729},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-0-387-93808-0\_26},
  doi          = {10.1007/978-0-387-93808-0\_26},
  timestamp    = {Tue, 16 May 2017 14:01:34 +0200},
  biburl       = {https://dblp.org/rec/books/daglib/p/NodaSYK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/ml/Stone10,
  author       = {Peter Stone},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Q-Learning},
  booktitle    = {Encyclopedia of Machine Learning},
  pages        = {819},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-0-387-30164-8\_683},
  doi          = {10.1007/978-0-387-30164-8\_683},
  timestamp    = {Wed, 14 Nov 2018 10:51:34 +0100},
  biburl       = {https://dblp.org/rec/reference/ml/Stone10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/ml/Stone10a,
  author       = {Peter Stone},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Reinforcement Learning},
  booktitle    = {Encyclopedia of Machine Learning},
  pages        = {849--851},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-0-387-30164-8\_714},
  doi          = {10.1007/978-0-387-30164-8\_714},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/ml/Stone10a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TaylorS09,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  title        = {Transfer Learning for Reinforcement Learning Domains: {A} Survey},
  journal      = {J. Mach. Learn. Res.},
  volume       = {10},
  pages        = {1633--1685},
  year         = {2009},
  url          = {https://dl.acm.org/doi/10.5555/1577069.1755839},
  doi          = {10.5555/1577069.1755839},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TaylorS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/SridharanS09,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Color learning and illumination invariance on mobile robots: {A} survey},
  journal      = {Robotics Auton. Syst.},
  volume       = {57},
  number       = {6-7},
  pages        = {629--644},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.robot.2009.01.004},
  doi          = {10.1016/J.ROBOT.2009.01.004},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ras/SridharanS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/FaselQS09,
  author       = {Ian R. Fasel and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {A Task Specification Language for Bootstrap Learning},
  booktitle    = {Agents that Learn from Human Teachers, Papers from the 2009 {AAAI}
                  Spring Symposium, Technical Report SS-09-01, Stanford, California,
                  USA, March 23-25, 2009},
  pages        = {48--55},
  publisher    = {{AAAI}},
  year         = {2009},
  url          = {http://www.aaai.org/Library/Symposia/Spring/2009/ss09-01-008.php},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/FaselQS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaiss/KnoxFS09,
  author       = {W. Bradley Knox and
                  Ian R. Fasel and
                  Peter Stone},
  title        = {Design Principles for Creating Human-Shapable Agents},
  booktitle    = {Agents that Learn from Human Teachers, Papers from the 2009 {AAAI}
                  Spring Symposium, Technical Report SS-09-01, Stanford, California,
                  USA, March 23-25, 2009},
  pages        = {79--86},
  publisher    = {{AAAI}},
  year         = {2009},
  url          = {http://www.aaai.org/Library/Symposia/Spring/2009/ss09-01-012.php},
  timestamp    = {Thu, 14 Apr 2016 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaiss/KnoxFS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/StoneKR09,
  author       = {Peter Stone and
                  Gal A. Kaminka and
                  Jeffrey S. Rosenschein},
  editor       = {Esther David and
                  Enrico H. Gerding and
                  David Sarne and
                  Onn Shehory},
  title        = {Leading a Best-Response Teammate in an Ad Hoc Team},
  booktitle    = {Agent-Mediated Electronic Commerce. Designing Trading Strategies and
                  Mechanisms for Electronic Markets - {AAMAS} Workshop, {AMEC} 2009,
                  Budapest, Hungary, May 12, 2009, and {IJCAI} Workshop, {TADA} 2009,
                  Pasadena, CA, USA, July 13, 2009, Selected and Revised Papers},
  series       = {Lecture Notes in Business Information Processing},
  volume       = {59},
  pages        = {132--146},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-15117-0\_10},
  doi          = {10.1007/978-3-642-15117-0\_10},
  timestamp    = {Thu, 07 Jul 2022 17:31:33 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/StoneKR09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/HesterS09,
  author       = {Todd Hester and
                  Peter Stone},
  editor       = {Carles Sierra and
                  Cristiano Castelfranchi and
                  Keith S. Decker and
                  Jaime Sim{\~{a}}o Sichman},
  title        = {Generalized model learning for reinforcement learning in factored
                  domains},
  booktitle    = {8th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume
                  2},
  pages        = {717--724},
  publisher    = {{IFAAMAS}},
  year         = {2009},
  url          = {https://dl.acm.org/citation.cfm?id=1558111},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/HesterS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KalyanakrishnanS09,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  editor       = {Carles Sierra and
                  Cristiano Castelfranchi and
                  Keith S. Decker and
                  Jaime Sim{\~{a}}o Sichman},
  title        = {An empirical analysis of value function-based and policy search reinforcement
                  learning},
  booktitle    = {8th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume
                  2},
  pages        = {749--756},
  publisher    = {{IFAAMAS}},
  year         = {2009},
  url          = {https://dl.acm.org/citation.cfm?id=1558115},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/KalyanakrishnanS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/FaselQS09,
  author       = {Ian R. Fasel and
                  Michael J. Quinlan and
                  Peter Stone},
  editor       = {Carles Sierra and
                  Cristiano Castelfranchi and
                  Keith S. Decker and
                  Jaime Sim{\~{a}}o Sichman},
  title        = {A task specification language for bootstrap learning},
  booktitle    = {8th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume
                  2},
  pages        = {1169--1170},
  publisher    = {{IFAAMAS}},
  year         = {2009},
  url          = {https://dl.acm.org/citation.cfm?id=1558195},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/FaselQS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KalyanakrishnanS09a,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  editor       = {Carles Sierra and
                  Cristiano Castelfranchi and
                  Keith S. Decker and
                  Jaime Sim{\~{a}}o Sichman},
  title        = {Learning complementary multiagent behaviors: a case study},
  booktitle    = {8th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume
                  2},
  pages        = {1359--1360},
  publisher    = {{IFAAMAS}},
  year         = {2009},
  url          = {https://dl.acm.org/citation.cfm?id=1558293},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/KalyanakrishnanS09a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/DjeuQS09,
  author       = {Peter Djeu and
                  Michael J. Quinlan and
                  Peter Stone},
  title        = {Improving particle filter performance using {SSE} instructions},
  booktitle    = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 11-15, 2009, St. Louis, MO, {USA}},
  pages        = {3480--3485},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/IROS.2009.5354190},
  doi          = {10.1109/IROS.2009.5354190},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/DjeuQS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kcap/KnoxS09,
  author       = {W. Bradley Knox and
                  Peter Stone},
  editor       = {Yolanda Gil and
                  Natasha Fridman Noy},
  title        = {Interactively shaping agents via human reinforcement: the {TAMER}
                  framework},
  booktitle    = {Proceedings of the 5th International Conference on Knowledge Capture
                  {(K-CAP} 2009), September 1-4, 2009, Redondo Beach, California, {USA}},
  pages        = {9--16},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1597735.1597738},
  doi          = {10.1145/1597735.1597738},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/kcap/KnoxS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/JongS09,
  author       = {Nicholas K. Jong and
                  Peter Stone},
  editor       = {Wray L. Buntine and
                  Marko Grobelnik and
                  Dunja Mladenic and
                  John Shawe{-}Taylor},
  title        = {Compositional Models for Reinforcement Learning},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases, European Conference,
                  {ECML} {PKDD} 2009, Bled, Slovenia, September 7-11, 2009, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5781},
  pages        = {644--659},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-04180-8\_59},
  doi          = {10.1007/978-3-642-04180-8\_59},
  timestamp    = {Tue, 14 May 2019 10:00:47 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/JongS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/JungS09,
  author       = {Tobias Jung and
                  Peter Stone},
  editor       = {Wray L. Buntine and
                  Marko Grobelnik and
                  Dunja Mladenic and
                  John Shawe{-}Taylor},
  title        = {Feature Selection for Value Function Approximation Using Bayesian
                  Model Selection},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases, European Conference,
                  {ECML} {PKDD} 2009, Bled, Slovenia, September 7-11, 2009, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5781},
  pages        = {660--675},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-04180-8\_60},
  doi          = {10.1007/978-3-642-04180-8\_60},
  timestamp    = {Fri, 19 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/JungS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KalyanakrishnanHQBS09,
  author       = {Shivaram Kalyanakrishnan and
                  Todd Hester and
                  Michael J. Quinlan and
                  Yinon Bentor and
                  Peter Stone},
  editor       = {Jacky Baltes and
                  Michail G. Lagoudakis and
                  Tadashi Naruse and
                  Saeed Shiry Ghidary},
  title        = {Three Humanoid Soccer Platforms: Comparison and Synthesis},
  booktitle    = {RoboCup 2009: Robot Soccer World Cup {XIII} [papers from the 13th
                  annual RoboCup International Symposium, Graz, Austria, June 29 - July
                  5, 2009]},
  series       = {Lecture Notes in Computer Science},
  volume       = {5949},
  pages        = {140--152},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-11876-0\_13},
  doi          = {10.1007/978-3-642-11876-0\_13},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KalyanakrishnanHQBS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KalyanakrishnanS09,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  editor       = {Jacky Baltes and
                  Michail G. Lagoudakis and
                  Tadashi Naruse and
                  Saeed Shiry Ghidary},
  title        = {Learning Complementary Multiagent Behaviors: {A} Case Study},
  booktitle    = {RoboCup 2009: Robot Soccer World Cup {XIII} [papers from the 13th
                  annual RoboCup International Symposium, Graz, Austria, June 29 - July
                  5, 2009]},
  series       = {Lecture Notes in Computer Science},
  volume       = {5949},
  pages        = {153--165},
  publisher    = {Springer},
  year         = {2009},
  url          = {https://doi.org/10.1007/978-3-642-11876-0\_14},
  doi          = {10.1007/978-3-642-11876-0\_14},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KalyanakrishnanS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/igi/09/DresnerSM09,
  author       = {Kurt M. Dresner and
                  Peter Stone and
                  Mark Van Middlesworth},
  editor       = {Ana L. C. Bazzan and
                  Franziska Kl{\"{u}}gl},
  title        = {An Unmanaged Intersection Protocol and Improved Intersection Safety
                  for Autonomous Vehicles},
  booktitle    = {Multi-Agent Systems for Traffic and Transportation Engineering},
  pages        = {193--217},
  publisher    = {{IGI} Global},
  year         = {2009},
  url          = {https://doi.org/10.4018/978-1-60566-226-8.ch009},
  doi          = {10.4018/978-1-60566-226-8.CH009},
  timestamp    = {Mon, 16 Sep 2019 14:43:09 +0200},
  biburl       = {https://dblp.org/rec/books/igi/09/DresnerSM09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijait/StrongerS08,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Polynomial Regression with Automated Degree: a Function Approximator
                  for Autonomous Agents},
  journal      = {Int. J. Artif. Intell. Tools},
  volume       = {17},
  number       = {1},
  pages        = {159--174},
  year         = {2008},
  url          = {https://doi.org/10.1142/S0218213008003820},
  doi          = {10.1142/S0218213008003820},
  timestamp    = {Tue, 12 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijait/StrongerS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijhisi/ParryPDS08,
  author       = {David Parry and
                  Emma Parry and
                  Phurb Dorji and
                  Peter Stone},
  title        = {Open Source Software: {A} Key Component of E-Health in Developing
                  Nations},
  journal      = {Int. J. Heal. Inf. Syst. Informatics},
  volume       = {3},
  number       = {3},
  pages        = {1--15},
  year         = {2008},
  url          = {https://doi.org/10.4018/jhisi.2008070101},
  doi          = {10.4018/JHISI.2008070101},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijhisi/ParryPDS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/DresnerS08,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  title        = {A Multiagent Approach to Autonomous Intersection Management},
  journal      = {J. Artif. Intell. Res.},
  volume       = {31},
  pages        = {591--656},
  year         = {2008},
  url          = {https://doi.org/10.1613/jair.2502},
  doi          = {10.1613/JAIR.2502},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/DresnerS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigecom/WellmanGS08,
  author       = {Michael P. Wellman and
                  Amy Greenwald and
                  Peter Stone},
  title        = {Book announcement: autonomous bidding agents},
  journal      = {SIGecom Exch.},
  volume       = {7},
  number       = {2},
  year         = {2008},
  url          = {https://doi.org/10.1145/1399589.1399591},
  doi          = {10.1145/1399589.1399591},
  timestamp    = {Thu, 04 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigecom/WellmanGS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agi/TaylorKS08,
  author       = {Matthew E. Taylor and
                  Gregory Kuhlmann and
                  Peter Stone},
  editor       = {Pei Wang and
                  Ben Goertzel and
                  Stan Franklin},
  title        = {Transfer Learning and Intelligence: an Argument and Approach},
  booktitle    = {Artificial General Intelligence 2008, Proceedings of the First {AGI}
                  Conference, {AGI} 2008, March 1-3, 2008, University of Memphis, Memphis,
                  TN, {USA}},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {171},
  pages        = {326--337},
  publisher    = {{IOS} Press},
  year         = {2008},
  url          = {http://www.booksonline.iospress.nl/Content/View.aspx?piid=8319},
  timestamp    = {Thu, 24 Aug 2017 11:33:04 +0200},
  biburl       = {https://dblp.org/rec/conf/agi/TaylorKS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/PardoeS08,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Wolfgang Ketter and
                  Han La Poutr{\'{e}} and
                  Norman M. Sadeh and
                  Onn Shehory and
                  William E. Walsh},
  title        = {The 2007 {TAC} {SCM} Prediction Challenge},
  booktitle    = {Agent-Mediated Electronic Commerce and Trading Agent Design and Analysis
                  - {AAMAS} Workshop, {AMEC} 2008, Estoril, Portugal, May 12-16, 2008,
                  and {AAAI} Workshop, {TADA} 2008, Chicago, IL, USA, July 14, 2008,
                  Revised Selected Papers},
  series       = {Lecture Notes in Business Information Processing},
  volume       = {44},
  pages        = {175--189},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-642-15237-5\_13},
  doi          = {10.1007/978-3-642-15237-5\_13},
  timestamp    = {Tue, 22 Jan 2019 08:41:34 +0100},
  biburl       = {https://dblp.org/rec/conf/amec/PardoeS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/TaylorKS08,
  author       = {Matthew E. Taylor and
                  Gregory Kuhlmann and
                  Peter Stone},
  editor       = {Lin Padgham and
                  David C. Parkes and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Simon Parsons},
  title        = {Autonomous transfer for reinforcement learning},
  booktitle    = {7th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume
                  1},
  pages        = {283--290},
  publisher    = {{IFAAMAS}},
  year         = {2008},
  url          = {https://dl.acm.org/citation.cfm?id=1402427},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/TaylorKS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/JongHS08,
  author       = {Nicholas K. Jong and
                  Todd Hester and
                  Peter Stone},
  editor       = {Lin Padgham and
                  David C. Parkes and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Simon Parsons},
  title        = {The utility of temporal abstraction in reinforcement learning},
  booktitle    = {7th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume
                  1},
  pages        = {299--306},
  publisher    = {{IFAAMAS}},
  year         = {2008},
  url          = {https://dl.acm.org/citation.cfm?id=1402429},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/JongHS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/DresnerS08,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  editor       = {Lin Padgham and
                  David C. Parkes and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Simon Parsons},
  title        = {Mitigating catastrophic failure at intersections of autonomous vehicles},
  booktitle    = {7th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume
                  3},
  pages        = {1393--1396},
  publisher    = {{IFAAMAS}},
  year         = {2008},
  url          = {https://dl.acm.org/citation.cfm?id=1402881},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DresnerS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/MiddlesworthDS08,
  author       = {Mark Van Middlesworth and
                  Kurt M. Dresner and
                  Peter Stone},
  editor       = {Lin Padgham and
                  David C. Parkes and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Simon Parsons},
  title        = {Replacing the stop sign: unmanaged intersection control for autonomous
                  vehicles},
  booktitle    = {7th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume
                  3},
  pages        = {1413--1416},
  publisher    = {{IFAAMAS}},
  year         = {2008},
  url          = {https://dl.acm.org/citation.cfm?id=1402886},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/MiddlesworthDS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icac/WildstromSW08,
  author       = {Jonathan Wildstrom and
                  Peter Stone and
                  Emmett Witchel},
  editor       = {John Strassner and
                  Simon A. Dobson and
                  Jos{\'{e}} A. B. Fortes and
                  Kumar K. Goswami},
  title        = {{CARVE:} {A} Cognitive Agent for Resource Value Estimation},
  booktitle    = {2008 International Conference on Autonomic Computing, {ICAC} 2008,
                  June 2-6, 2008, Chicago, Illinois, {USA}},
  pages        = {182--191},
  publisher    = {{IEEE} Computer Society},
  year         = {2008},
  url          = {https://doi.org/10.1109/ICAC.2008.27},
  doi          = {10.1109/ICAC.2008.27},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icac/WildstromSW08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ReisingerSM08,
  author       = {Joseph Reisinger and
                  Peter Stone and
                  Risto Miikkulainen},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Online kernel selection for Bayesian reinforcement learning},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {816--823},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390259},
  doi          = {10.1145/1390156.1390259},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/ReisingerSM08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KnoxLS08,
  author       = {W. Bradley Knox and
                  Juhyun Lee and
                  Peter Stone},
  title        = {Person recognition on a Segway Robot: {A} video of {UT} Austin Villa
                  Robocup@Home 2007 finals demonstration},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {1785--1786},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543466},
  doi          = {10.1109/ROBOT.2008.4543466},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KnoxLS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/StrongerS08,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Maximum likelihood estimation of sensor and action model functions
                  on a mobile robot},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {2104--2109},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543517},
  doi          = {10.1109/ROBOT.2008.4543517},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/StrongerS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LeeS08,
  author       = {Juhyun Lee and
                  Peter Stone},
  title        = {Person tracking on a mobile robot with heterogeneous inter-characteristic
                  feedback},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {2577--2582},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543601},
  doi          = {10.1109/ROBOT.2008.4543601},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LeeS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/HesterS08,
  author       = {Todd Hester and
                  Peter Stone},
  title        = {Negative information and line observations for Monte Carlo localization},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {2764--2769},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543629},
  doi          = {10.1109/ROBOT.2008.4543629},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/HesterS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/ChakrabortyS08,
  author       = {Doran Chakraborty and
                  Peter Stone},
  editor       = {Walter Daelemans and
                  Bart Goethals and
                  Katharina Morik},
  title        = {Online Multiagent Learning against Memory Bounded Adversaries},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases, European Conference,
                  {ECML/PKDD} 2008, Antwerp, Belgium, September 15-19, 2008, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5211},
  pages        = {211--226},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87479-9\_32},
  doi          = {10.1007/978-3-540-87479-9\_32},
  timestamp    = {Mon, 28 Aug 2023 21:17:29 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/ChakrabortyS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/TaylorJS08,
  author       = {Matthew E. Taylor and
                  Nicholas K. Jong and
                  Peter Stone},
  editor       = {Walter Daelemans and
                  Bart Goethals and
                  Katharina Morik},
  title        = {Transferring Instances for Model-Based Reinforcement Learning},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases, European Conference,
                  {ECML/PKDD} 2008, Antwerp, Belgium, September 15-19, 2008, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5212},
  pages        = {488--505},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-540-87481-2\_32},
  doi          = {10.1007/978-3-540-87481-2\_32},
  timestamp    = {Tue, 14 May 2019 10:00:47 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/TaylorJS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KnoxLS08,
  author       = {W. Bradley Knox and
                  Juhyun Lee and
                  Peter Stone},
  editor       = {Luca Iocchi and
                  Hitoshi Matsubara and
                  Alfredo Weitzenfeld and
                  Changjiu Zhou},
  title        = {Domestic Interaction on a Segway Base},
  booktitle    = {RoboCup 2008: Robot Soccer World Cup {XII} [papers from the 12th annual
                  RoboCup International Symposium, Suzhou, China, July 15-18, 2008]},
  series       = {Lecture Notes in Computer Science},
  volume       = {5399},
  pages        = {519--531},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-642-02921-9\_45},
  doi          = {10.1007/978-3-642-02921-9\_45},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KnoxLS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/visapp/SridharanS08a,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Luca Iocchi and
                  Domenico G. Sorrenti},
  title        = {Comparing Two Action Planning Approaches for Color Learning on a Mobile
                  Robot},
  booktitle    = {Proceedings of the {VISAPP} International Workshop on Robotic Perception,
                  in conjunction with {VISIGRAPP} 2008, Funchal, Madeira, Portugal,
                  January 2008},
  pages        = {43--52},
  publisher    = {{INSTICC} - Institute for Systems and Technologies of Information,
                  Control and Communication},
  year         = {2008},
  timestamp    = {Sun, 07 Sep 2008 13:06:48 +0200},
  biburl       = {https://dblp.org/rec/conf/visapp/SridharanS08a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/visapp/SridharanS08,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Alpesh Ranchordas and
                  Helder Ara{\'{u}}jo},
  title        = {Long-Term vs. Greedy Action Planning for Color Learning on a Mobile
                  Robot},
  booktitle    = {{VISAPP} 2008: Proceedings of the Third International Conference on
                  Computer Vision Theory and Applications, Funchal, Madeira, Portugal,
                  January 22-25, 2008 - Volume 2},
  pages        = {682--685},
  publisher    = {{INSTICC} - Institute for Systems and Technologies of Information,
                  Control and Communication},
  year         = {2008},
  timestamp    = {Mon, 15 Jun 2015 19:00:07 +0200},
  biburl       = {https://dblp.org/rec/conf/visapp/SridharanS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/daglib/0018264,
  author       = {Michael P. Wellman and
                  Amy Greenwald and
                  Peter Stone},
  title        = {Autonomous bidding agents - strategies and lessons from the trading
                  agent competition},
  publisher    = {{MIT} Press},
  year         = {2007},
  isbn         = {978-0-262-23260-9},
  timestamp    = {Thu, 09 Feb 2012 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/books/daglib/0018264.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:series/synthesis/2007Stone,
  author       = {Peter Stone},
  title        = {Intelligent Autonomous Robotics: {A} Robot Soccer Case Study},
  series       = {Synthesis Lectures on Artificial Intelligence and Machine Learning},
  publisher    = {Morgan {\&} Claypool Publishers},
  year         = {2007},
  url          = {https://doi.org/10.2200/S00090ED1V01Y200705AIM001},
  doi          = {10.2200/S00090ED1V01Y200705AIM001},
  isbn         = {978-3-031-00416-2},
  timestamp    = {Tue, 17 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/series/synthesis/2007Stone.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/adb/WhitesonTS07,
  author       = {Shimon Whiteson and
                  Matthew E. Taylor and
                  Peter Stone},
  title        = {Empirical Studies in Action Selection with Reinforcement Learning},
  journal      = {Adapt. Behav.},
  volume       = {15},
  number       = {1},
  pages        = {33--50},
  year         = {2007},
  url          = {https://doi.org/10.1177/1059712306076253},
  doi          = {10.1177/1059712306076253},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/adb/WhitesonTS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/Stone07,
  author       = {Peter Stone},
  title        = {Multiagent learning is not the answer. It is the question},
  journal      = {Artif. Intell.},
  volume       = {171},
  number       = {7},
  pages        = {402--405},
  year         = {2007},
  url          = {https://doi.org/10.1016/j.artint.2006.12.005},
  doi          = {10.1016/J.ARTINT.2006.12.005},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/Stone07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/arobots/SridharanS07,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Structure-based color learning on a mobile robot under changing illumination},
  journal      = {Auton. Robots},
  volume       = {23},
  number       = {3},
  pages        = {161--182},
  year         = {2007},
  url          = {https://doi.org/10.1007/s10514-007-9038-7},
  doi          = {10.1007/S10514-007-9038-7},
  timestamp    = {Thu, 18 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/arobots/SridharanS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TaylorSL07,
  author       = {Matthew E. Taylor and
                  Peter Stone and
                  Yaxin Liu},
  title        = {Transfer Learning via Inter-Task Mappings for Temporal Difference
                  Learning},
  journal      = {J. Mach. Learn. Res.},
  volume       = {8},
  pages        = {2125--2167},
  year         = {2007},
  url          = {https://dl.acm.org/doi/10.5555/1314498.1314569},
  doi          = {10.5555/1314498.1314569},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TaylorSL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TaylorWS07,
  author       = {Matthew E. Taylor and
                  Shimon Whiteson and
                  Peter Stone},
  title        = {Temporal Difference and Policy Search Methods for Reinforcement Learning:
                  An Empirical Comparison},
  booktitle    = {Proceedings of the Twenty-Second {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2007, Vancouver, British Columbia, Canada},
  pages        = {1675--1678},
  publisher    = {{AAAI} Press},
  year         = {2007},
  url          = {http://www.aaai.org/Library/AAAI/2007/aaai07-271.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TaylorWS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TaylorS07,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  title        = {Representation Transfer via Elaboration},
  booktitle    = {Proceedings of the Twenty-Second {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2007, Vancouver, British Columbia, Canada},
  pages        = {1906--1907},
  publisher    = {{AAAI} Press},
  year         = {2007},
  url          = {http://www.aaai.org/Library/AAAI/2007/aaai07-328.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TaylorS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaaifs/TaylorS07,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  editor       = {Clayton T. Morrison and
                  Tim Oates},
  title        = {Representation Transfer for Reinforcement Learning},
  booktitle    = {Computational Approaches to Representation Change during Learning
                  and Development, Papers from the 2007 {AAAI} Fall Symposium, Arlington,
                  Virginia, USA, November 9-11, 2007},
  series       = {{AAAI} Technical Report},
  volume       = {{FS-07-03}},
  pages        = {78--85},
  publisher    = {{AAAI} Press},
  year         = {2007},
  url          = {https://www.aaai.org/Library/Symposia/Fall/2007/fs07-03-015.php},
  timestamp    = {Sun, 16 Oct 2022 14:19:55 +0200},
  biburl       = {https://dblp.org/rec/conf/aaaifs/TaylorS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeS07a,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {John Collins and
                  Peyman Faratin and
                  Simon Parsons and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar and
                  Norman M. Sadeh and
                  Onn Shehory and
                  Elizabeth Sklar},
  title        = {Adapting Price Predictions in {TAC} {SCM}},
  booktitle    = {Agent-Mediated Electronic Commerce and Trading Agent Design and Analysis,
                  {AAMAS} 2007 Workshop, {AMEC} 2007, Honolulu, Hawaii, May 14, 2007,
                  and {AAAI} 2007 Workshop, {TADA} 2007, Vancouver, Canada, July 23,
                  2007, Selected and Revised Papers},
  series       = {Lecture Notes in Business Information Processing},
  volume       = {13},
  pages        = {30--45},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-88713-3\_3},
  doi          = {10.1007/978-3-540-88713-3\_3},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeS07a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/TaylorWS07,
  author       = {Matthew E. Taylor and
                  Shimon Whiteson and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {Transfer via inter-task mappings in policy search reinforcement learning},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {37},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329170},
  doi          = {10.1145/1329125.1329170},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/TaylorWS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/KalyanakrishnanS07,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {Batch reinforcement learning in a complex domain},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {94},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329241},
  doi          = {10.1145/1329125.1329241},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/KalyanakrishnanS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/JongS07,
  author       = {Nicholas K. Jong and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {Model-based function approximation in reinforcement learning},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {95},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329242},
  doi          = {10.1145/1329125.1329242},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/JongS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeS07,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {Adapting in agent-based markets: a study from {TAC} {SCM}},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {98},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329246},
  doi          = {10.1145/1329125.1329246},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/TaylorS07,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {Towards reinforcement learning representation transfer},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {100},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329248},
  doi          = {10.1145/1329125.1329248},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/TaylorS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AhmadiTS07,
  author       = {Mazda Ahmadi and
                  Matthew E. Taylor and
                  Peter Stone},
  editor       = {Edmund H. Durfee and
                  Makoto Yokoo and
                  Michael N. Huhns and
                  Onn Shehory},
  title        = {{IFSA:} incremental feature-set augmentation for reinforcement learning
                  tasks},
  booktitle    = {6th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007},
  pages        = {186},
  publisher    = {{IFAAMAS}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1329125.1329351},
  doi          = {10.1145/1329125.1329351},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/AhmadiTS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecml/KuhlmannS07,
  author       = {Gregory Kuhlmann and
                  Peter Stone},
  editor       = {Joost N. Kok and
                  Jacek Koronacki and
                  Ram{\'{o}}n L{\'{o}}pez de M{\'{a}}ntaras and
                  Stan Matwin and
                  Dunja Mladenic and
                  Andrzej Skowron},
  title        = {Graph-Based Domain Mapping for Transfer Learning in General Games},
  booktitle    = {Machine Learning: {ECML} 2007, 18th European Conference on Machine
                  Learning, Warsaw, Poland, September 17-21, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4701},
  pages        = {188--200},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-74958-5\_20},
  doi          = {10.1007/978-3-540-74958-5\_20},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/ecml/KuhlmannS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icac/WildstromSW07,
  author       = {Jonathan Wildstrom and
                  Peter Stone and
                  Emmett Witchel},
  title        = {Autonomous Return on Investment Analysis of Additional Processing
                  Resources},
  booktitle    = {Fourth International Conference on Autonomic Computing (ICAC'07),
                  Jacksonville, Florida, USA, June 11-15, 2007},
  pages        = {15},
  publisher    = {{IEEE} Computer Society},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICAC.2007.11},
  doi          = {10.1109/ICAC.2007.11},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icac/WildstromSW07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TaylorS07,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  editor       = {Zoubin Ghahramani},
  title        = {Cross-domain transfer for reinforcement learning},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fourth International Conference
                  {(ICML} 2007), Corvallis, Oregon, USA, June 20-24, 2007},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {227},
  pages        = {879--886},
  publisher    = {{ACM}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1273496.1273607},
  doi          = {10.1145/1273496.1273607},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/TaylorS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/StrongerS07,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {A Comparison of Two Approaches for Vision and Self-Localization on
                  a Mobile Robot},
  booktitle    = {2007 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2007, 10-14 April 2007, Roma, Italy},
  pages        = {3915--3920},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ROBOT.2007.364079},
  doi          = {10.1109/ROBOT.2007.364079},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/StrongerS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/Stone07,
  author       = {Peter Stone},
  editor       = {Manuela M. Veloso},
  title        = {Learning and Multiagent Reasoning for Autonomous Agents},
  booktitle    = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference
                  on Artificial Intelligence, Hyderabad, India, January 6-12, 2007},
  pages        = {12--30},
  year         = {2007},
  url          = {http://ijcai.org/Proceedings/07/Papers/002.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:17:11 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/Stone07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/BanerjeeS07,
  author       = {Bikramjit Banerjee and
                  Peter Stone},
  editor       = {Manuela M. Veloso},
  title        = {General Game Learning Using Knowledge Transfer},
  booktitle    = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference
                  on Artificial Intelligence, Hyderabad, India, January 6-12, 2007},
  pages        = {672--677},
  year         = {2007},
  url          = {http://ijcai.org/Proceedings/07/Papers/107.pdf},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/BanerjeeS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/WildstromSWD07,
  author       = {Jonathan Wildstrom and
                  Peter Stone and
                  Emmett Witchel and
                  Michael Dahlin},
  editor       = {Manuela M. Veloso},
  title        = {Machine Learning for On-Line Hardware Reconfiguration},
  booktitle    = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference
                  on Artificial Intelligence, Hyderabad, India, January 6-12, 2007},
  pages        = {1113--1118},
  year         = {2007},
  url          = {http://ijcai.org/Proceedings/07/Papers/180.pdf},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/WildstromSWD07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/DresnerS07,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  editor       = {Manuela M. Veloso},
  title        = {Sharing the Road: Autonomous Vehicles Meet Human Drivers},
  booktitle    = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference
                  on Artificial Intelligence, Hyderabad, India, January 6-12, 2007},
  pages        = {1263--1268},
  year         = {2007},
  url          = {http://ijcai.org/Proceedings/07/Papers/204.pdf},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/DresnerS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/SridharanS07,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Manuela M. Veloso},
  title        = {Color Learning on a Mobile Robot: Towards Full Autonomy under Changing
                  Illumination},
  booktitle    = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference
                  on Artificial Intelligence, Hyderabad, India, January 6-12, 2007},
  pages        = {2212--2217},
  year         = {2007},
  url          = {http://ijcai.org/Proceedings/07/Papers/356.pdf},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/SridharanS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/SridharanS07,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Global action selection for illumination invariant color modeling},
  booktitle    = {2007 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 29 - November 2, 2007, Sheraton Hotel and Marina,
                  San Diego, California, {USA}},
  pages        = {1671--1676},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/IROS.2007.4399203},
  doi          = {10.1109/IROS.2007.4399203},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/SridharanS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/AhmadiS07,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  editor       = {Ubbo Visser and
                  Fernando Ribeiro and
                  Takeshi Ohashi and
                  Frank Dellaert},
  title        = {Instance-Based Action Models for Fast Action Planning},
  booktitle    = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta,
                  GA, {USA}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5001},
  pages        = {1--16},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-68847-1\_1},
  doi          = {10.1007/978-3-540-68847-1\_1},
  timestamp    = {Sat, 30 Sep 2023 09:55:24 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/AhmadiS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KalyanakrishnanSL07,
  author       = {Shivaram Kalyanakrishnan and
                  Peter Stone and
                  Yaxin Liu},
  editor       = {Ubbo Visser and
                  Fernando Ribeiro and
                  Takeshi Ohashi and
                  Frank Dellaert},
  title        = {Model-Based Reinforcement Learning in a Complex Domain},
  booktitle    = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta,
                  GA, {USA}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5001},
  pages        = {171--183},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-68847-1\_15},
  doi          = {10.1007/978-3-540-68847-1\_15},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KalyanakrishnanSL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/GrasemannSS07,
  author       = {Uli Grasemann and
                  Daniel Stronger and
                  Peter Stone},
  editor       = {Ubbo Visser and
                  Fernando Ribeiro and
                  Takeshi Ohashi and
                  Frank Dellaert},
  title        = {A Neural Network-Based Approach to Robot Motion Control},
  booktitle    = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta,
                  GA, {USA}},
  series       = {Lecture Notes in Computer Science},
  volume       = {5001},
  pages        = {480--487},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-68847-1\_51},
  doi          = {10.1007/978-3-540-68847-1\_51},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/GrasemannSS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sara/JongS07,
  author       = {Nicholas K. Jong and
                  Peter Stone},
  editor       = {Ian Miguel and
                  Wheeler Ruml},
  title        = {Model-Based Exploration in Continuous State Spaces},
  booktitle    = {Abstraction, Reformulation, and Approximation, 7th International Symposium,
                  {SARA} 2007, Whistler, Canada, July 18-21, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4612},
  pages        = {258--272},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-73580-9\_21},
  doi          = {10.1007/978-3-540-73580-9\_21},
  timestamp    = {Tue, 14 May 2019 10:00:38 +0200},
  biburl       = {https://dblp.org/rec/conf/sara/JongS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/IsbellKSSSK06,
  author       = {Charles Lee Isbell Jr. and
                  Michael J. Kearns and
                  Satinder Singh and
                  Christian R. Shelton and
                  Peter Stone and
                  David P. Kormann},
  title        = {Cobot in LambdaMOO: An Adaptive Social Statistics Agent},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {13},
  number       = {3},
  pages        = {327--354},
  year         = {2006},
  url          = {https://doi.org/10.1007/s10458-006-0005-z},
  doi          = {10.1007/S10458-006-0005-Z},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aamas/IsbellKSSSK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/connection/StrongerS06,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Towards autonomous sensor and actuator model induction on a mobile
                  robot},
  journal      = {Connect. Sci.},
  volume       = {18},
  number       = {2},
  pages        = {97--119},
  year         = {2006},
  url          = {https://doi.org/10.1080/09540090600768690},
  doi          = {10.1080/09540090600768690},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/connection/StrongerS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/WhitesonS06,
  author       = {Shimon Whiteson and
                  Peter Stone},
  title        = {Evolutionary Function Approximation for Reinforcement Learning},
  journal      = {J. Mach. Learn. Res.},
  volume       = {7},
  pages        = {877--917},
  year         = {2006},
  url          = {http://jmlr.org/papers/v7/whiteson06a.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/WhitesonS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/StoneSSKKFJ06,
  author       = {Peter Stone and
                  Mohan Sridharan and
                  Daniel Stronger and
                  Gregory Kuhlmann and
                  Nate Kohl and
                  Peggy Fidelman and
                  Nicholas K. Jong},
  title        = {From pixels to multi-robot decision-making: {A} study in uncertainty},
  journal      = {Robotics Auton. Syst.},
  volume       = {54},
  number       = {11},
  pages        = {933--943},
  year         = {2006},
  url          = {https://doi.org/10.1016/j.robot.2006.05.010},
  doi          = {10.1016/J.ROBOT.2006.05.010},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ras/StoneSSKKFJ06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ACMicec/PardoeSST06,
  author       = {David Pardoe and
                  Peter Stone and
                  Maytal Saar{-}Tsechansky and
                  Kerem Tomak},
  editor       = {Mark S. Fox and
                  Bruce Spencer},
  title        = {Adaptive mechanism design: a metalearning approach},
  booktitle    = {Proceedings of the 8th International Conference on Electronic Commerce:
                  The new e-commerce - Innovations for Conquering Current Barriers,
                  Obstacles and Limitations to Conducting Successful Business on the
                  Internet, 2006, Fredericton, New Brunswick, Canada, August 13-16,
                  2006},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {156},
  pages        = {92--102},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1151454.1151480},
  doi          = {10.1145/1151454.1151480},
  timestamp    = {Tue, 06 Apr 2021 12:12:56 +0200},
  biburl       = {https://dblp.org/rec/conf/ACMicec/PardoeSST06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuS06,
  author       = {Yaxin Liu and
                  Peter Stone},
  title        = {Value-Function-Based Transfer for Reinforcement Learning Using Structure
                  Mapping},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {415--420},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-066.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WhitesonS06,
  author       = {Shimon Whiteson and
                  Peter Stone},
  title        = {Sample-Efficient Evolutionary Function Approximation for Reinforcement
                  Learning},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {518--523},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-083.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WhitesonS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AhmadiS06,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  title        = {Keeping in Touch: Maintaining Biconnected Structure by Homogeneous
                  Robots},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {580--585},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-093.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AhmadiS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KuhlmannS06,
  author       = {Gregory Kuhlmann and
                  Peter Stone},
  title        = {Automatic Heuristic Construction in a Complete General Game Player},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1457--1462},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-229.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KuhlmannS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KuhlmannKS06,
  author       = {Gregory Kuhlmann and
                  William B. Knox and
                  Peter Stone},
  title        = {Know Thine Enemy: {A} Champion RoboCup Coach Agent},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1463--1468},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-230.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KuhlmannKS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/PardoeS06,
  author       = {David Pardoe and
                  Peter Stone},
  title        = {TacTex-05: {A} Champion Supply Chain Management Agent},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1489--1494},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-234.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/PardoeS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DresnerS06,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  title        = {Traffic Intersections of the Future},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1593--1596},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-258.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DresnerS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/AhmadiS06a,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  title        = {Biconnected Structure for Multi-Robot Systems},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1853},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-305.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/AhmadiS06a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DresnerS06a,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  title        = {Making Autonomous Intersection Management Backwards-Compatible},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1865--1866},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-311.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DresnerS06a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KuhlmannS06a,
  author       = {Gregory Kuhlmann and
                  Peter Stone},
  title        = {Automatic Heuristic Construction for General Game Playing},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1883--1884},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-320.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KuhlmannS06a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/StrongerS06,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Expectation-Based Vision for Self-Localization on a Legged Robot},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1899--1900},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-328.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/StrongerS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TaylorS06,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  title        = {Inter-Task Action Correlation for Reinforcement Learning Tasks},
  booktitle    = {Proceedings, The Twenty-First National Conference on Artificial Intelligence
                  and the Eighteenth Innovative Applications of Artificial Intelligence
                  Conference, July 16-20, 2006, Boston, Massachusetts, {USA}},
  pages        = {1901--1903},
  publisher    = {{AAAI} Press},
  year         = {2006},
  url          = {http://www.aaai.org/Library/AAAI/2006/aaai06-329.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TaylorS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/PardoeS06,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Derek Long and
                  Stephen F. Smith and
                  Daniel Borrajo and
                  Lee McCluskey},
  title        = {Predictive Planning for Supply Chain Management},
  booktitle    = {Proceedings of the Sixteenth International Conference on Automated
                  Planning and Scheduling, {ICAPS} 2006, Cumbria, UK, June 6-10, 2006},
  pages        = {21--30},
  publisher    = {{AAAI}},
  year         = {2006},
  url          = {http://www.aaai.org/Library/ICAPS/2006/icaps06-003.php},
  timestamp    = {Fri, 05 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aips/PardoeS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeSM06,
  author       = {David Pardoe and
                  Peter Stone and
                  Mark Van Middlesworth},
  editor       = {Maria Fasli and
                  Onn Shehory},
  title        = {TacTex-05: An Adaptive Agent for {TAC} {SCM}},
  booktitle    = {Agent-Mediated Electronic Commerce. Automated Negotiation and Strategy
                  Design for Electronic Markets, {AAMAS} 2006 Workshop, {TADA/AMEC}
                  2006, Hakodate, Japan, May 9, 2006, Selected and Revised Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {4452},
  pages        = {46--61},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-72502-2\_4},
  doi          = {10.1007/978-3-540-72502-2\_4},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeSM06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dars/AhmadiS06,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  editor       = {Maria L. Gini and
                  Richard M. Voyles},
  title        = {A Distributed Biconnectivity Check},
  booktitle    = {Distributed Autonomous Robotic Systems 7, Proceedings of the 8th International
                  Symposium on Distributed Autonomous Robotic Systems, {DARS} 2006,
                  Minneapolis, Minnesota, USA, 2006},
  pages        = {1--10},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/4-431-35881-1\_1},
  doi          = {10.1007/4-431-35881-1\_1},
  timestamp    = {Fri, 26 Jul 2019 10:09:14 +0200},
  biburl       = {https://dblp.org/rec/conf/dars/AhmadiS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/TaylorWS06,
  author       = {Matthew E. Taylor and
                  Shimon Whiteson and
                  Peter Stone},
  editor       = {Mike Cattolico},
  title        = {Comparing evolutionary and temporal difference methods in a reinforcement
                  learning domain},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings,
                  Seattle, Washington, USA, July 8-12, 2006},
  pages        = {1321--1328},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143997.1144202},
  doi          = {10.1145/1143997.1144202},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/TaylorWS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/WhitesonS06,
  author       = {Shimon Whiteson and
                  Peter Stone},
  editor       = {Mike Cattolico},
  title        = {On-line evolutionary computation for reinforcement learning in stochastic
                  domains},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings,
                  Seattle, Washington, USA, July 8-12, 2006},
  pages        = {1577--1584},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143997.1144252},
  doi          = {10.1145/1143997.1144252},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/WhitesonS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/SubramanianRSK06,
  author       = {Harish Subramanian and
                  Subramanian Ramamoorthy and
                  Peter Stone and
                  Benjamin Kuipers},
  editor       = {Mike Cattolico},
  title        = {Designing safe, profitable automated stock trading agents using evolutionary
                  algorithms},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings,
                  Seattle, Washington, USA, July 8-12, 2006},
  pages        = {1777--1784},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143997.1144285},
  doi          = {10.1145/1143997.1144285},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/SubramanianRSK06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icarcv/SridharanS06,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Autonomous Planned Color Learning on a Mobile Robot Without Labeled
                  Data},
  booktitle    = {Ninth International Conference on Control, Automation, Robotics and
                  Vision, {ICARCV} 2006, Singapore, 5-8 December 2006, Proceedings},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICARCV.2006.345403},
  doi          = {10.1109/ICARCV.2006.345403},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icarcv/SridharanS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/AhmadiS06,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  title        = {A Multi-robot System for Continuous Area Sweeping Tasks},
  booktitle    = {Proceedings of the 2006 {IEEE} International Conference on Robotics
                  and Automation, {ICRA} 2006, May 15-19, 2006, Orlando, Florida, {USA}},
  pages        = {1724--1729},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/ROBOT.2006.1641955},
  doi          = {10.1109/ROBOT.2006.1641955},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/AhmadiS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ictai/StrongerS06,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Polynomial Regression with Automated Degree: {A} Function Approximator
                  for Autonomous Agents},
  booktitle    = {18th {IEEE} International Conference on Tools with Artificial Intelligence
                  {(ICTAI} 2006), 13-15 November 2006, Arlington, VA, {USA}},
  pages        = {474--480},
  publisher    = {{IEEE} Computer Society},
  year         = {2006},
  url          = {https://doi.org/10.1109/ICTAI.2006.96},
  doi          = {10.1109/ICTAI.2006.96},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ictai/StrongerS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/FidelmanS06,
  author       = {Peggy Fidelman and
                  Peter Stone},
  editor       = {Gerhard Lakemeyer and
                  Elizabeth Sklar and
                  Domenico G. Sorrenti and
                  Tomoichi Takahashi},
  title        = {The Chin Pinch: {A} Case Study in Skill Learning on a Legged Robot},
  booktitle    = {RoboCup 2006: Robot Soccer World Cup {X}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4434},
  pages        = {59--71},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-74024-7\_6},
  doi          = {10.1007/978-3-540-74024-7\_6},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/FidelmanS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KalyanakrishnanLS06,
  author       = {Shivaram Kalyanakrishnan and
                  Yaxin Liu and
                  Peter Stone},
  editor       = {Gerhard Lakemeyer and
                  Elizabeth Sklar and
                  Domenico G. Sorrenti and
                  Tomoichi Takahashi},
  title        = {Half Field Offense in RoboCup Soccer: {A} Multiagent Reinforcement
                  Learning Case Study},
  booktitle    = {RoboCup 2006: Robot Soccer World Cup {X}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4434},
  pages        = {72--85},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-74024-7\_7},
  doi          = {10.1007/978-3-540-74024-7\_7},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KalyanakrishnanLS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/SaggarDKS06,
  author       = {Manish Saggar and
                  Thomas D'Silva and
                  Nate Kohl and
                  Peter Stone},
  editor       = {Gerhard Lakemeyer and
                  Elizabeth Sklar and
                  Domenico G. Sorrenti and
                  Tomoichi Takahashi},
  title        = {Autonomous Learning of Stable Quadruped Locomotion},
  booktitle    = {RoboCup 2006: Robot Soccer World Cup {X}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4434},
  pages        = {98--109},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-74024-7\_9},
  doi          = {10.1007/978-3-540-74024-7\_9},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/SaggarDKS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StrongerS06,
  author       = {Daniel Stronger and
                  Peter Stone},
  editor       = {Gerhard Lakemeyer and
                  Elizabeth Sklar and
                  Domenico G. Sorrenti and
                  Tomoichi Takahashi},
  title        = {Selective Visual Attention for Object Detection on a Legged Robot},
  booktitle    = {RoboCup 2006: Robot Soccer World Cup {X}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4434},
  pages        = {158--170},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-74024-7\_14},
  doi          = {10.1007/978-3-540-74024-7\_14},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StrongerS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/SridharanS06,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Gerhard Lakemeyer and
                  Elizabeth Sklar and
                  Domenico G. Sorrenti and
                  Tomoichi Takahashi},
  title        = {Autonomous Planned Color Learning on a Legged Robot},
  booktitle    = {RoboCup 2006: Robot Soccer World Cup {X}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4434},
  pages        = {270--278},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-74024-7\_23},
  doi          = {10.1007/978-3-540-74024-7\_23},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/SridharanS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/atal/2006,
  editor       = {Hideyuki Nakashima and
                  Michael P. Wellman and
                  Gerhard Weiss and
                  Peter Stone},
  title        = {5th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2006), Hakodate, Japan, May 8-12, 2006},
  publisher    = {{ACM}},
  year         = {2006},
  isbn         = {1-59593-303-4},
  timestamp    = {Tue, 08 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/2006.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/adb/StoneSK05,
  author       = {Peter Stone and
                  Richard S. Sutton and
                  Gregory Kuhlmann},
  title        = {Reinforcement Learning for RoboCup Soccer Keepaway},
  journal      = {Adapt. Behav.},
  volume       = {13},
  number       = {3},
  pages        = {165--188},
  year         = {2005},
  url          = {https://doi.org/10.1177/105971230501300301},
  doi          = {10.1177/105971230501300301},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/adb/StoneSK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/dss/LittmanS05,
  author       = {Michael L. Littman and
                  Peter Stone},
  title        = {A polynomial-time Nash equilibrium algorithm for repeated games},
  journal      = {Decis. Support Syst.},
  volume       = {39},
  number       = {1},
  pages        = {55--66},
  year         = {2005},
  url          = {https://doi.org/10.1016/j.dss.2004.08.007},
  doi          = {10.1016/J.DSS.2004.08.007},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/dss/LittmanS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ecr/StoneG05,
  author       = {Peter Stone and
                  Amy Greenwald},
  title        = {The First International Trading Agent Competition: Autonomous Bidding
                  Agents},
  journal      = {Electron. Commer. Res.},
  volume       = {5},
  number       = {2},
  pages        = {229--265},
  year         = {2005},
  url          = {https://doi.org/10.1007/s10660-005-6158-z},
  doi          = {10.1007/S10660-005-6158-Z},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ecr/StoneG05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/WhitesonKMS05,
  author       = {Shimon Whiteson and
                  Nate Kohl and
                  Risto Miikkulainen and
                  Peter Stone},
  title        = {Evolving Soccer Keepaway Players Through Task Decomposition},
  journal      = {Mach. Learn.},
  volume       = {59},
  number       = {1-2},
  pages        = {5--30},
  year         = {2005},
  url          = {https://doi.org/10.1007/s10994-005-0460-9},
  doi          = {10.1007/S10994-005-0460-9},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/WhitesonKMS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigecom/PardoeS05,
  author       = {David Pardoe and
                  Peter Stone},
  title        = {Developing adaptive auction mechanisms},
  journal      = {SIGecom Exch.},
  volume       = {5},
  number       = {3},
  pages        = {1--10},
  year         = {2005},
  url          = {https://doi.org/10.1145/1120680.1120682},
  doi          = {10.1145/1120680.1120682},
  timestamp    = {Thu, 04 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigecom/PardoeS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/TaylorSL05,
  author       = {Matthew E. Taylor and
                  Peter Stone and
                  Yaxin Liu},
  editor       = {Manuela M. Veloso and
                  Subbarao Kambhampati},
  title        = {Value Functions for RL-Based Behavior Transfer: {A} Comparative Study},
  booktitle    = {Proceedings, The Twentieth National Conference on Artificial Intelligence
                  and the Seventeenth Innovative Applications of Artificial Intelligence
                  Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}},
  pages        = {880--885},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2005},
  url          = {http://www.aaai.org/Library/AAAI/2005/aaai05-139.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/TaylorSL05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SherstovS05,
  author       = {Alexander A. Sherstov and
                  Peter Stone},
  editor       = {Manuela M. Veloso and
                  Subbarao Kambhampati},
  title        = {Improving Action Selection in MDP's via Knowledge Transfer},
  booktitle    = {Proceedings, The Twentieth National Conference on Artificial Intelligence
                  and the Seventeenth Innovative Applications of Artificial Intelligence
                  Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}},
  pages        = {1024--1029},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2005},
  url          = {http://www.aaai.org/Library/AAAI/2005/aaai05-162.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SherstovS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SridharanS05,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Manuela M. Veloso and
                  Subbarao Kambhampati},
  title        = {Autonomous Color Learning on a Mobile Robot},
  booktitle    = {Proceedings, The Twentieth National Conference on Artificial Intelligence
                  and the Seventeenth Innovative Applications of Artificial Intelligence
                  Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}},
  pages        = {1318--1323},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2005},
  url          = {http://www.aaai.org/Library/AAAI/2005/aaai05-209.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SridharanS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/TaylorS05,
  author       = {Matthew E. Taylor and
                  Peter Stone},
  editor       = {Frank Dignum and
                  Virginia Dignum and
                  Sven Koenig and
                  Sarit Kraus and
                  Munindar P. Singh and
                  Michael J. Wooldridge},
  title        = {Behavior transfer for value-function-based reinforcement learning},
  booktitle    = {4th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2005), July 25-29, 2005, Utrecht, The Netherlands},
  pages        = {53--59},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1082473.1082482},
  doi          = {10.1145/1082473.1082482},
  timestamp    = {Fri, 26 Apr 2019 14:26:42 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/TaylorS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/DresnerS05,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  editor       = {Frank Dignum and
                  Virginia Dignum and
                  Sven Koenig and
                  Sarit Kraus and
                  Munindar P. Singh and
                  Michael J. Wooldridge},
  title        = {Multiagent traffic management: an improved intersection control mechanism},
  booktitle    = {4th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2005), July 25-29, 2005, Utrecht, The Netherlands},
  pages        = {471--477},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1082473.1082545},
  doi          = {10.1145/1082473.1082545},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DresnerS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/WhitesonSSMK05,
  author       = {Shimon Whiteson and
                  Peter Stone and
                  Kenneth O. Stanley and
                  Risto Miikkulainen and
                  Nate Kohl},
  editor       = {Hans{-}Georg Beyer and
                  Una{-}May O'Reilly},
  title        = {Automatic feature selection in neuroevolution},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} 2005, Proceedings,
                  Washington DC, USA, June 25-29, 2005},
  pages        = {1225--1232},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1068009.1068210},
  doi          = {10.1145/1068009.1068210},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/WhitesonSSMK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icac/WildstromSWMD05,
  author       = {Jonathan Wildstrom and
                  Peter Stone and
                  Emmett Witchel and
                  Raymond J. Mooney and
                  Michael Dahlin},
  title        = {Towards Self-Configuring Hardware for Distributed Computer Systems},
  booktitle    = {Second International Conference on Autonomic Computing {(ICAC} 2005),
                  13-16 June 2005, Seattle, WA, {USA}},
  pages        = {241--249},
  publisher    = {{IEEE} Computer Society},
  year         = {2005},
  url          = {https://doi.org/10.1109/ICAC.2005.63},
  doi          = {10.1109/ICAC.2005.63},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icac/WildstromSWMD05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/SridharanKS05,
  author       = {Mohan Sridharan and
                  Gregory Kuhlmann and
                  Peter Stone},
  title        = {Practical Vision-Based Monte Carlo Localization on a Legged Robot},
  booktitle    = {Proceedings of the 2005 {IEEE} International Conference on Robotics
                  and Automation, {ICRA} 2005, April 18-22, 2005, Barcelona, Spain},
  pages        = {3366--3371},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ROBOT.2005.1570630},
  doi          = {10.1109/ROBOT.2005.1570630},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/SridharanKS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/StrongerS05,
  author       = {Daniel Stronger and
                  Peter Stone},
  title        = {Simultaneous Calibration of Action and Sensor Models on a Mobile Robot},
  booktitle    = {Proceedings of the 2005 {IEEE} International Conference on Robotics
                  and Automation, {ICRA} 2005, April 18-22, 2005, Barcelona, Spain},
  pages        = {4563--4568},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ROBOT.2005.1570823},
  doi          = {10.1109/ROBOT.2005.1570823},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/StrongerS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/JongS05,
  author       = {Nicholas K. Jong and
                  Peter Stone},
  editor       = {Leslie Pack Kaelbling and
                  Alessandro Saffiotti},
  title        = {State Abstraction Discovery from Irrelevant State Variables},
  booktitle    = {IJCAI-05, Proceedings of the Nineteenth International Joint Conference
                  on Artificial Intelligence, Edinburgh, Scotland, UK, July 30 - August
                  5, 2005},
  pages        = {752--757},
  publisher    = {Professional Book Center},
  year         = {2005},
  url          = {http://ijcai.org/Proceedings/05/Papers/1655.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:16:29 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/JongS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/SridharanS05,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Real-time vision on a mobile robot platform},
  booktitle    = {2005 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, Edmonton, Alberta, Canada, August 2-6, 2005},
  pages        = {2148--2153},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/IROS.2005.1545540},
  doi          = {10.1109/IROS.2005.1545540},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/SridharanS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lamas/AhmadiS05,
  author       = {Mazda Ahmadi and
                  Peter Stone},
  editor       = {Karl Tuyls and
                  Pieter Jan't Hoen and
                  Katja Verbeeck and
                  Sandip Sen},
  title        = {Multi-robot Learning for Continuous Area Sweeping},
  booktitle    = {Learning and Adaption in Multi-Agent Systems, First International
                  Workshop, {LAMAS} 2005, Utrecht, The Netherlands, July 25, 2005, Revised
                  Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3898},
  pages        = {47--70},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11691839\_2},
  doi          = {10.1007/11691839\_2},
  timestamp    = {Tue, 14 May 2019 10:00:47 +0200},
  biburl       = {https://dblp.org/rec/conf/lamas/AhmadiS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lamas/DresnerS05,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  editor       = {Karl Tuyls and
                  Pieter Jan't Hoen and
                  Katja Verbeeck and
                  Sandip Sen},
  title        = {Multiagent Traffic Management: Opportunities for Multiagent Learning},
  booktitle    = {Learning and Adaption in Multi-Agent Systems, First International
                  Workshop, {LAMAS} 2005, Utrecht, The Netherlands, July 25, 2005, Revised
                  Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3898},
  pages        = {129--138},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11691839\_7},
  doi          = {10.1007/11691839\_7},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lamas/DresnerS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneKTL05,
  author       = {Peter Stone and
                  Gregory Kuhlmann and
                  Matthew E. Taylor and
                  Yaxin Liu},
  editor       = {Ansgar Bredenfeld and
                  Adam Jacoff and
                  Itsuki Noda and
                  Yasutake Takahashi},
  title        = {Keepaway Soccer: From Machine Learning Testbed to Benchmark},
  booktitle    = {RoboCup 2005: Robot Soccer World Cup {IX}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4020},
  pages        = {93--105},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11780519\_9},
  doi          = {10.1007/11780519\_9},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneKTL05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/SridharanS05,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Ansgar Bredenfeld and
                  Adam Jacoff and
                  Itsuki Noda and
                  Yasutake Takahashi},
  title        = {Towards Eliminating Manual Color Calibration at RoboCup},
  booktitle    = {RoboCup 2005: Robot Soccer World Cup {IX}},
  series       = {Lecture Notes in Computer Science},
  volume       = {4020},
  pages        = {673--681},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11780519\_68},
  doi          = {10.1007/11780519\_68},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/SridharanS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sara/SherstovS05,
  author       = {Alexander A. Sherstov and
                  Peter Stone},
  editor       = {Jean{-}Daniel Zucker and
                  Lorenza Saitta},
  title        = {Function Approximation via Tile Coding: Automating Parameter Choice},
  booktitle    = {Abstraction, Reformulation and Approximation, 6th International Symposium,
                  {SARA} 2005, Airth Castle, Scotland, UK, July 26-29, 2005, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3607},
  pages        = {194--205},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/11527862\_14},
  doi          = {10.1007/11527862\_14},
  timestamp    = {Tue, 14 May 2019 10:00:38 +0200},
  biburl       = {https://dblp.org/rec/conf/sara/SherstovS05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/eaai/WhitesonS04,
  author       = {Shimon Whiteson and
                  Peter Stone},
  title        = {Adaptive job routing and scheduling},
  journal      = {Eng. Appl. Artif. Intell.},
  volume       = {17},
  number       = {7},
  pages        = {855--869},
  year         = {2004},
  url          = {https://doi.org/10.1016/j.engappai.2004.08.027},
  doi          = {10.1016/J.ENGAPPAI.2004.08.027},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/eaai/WhitesonS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jeric/SklarPS04,
  author       = {Elizabeth Sklar and
                  Simon Parsons and
                  Peter Stone},
  title        = {Using RoboCup in university-level computer science education},
  journal      = {{ACM} J. Educ. Resour. Comput.},
  volume       = {4},
  number       = {2},
  pages        = {4},
  year         = {2004},
  url          = {https://doi.org/10.1145/1071620.1071624},
  doi          = {10.1145/1071620.1071624},
  timestamp    = {Sun, 17 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jeric/SklarPS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigecom/PardoeS04,
  author       = {David Pardoe and
                  Peter Stone},
  title        = {TacTex-03: a supply chain management agent},
  journal      = {SIGecom Exch.},
  volume       = {4},
  number       = {3},
  pages        = {19--28},
  year         = {2004},
  url          = {https://doi.org/10.1145/1120701.1120705},
  doi          = {10.1145/1120701.1120705},
  timestamp    = {Thu, 04 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sigecom/PardoeS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KohlS04,
  author       = {Nate Kohl and
                  Peter Stone},
  editor       = {Deborah L. McGuinness and
                  George Ferguson},
  title        = {Machine Learning for Fast Quadrupedal Locomotion},
  booktitle    = {Proceedings of the Nineteenth National Conference on Artificial Intelligence,
                  Sixteenth Conference on Innovative Applications of Artificial Intelligence,
                  July 25-29, 2004, San Jose, California, {USA}},
  pages        = {611--616},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2004},
  url          = {http://www.aaai.org/Library/AAAI/2004/aaai04-097.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KohlS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WhitesonS04,
  author       = {Shimon Whiteson and
                  Peter Stone},
  editor       = {Deborah L. McGuinness and
                  George Ferguson},
  title        = {Towards Autonomic Computing: Adaptive Job Routing and Scheduling},
  booktitle    = {Proceedings of the Nineteenth National Conference on Artificial Intelligence,
                  Sixteenth Conference on Innovative Applications of Artificial Intelligence,
                  July 25-29, 2004, San Jose, California, {USA}},
  pages        = {916--922},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2004},
  timestamp    = {Wed, 21 Jul 2004 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WhitesonS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/PardoeS04,
  author       = {David Pardoe and
                  Peter Stone},
  editor       = {Peyman Faratin and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar},
  title        = {Bidding for Customer Orders in {TAC} {SCM}},
  booktitle    = {Agent-Mediated Electronic Commerce VI, Theories for and Engineering
                  of Distributed Mechanisms and Systems, {AAMAS} 2004 Workshop, {AMEC}
                  2004, New York, NY, USA, July 19, 2004, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3435},
  pages        = {143--157},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/11575726\_11},
  doi          = {10.1007/11575726\_11},
  timestamp    = {Tue, 14 May 2019 10:00:39 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/PardoeS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/SherstovS04,
  author       = {Alexander A. Sherstov and
                  Peter Stone},
  editor       = {Peyman Faratin and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar},
  title        = {Three Automated Stock-Trading Agents: {A} Comparative Study},
  booktitle    = {Agent-Mediated Electronic Commerce VI, Theories for and Engineering
                  of Distributed Mechanisms and Systems, {AAMAS} 2004 Workshop, {AMEC}
                  2004, New York, NY, USA, July 19, 2004, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3435},
  pages        = {173--187},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/11575726\_13},
  doi          = {10.1007/11575726\_13},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/SherstovS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/DresnerS04,
  author       = {Kurt M. Dresner and
                  Peter Stone},
  title        = {Multiagent Traffic Management: {A} Reservation-Based Intersection
                  Control Mechanism},
  booktitle    = {3rd International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2004), 19-23 August 2004, New York, NY, {USA}},
  pages        = {530--537},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.ieeecomputersociety.org/10.1109/AAMAS.2004.10121},
  doi          = {10.1109/AAMAS.2004.10121},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DresnerS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PardoeS04,
  author       = {David Pardoe and
                  Peter Stone},
  title        = {Agent-Based Supply Chain Management: Bidding for Customer Orders},
  booktitle    = {3rd International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2004), 19-23 August 2004, New York, NY, {USA}},
  pages        = {1442--1443},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.ieeecomputersociety.org/10.1109/AAMAS.2004.10276},
  doi          = {10.1109/AAMAS.2004.10276},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/PardoeS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/crv/SridharanS04,
  author       = {Mohan Sridharan and
                  Peter Stone},
  title        = {Towards On-Board Color Constancy on Mobile Robots},
  booktitle    = {1st Canadian Conference on Computer and Robot Vision {(CRV} 2004)
                  17-19 May 2004, London, Ontario, Canada},
  pages        = {130--137},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/CCCRV.2004.1301436},
  doi          = {10.1109/CCCRV.2004.1301436},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/crv/SridharanS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icac/WhitesonS04,
  author       = {Shimon Whiteson and
                  Peter Stone},
  title        = {Towards Autonomic Computing: Adaptive Network Routing and Scheduling},
  booktitle    = {1st International Conference on Autonomic Computing {(ICAC} 2004),
                  17-19 May 2004, New York, NY, {USA}},
  pages        = {286--287},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.ieeecomputersociety.org/10.1109/ICAC.2004.62},
  doi          = {10.1109/ICAC.2004.62},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icac/WhitesonS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/KohlS04,
  author       = {Nate Kohl and
                  Peter Stone},
  title        = {Policy Gradient Reinforcement Learning for Fast Quadrupedal Locomotion},
  booktitle    = {Proceedings of the 2004 {IEEE} International Conference on Robotics
                  and Automation, {ICRA} 2004, April 26 - May 1, 2004, New Orleans,
                  LA, {USA}},
  pages        = {2619--2624},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ROBOT.2004.1307456},
  doi          = {10.1109/ROBOT.2004.1307456},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/KohlS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isbi/WahleOVBBRCSMCFS04,
  author       = {Andreas Wahle and
                  Mark E. Olszewski and
                  Sarah C. Vigmostad and
                  Kathleen Braddy and
                  Theresa Brennan and
                  James D. Rossen and
                  Krishnan B. Chandran and
                  Milan Sonka and
                  Rub{\'{e}}n Medina and
                  A. Coskun and
                  Charles Feldman and
                  Peter Stone},
  title        = {Quantitative Analysis of Circumferential Plaque Distribution in Human
                  Coronary Arteries in Relation to Local Vessel Curvature},
  booktitle    = {Proceedings of the 2004 {IEEE} International Symposium on Biomedical
                  Imaging: From Nano to Macro, Arlington, VA, USA, 15-18 April 2004},
  pages        = {531--534},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/ISBI.2004.1398592},
  doi          = {10.1109/ISBI.2004.1398592},
  timestamp    = {Sat, 28 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/isbi/WahleOVBBRCSMCFS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/SridharanS04,
  author       = {Mohan Sridharan and
                  Peter Stone},
  editor       = {Daniele Nardi and
                  Martin A. Riedmiller and
                  Claude Sammut and
                  Jos{\'{e}} Santos{-}Victor},
  title        = {Towards Illumination Invariance in the Legged League},
  booktitle    = {RoboCup 2004: Robot Soccer World Cup {VIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3276},
  pages        = {196--208},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-32256-6\_16},
  doi          = {10.1007/978-3-540-32256-6\_16},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/SridharanS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StrongerS04,
  author       = {Daniel Stronger and
                  Peter Stone},
  editor       = {Daniele Nardi and
                  Martin A. Riedmiller and
                  Claude Sammut and
                  Jos{\'{e}} Santos{-}Victor},
  title        = {A Model-Based Approach to Robot Joint Control},
  booktitle    = {RoboCup 2004: Robot Soccer World Cup {VIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3276},
  pages        = {297--309},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-32256-6\_24},
  doi          = {10.1007/978-3-540-32256-6\_24},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StrongerS04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KuhlmannSL04,
  author       = {Gregory Kuhlmann and
                  Peter Stone and
                  Justin Lallinger},
  editor       = {Daniele Nardi and
                  Martin A. Riedmiller and
                  Claude Sammut and
                  Jos{\'{e}} Santos{-}Victor},
  title        = {The {UT} Austin Villa 2003 Champion Simulator Coach: {A} Machine Learning
                  Approach},
  booktitle    = {RoboCup 2004: Robot Soccer World Cup {VIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3276},
  pages        = {636--644},
  publisher    = {Springer},
  year         = {2004},
  url          = {https://doi.org/10.1007/978-3-540-32256-6\_61},
  doi          = {10.1007/978-3-540-32256-6\_61},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KuhlmannSL04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aamas/NodaS03,
  author       = {Itsuki Noda and
                  Peter Stone},
  title        = {The RoboCup Soccer Server and CMUnited Clients: Implemented Infrastructure
                  for {MAS} Research},
  journal      = {Auton. Agents Multi Agent Syst.},
  volume       = {7},
  number       = {1-2},
  pages        = {101--120},
  year         = {2003},
  url          = {https://doi.org/10.1023/A:1024128904944},
  doi          = {10.1023/A:1024128904944},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/aamas/NodaS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/electronicmarkets/WellmanGSW03,
  author       = {Michael P. Wellman and
                  Amy Greenwald and
                  Peter Stone and
                  Peter R. Wurman},
  title        = {The 2001 Trading Agent Competition},
  journal      = {Electron. Mark.},
  volume       = {13},
  number       = {1},
  pages        = {4--12},
  year         = {2003},
  url          = {https://doi.org/10.1080/1019678032000062212},
  doi          = {10.1080/1019678032000062212},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/electronicmarkets/WellmanGSW03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/expert/GreenwaldJS03,
  author       = {Amy Greenwald and
                  Nicholas R. Jennings and
                  Peter Stone},
  title        = {Guest Editors' Introduction: Agents and Markets},
  journal      = {{IEEE} Intell. Syst.},
  volume       = {18},
  number       = {6},
  pages        = {12--14},
  year         = {2003},
  url          = {https://doi.org/10.1109/MIS.2003.1249164},
  doi          = {10.1109/MIS.2003.1249164},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/expert/GreenwaldJS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/StoneSLCM03,
  author       = {Peter Stone and
                  Robert E. Schapire and
                  Michael L. Littman and
                  J{\'{a}}nos A. Csirik and
                  David A. McAllester},
  title        = {Decision-Theoretic Bidding Based on Learned Density Models in Simultaneous,
                  Interacting Auctions},
  journal      = {J. Artif. Intell. Res.},
  volume       = {19},
  pages        = {209--242},
  year         = {2003},
  url          = {https://doi.org/10.1613/jair.1200},
  doi          = {10.1613/JAIR.1200},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/StoneSLCM03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ACMicec/YuS03,
  author       = {Ronggang Yu and
                  Peter Stone},
  editor       = {Norman M. Sadeh and
                  Mary Jo Dively and
                  Robert J. Kauffman and
                  Yannis Labrou and
                  Onn Shehory and
                  Rahul Telang and
                  Lorrie Faith Cranor},
  title        = {Performance analysis of a counter-intuitive automated stock-trading
                  agent},
  booktitle    = {Proceedings of the 5th International Conference on Electronic Commerce,
                  {ICEC} 2003, Pittsburgh, Pennsylvania, USA, September 30 - October
                  03, 2003},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {50},
  pages        = {40--46},
  publisher    = {{ACM}},
  year         = {2003},
  url          = {https://doi.org/10.1145/948005.948011},
  doi          = {10.1145/948005.948011},
  timestamp    = {Tue, 06 Apr 2021 12:12:56 +0200},
  biburl       = {https://dblp.org/rec/conf/ACMicec/YuS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/FengYS03,
  author       = {Y. Feng and
                  Rong Yu and
                  Peter Stone},
  editor       = {Peyman Faratin and
                  David C. Parkes and
                  Juan A. Rodr{\'{\i}}guez{-}Aguilar and
                  William E. Walsh},
  title        = {Two Stock-Trading Agents: Market Making and Technical Analysis},
  booktitle    = {Agent-Mediated Electronic Commerce V, Designing Mechanisms and Systems,
                  {AAMAS} 2003 Workshop, {AMEC} 2003, Melbourne, Australia, July 15,
                  2003, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {3048},
  pages        = {18--36},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/978-3-540-25947-3\_2},
  doi          = {10.1007/978-3-540-25947-3\_2},
  timestamp    = {Sat, 14 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/FengYS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/WhitesonS03,
  author       = {Shimon Whiteson and
                  Peter Stone},
  title        = {Concurrent layered learning},
  booktitle    = {The Second International Joint Conference on Autonomous Agents {\&}
                  Multiagent Systems, {AAMAS} 2003, July 14-18, 2003, Melbourne, Victoria,
                  Australia, Proceedings},
  pages        = {193--200},
  publisher    = {{ACM}},
  year         = {2003},
  url          = {https://doi.org/10.1145/860575.860607},
  doi          = {10.1145/860575.860607},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/WhitesonS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/WhitesonKMS03,
  author       = {Shimon Whiteson and
                  Nate Kohl and
                  Risto Miikkulainen and
                  Peter Stone},
  editor       = {Erick Cant{\'{u}}{-}Paz and
                  James A. Foster and
                  Kalyanmoy Deb and
                  Lawrence Davis and
                  Rajkumar Roy and
                  Una{-}May O'Reilly and
                  Hans{-}Georg Beyer and
                  Russell K. Standish and
                  Graham Kendall and
                  Stewart W. Wilson and
                  Mark Harman and
                  Joachim Wegener and
                  Dipankar Dasgupta and
                  Mitchell A. Potter and
                  Alan C. Schultz and
                  Kathryn A. Dowsland and
                  Natasa Jonoska and
                  Julian F. Miller},
  title        = {Evolving Keepaway Soccer Players through Task Decomposition},
  booktitle    = {Genetic and Evolutionary Computation - {GECCO} 2003, Genetic and Evolutionary
                  Computation Conference, Chicago, IL, USA, July 12-16, 2003. Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2723},
  pages        = {356--368},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/3-540-45105-6\_41},
  doi          = {10.1007/3-540-45105-6\_41},
  timestamp    = {Tue, 14 May 2019 10:00:35 +0200},
  biburl       = {https://dblp.org/rec/conf/gecco/WhitesonKMS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SinghLJPS03,
  author       = {Satinder Singh and
                  Michael L. Littman and
                  Nicholas K. Jong and
                  David Pardoe and
                  Peter Stone},
  editor       = {Tom Fawcett and
                  Nina Mishra},
  title        = {Learning Predictive State Representations},
  booktitle    = {Machine Learning, Proceedings of the Twentieth International Conference
                  {(ICML} 2003), August 21-24, 2003, Washington, DC, {USA}},
  pages        = {712--719},
  publisher    = {{AAAI} Press},
  year         = {2003},
  url          = {http://www.aaai.org/Library/ICML/2003/icml03-093.php},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SinghLJPS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/Stone03,
  author       = {Peter Stone},
  editor       = {Daniel Polani and
                  Brett Browning and
                  Andrea Bonarini and
                  Kazuo Yoshida},
  title        = {RoboCup as an Introduction to {CS} Research},
  booktitle    = {RoboCup 2003: Robot Soccer World Cup {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3020},
  pages        = {284--295},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/978-3-540-25940-4\_25},
  doi          = {10.1007/978-3-540-25940-4\_25},
  timestamp    = {Tue, 14 May 2019 10:00:53 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/Stone03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/SklarPS03,
  author       = {Elizabeth Sklar and
                  Simon Parsons and
                  Peter Stone},
  editor       = {Daniel Polani and
                  Brett Browning and
                  Andrea Bonarini and
                  Kazuo Yoshida},
  title        = {RoboCup in Higher Education: {A} Preliminary Report},
  booktitle    = {RoboCup 2003: Robot Soccer World Cup {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3020},
  pages        = {296--307},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/978-3-540-25940-4\_26},
  doi          = {10.1007/978-3-540-25940-4\_26},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/SklarPS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KuhlmannS03,
  author       = {Gregory Kuhlmann and
                  Peter Stone},
  editor       = {Daniel Polani and
                  Brett Browning and
                  Andrea Bonarini and
                  Kazuo Yoshida},
  title        = {Progress in Learning 3 vs. 2 Keepaway},
  booktitle    = {RoboCup 2003: Robot Soccer World Cup {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {3020},
  pages        = {694--702},
  publisher    = {Springer},
  year         = {2003},
  url          = {https://doi.org/10.1007/978-3-540-25940-4\_68},
  doi          = {10.1007/978-3-540-25940-4\_68},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KuhlmannS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigecom/LittmanS03,
  author       = {Michael L. Littman and
                  Peter Stone},
  editor       = {Daniel A. Menasc{\'{e}} and
                  Noam Nisan},
  title        = {A polynomial-time nash equilibrium algorithm for repeated games},
  booktitle    = {Proceedings 4th {ACM} Conference on Electronic Commerce (EC-2003),
                  San Diego, California, USA, June 9-12, 2003},
  pages        = {48--54},
  publisher    = {{ACM}},
  year         = {2003},
  url          = {https://doi.org/10.1145/779928.779935},
  doi          = {10.1145/779928.779935},
  timestamp    = {Tue, 27 Nov 2018 11:56:48 +0100},
  biburl       = {https://dblp.org/rec/conf/sigecom/LittmanS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/smc/KuhlmannS03,
  author       = {Gregory Kuhlmann and
                  Peter Stone},
  title        = {Progress in learning 3 vs. 2 keepaway},
  booktitle    = {Proceedings of the {IEEE} International Conference on Systems, Man
                  {\&} Cybernetics: Washington, D.C., USA, 5-8 October 2003},
  pages        = {52--59},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/ICSMC.2003.1243791},
  doi          = {10.1109/ICSMC.2003.1243791},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/smc/KuhlmannS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/VelosoBSKYEAJSMKCHHC02,
  author       = {Manuela M. Veloso and
                  Tucker R. Balch and
                  Peter Stone and
                  Hiroaki Kitano and
                  Fuminori Yamasaki and
                  Ken Endo and
                  Minoru Asada and
                  Mansour Jamzad and
                  Sayyed Bashir Sadjad and
                  Vahab S. Mirrokni and
                  Moslem Kazemi and
                  Hamid Reza Chitsaz and
                  Abbas Heydarnoori and
                  Mohammad Taghi Hajiaghayi and
                  Ehsan Chiniforooshan},
  title        = {RoboCup-2001: The Fifth Robotic Soccer World Championships},
  journal      = {{AI} Mag.},
  volume       = {23},
  number       = {1},
  pages        = {55--68},
  year         = {2002},
  url          = {https://doi.org/10.1609/aimag.v23i1.1609},
  doi          = {10.1609/AIMAG.V23I1.1609},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/VelosoBSKYEAJSMKCHHC02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/KarlgrenKGFTSGSBFSHCBGSDL02,
  author       = {Jussi Karlgren and
                  Pentti Kanerva and
                  Bj{\"{o}}rn Gamb{\"{a}}ck and
                  Kenneth D. Forbus and
                  Kagan Tumer and
                  Peter Stone and
                  Kai Goebel and
                  Gaurav S. Sukhatme and
                  Tucker R. Balch and
                  Bernd Fischer and
                  Doug Smith and
                  Sanda M. Harabagiu and
                  Vinay K. Chaudri and
                  Mike Barley and
                  Hans W. Guesgen and
                  Thomas F. Stahovich and
                  Randall Davis and
                  James A. Landay},
  title        = {The 2002 {AAAI} Spring Symposium Series},
  journal      = {{AI} Mag.},
  volume       = {23},
  number       = {4},
  pages        = {101--106},
  year         = {2002},
  url          = {https://doi.org/10.1609/aimag.v23i4.1675},
  doi          = {10.1609/AIMAG.V23I4.1675},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/KarlgrenKGFTSGSBFSHCBGSDL02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/WellmanGSW02,
  author       = {Michael P. Wellman and
                  Amy Greenwald and
                  Peter Stone and
                  Peter R. Wurman},
  editor       = {Rina Dechter and
                  Michael J. Kearns and
                  Richard S. Sutton},
  title        = {The 2001 Trading Agent Competition},
  booktitle    = {Proceedings of the Eighteenth National Conference on Artificial Intelligence
                  and Fourteenth Conference on Innovative Applications of Artificial
                  Intelligence, July 28 - August 1, 2002, Edmonton, Alberta, Canada},
  pages        = {935--942},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2002},
  url          = {http://www.aaai.org/Library/AAAI/2002/aaai02-138.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/WellmanGSW02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/StoneSCLM02,
  author       = {Peter Stone and
                  Robert E. Schapire and
                  J{\'{a}}nos A. Csirik and
                  Michael L. Littman and
                  David A. McAllester},
  editor       = {Julian A. Padget and
                  Onn Shehory and
                  David C. Parkes and
                  Norman M. Sadeh and
                  William E. Walsh},
  title        = {ATTac-2001: {A} Learning, Autonomous Bidding Agent},
  booktitle    = {Agent-Mediated Electronic Commerce IV, Designing Mechanisms and Systems,
                  {AAMAS} 2002 Workshop on Agent Mediated Electronic Commerce, Bologna,
                  Italy, July 16, 2002, Revised Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {2531},
  pages        = {143--160},
  publisher    = {Springer},
  year         = {2002},
  url          = {https://doi.org/10.1007/3-540-36378-5\_9},
  doi          = {10.1007/3-540-36378-5\_9},
  timestamp    = {Tue, 14 May 2019 10:00:39 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/StoneSCLM02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/amec/ReitsmaSCL02,
  author       = {Paul S. A. Reitsma and
                  Peter Stone and
                  J{\'{a}}nos A. Csirik and
                  Michael L. Littman},
  editor       = {Julian A. Padget and
                  Onn Shehory and
                  David C. Parkes and
                  Norman M. Sadeh and
                  William E. Walsh},
  title        = {Self-Enforcing Strategic Demand Reduction},
  booktitle    = {Agent-Mediated Electronic Commerce IV, Designing Mechanisms and Systems,
                  {AAMAS} 2002 Workshop on Agent Mediated Electronic Commerce, Bologna,
                  Italy, July 16, 2002, Revised Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {2531},
  pages        = {289--306},
  publisher    = {Springer},
  year         = {2002},
  url          = {https://doi.org/10.1007/3-540-36378-5\_18},
  doi          = {10.1007/3-540-36378-5\_18},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/amec/ReitsmaSCL02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/ReitsmaSCL02,
  author       = {Paul S. A. Reitsma and
                  Peter Stone and
                  J{\'{a}}nos A. Csirik and
                  Michael L. Littman},
  title        = {Randomized strategic demand reduction: getting more by asking for
                  less},
  booktitle    = {The First International Joint Conference on Autonomous Agents {\&}
                  Multiagent Systems, {AAMAS} 2002, July 15-19, 2002, Bologna, Italy,
                  Proceedings},
  pages        = {162--163},
  publisher    = {{ACM}},
  year         = {2002},
  url          = {https://doi.org/10.1145/544741.544778},
  doi          = {10.1145/544741.544778},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/ReitsmaSCL02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SchapireSMLC02,
  author       = {Robert E. Schapire and
                  Peter Stone and
                  David A. McAllester and
                  Michael L. Littman and
                  J{\'{a}}nos A. Csirik},
  editor       = {Claude Sammut and
                  Achim G. Hoffmann},
  title        = {Modeling Auction Price Uncertainty Using Boosting-based Conditional
                  Density Estimation},
  booktitle    = {Machine Learning, Proceedings of the Nineteenth International Conference
                  {(ICML} 2002), University of New South Wales, Sydney, Australia, July
                  8-12, 2002},
  pages        = {546--553},
  publisher    = {Morgan Kaufmann},
  year         = {2002},
  timestamp    = {Tue, 16 Mar 2004 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/SchapireSMLC02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/Stone02,
  author       = {Peter Stone},
  editor       = {Gal A. Kaminka and
                  Pedro U. Lima and
                  Ra{\'{u}}l Rojas},
  title        = {Multiagent Competitions and Research: Lessons from RoboCup and {TAC}},
  booktitle    = {RoboCup 2002: Robot Soccer World Cup {VI}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2752},
  pages        = {224--237},
  publisher    = {Springer},
  year         = {2002},
  url          = {https://doi.org/10.1007/978-3-540-45135-8\_17},
  doi          = {10.1007/978-3-540-45135-8\_17},
  timestamp    = {Mon, 23 Nov 2020 14:36:01 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/Stone02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/Stone01,
  author       = {Peter Stone},
  title        = {RoboCup-2000: The Fourth Robotic Soccer World Championships},
  journal      = {{AI} Mag.},
  volume       = {22},
  number       = {1},
  pages        = {11--38},
  year         = {2001},
  url          = {https://doi.org/10.1609/aimag.v22i1.1541},
  doi          = {10.1609/AIMAG.V22I1.1541},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/Stone01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/internet/GreenwaldS01,
  author       = {Amy Greenwald and
                  Peter Stone},
  title        = {Autonomous Bidding Agents in the Trading Agent Competition},
  journal      = {{IEEE} Internet Comput.},
  volume       = {5},
  number       = {2},
  pages        = {52--60},
  year         = {2001},
  url          = {https://doi.org/10.1109/4236.914648},
  doi          = {10.1109/4236.914648},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/internet/GreenwaldS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/StoneLSK01,
  author       = {Peter Stone and
                  Michael L. Littman and
                  Satinder Singh and
                  Michael J. Kearns},
  title        = {ATTac-2000: An Adaptive Autonomous Bidding Agent},
  journal      = {J. Artif. Intell. Res.},
  volume       = {15},
  pages        = {189--206},
  year         = {2001},
  url          = {https://doi.org/10.1613/jair.865},
  doi          = {10.1613/JAIR.865},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jair/StoneLSK01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/StoneLSK01,
  author       = {Peter Stone and
                  Michael L. Littman and
                  Satinder Singh and
                  Michael J. Kearns},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sandip Sen and
                  Claude Frasson and
                  J{\"{o}}rg P. M{\"{u}}ller},
  title        = {ATTac-2000: an adaptive autonomous bidding agent},
  booktitle    = {Proceedings of the Fifth International Conference on Autonomous Agents,
                  {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001},
  pages        = {238--245},
  publisher    = {{ACM}},
  year         = {2001},
  url          = {https://doi.org/10.1145/375735.376301},
  doi          = {10.1145/375735.376301},
  timestamp    = {Sat, 30 Sep 2023 09:33:47 +0200},
  biburl       = {https://dblp.org/rec/conf/agents/StoneLSK01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/StoneM01,
  author       = {Peter Stone and
                  David A. McAllester},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sandip Sen and
                  Claude Frasson and
                  J{\"{o}}rg P. M{\"{u}}ller},
  title        = {An architecture for action selection in robotic soccer},
  booktitle    = {Proceedings of the Fifth International Conference on Autonomous Agents,
                  {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001},
  pages        = {316--323},
  publisher    = {{ACM}},
  year         = {2001},
  url          = {https://doi.org/10.1145/375735.376320},
  doi          = {10.1145/375735.376320},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/agents/StoneM01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/IsbellSKSS01,
  author       = {Charles Lee Isbell Jr. and
                  Christian R. Shelton and
                  Michael J. Kearns and
                  Satinder Singh and
                  Peter Stone},
  editor       = {Elisabeth Andr{\'{e}} and
                  Sandip Sen and
                  Claude Frasson and
                  J{\"{o}}rg P. M{\"{u}}ller},
  title        = {A social reinforcement learning agent},
  booktitle    = {Proceedings of the Fifth International Conference on Autonomous Agents,
                  {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001},
  pages        = {377--384},
  publisher    = {{ACM}},
  year         = {2001},
  url          = {https://doi.org/10.1145/375735.376334},
  doi          = {10.1145/375735.376334},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/agents/IsbellSKSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/LittmanS01,
  author       = {Michael L. Littman and
                  Peter Stone},
  editor       = {John{-}Jules Ch. Meyer and
                  Milind Tambe},
  title        = {Implicit Negotiation in Repeated Games},
  booktitle    = {Intelligent Agents VIII, 8th International Workshop, {ATAL} 2001 Seattle,
                  WA, USA, August 1-3, 2001, Revised Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {2333},
  pages        = {393--404},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45448-9\_29},
  doi          = {10.1007/3-540-45448-9\_29},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/LittmanS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/StoneS01,
  author       = {Peter Stone and
                  Richard S. Sutton},
  editor       = {Carla E. Brodley and
                  Andrea Pohoreckyj Danyluk},
  title        = {Scaling Reinforcement Learning toward RoboCup Soccer},
  booktitle    = {Proceedings of the Eighteenth International Conference on Machine
                  Learning {(ICML} 2001), Williams College, Williamstown, MA, USA, June
                  28 - July 1, 2001},
  pages        = {537--544},
  publisher    = {Morgan Kaufmann},
  year         = {2001},
  timestamp    = {Wed, 27 Nov 2002 10:53:35 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/StoneS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/IsbellSKSS01,
  author       = {Charles Lee Isbell Jr. and
                  Christian R. Shelton and
                  Michael J. Kearns and
                  Satinder Singh and
                  Peter Stone},
  editor       = {Thomas G. Dietterich and
                  Suzanna Becker and
                  Zoubin Ghahramani},
  title        = {Cobot: {A} Social Reinforcement Learning Agent},
  booktitle    = {Advances in Neural Information Processing Systems 14 [Neural Information
                  Processing Systems: Natural and Synthetic, {NIPS} 2001, December 3-8,
                  2001, Vancouver, British Columbia, Canada]},
  pages        = {1393--1400},
  publisher    = {{MIT} Press},
  year         = {2001},
  url          = {https://proceedings.neurips.cc/paper/2001/hash/92bbd31f8e0e43a7da8a6295b251725f-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/IsbellSKSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneS01,
  author       = {Peter Stone and
                  Richard S. Sutton},
  editor       = {Andreas Birk and
                  Silvia Coradeschi and
                  Satoshi Tadokoro},
  title        = {Keepaway Soccer: {A} Machine Learning Testbed},
  booktitle    = {RoboCup 2001: Robot Soccer World Cup {V}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2377},
  pages        = {214--223},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45603-1\_22},
  doi          = {10.1007/3-540-45603-1\_22},
  timestamp    = {Tue, 14 May 2019 10:00:53 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/Stone01,
  author       = {Peter Stone},
  editor       = {Andreas Birk and
                  Silvia Coradeschi and
                  Satoshi Tadokoro},
  title        = {ATTUnited-2001: Using Heterogeneous Players},
  booktitle    = {RoboCup 2001: Robot Soccer World Cup {V}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2377},
  pages        = {495--498},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45603-1\_67},
  doi          = {10.1007/3-540-45603-1\_67},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/Stone01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/welcom/CsirikLSS01,
  author       = {J{\'{a}}nos A. Csirik and
                  Michael L. Littman and
                  Satinder Singh and
                  Peter Stone},
  editor       = {Ludger Fiege and
                  Gero M{\"{u}}hl and
                  Uwe G. Wilhelm},
  title        = {FAucS : An {FCC} Spectrum Auction Simulator for Autonomous Bidding
                  Agents},
  booktitle    = {Electronic Commerce, Second International Workshop, {WELCOM} 2001
                  Heidelberg, Germany, November 16-17, 2001, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {2232},
  pages        = {139--151},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45598-1\_14},
  doi          = {10.1007/3-540-45598-1\_14},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/welcom/CsirikLSS01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/robocup/2000,
  editor       = {Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar},
  title        = {RoboCup 2000: Robot Soccer World Cup {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2019},
  publisher    = {Springer},
  year         = {2001},
  url          = {https://doi.org/10.1007/3-540-45324-5},
  doi          = {10.1007/3-540-45324-5},
  isbn         = {3-540-42185-8},
  timestamp    = {Tue, 14 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/2000.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/daglib/0015985,
  author       = {Peter Stone},
  title        = {Layered learning in multiagent systems - a winning approach to robotic
                  soccer},
  series       = {Intelligent robotics and autonomous agents},
  publisher    = {{MIT} Press},
  year         = {2000},
  isbn         = {978-0-262-19438-9},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/daglib/0015985.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/StoneVR00,
  author       = {Peter Stone and
                  Manuela M. Veloso and
                  Patrick Riley},
  title        = {{CMUNITED-98} Simulator Team},
  journal      = {{AI} Mag.},
  volume       = {21},
  number       = {1},
  pages        = {20--28},
  year         = {2000},
  url          = {https://doi.org/10.1609/aimag.v21i1.1491},
  doi          = {10.1609/AIMAG.V21I1.1491},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/StoneVR00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/VelosoBAHS00,
  author       = {Manuela M. Veloso and
                  Michael H. Bowling and
                  Sorin Achim and
                  Kwun Han and
                  Peter Stone},
  title        = {{CMUNITED-98:} RoboCup-98 Small-Robot World Champion Team},
  journal      = {{AI} Mag.},
  volume       = {21},
  number       = {1},
  pages        = {29--36},
  year         = {2000},
  url          = {https://doi.org/10.1609/aimag.v21i1.1492},
  doi          = {10.1609/AIMAG.V21I1.1492},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/VelosoBAHS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/CoradeschiKSBKA00,
  author       = {Silvia Coradeschi and
                  Lars Karlsson and
                  Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar and
                  Minoru Asada},
  title        = {Overview of RoboCup-99},
  journal      = {{AI} Mag.},
  volume       = {21},
  number       = {3},
  pages        = {11--18},
  year         = {2000},
  url          = {https://doi.org/10.1609/aimag.v21i3.1516},
  doi          = {10.1609/AIMAG.V21I3.1516},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/CoradeschiKSBKA00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/StoneRV00,
  author       = {Peter Stone and
                  Patrick Riley and
                  Manuela M. Veloso},
  title        = {The CMUnited-99 Champion Simulator Team},
  journal      = {{AI} Mag.},
  volume       = {21},
  number       = {3},
  pages        = {33--40},
  year         = {2000},
  url          = {https://doi.org/10.1609/aimag.v21i3.1520},
  doi          = {10.1609/AIMAG.V21I3.1520},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/StoneRV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/arobots/StoneV00,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  title        = {Multiagent Systems: {A} Survey from a Machine Learning Perspective},
  journal      = {Auton. Robots},
  volume       = {8},
  number       = {3},
  pages        = {345--383},
  year         = {2000},
  url          = {https://doi.org/10.1023/A:1008942012299},
  doi          = {10.1023/A:1008942012299},
  timestamp    = {Thu, 18 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/arobots/StoneV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/IsbellKKSS00,
  author       = {Charles Lee Isbell Jr. and
                  Michael J. Kearns and
                  David P. Kormann and
                  Satinder Singh and
                  Peter Stone},
  editor       = {Henry A. Kautz and
                  Bruce W. Porter},
  title        = {Cobot in LambdaMOO: {A} Social Statistics Agent},
  booktitle    = {Proceedings of the Seventeenth National Conference on Artificial Intelligence
                  and Twelfth Conference on on Innovative Applications of Artificial
                  Intelligence, July 30 - August 3, 2000, Austin, Texas, {USA}},
  pages        = {36--41},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2000},
  url          = {http://www.aaai.org/Library/AAAI/2000/aaai00-006.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/IsbellKKSS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/StoneRV00,
  author       = {Peter Stone and
                  Patrick Riley and
                  Manuela M. Veloso},
  editor       = {Henry A. Kautz and
                  Bruce W. Porter},
  title        = {Defining and Using Ideal Teammate and Opponent Agent Models},
  booktitle    = {Proceedings of the Seventeenth National Conference on Artificial Intelligence
                  and Twelfth Conference on on Innovative Applications of Artificial
                  Intelligence, July 30 - August 3, 2000, Austin, Texas, {USA}},
  pages        = {1040--1045},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {2000},
  url          = {http://www.aaai.org/Library/IAAI/2000/iaai00-016.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/StoneRV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/NodaS00,
  author       = {Itsuki Noda and
                  Peter Stone},
  editor       = {Thomas Wagner and
                  Omer F. Rana},
  title        = {The RoboCup Soccer Server and CMUnited: Implemented Infrastructure
                  for {MAS} Research},
  booktitle    = {Infrastructure for Agents, Multi-Agent Systems, and Scalable Multi-Agent
                  Systems, International Workshop on Infrastructure for Multi-Agent
                  Systems, Barcelona, Spain, June 3-7, 2000, Revised Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {1887},
  pages        = {94--101},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-47772-1\_10},
  doi          = {10.1007/3-540-47772-1\_10},
  timestamp    = {Tue, 14 May 2019 10:00:38 +0200},
  biburl       = {https://dblp.org/rec/conf/agents/NodaS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/StoneRV00,
  author       = {Peter Stone and
                  Patrick Riley and
                  Manuela M. Veloso},
  editor       = {Carles Sierra and
                  Maria L. Gini and
                  Jeffrey S. Rosenschein},
  title        = {Layered disclosure: why is the agent doing what it's doing?},
  booktitle    = {Proceedings of the Fourth International Conference on Autonomous Agents,
                  {AGENTS} 2000, Barcelona, Catalonia, Spain, June 3-7, 2000},
  pages        = {225--226},
  publisher    = {{ACM}},
  year         = {2000},
  url          = {https://doi.org/10.1145/336595.337387},
  doi          = {10.1145/336595.337387},
  timestamp    = {Thu, 21 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/agents/StoneRV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/RileySV00,
  author       = {Patrick Riley and
                  Peter Stone and
                  Manuela M. Veloso},
  editor       = {Cristiano Castelfranchi and
                  Yves Lesp{\'{e}}rance},
  title        = {Layered Disclosure: Revealing Agents' Internals},
  booktitle    = {Intelligent Agents {VII.} Agent Theories Architectures and Languages,
                  7th International Workshop, {ATAL} 2000, Boston, MA, USA, July 7-9,
                  2000, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1986},
  pages        = {61--72},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-44631-1\_5},
  doi          = {10.1007/3-540-44631-1\_5},
  timestamp    = {Thu, 21 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/RileySV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecml/StoneV00,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Ram{\'{o}}n L{\'{o}}pez de M{\'{a}}ntaras and
                  Enric Plaza},
  title        = {Layered Learning},
  booktitle    = {Machine Learning: {ECML} 2000, 11th European Conference on Machine
                  Learning, Barcelona, Catalonia, Spain, May 31 - June 2, 2000, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1810},
  pages        = {369--381},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45164-1\_38},
  doi          = {10.1007/3-540-45164-1\_38},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/ecml/StoneV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icmas/StoneRV00,
  author       = {Peter Stone and
                  Patrick Riley and
                  Manuela M. Veloso},
  title        = {Defining and Using Ideal Teammate and Opponent Agent Models: {A} Case
                  Study in Robotic Soccer},
  booktitle    = {4th International Conference on Multi-Agent Systems, {ICMAS} 2000,
                  Boston, MA, USA, July 10-12, 2000},
  pages        = {441--442},
  publisher    = {{IEEE} Computer Society},
  year         = {2000},
  url          = {https://doi.org/10.1109/ICMAS.2000.858515},
  doi          = {10.1109/ICMAS.2000.858515},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icmas/StoneRV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Stone00,
  author       = {Peter Stone},
  editor       = {Pat Langley},
  title        = {{TPOT-RL} Applied to Network Routing},
  booktitle    = {Proceedings of the Seventeenth International Conference on Machine
                  Learning {(ICML} 2000), Stanford University, Stanford, CA, USA, June
                  29 - July 2, 2000},
  pages        = {935--942},
  publisher    = {Morgan Kaufmann},
  year         = {2000},
  timestamp    = {Sun, 21 Feb 2010 20:54:50 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/Stone00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iser/AsadaBPFNTDSVBKT00,
  author       = {Minoru Asada and
                  Andreas Birk and
                  Enrico Pagello and
                  Masahiro Fujita and
                  Itsuki Noda and
                  Satoshi Tadokoro and
                  Dominique Duhaut and
                  Peter Stone and
                  Manuela M. Veloso and
                  Tucker R. Balch and
                  Hiroaki Kitano and
                  Brian Thomas},
  editor       = {Daniela Rus and
                  Sanjiv Singh},
  title        = {Progress in RoboCup Soccer Research in 2000},
  booktitle    = {Experimental Robotics {VII} {[ISER} 2000, Waikiki, Hawaii, USA, December
                  11-13, 2000]},
  series       = {Lecture Notes in Control and Information Sciences},
  volume       = {271},
  pages        = {363--372},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45118-8\_37},
  doi          = {10.1007/3-540-45118-8\_37},
  timestamp    = {Fri, 02 Jun 2017 12:01:41 +0200},
  biburl       = {https://dblp.org/rec/conf/iser/AsadaBPFNTDSVBKT00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneABFKLSTW00,
  author       = {Peter Stone and
                  Minoru Asada and
                  Tucker R. Balch and
                  Masahiro Fujita and
                  Gerhard K. Kraetzschmar and
                  Henrik Hautop Lund and
                  Paul Scerri and
                  Satoshi Tadokoro and
                  Gordon F. Wyeth},
  editor       = {Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar},
  title        = {Overview of RoboCup-2000},
  booktitle    = {RoboCup 2000: Robot Soccer World Cup {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2019},
  pages        = {1--28},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45324-5\_1},
  doi          = {10.1007/3-540-45324-5\_1},
  timestamp    = {Mon, 23 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneABFKLSTW00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneSS00,
  author       = {Peter Stone and
                  Richard S. Sutton and
                  Satinder Singh},
  editor       = {Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar},
  title        = {Reinforcement Learning for 3 vs. 2 Keepaway},
  booktitle    = {RoboCup 2000: Robot Soccer World Cup {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2019},
  pages        = {249--258},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45324-5\_23},
  doi          = {10.1007/3-540-45324-5\_23},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneSS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/McAllesterS00,
  author       = {David A. McAllester and
                  Peter Stone},
  editor       = {Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar},
  title        = {Keeping the Ball from CMUnited-99},
  booktitle    = {RoboCup 2000: Robot Soccer World Cup {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2019},
  pages        = {333--338},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45324-5\_35},
  doi          = {10.1007/3-540-45324-5\_35},
  timestamp    = {Fri, 26 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/McAllesterS00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/RileySMV00,
  author       = {Patrick Riley and
                  Peter Stone and
                  David A. McAllester and
                  Manuela M. Veloso},
  editor       = {Peter Stone and
                  Tucker R. Balch and
                  Gerhard K. Kraetzschmar},
  title        = {ATT-CMUnited-2000: Third Place Finisher in the RoboCup-2000 Simulator
                  League},
  booktitle    = {RoboCup 2000: Robot Soccer World Cup {IV}},
  series       = {Lecture Notes in Computer Science},
  volume       = {2019},
  pages        = {489--492},
  publisher    = {Springer},
  year         = {2000},
  url          = {https://doi.org/10.1007/3-540-45324-5\_68},
  doi          = {10.1007/3-540-45324-5\_68},
  timestamp    = {Thu, 21 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/RileySMV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ai/StoneV99,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  title        = {Task Decomposition, Dynamic Role Assignment, and Low-Bandwidth Communication
                  for Real-Time Strategic Teamwork},
  journal      = {Artif. Intell.},
  volume       = {110},
  number       = {2},
  pages        = {241--273},
  year         = {1999},
  url          = {https://doi.org/10.1016/S0004-3702(99)00025-9},
  doi          = {10.1016/S0004-3702(99)00025-9},
  timestamp    = {Sat, 27 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ai/StoneV99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ras/VelosoSH99,
  author       = {Manuela M. Veloso and
                  Peter Stone and
                  Kwun Han},
  title        = {The CMUnited-97 robotic soccer team: Perception and multi-agent control},
  journal      = {Robotics Auton. Syst.},
  volume       = {29},
  number       = {2-3},
  pages        = {133--143},
  year         = {1999},
  url          = {https://doi.org/10.1016/S0921-8890(99)00048-2},
  doi          = {10.1016/S0921-8890(99)00048-2},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ras/VelosoSH99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/VelosoBAHS99,
  author       = {Manuela M. Veloso and
                  Michael H. Bowling and
                  Sorin Achim and
                  Kwun Han and
                  Peter Stone},
  editor       = {Jim Hendler and
                  Devika Subramanian},
  title        = {CMUnited-98: {A} Team of Robotic Soccer Agents},
  booktitle    = {Proceedings of the Sixteenth National Conference on Artificial Intelligence
                  and Eleventh Conference on Innovative Applications of Artificial Intelligence,
                  July 18-22, 1999, Orlando, Florida, {USA}},
  pages        = {891--896},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {1999},
  url          = {http://www.aaai.org/Library/IAAI/1999/iaai99-126.php},
  timestamp    = {Tue, 05 Sep 2023 09:10:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/VelosoBAHS99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/StoneV99,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Oren Etzioni and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Jeffrey M. Bradshaw},
  title        = {Team-Partitioned, Opaque-Transition Reinforcement Learning},
  booktitle    = {Proceedings of the Third Annual Conference on Autonomous Agents, {AGENTS}
                  1999, Seattle, WA, USA, May 1-5, 1999},
  pages        = {206--212},
  publisher    = {{ACM}},
  year         = {1999},
  url          = {https://doi.org/10.1145/301136.301195},
  doi          = {10.1145/301136.301195},
  timestamp    = {Tue, 06 Nov 2018 11:07:01 +0100},
  biburl       = {https://dblp.org/rec/conf/agents/StoneV99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/VelosoKPKSBACKF99,
  author       = {Manuela M. Veloso and
                  Hiroaki Kitano and
                  Enrico Pagello and
                  Gerhard K. Kraetzschmar and
                  Peter Stone and
                  Tucker R. Balch and
                  Minoru Asada and
                  Silvia Coradeschi and
                  Lars Karlsson and
                  Masahiro Fujita},
  editor       = {Manuela M. Veloso and
                  Enrico Pagello and
                  Hiroaki Kitano},
  title        = {Overview of RoboCup-99},
  booktitle    = {RoboCup-99: Robot Soccer World Cup {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1856},
  pages        = {1--34},
  publisher    = {Springer},
  year         = {1999},
  url          = {https://doi.org/10.1007/3-540-45327-X\_1},
  doi          = {10.1007/3-540-45327-X\_1},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/VelosoKPKSBACKF99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneRV99,
  author       = {Peter Stone and
                  Patrick Riley and
                  Manuela M. Veloso},
  editor       = {Manuela M. Veloso and
                  Enrico Pagello and
                  Hiroaki Kitano},
  title        = {The CMUnited-99 Champion Simulator Team},
  booktitle    = {RoboCup-99: Robot Soccer World Cup {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1856},
  pages        = {35--48},
  publisher    = {Springer},
  year         = {1999},
  url          = {https://doi.org/10.1007/3-540-45327-X\_2},
  doi          = {10.1007/3-540-45327-X\_2},
  timestamp    = {Thu, 21 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneRV99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneV99,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Manuela M. Veloso and
                  Enrico Pagello and
                  Hiroaki Kitano},
  title        = {Layered Learning and Flexible Teamwork in RoboCup Simulation Agents},
  booktitle    = {RoboCup-99: Robot Soccer World Cup {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1856},
  pages        = {495--508},
  publisher    = {Springer},
  year         = {1999},
  url          = {https://doi.org/10.1007/3-540-45327-X\_42},
  doi          = {10.1007/3-540-45327-X\_42},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneV99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aai/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  title        = {Layered Approach to Learning Client Behaviors in the Robocup Soccer
                  Server},
  journal      = {Appl. Artif. Intell.},
  volume       = {12},
  number       = {2-3},
  pages        = {165--188},
  year         = {1998},
  url          = {https://doi.org/10.1080/088395198117811},
  doi          = {10.1080/088395198117811},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aai/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aai/AsadaSKWKDDVAS98,
  author       = {Minoru Asada and
                  Peter Stone and
                  Hiroaki Kitano and
                  Barry Brian Werger and
                  Yasuo Kuniyoshi and
                  Alexis Drogoul and
                  Dominique Duhaut and
                  Manuela M. Veloso and
                  Hajime Asama and
                  Sho'ji Suzuki},
  title        = {The Robocup Physical Agent Challenge: Phase {I}},
  journal      = {Appl. Artif. Intell.},
  volume       = {12},
  number       = {2-3},
  pages        = {251--263},
  year         = {1998},
  url          = {https://doi.org/10.1080/088395198117857},
  doi          = {10.1080/088395198117857},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aai/AsadaSKWKDDVAS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/aim/VelosoSH98,
  author       = {Manuela M. Veloso and
                  Peter Stone and
                  Kwun Han},
  title        = {{CMUNITED-97:} RoboCup-97 Small-Robot World Champion Team},
  journal      = {{AI} Mag.},
  volume       = {19},
  number       = {3},
  pages        = {61--69},
  year         = {1998},
  url          = {https://doi.org/10.1609/aimag.v19i3.1394},
  doi          = {10.1609/AIMAG.V19I3.1394},
  timestamp    = {Tue, 25 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/aim/VelosoSH98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ar/VelosoBS98,
  author       = {Manuela M. Veloso and
                  Michael H. Bowling and
                  Peter Stone},
  title        = {The CMUnited-98 champion small-robot team},
  journal      = {Adv. Robotics},
  volume       = {13},
  number       = {8},
  pages        = {753--766},
  year         = {1998},
  url          = {https://doi.org/10.1163/156855300X00089},
  doi          = {10.1163/156855300X00089},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ar/VelosoBS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/crossroads/VelosoSHA98,
  author       = {Manuela Veloso and
                  Peter Stone and
                  Kwun Han and
                  Sorin Achim},
  title        = {CMUnited: a team of robotics soccer agents collaborating in an adversarial
                  environment},
  journal      = {{XRDS}},
  volume       = {4},
  number       = {3},
  pages        = {11--17},
  year         = {1998},
  url          = {https://doi.org/10.1145/332084.332089},
  doi          = {10.1145/332084.332089},
  timestamp    = {Wed, 04 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/crossroads/VelosoSHA98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijmms/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  title        = {Towards collaborative and adversarial learning: a case study in robotic
                  soccer},
  journal      = {Int. J. Hum. Comput. Stud.},
  volume       = {48},
  number       = {1},
  pages        = {83--104},
  year         = {1998},
  url          = {https://doi.org/10.1006/ijhc.1997.0162},
  doi          = {10.1006/IJHC.1997.0162},
  timestamp    = {Fri, 21 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijmms/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/VelosoSH98,
  author       = {Manuela M. Veloso and
                  Peter Stone and
                  Kwun Han},
  editor       = {Katia P. Sycara and
                  Michael J. Wooldridge},
  title        = {The CMUnited-97 Robotic Socccer Team: Perception and Multiagent Control},
  booktitle    = {Proceedings of the Second International Conference on Autonomous Agents,
                  {AGENTS} 1998, St. Paul, Minnepolis, USA, May 9-13, 1998},
  pages        = {78--85},
  publisher    = {{ACM}},
  year         = {1998},
  url          = {https://doi.org/10.1145/280765.280778},
  doi          = {10.1145/280765.280778},
  timestamp    = {Fri, 26 Apr 2019 14:26:42 +0200},
  biburl       = {https://dblp.org/rec/conf/agents/VelosoSH98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Katia P. Sycara and
                  Michael J. Wooldridge},
  title        = {Using Decision Tree Confidence Factors for Multi-Agent Control},
  booktitle    = {Proceedings of the Second International Conference on Autonomous Agents,
                  {AGENTS} 1998, St. Paul, Minnepolis, USA, May 9-13, 1998},
  pages        = {86--91},
  publisher    = {{ACM}},
  year         = {1998},
  url          = {https://doi.org/10.1145/280765.280780},
  doi          = {10.1145/280765.280780},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/agents/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {J{\"{o}}rg P. M{\"{u}}ller and
                  Munindar P. Singh and
                  Anand S. Rao},
  title        = {Task Decomposition and Dynamic Role Assignment for Real-Time Strategic
                  Teamwork},
  booktitle    = {Intelligent Agents V, Agent Theories, Architectures, and Languages,
                  5th International Workshop, {ATAL} '98, Paris, France, July 4-7, 1998,
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1555},
  pages        = {293--308},
  publisher    = {Springer},
  year         = {1998},
  url          = {https://doi.org/10.1007/3-540-49057-4\_19},
  doi          = {10.1007/3-540-49057-4\_19},
  timestamp    = {Tue, 29 Dec 2020 18:27:45 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/crw/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Alexis Drogoul and
                  Milind Tambe and
                  Toshio Fukuda},
  title        = {Communication in Domains with Unreliable, Single-Channel, Low-Bandwidth
                  Communication},
  booktitle    = {Collective Robotics, First International Workshop, CRW'98, Paris,
                  France, July 4-5, 1998, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1456},
  pages        = {85--97},
  publisher    = {Springer},
  year         = {1998},
  url          = {https://doi.org/10.1007/BFb0033376},
  doi          = {10.1007/BFB0033376},
  timestamp    = {Tue, 14 May 2019 10:00:55 +0200},
  biburl       = {https://dblp.org/rec/conf/crw/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icmas/VelosoS98,
  author       = {Manuela M. Veloso and
                  Peter Stone},
  editor       = {Yves Demazeau},
  title        = {Individual and Collaborative Behaviors in a Team of Robotic Soccer
                  Agents},
  booktitle    = {Proceedings of the Third International Conference on Multiagent Systems,
                  {ICMAS} 1998, Paris, France, July 3-7, 1998},
  pages        = {309--316},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/ICMAS.1998.699074},
  doi          = {10.1109/ICMAS.1998.699074},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icmas/VelosoS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneVR98,
  author       = {Peter Stone and
                  Manuela M. Veloso and
                  Patrick Riley},
  editor       = {Minoru Asada and
                  Hiroaki Kitano},
  title        = {The CMUnited-98 Champion Simulator Team},
  booktitle    = {RoboCup-98: Robot Soccer World Cup {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1604},
  pages        = {61--76},
  publisher    = {Springer},
  year         = {1998},
  url          = {https://doi.org/10.1007/3-540-48422-1\_5},
  doi          = {10.1007/3-540-48422-1\_5},
  timestamp    = {Thu, 21 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneVR98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/VelosoBAHS98,
  author       = {Manuela M. Veloso and
                  Michael H. Bowling and
                  Sorin Achim and
                  Kwun Han and
                  Peter Stone},
  editor       = {Minoru Asada and
                  Hiroaki Kitano},
  title        = {The CMUnited-98 Small-Robot Team},
  booktitle    = {RoboCup-98: Robot Soccer World Cup {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1604},
  pages        = {77--92},
  publisher    = {Springer},
  year         = {1998},
  url          = {https://doi.org/10.1007/3-540-48422-1\_6},
  doi          = {10.1007/3-540-48422-1\_6},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/VelosoBAHS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneV98,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Minoru Asada and
                  Hiroaki Kitano},
  title        = {Team-Partitioned, Opaque-Transition Reinforced Learning},
  booktitle    = {RoboCup-98: Robot Soccer World Cup {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1604},
  pages        = {261--272},
  publisher    = {Springer},
  year         = {1998},
  url          = {https://doi.org/10.1007/3-540-48422-1\_21},
  doi          = {10.1007/3-540-48422-1\_21},
  timestamp    = {Wed, 24 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneV98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/clsr/Stone97,
  author       = {Peter Stone},
  title        = {Lessons from America: Filtration of functionality from software copyright},
  journal      = {Comput. Law Secur. Rev.},
  volume       = {13},
  number       = {1},
  pages        = {15--21},
  year         = {1997},
  url          = {https://doi.org/10.1016/S0267-3649(97)81187-9},
  doi          = {10.1016/S0267-3649(97)81187-9},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/clsr/Stone97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Stone97,
  author       = {Peter Stone},
  editor       = {Benjamin Kuipers and
                  Bonnie L. Webber},
  title        = {Layered Learning in Multiagent Systems},
  booktitle    = {Proceedings of the Fourteenth National Conference on Artificial Intelligence
                  and Ninth Innovative Applications of Artificial Intelligence Conference,
                  {AAAI} 97, {IAAI} 97, July 27-31, 1997, Providence, Rhode Island,
                  {USA}},
  pages        = {819},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {1997},
  url          = {http://www.aaai.org/Library/AAAI/1997/aaai97-150.php},
  timestamp    = {Tue, 05 Sep 2023 08:53:09 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Stone97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/agents/VelosoSA97,
  author       = {Manuela M. Veloso and
                  Peter Stone and
                  Sorin Achim},
  editor       = {W. Lewis Johnson},
  title        = {A Layered Approach for an Autonomous Robotic Soccer System},
  booktitle    = {Proceedings of the First International Conference on Autonomous Agents,
                  {AGENTS} 1997, Marina del Rey, California, USA, February 5-8, 1997},
  pages        = {530--531},
  publisher    = {{ACM}},
  year         = {1997},
  url          = {https://doi.org/10.1145/267658.267818},
  doi          = {10.1145/267658.267818},
  timestamp    = {Tue, 06 Nov 2018 11:07:02 +0100},
  biburl       = {https://dblp.org/rec/conf/agents/VelosoSA97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/KitanoTSVCOMNA97,
  author       = {Hiroaki Kitano and
                  Milind Tambe and
                  Peter Stone and
                  Manuela M. Veloso and
                  Silvia Coradeschi and
                  Eiichi Osawa and
                  Hitoshi Matsubara and
                  Itsuki Noda and
                  Minoru Asada},
  title        = {The RoboCup Synthetic Agent Challenge 97},
  booktitle    = {Proceedings of the Fifteenth International Joint Conference on Artificial
                  Intelligence, {IJCAI} 97, Nagoya, Japan, August 23-29, 1997, 2 Volumes},
  pages        = {24--30},
  publisher    = {Morgan Kaufmann},
  year         = {1997},
  url          = {http://ijcai.org/Proceedings/97-1/Papers/004.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:17:27 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/KitanoTSVCOMNA97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/AsadaSKDDVAS97,
  author       = {Minoru Asada and
                  Peter Stone and
                  Hiroaki Kitano and
                  Alexis Drogoul and
                  Dominique Duhaut and
                  Manuela M. Veloso and
                  Hajime Asama and
                  Sho'ji Suzuki},
  editor       = {Hiroaki Kitano},
  title        = {The RoboCup Physical Agent Challenge: Goals and Protocols for Phase
                  1},
  booktitle    = {RoboCup-97: Robot Soccer World Cup {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1395},
  pages        = {42--61},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/3-540-64473-3\_48},
  doi          = {10.1007/3-540-64473-3\_48},
  timestamp    = {Tue, 14 May 2019 10:00:53 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/AsadaSKDDVAS97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/KitanoTSVCOMNA97,
  author       = {Hiroaki Kitano and
                  Milind Tambe and
                  Peter Stone and
                  Manuela M. Veloso and
                  Silvia Coradeschi and
                  Eiichi Osawa and
                  Hitoshi Matsubara and
                  Itsuki Noda and
                  Minoru Asada},
  editor       = {Hiroaki Kitano},
  title        = {The RoboCup Synthetic Agent Challenge 97},
  booktitle    = {RoboCup-97: Robot Soccer World Cup {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1395},
  pages        = {62--73},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/3-540-64473-3\_49},
  doi          = {10.1007/3-540-64473-3\_49},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/KitanoTSVCOMNA97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneV97,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Hiroaki Kitano},
  title        = {Using Decision Tree Confidence Factors for Multiagent Control},
  booktitle    = {RoboCup-97: Robot Soccer World Cup {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1395},
  pages        = {99--111},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/3-540-64473-3\_52},
  doi          = {10.1007/3-540-64473-3\_52},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneV97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/VelosoSHA97,
  author       = {Manuela M. Veloso and
                  Peter Stone and
                  Kwun Han and
                  Sorin Achim},
  editor       = {Hiroaki Kitano},
  title        = {The CMUnited-97 Small Robot Team},
  booktitle    = {RoboCup-97: Robot Soccer World Cup {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1395},
  pages        = {242--256},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/3-540-64473-3\_64},
  doi          = {10.1007/3-540-64473-3\_64},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/VelosoSHA97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/robocup/StoneV97a,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {Hiroaki Kitano},
  title        = {The CMUnited-97 Simulator Team},
  booktitle    = {RoboCup-97: Robot Soccer World Cup {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {1395},
  pages        = {389--397},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/3-540-64473-3\_75},
  doi          = {10.1007/3-540-64473-3\_75},
  timestamp    = {Tue, 23 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/robocup/StoneV97a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/VelosoS95,
  author       = {Manuela M. Veloso and
                  Peter Stone},
  title        = {{FLECS:} Planning with a Flexible Commitment Strategy},
  journal      = {J. Artif. Intell. Res.},
  volume       = {3},
  pages        = {25--52},
  year         = {1995},
  url          = {https://doi.org/10.1613/jair.131},
  doi          = {10.1613/JAIR.131},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/VelosoS95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/StoneV95,
  author       = {Peter Stone and
                  Manuela M. Veloso},
  editor       = {David S. Touretzky and
                  Michael Mozer and
                  Michael E. Hasselmo},
  title        = {Beating a Defender in Robotic Soccer: Memory-Based Learning of a Continuous
                  Function},
  booktitle    = {Advances in Neural Information Processing Systems 8, NIPS, Denver,
                  CO, USA, November 27-30, 1995},
  pages        = {896--902},
  publisher    = {{MIT} Press},
  year         = {1995},
  url          = {http://papers.nips.cc/paper/1089-beating-a-defender-in-robotic-soccer-memory-based-learning-of-a-continuous-function},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/StoneV95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-cs-9506101,
  author       = {Manuela M. Veloso and
                  Peter Stone},
  title        = {{FLECS:} Planning with a Flexible Commitment Strategy},
  journal      = {CoRR},
  volume       = {abs/cs/9506101},
  year         = {1995},
  url          = {http://arxiv.org/abs/cs/9506101},
  eprinttype    = {arXiv},
  eprint       = {cs/9506101},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-cs-9506101.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aips/StoneVB94,
  author       = {Peter Stone and
                  Manuela M. Veloso and
                  Jim Blythe},
  editor       = {Kristian J. Hammond},
  title        = {The Need for Different Domain-independent Heuristics},
  booktitle    = {Proceedings of the Second International Conference on Artificial Intelligence
                  Planning Systems, University of Chicago, Chicago, Illinois, USA, June
                  13-15, 1994},
  pages        = {164--169},
  publisher    = {{AAAI}},
  year         = {1994},
  url          = {http://www.aaai.org/Library/AIPS/1994/aips94-028.php},
  timestamp    = {Fri, 05 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aips/StoneVB94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cn/Stone90,
  author       = {Peter Stone},
  title        = {Developing Networked Services for Libraries: The U. K. Experience},
  journal      = {Comput. Networks {ISDN} Syst.},
  volume       = {19},
  number       = {3-5},
  pages        = {343--349},
  year         = {1990},
  url          = {https://doi.org/10.1016/0169-7552(90)90098-D},
  doi          = {10.1016/0169-7552(90)90098-D},
  timestamp    = {Thu, 14 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cn/Stone90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics