Stop the war!
Остановите войну!
for scientists:
default search action
BibTeX records: Peter Stone
@inproceedings{DBLP:conf/aaai/KnoxHABDSN24, author = {W. Bradley Knox and Stephane Hatgis{-}Kessell and Sigurdur O. Adalgeirsson and Serena Booth and Anca D. Dragan and Peter Stone and Scott Niekum}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Learning Optimal Advantage from Preferences and Mistaking It for Reward}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {10066--10073}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i9.28870}, doi = {10.1609/AAAI.V38I9.28870}, timestamp = {Tue, 02 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KnoxHABDSN24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WangWXZS24, author = {Zizhao Wang and Caroline Wang and Xuesu Xiao and Yuke Zhu and Peter Stone}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Building Minimal and Reusable Causal State Abstractions for Reinforcement Learning}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {15778--15786}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i14.29507}, doi = {10.1609/AAAI.V38I14.29507}, timestamp = {Tue, 02 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WangWXZS24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/RahmanCS24, author = {Muhammad Rahman and Jiaxun Cui and Peter Stone}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Minimum Coverage Sets for Training Robust Ad Hoc Teamwork Agents}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {17523--17530}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i16.29702}, doi = {10.1609/AAAI.V38I16.29702}, timestamp = {Thu, 11 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/RahmanCS24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/KnoxABSS24, author = {W. Bradley Knox and Alessandro Allievi and Holger Banzhaf and Felix Schmitt and Peter Stone}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Reward (Mis)design for Autonomous Driving (Abstract Reprint)}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {22702}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i20.30602}, doi = {10.1609/AAAI.V38I20.30602}, timestamp = {Tue, 02 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KnoxABSS24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-02576, author = {William Yue and Bo Liu and Peter Stone}, title = {t-DGR: {A} Trajectory-Based Deep Generative Replay Method for Continual Learning in Decision Making}, journal = {CoRR}, volume = {abs/2401.02576}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.02576}, doi = {10.48550/ARXIV.2401.02576}, eprinttype = {arXiv}, eprint = {2401.02576}, timestamp = {Tue, 23 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-02576.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2401-12497, author = {Zizhao Wang and Caroline Wang and Xuesu Xiao and Yuke Zhu and Peter Stone}, title = {Building Minimal and Reusable Causal State Abstractions for Reinforcement Learning}, journal = {CoRR}, volume = {abs/2401.12497}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2401.12497}, doi = {10.48550/ARXIV.2401.12497}, eprinttype = {arXiv}, eprint = {2401.12497}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2401-12497.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-01636, author = {Ziping Xu and Zifan Xu and Runxuan Jiang and Peter Stone and Ambuj Tewari}, title = {Sample Efficient Myopic Exploration Through Multitask Reinforcement Learning with Diverse Tasks}, journal = {CoRR}, volume = {abs/2403.01636}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.01636}, doi = {10.48550/ARXIV.2403.01636}, eprinttype = {arXiv}, eprint = {2403.01636}, timestamp = {Wed, 10 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-01636.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-03848, author = {Zifan Xu and Amir Hossain Raj and Xuesu Xiao and Peter Stone}, title = {Dexterous Legged Locomotion in Confined 3D Spaces with Reinforcement Learning}, journal = {CoRR}, volume = {abs/2403.03848}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.03848}, doi = {10.48550/ARXIV.2403.03848}, eprinttype = {arXiv}, eprint = {2403.03848}, timestamp = {Wed, 03 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-03848.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-07869, author = {Shivin Dass and Wensi Ai and Yuqian Jiang and Samik Singh and Jiaheng Hu and Ruohan Zhang and Peter Stone and Ben Abbatematteo and Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n}, title = {TeleMoMa: {A} Modular and Versatile Teleoperation System for Mobile Manipulation}, journal = {CoRR}, volume = {abs/2403.07869}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.07869}, doi = {10.48550/ARXIV.2403.07869}, eprinttype = {arXiv}, eprint = {2403.07869}, timestamp = {Thu, 04 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-07869.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-11940, author = {Alexander Levine and Peter Stone and Amy Zhang}, title = {Multistep Inverse Is Not All You Need}, journal = {CoRR}, volume = {abs/2403.11940}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.11940}, doi = {10.48550/ARXIV.2403.11940}, eprinttype = {arXiv}, eprint = {2403.11940}, timestamp = {Mon, 08 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-11940.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-17231, author = {Saad Abdul Ghani and Zizhao Wang and Peter Stone and Xuesu Xiao}, title = {Dyna-LfLH: Learning Agile Navigation in Dynamic Environments from Learned Hallucination}, journal = {CoRR}, volume = {abs/2403.17231}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.17231}, doi = {10.48550/ARXIV.2403.17231}, eprinttype = {arXiv}, eprint = {2403.17231}, timestamp = {Wed, 10 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-17231.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/KnoxABSS23, author = {W. Bradley Knox and Alessandro Allievi and Holger Banzhaf and Felix Schmitt and Peter Stone}, title = {Reward (Mis)design for autonomous driving}, journal = {Artif. Intell.}, volume = {316}, pages = {103829}, year = {2023}, url = {https://doi.org/10.1016/j.artint.2022.103829}, doi = {10.1016/J.ARTINT.2022.103829}, timestamp = {Sat, 13 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/KnoxABSS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/arobots/ZhangASTSZ23, author = {Xiaohan Zhang and Saeid Amiri and Jivko Sinapov and Jesse Thomason and Peter Stone and Shiqi Zhang}, title = {Multimodal embodied attribute learning by robots for object-centric action policies}, journal = {Auton. Robots}, volume = {47}, number = {5}, pages = {505--528}, year = {2023}, url = {https://doi.org/10.1007/s10514-023-10098-5}, doi = {10.1007/S10514-023-10098-5}, timestamp = {Thu, 31 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/arobots/ZhangASTSZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nn/BakerNAAABBBBDDDDEFGHIKKKKKLLLMMNPPR23, author = {Megan M. Baker and Alexander New and Mario Aguilar{-}Simon and Ziad Al{-}Halah and S{\'{e}}bastien M. R. Arnold and Eseoghene Ben{-}Iwhiwhu and Andrew P. Brna and Ethan Brooks and Ryan C. Brown and Zachary Daniels and Anurag Reddy Daram and Fabien Delattre and Ryan Dellana and Eric Eaton and Haotian Fu and Kristen Grauman and Jesse Hostetler and Shariq Iqbal and Cassandra Kent and Nicholas Ketz and Soheil Kolouri and George Konidaris and Dhireesha Kudithipudi and Erik G. Learned{-}Miller and Seungwon Lee and Michael Littman and Sandeep Madireddy and Jorge A. Mendez and Eric Q. Nguyen and Christine D. Piatko and Praveen K. Pilly and Aswin Raghavan and Abrar Rahman and Santhosh Kumar Ramakrishnan and Neale Ratzlaff and Andrea Soltoggio and Peter Stone and Indranil Sur and Zhipeng Tang and Saket Tiwari and Kyle Vedder and Felix Wang and Zifan Xu and Angel Yanguas{-}Gil and Harel Yedidsion and Shangqun Yu and Gautam K. Vallabha}, title = {A domain-agnostic approach for characterization of lifelong learning systems}, journal = {Neural Networks}, volume = {160}, pages = {274--296}, year = {2023}, url = {https://doi.org/10.1016/j.neunet.2023.01.007}, doi = {10.1016/J.NEUNET.2023.01.007}, timestamp = {Mon, 09 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/nn/BakerNAAABBBBDDDDEFGHIKKKKKLLLMMNPPR23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ram/XiaoXWSGRBMCBR23, author = {Xuesu Xiao and Zifan Xu and Garrett Warnell and Peter Stone and Ferran Gebelli Guinjoan and R{\^{o}}mulo T. Rodrigues and Herman Bruyninckx and Hanjaya Mandala and Guilherme Christmann and Jos{\'{e}} Luis Blanco{-}Claraco and Shravan Somashekara Rai}, title = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons Learned From the Second {BARN} Challenge at {ICRA} 2023 [Competitions]}, journal = {{IEEE} Robotics Autom. Mag.}, volume = {30}, number = {4}, pages = {91--97}, year = {2023}, url = {https://doi.org/10.1109/MRA.2023.3322920}, doi = {10.1109/MRA.2023.3322920}, timestamp = {Sat, 13 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ram/XiaoXWSGRBMCBR23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BoothKSNSA23, author = {Serena Booth and W. Bradley Knox and Julie Shah and Scott Niekum and Peter Stone and Alessandro Allievi}, editor = {Brian Williams and Yiling Chen and Jennifer Neville}, title = {The Perils of Trial-and-Error Reward Design: Misdesign through Overfitting and Invalid Task Specifications}, booktitle = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI} 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February 7-14, 2023}, pages = {5920--5929}, publisher = {{AAAI} Press}, year = {2023}, url = {https://doi.org/10.1609/aaai.v37i5.25733}, doi = {10.1609/AAAI.V37I5.25733}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BoothKSNSA23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/0042F0S23, author = {Bo Liu and Yihao Feng and Qiang Liu and Peter Stone}, editor = {Brian Williams and Yiling Chen and Jennifer Neville}, title = {Metric Residual Network for Sample Efficient Goal-Conditioned Reinforcement Learning}, booktitle = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI} 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February 7-14, 2023}, pages = {8799--8806}, publisher = {{AAAI} Press}, year = {2023}, url = {https://doi.org/10.1609/aaai.v37i7.26058}, doi = {10.1609/AAAI.V37I7.26058}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/0042F0S23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WangDLS23, author = {Caroline Wang and Ishan Durugkar and Elad Liebman and Peter Stone}, editor = {Brian Williams and Yiling Chen and Jennifer Neville}, title = {DM{\({^2}\)}: Decentralized Multi-Agent Reinforcement Learning via Distribution Matching}, booktitle = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI} 2023, Thirty-Fifth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February 7-14, 2023}, pages = {11699--11707}, publisher = {{AAAI} Press}, year = {2023}, url = {https://doi.org/10.1609/aaai.v37i10.26382}, doi = {10.1609/AAAI.V37I10.26382}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WangDLS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/BajajSS23, author = {Vaibhav Bajaj and Guni Sharon and Peter Stone}, editor = {Sven Koenig and Roni Stern and Mauro Vallati}, title = {Task Phasing: Automated Curriculum Learning from Demonstrations}, booktitle = {Proceedings of the Thirty-Third International Conference on Automated Planning and Scheduling, July 8-13, 2023, Prague, Czech Republic}, pages = {542--550}, publisher = {{AAAI} Press}, year = {2023}, url = {https://doi.org/10.1609/icaps.v33i1.27235}, doi = {10.1609/ICAPS.V33I1.27235}, timestamp = {Wed, 20 Sep 2023 11:58:30 +0200}, biburl = {https://dblp.org/rec/conf/aips/BajajSS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/WangWS23, author = {Caroline Wang and Garrett Warnell and Peter Stone}, editor = {Noa Agmon and Bo An and Alessandro Ricci and William Yeoh}, title = {D-Shape: Demonstration-Shaped Reinforcement Learning via Goal-Conditioning}, booktitle = {Proceedings of the 2023 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2023, London, United Kingdom, 29 May 2023 - 2 June 2023}, pages = {1267--1275}, publisher = {{ACM}}, year = {2023}, url = {https://dl.acm.org/doi/10.5555/3545946.3598772}, doi = {10.5555/3545946.3598772}, timestamp = {Tue, 23 May 2023 14:27:14 +0200}, biburl = {https://dblp.org/rec/conf/atal/WangWS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ShperbergLS23, author = {Shahaf S. Shperberg and Bo Liu and Peter Stone}, editor = {Noa Agmon and Bo An and Alessandro Ricci and William Yeoh}, title = {Relaxed Exploration Constrained Reinforcement Learning}, booktitle = {Proceedings of the 2023 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2023, London, United Kingdom, 29 May 2023 - 2 June 2023}, pages = {2821--2823}, publisher = {{ACM}}, year = {2023}, url = {https://dl.acm.org/doi/10.5555/3545946.3599090}, doi = {10.5555/3545946.3599090}, timestamp = {Tue, 23 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/ShperbergLS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/collas/XuZSMJLS23, author = {Zifan Xu and Yulin Zhang and Shahaf S. Shperberg and Reuth Mirsky and Yuqian Jiang and Bo Liu and Peter Stone}, editor = {Sarath Chandar and Razvan Pascanu and Hanie Sedghi and Doina Precup}, title = {Model-Based Meta Automatic Curriculum Learning}, booktitle = {Conference on Lifelong Learning Agents, 22-25 August 2023, McGill University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada}, series = {Proceedings of Machine Learning Research}, volume = {232}, pages = {846--860}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v232/xu23a.html}, timestamp = {Tue, 20 Feb 2024 13:52:18 +0100}, biburl = {https://dblp.org/rec/conf/collas/XuZSMJLS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/KarnanYFWBS23, author = {Haresh Karnan and Elvin Yang and Daniel Farkash and Garrett Warnell and Joydeep Biswas and Peter Stone}, editor = {Jie Tan and Marc Toussaint and Kourosh Darvish}, title = {{STERLING:} Self-Supervised Terrain Representation Learning from Unconstrained Robot Experience}, booktitle = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta, GA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {229}, pages = {2393--2413}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v229/karnan23a.html}, timestamp = {Tue, 20 Feb 2024 12:11:46 +0100}, biburl = {https://dblp.org/rec/conf/corl/KarnanYFWBS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/Zhu0SZ23, author = {Yifeng Zhu and Zhenyu Jiang and Peter Stone and Yuke Zhu}, editor = {Jie Tan and Marc Toussaint and Kourosh Darvish}, title = {Learning Generalizable Manipulation Policies with Object-Centric 3D Representations}, booktitle = {Conference on Robot Learning, CoRL 2023, 6-9 November 2023, Atlanta, GA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {229}, pages = {3418--3433}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v229/zhu23b.html}, timestamp = {Tue, 20 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/corl/Zhu0SZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/humanoids/MannemMSM23, author = {Swathi Mannem and William Macke and Peter Stone and Reuth Mirsky}, title = {Exploring the Cost of Interruptions in Human-Robot Teaming}, booktitle = {22nd {IEEE-RAS} International Conference on Humanoid Robots, Humanoids 2023, Austin, TX, USA, December 12-14, 2023}, pages = {1--8}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/Humanoids57100.2023.10375236}, doi = {10.1109/HUMANOIDS57100.2023.10375236}, timestamp = {Tue, 09 Jan 2024 15:27:05 +0100}, biburl = {https://dblp.org/rec/conf/humanoids/MannemMSM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/CuiYLLSLLS0T23, author = {Jiaxun Cui and Xiaomeng Yang and Mulong Luo and Geunbae Lee and Peter Stone and Hsien{-}Hsin S. Lee and Benjamin Lee and G. Edward Suh and Wenjie Xiong and Yuandong Tian}, title = {{MACTA:} {A} Multi-agent Reinforcement Learning Approach for Cache Timing Attacks and Detection}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=CDlHZ78-Xzi}, timestamp = {Fri, 30 Jun 2023 14:38:38 +0200}, biburl = {https://dblp.org/rec/conf/iclr/CuiYLLSLLS0T23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/XuLXNS23, author = {Zifan Xu and Bo Liu and Xuesu Xiao and Anirudh Nair and Peter Stone}, title = {Benchmarking Reinforcement Learning Techniques for Autonomous Navigation}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2023, London, UK, May 29 - June 2, 2023}, pages = {9224--9230}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/ICRA48891.2023.10160583}, doi = {10.1109/ICRA48891.2023.10160583}, timestamp = {Tue, 08 Aug 2023 10:24:29 +0200}, biburl = {https://dblp.org/rec/conf/icra/XuLXNS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/ParkXWYS23, author = {Jin Soo Park and Xuesu Xiao and Garrett Warnell and Harel Yedidsion and Peter Stone}, title = {Learning Perceptual Hallucination for Multi-Robot Navigation in Narrow Hallways}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2023, London, UK, May 29 - June 2, 2023}, pages = {10033--10039}, publisher = {{IEEE}}, year = {2023}, url = {https://doi.org/10.1109/ICRA48891.2023.10161327}, doi = {10.1109/ICRA48891.2023.10161327}, timestamp = {Tue, 08 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/ParkXWYS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/0002ZDJZS023, author = {Xiaohan Zhang and Yifeng Zhu and Yan Ding and Yuqian Jiang and Yuke Zhu and Peter Stone and Shiqi Zhang}, title = {Symbolic State Space Optimization for Long Horizon Mobile Manipulation Planning}, booktitle = {{IROS}}, pages = {866--872}, year = {2023}, url = {https://doi.org/10.1109/IROS55552.2023.10342224}, doi = {10.1109/IROS55552.2023.10342224}, timestamp = {Mon, 25 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/0002ZDJZS023.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/GhonasgiMHSD23, author = {Keya Ghonasgi and Reuth Mirsky and Adrian M. Haith and Peter Stone and Ashish D. Deshpande}, title = {A Novel Control Law for Multi-Joint Human-Robot Interaction Tasks While Maintaining Postural Coordination}, booktitle = {{IROS}}, pages = {6110--6116}, year = {2023}, url = {https://doi.org/10.1109/IROS55552.2023.10342501}, doi = {10.1109/IROS55552.2023.10342501}, timestamp = {Fri, 05 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/GhonasgiMHSD23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/AgarwalDSZ23, author = {Siddhant Agarwal and Ishan Durugkar and Peter Stone and Amy Zhang}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {f-Policy Gradients: {A} General Framework for Goal-Conditioned {RL} using f-Divergences}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/27f4d95417bb722201597bf4d67cbacc-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/AgarwalDSZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuFSL23, author = {Bo Liu and Yihao Feng and Peter Stone and Qiang Liu}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {{FAMO:} Fast Adaptive Multitask Optimization}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/b2fe1ee8d936ac08dd26f2ff58986c8f-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuFSL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuZGFLZS23, author = {Bo Liu and Yifeng Zhu and Chongkai Gao and Yihao Feng and Qiang Liu and Yuke Zhu and Peter Stone}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {{LIBERO:} Benchmarking Knowledge Transfer for Lifelong Robot Learning}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/8c3c666820ea055a77726d66fc7d447f-Abstract-Datasets\_and\_Benchmarks.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuZGFLZS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/WangHSM23, author = {Zizhao Wang and Jiaheng Hu and Peter Stone and Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {{ELDEN:} Exploration via Local Dependencies}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/31ed129feae64a7e44a15b148c15558d-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/WangHSM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/rss/HuSM23, author = {Jiaheng Hu and Peter Stone and Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n}, editor = {Kostas E. Bekris and Kris Hauser and Sylvia L. Herbert and Jingjin Yu}, title = {Causal Policy Gradient for Whole-Body Mobile Manipulation}, booktitle = {Robotics: Science and Systems XIX, Daegu, Republic of Korea, July 10-14, 2023}, year = {2023}, url = {https://doi.org/10.15607/RSS.2023.XIX.049}, doi = {10.15607/RSS.2023.XIX.049}, timestamp = {Thu, 20 Jul 2023 14:53:22 +0200}, biburl = {https://dblp.org/rec/conf/rss/HuSM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/rss/SungS23, author = {Yoonchang Sung and Peter Stone}, editor = {Kostas E. Bekris and Kris Hauser and Sylvia L. Herbert and Jingjin Yu}, title = {Motion Planning (In)feasibility Detection using a Prior Roadmap via Path and Cut Search}, booktitle = {Robotics: Science and Systems XIX, Daegu, Republic of Korea, July 10-14, 2023}, year = {2023}, url = {https://doi.org/10.15607/RSS.2023.XIX.060}, doi = {10.15607/RSS.2023.XIX.060}, timestamp = {Thu, 20 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/rss/SungS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/tas/HauserCCHWDGEKH23, author = {Elliott Hauser and Yao{-}Cheng Chan and Parth Chonkar and Geethika Hemkumar and Huihai Wang and Daksh Dua and Shikhar Gupta and Efren Mendoza Enriquez and Tiffany Kao and Justin W. Hart and Reuth Mirsky and Joydeep Biswas and Junfeng Jiao and Peter Stone}, title = {"What's That Robot Doing Here?": Perceptions Of Incidental Encounters With Autonomous Quadruped Robots}, booktitle = {Proceedings of the First International Symposium on Trustworthy Autonomous Systems, {TAS} 2023, Edinburgh, United Kingdom, July 11-12, 2023}, pages = {12:1--12:15}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3597512.3599707}, doi = {10.1145/3597512.3599707}, timestamp = {Fri, 21 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/tas/HauserCCHWDGEKH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/Morrill0HWS23, author = {Dustin Morrill and Thomas J. Walsh and Daniel Hernandez and Peter R. Wurman and Peter Stone}, editor = {Robin J. Evans and Ilya Shpitser}, title = {Composing Efficient, Robust Tests for Policy Selection}, booktitle = {Uncertainty in Artificial Intelligence, {UAI} 2023, July 31 - 4 August 2023, Pittsburgh, PA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {216}, pages = {1456--1466}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v216/morrill23a.html}, timestamp = {Mon, 28 Aug 2023 17:23:08 +0200}, biburl = {https://dblp.org/rec/conf/uai/Morrill0HWS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-07799, author = {Megan M. Baker and Alexander New and Mario Aguilar{-}Simon and Ziad Al{-}Halah and S{\'{e}}bastien M. R. Arnold and Eseoghene Ben{-}Iwhiwhu and Andrew P. Brna and Ethan Brooks and Ryan C. Brown and Zachary Daniels and Anurag Reddy Daram and Fabien Delattre and Ryan Dellana and Eric Eaton and Haotian Fu and Kristen Grauman and Jesse Hostetler and Shariq Iqbal and Cassandra Kent and Nicholas Ketz and Soheil Kolouri and George Dimitri Konidaris and Dhireesha Kudithipudi and Erik G. Learned{-}Miller and Seungwon Lee and Michael Littman and Sandeep Madireddy and Jorge A. Mendez and Eric Q. Nguyen and Christine D. Piatko and Praveen K. Pilly and Aswin Raghavan and Abrar Rahman and Santhosh Kumar Ramakrishnan and Neale Ratzlaff and Andrea Soltoggio and Peter Stone and Indranil Sur and Zhipeng Tang and Saket Tiwari and Kyle Vedder and Felix Wang and Zifan Xu and Angel Yanguas{-}Gil and Harel Yedidsion and Shangqun Yu and Gautam K. Vallabha}, title = {A Domain-Agnostic Approach for Characterization of Lifelong Learning Systems}, journal = {CoRR}, volume = {abs/2301.07799}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.07799}, doi = {10.48550/ARXIV.2301.07799}, eprinttype = {arXiv}, eprint = {2301.07799}, timestamp = {Mon, 09 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-07799.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2304-11477, author = {Bo Liu and Yuqian Jiang and Xiaohan Zhang and Qiang Liu and Shiqi Zhang and Joydeep Biswas and Peter Stone}, title = {{LLM+P:} Empowering Large Language Models with Optimal Planning Proficiency}, journal = {CoRR}, volume = {abs/2304.11477}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2304.11477}, doi = {10.48550/ARXIV.2304.11477}, eprinttype = {arXiv}, eprint = {2304.11477}, timestamp = {Tue, 23 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2304-11477.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-04866, author = {Jiaheng Hu and Peter Stone and Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n}, title = {Causal Policy Gradient for Whole-Body Mobile Manipulation}, journal = {CoRR}, volume = {abs/2305.04866}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.04866}, doi = {10.48550/ARXIV.2305.04866}, eprinttype = {arXiv}, eprint = {2305.04866}, timestamp = {Fri, 12 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-04866.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-10395, author = {Yoonchang Sung and Peter Stone}, title = {Motion Planning (In)feasibility Detection using a Prior Roadmap via Path and Cut Search}, journal = {CoRR}, volume = {abs/2305.10395}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.10395}, doi = {10.48550/ARXIV.2305.10395}, eprinttype = {arXiv}, eprint = {2305.10395}, timestamp = {Wed, 24 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-10395.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-03310, author = {Bo Liu and Yifeng Zhu and Chongkai Gao and Yihao Feng and Qiang Liu and Yuke Zhu and Peter Stone}, title = {{LIBERO:} Benchmarking Knowledge Transfer for Lifelong Robot Learning}, journal = {CoRR}, volume = {abs/2306.03310}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.03310}, doi = {10.48550/ARXIV.2306.03310}, eprinttype = {arXiv}, eprint = {2306.03310}, timestamp = {Mon, 31 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-03310.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-03792, author = {Bo Liu and Yihao Feng and Peter Stone and Qiang Liu}, title = {{FAMO:} Fast Adaptive Multitask Optimization}, journal = {CoRR}, volume = {abs/2306.03792}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.03792}, doi = {10.48550/ARXIV.2306.03792}, eprinttype = {arXiv}, eprint = {2306.03792}, timestamp = {Mon, 31 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-03792.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-07372, author = {Dustin Morrill and Thomas J. Walsh and Daniel Hernandez and Peter R. Wurman and Peter Stone}, title = {Composing Efficient, Robust Tests for Policy Selection}, journal = {CoRR}, volume = {abs/2306.07372}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.07372}, doi = {10.48550/ARXIV.2306.07372}, eprinttype = {arXiv}, eprint = {2306.07372}, timestamp = {Sat, 17 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-07372.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-16740, author = {Anthony G. Francis and Claudia P{\'{e}}rez{-}D'Arpino and Chengshu Li and Fei Xia and Alexandre Alahi and Rachid Alami and Aniket Bera and Abhijat Biswas and Joydeep Biswas and Rohan Chandra and Hao{-}Tien Lewis Chiang and Michael Everett and Sehoon Ha and Justin W. Hart and Jonathan P. How and Haresh Karnan and Tsang{-}Wei Edward Lee and Luis J. Manso and Reuth Mirsky and S{\"{o}}ren Pirk and Phani{-}Teja Singamaneni and Peter Stone and Ada V. Taylor and Peter Trautman and Nathan Tsoi and Marynel V{\'{a}}zquez and Xuesu Xiao and Peng Xu and Naoki Yokoyama and Alexander Toshev and Roberto Martin Martin}, title = {Principles and Guidelines for Evaluating Social Robot Navigation Algorithms}, journal = {CoRR}, volume = {abs/2306.16740}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.16740}, doi = {10.48550/ARXIV.2306.16740}, eprinttype = {arXiv}, eprint = {2306.16740}, timestamp = {Mon, 03 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-16740.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-11889, author = {Xiaohan Zhang and Yifeng Zhu and Yan Ding and Yuqian Jiang and Yuke Zhu and Peter Stone and Shiqi Zhang}, title = {Symbolic State Space Optimization for Long Horizon Mobile Manipulation Planning}, journal = {CoRR}, volume = {abs/2307.11889}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.11889}, doi = {10.48550/ARXIV.2307.11889}, eprinttype = {arXiv}, eprint = {2307.11889}, timestamp = {Mon, 25 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-11889.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-03205, author = {Xuesu Xiao and Zifan Xu and Garrett Warnell and Peter Stone and Ferran Gebelli Guinjoan and R{\^{o}}mulo T. Rodrigues and Herman Bruyninckx and Hanjaya Mandala and Guilherme Christmann and Jos{\'{e}} Luis Blanco{-}Claraco and Shravan Somashekara Rai}, title = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons learned from The 2nd {BARN} Challenge at {ICRA} 2023}, journal = {CoRR}, volume = {abs/2308.03205}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.03205}, doi = {10.48550/ARXIV.2308.03205}, eprinttype = {arXiv}, eprint = {2308.03205}, timestamp = {Mon, 21 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-03205.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-09595, author = {Arrasy Rahman and Jiaxun Cui and Peter Stone}, title = {Minimum Coverage Sets for Training Robust Ad Hoc Teamwork Agents}, journal = {CoRR}, volume = {abs/2308.09595}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.09595}, doi = {10.48550/ARXIV.2308.09595}, eprinttype = {arXiv}, eprint = {2308.09595}, timestamp = {Fri, 25 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-09595.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-10966, author = {Rohan Chandra and Vrushabh Zinage and Efstathios Bakolas and Joydeep Biswas and Peter Stone}, title = {Decentralized Multi-Robot Social Navigation in Constrained Environments via Game-Theoretic Control Barrier Functions}, journal = {CoRR}, volume = {abs/2308.10966}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.10966}, doi = {10.48550/ARXIV.2308.10966}, eprinttype = {arXiv}, eprint = {2308.10966}, timestamp = {Wed, 30 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-10966.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-14269, author = {Elad Liebman and Peter Stone}, title = {Utilizing Mood-Inducing Background Music in Human-Robot Interaction}, journal = {CoRR}, volume = {abs/2308.14269}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.14269}, doi = {10.48550/ARXIV.2308.14269}, eprinttype = {arXiv}, eprint = {2308.14269}, timestamp = {Fri, 01 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-14269.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-08897, author = {Yoonchang Sung and Rahul Shome and Peter Stone}, title = {Asynchronous Task Plan Refinement for Multi-Robot Task and Motion Planning}, journal = {CoRR}, volume = {abs/2309.08897}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.08897}, doi = {10.48550/ARXIV.2309.08897}, eprinttype = {arXiv}, eprint = {2309.08897}, timestamp = {Fri, 22 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-08897.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-09912, author = {Haresh Karnan and Elvin Yang and Garrett Warnell and Joydeep Biswas and Peter Stone}, title = {Wait, That Feels Familiar: Learning to Extrapolate Human Preferences for Preference Aligned Path Planning}, journal = {CoRR}, volume = {abs/2309.09912}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.09912}, doi = {10.48550/ARXIV.2309.09912}, eprinttype = {arXiv}, eprint = {2309.09912}, timestamp = {Fri, 22 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-09912.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-13466, author = {Amir Hossain Raj and Zichao Hu and Haresh Karnan and Rohan Chandra and Amirreza Payandeh and Luisa Mao and Peter Stone and Joydeep Biswas and Xuesu Xiao}, title = {Targeted Learning: {A} Hybrid Approach to Social Robot Navigation}, journal = {CoRR}, volume = {abs/2309.13466}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.13466}, doi = {10.48550/ARXIV.2309.13466}, eprinttype = {arXiv}, eprint = {2309.13466}, timestamp = {Wed, 27 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-13466.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-15302, author = {Haresh Karnan and Elvin Yang and Daniel Farkash and Garrett Warnell and Joydeep Biswas and Peter Stone}, title = {Self-Supervised Terrain Representation Learning from Unconstrained Robot Experience}, journal = {CoRR}, volume = {abs/2309.15302}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.15302}, doi = {10.48550/ARXIV.2309.15302}, eprinttype = {arXiv}, eprint = {2309.15302}, timestamp = {Tue, 17 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-15302.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-02456, author = {W. Bradley Knox and Stephane Hatgis{-}Kessell and Sigurdur O. Adalgeirsson and Serena Booth and Anca D. Dragan and Peter Stone and Scott Niekum}, title = {Learning Optimal Advantage from Preferences and Mistaking it for Reward}, journal = {CoRR}, volume = {abs/2310.02456}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.02456}, doi = {10.48550/ARXIV.2310.02456}, eprinttype = {arXiv}, eprint = {2310.02456}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-02456.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-06303, author = {Carson Stark and Bohkyung Chun and Casey Charleston and Varsha Ravi and Luis Pabon and Surya Sunkari and Tarun Mohan and Peter Stone and Justin W. Hart}, title = {Dobby: {A} Conversational Service Robot Driven by {GPT-4}}, journal = {CoRR}, volume = {abs/2310.06303}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.06303}, doi = {10.48550/ARXIV.2310.06303}, eprinttype = {arXiv}, eprint = {2310.06303}, timestamp = {Tue, 24 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-06303.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-06794, author = {Siddhant Agarwal and Ishan Durugkar and Peter Stone and Amy Zhang}, title = {f-Policy Gradients: {A} General Framework for Goal Conditioned {RL} using f-Divergences}, journal = {CoRR}, volume = {abs/2310.06794}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.06794}, doi = {10.48550/ARXIV.2310.06794}, eprinttype = {arXiv}, eprint = {2310.06794}, timestamp = {Tue, 24 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-06794.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-08702, author = {Jiaheng Hu and Zizhao Wang and Peter Stone and Roberto Martin Martin}, title = {{ELDEN:} Exploration via Local Dependencies}, journal = {CoRR}, volume = {abs/2310.08702}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.08702}, doi = {10.48550/ARXIV.2310.08702}, eprinttype = {arXiv}, eprint = {2310.08702}, timestamp = {Wed, 25 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-08702.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-14386, author = {Yifeng Zhu and Zhenyu Jiang and Peter Stone and Yuke Zhu}, title = {Learning Generalizable Manipulation Policies with Object-Centric 3D Representations}, journal = {CoRR}, volume = {abs/2310.14386}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.14386}, doi = {10.48550/ARXIV.2310.14386}, eprinttype = {arXiv}, eprint = {2310.14386}, timestamp = {Mon, 30 Oct 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-14386.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-00785, author = {Swathi Mannem and William Macke and Peter Stone and Reuth Mirsky}, title = {Exploring the Cost of Interruptions in Human-Robot Teaming}, journal = {CoRR}, volume = {abs/2311.00785}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.00785}, doi = {10.48550/ARXIV.2311.00785}, eprinttype = {arXiv}, eprint = {2311.00785}, timestamp = {Tue, 07 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-00785.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-08783, author = {Sveta Paster and Kantwon Rogers and Gordon Briggs and Peter Stone and Reuth Mirsky}, title = {{ICRA} Roboethics Challenge 2023: Intelligent Disobedience in an Elderly Care Home}, journal = {CoRR}, volume = {abs/2311.08783}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.08783}, doi = {10.48550/ARXIV.2311.08783}, eprinttype = {arXiv}, eprint = {2311.08783}, timestamp = {Tue, 21 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-08783.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2312-04684, author = {Zifan Xu and Haozhu Wang and Dmitriy Bespalov and Peter Stone and Yanjun Qi}, title = {Latent Skill Discovery for Chain-of-Thought Reasoning}, journal = {CoRR}, volume = {abs/2312.04684}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2312.04684}, doi = {10.48550/ARXIV.2312.04684}, eprinttype = {arXiv}, eprint = {2312.04684}, timestamp = {Wed, 03 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2312-04684.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/arobots/XiaoLWS22, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {Motion planning and control for mobile robot navigation using machine learning: a survey}, journal = {Auton. Robots}, volume = {46}, number = {5}, pages = {569--597}, year = {2022}, url = {https://doi.org/10.1007/s10514-022-10039-8}, doi = {10.1007/S10514-022-10039-8}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/arobots/XiaoLWS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/expert/WurmanSS22, author = {Peter R. Wurman and Peter Stone and Michael Spranger}, title = {Challenges and Opportunities of Applying Reinforcement Learning to Autonomous Racing}, journal = {{IEEE} Intell. Syst.}, volume = {37}, number = {3}, pages = {20--23}, year = {2022}, url = {https://doi.org/10.1109/MIS.2022.3184427}, doi = {10.1109/MIS.2022.3184427}, timestamp = {Mon, 08 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/expert/WurmanSS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ior/AlbertCLS22, author = {Michael Albert and Vincent Conitzer and Giuseppe Lopomo and Peter Stone}, title = {Mechanism Design for Correlated Valuations: Efficient Methods for Revenue Maximization}, journal = {Oper. Res.}, volume = {70}, number = {1}, pages = {562--584}, year = {2022}, url = {https://doi.org/10.1287/opre.2020.2092}, doi = {10.1287/OPRE.2020.2092}, timestamp = {Wed, 23 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ior/AlbertCLS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nature/WurmanBKMS0CDE022, author = {Peter R. Wurman and Samuel Barrett and Kenta Kawamoto and James MacGlashan and Kaushik Subramanian and Thomas J. Walsh and Roberto Capobianco and Alisa Devlic and Franziska Eckert and Florian Fuchs and Leilani Gilpin and Piyush Khandelwal and Varun Kompella and HaoChih Lin and Patrick MacAlpine and Declan Oller and Takuma Seno and Craig Sherstan and Michael D. Thomure and Houmehr Aghabozorgi and Leon Barrett and Rory Douglas and Dion Whitehead and Peter D{\"{u}}rr and Peter Stone and Michael Spranger and Hiroaki Kitano}, title = {Outracing champion Gran Turismo drivers with deep reinforcement learning}, journal = {Nat.}, volume = {602}, number = {7896}, pages = {223--228}, year = {2022}, url = {https://doi.org/10.1038/s41586-021-04357-7}, doi = {10.1038/S41586-021-04357-7}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/nature/WurmanBKMS0CDE022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nca/DuWGST22, author = {Yunshu Du and Garrett Warnell and Assefaw H. Gebremedhin and Peter Stone and Matthew E. Taylor}, title = {Lucid dreaming for experience replay: refreshing past states with the current policy}, journal = {Neural Comput. Appl.}, volume = {34}, number = {3}, pages = {1687--1712}, year = {2022}, url = {https://doi.org/10.1007/s00521-021-06104-5}, doi = {10.1007/S00521-021-06104-5}, timestamp = {Wed, 23 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nca/DuWGST22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/ZhuSZ22, author = {Yifeng Zhu and Peter Stone and Yuke Zhu}, title = {Bottom-Up Skill Discovery From Unsegmented Demonstrations for Long-Horizon Robot Manipulation}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {7}, number = {2}, pages = {4126--4133}, year = {2022}, url = {https://doi.org/10.1109/LRA.2022.3146589}, doi = {10.1109/LRA.2022.3146589}, timestamp = {Fri, 01 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ral/ZhuSZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/KarnanNXWPTHBS22, author = {Haresh Karnan and Anirudh Nair and Xuesu Xiao and Garrett Warnell and S{\"{o}}ren Pirk and Alexander Toshev and Justin W. Hart and Joydeep Biswas and Peter Stone}, title = {Socially CompliAnt Navigation Dataset {(SCAND):} {A} Large-Scale Dataset of Demonstrations for Social Navigation}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {7}, number = {4}, pages = {11807--11814}, year = {2022}, url = {https://doi.org/10.1109/LRA.2022.3184025}, doi = {10.1109/LRA.2022.3184025}, timestamp = {Mon, 05 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ral/KarnanNXWPTHBS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ram/XiaoXWSWSZRWKBM22, author = {Xuesu Xiao and Zifan Xu and Zizhao Wang and Yunlong Song and Garrett Warnell and Peter Stone and Tingnan Zhang and Shravan Ravi and Gary Wang and Haresh Karnan and Joydeep Biswas and Nicholas Mohammad and Lauren Bramblett and Rahul Peddi and Nicola Bezzo and Zhanteng Xie and Philip M. Dames}, title = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons Learned From the Benchmark Autonomous Robot Navigation Challenge at {ICRA} 2022 [Competitions]}, journal = {{IEEE} Robotics Autom. Mag.}, volume = {29}, number = {4}, pages = {148--156}, year = {2022}, url = {https://doi.org/10.1109/MRA.2022.3213466}, doi = {10.1109/MRA.2022.3213466}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ram/XiaoXWSWSZRWKBM22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/XiaoWXLWDNS22, author = {Xuesu Xiao and Zizhao Wang and Zifan Xu and Bo Liu and Garrett Warnell and Gauraang Dhamankar and Anirudh Nair and Peter Stone}, title = {{APPL:} Adaptive Planner Parameter Learning}, journal = {Robotics Auton. Syst.}, volume = {154}, pages = {104132}, year = {2022}, url = {https://doi.org/10.1016/j.robot.2022.104132}, doi = {10.1016/J.ROBOT.2022.104132}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ras/XiaoWXLWDNS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/collas/Shperberg0AS22, author = {Shahaf S. Shperberg and Bo Liu and Alessandro Allievi and Peter Stone}, editor = {Sarath Chandar and Razvan Pascanu and Doina Precup}, title = {A Rule-based Shield: Accumulating Safety Rules from Catastrophic Action Effects}, booktitle = {Conference on Lifelong Learning Agents, CoLLAs 2022, 22-24 August 2022, McGill University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada}, series = {Proceedings of Machine Learning Research}, volume = {199}, pages = {231--242}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v199/shperberg22a.html}, timestamp = {Fri, 17 Feb 2023 16:29:10 +0100}, biburl = {https://dblp.org/rec/conf/collas/Shperberg0AS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/collas/LiuLS22, author = {Bo Liu and Qiang Liu and Peter Stone}, editor = {Sarath Chandar and Razvan Pascanu and Doina Precup}, title = {Continual Learning and Private Unlearning}, booktitle = {Conference on Lifelong Learning Agents, CoLLAs 2022, 22-24 August 2022, McGill University, Montr{\'{e}}al, Qu{\'{e}}bec, Canada}, series = {Proceedings of Machine Learning Research}, volume = {199}, pages = {243--254}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v199/liu22a.html}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/collas/LiuLS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/ZhuJSZ22, author = {Yifeng Zhu and Abhishek Joshi and Peter Stone and Yuke Zhu}, editor = {Karen Liu and Dana Kulic and Jeffrey Ichnowski}, title = {{VIOLA:} Object-Centric Imitation Learning for Vision-Based Robot Manipulation}, booktitle = {Conference on Robot Learning, CoRL 2022, 14-18 December 2022, Auckland, New Zealand}, series = {Proceedings of Machine Learning Research}, volume = {205}, pages = {1199--1210}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v205/zhu23a.html}, timestamp = {Wed, 15 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/corl/ZhuJSZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/SungWS22, author = {Yoonchang Sung and Zizhao Wang and Peter Stone}, editor = {Karen Liu and Dana Kulic and Jeffrey Ichnowski}, title = {Learning to Correct Mistakes: Backjumping in Long-Horizon Task and Motion Planning}, booktitle = {Conference on Robot Learning, CoRL 2022, 14-18 December 2022, Auckland, New Zealand}, series = {Proceedings of Machine Learning Research}, volume = {205}, pages = {2115--2124}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v205/sung23a.html}, timestamp = {Wed, 15 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/corl/SungWS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/CuiQ0SZ22, author = {Jiaxun Cui and Hang Qiu and Dian Chen and Peter Stone and Yuke Zhu}, title = {Coopernaut: End-to-End Driving with Cooperative Perception for Networked Vehicles}, booktitle = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022}, pages = {17231--17241}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/CVPR52688.2022.01674}, doi = {10.1109/CVPR52688.2022.01674}, timestamp = {Mon, 13 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/CuiQ0SZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eenergy/Nweye0LS22, author = {Kingsley Nweye and Zolt{\'{a}}n Nagy and Bo Liu and Peter Stone}, editor = {Sebastian Lehnhoff and David E. Irwin and Dan Wang}, title = {Offline training of multi-agent reinforcement agents for grid-interactive buildings control}, booktitle = {e-Energy '22: The Thirteenth {ACM} International Conference on Future Energy Systems, Virtual Event, 28 June 2022 - 1 July 2022}, pages = {442--443}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3538637.3538752}, doi = {10.1145/3538637.3538752}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/eenergy/Nweye0LS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eumas/MirskyCRFMSSA22, author = {Reuth Mirsky and Ignacio Carlucho and Arrasy Rahman and Elliot Fosong and William Macke and Mohan Sridharan and Peter Stone and Stefano V. Albrecht}, editor = {Dorothea Baumeister and J{\"{o}}rg Rothe}, title = {A Survey of Ad Hoc Teamwork Research}, booktitle = {Multi-Agent Systems - 19th European Conference, {EUMAS} 2022, D{\"{u}}sseldorf, Germany, September 14-16, 2022, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {13442}, pages = {275--293}, publisher = {Springer}, year = {2022}, url = {https://doi.org/10.1007/978-3-031-20614-6\_16}, doi = {10.1007/978-3-031-20614-6\_16}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/eumas/MirskyCRFMSSA22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/KumarLMS22, author = {Akarsh Kumar and Bo Liu and Risto Miikkulainen and Peter Stone}, editor = {Jonathan E. Fieldsend and Markus Wagner}, title = {Effective mutation rate adaptation through group elite selection}, booktitle = {{GECCO} '22: Genetic and Evolutionary Computation Conference, Boston, Massachusetts, USA, July 9 - 13, 2022}, pages = {721--729}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3512290.3528706}, doi = {10.1145/3512290.3528706}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/KumarLMS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/WangXXZS22, author = {Zizhao Wang and Xuesu Xiao and Zifan Xu and Yuke Zhu and Peter Stone}, editor = {Kamalika Chaudhuri and Stefanie Jegelka and Le Song and Csaba Szepesv{\'{a}}ri and Gang Niu and Sivan Sabato}, title = {Causal Dynamics Learning for Task-Independent State Abstraction}, booktitle = {International Conference on Machine Learning, {ICML} 2022, 17-23 July 2022, Baltimore, Maryland, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {162}, pages = {23151--23180}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v162/wang22ae.html}, timestamp = {Tue, 12 Jul 2022 17:36:52 +0200}, biburl = {https://dblp.org/rec/conf/icml/WangXXZS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/ZhangZDZS022, author = {Xiaohan Zhang and Yifeng Zhu and Yan Ding and Yuke Zhu and Peter Stone and Shiqi Zhang}, title = {Visually Grounded Task and Motion Planning for Mobile Manipulation}, booktitle = {2022 International Conference on Robotics and Automation, {ICRA} 2022, Philadelphia, PA, USA, May 23-27, 2022}, pages = {1925--1931}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICRA46639.2022.9812055}, doi = {10.1109/ICRA46639.2022.9812055}, timestamp = {Mon, 25 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/ZhangZDZS022.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KarnanTWS22, author = {Haresh Karnan and Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Adversarial Imitation Learning from Video Using a State Observer}, booktitle = {2022 International Conference on Robotics and Automation, {ICRA} 2022, Philadelphia, PA, USA, May 23-27, 2022}, pages = {2452--2458}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICRA46639.2022.9811570}, doi = {10.1109/ICRA46639.2022.9811570}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KarnanTWS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/HudsonWTS22, author = {Eddy Hudson and Garrett Warnell and Faraz Torabi and Peter Stone}, title = {Skeletal Feature Compensation for Imitation Learning with Embodiment Mismatch}, booktitle = {2022 International Conference on Robotics and Automation, {ICRA} 2022, Philadelphia, PA, USA, May 23-27, 2022}, pages = {2482--2488}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICRA46639.2022.9812127}, doi = {10.1109/ICRA46639.2022.9812127}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/HudsonWTS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KarnanWXS22, author = {Haresh Karnan and Garrett Warnell and Xuesu Xiao and Peter Stone}, title = {{VOILA:} Visual-Observation-Only Imitation Learning for Autonomous Navigation}, booktitle = {2022 International Conference on Robotics and Automation, {ICRA} 2022, Philadelphia, PA, USA, May 23-27, 2022}, pages = {2497--2503}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/ICRA46639.2022.9812316}, doi = {10.1109/ICRA46639.2022.9812316}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KarnanWXS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/SokarMMPS22, author = {Ghada Sokar and Elena Mocanu and Decebal Constantin Mocanu and Mykola Pechenizkiy and Peter Stone}, editor = {Luc De Raedt}, title = {Dynamic Sparse Training for Deep Reinforcement Learning}, booktitle = {Proceedings of the Thirty-First International Joint Conference on Artificial Intelligence, {IJCAI} 2022, Vienna, Austria, 23-29 July 2022}, pages = {3437--3443}, publisher = {ijcai.org}, year = {2022}, url = {https://doi.org/10.24963/ijcai.2022/477}, doi = {10.24963/IJCAI.2022/477}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ijcai/SokarMMPS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/KarnanSARXWSB22, author = {Haresh Karnan and Kavan Singh Sikand and Pranav Atreya and Sadegh Rabiee and Xuesu Xiao and Garrett Warnell and Peter Stone and Joydeep Biswas}, title = {{VI-IKD:} High-Speed Accurate Off-Road Navigation using Learned Visual-Inertial Inverse Kinodynamics}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2022, Kyoto, Japan, October 23-27, 2022}, pages = {3294--3301}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/IROS47612.2022.9982060}, doi = {10.1109/IROS47612.2022.9982060}, timestamp = {Tue, 03 Jan 2023 14:18:21 +0100}, biburl = {https://dblp.org/rec/conf/iros/KarnanSARXWSB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/GhonasgiMHSD22, author = {Keya Ghonasgi and Reuth Mirsky and Adrian M. Haith and Peter Stone and Ashish D. Deshpande}, title = {Quantifying Changes in Kinematic Behavior of a Human-Exoskeleton Interactive System}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2022, Kyoto, Japan, October 23-27, 2022}, pages = {10734--10739}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/IROS47612.2022.9981032}, doi = {10.1109/IROS47612.2022.9981032}, timestamp = {Tue, 03 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/GhonasgiMHSD22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuYWSL22, author = {Bo Liu and Mao Ye and Stephen Wright and Peter Stone and Qiang Liu}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {BOME! Bilevel Optimization Made Easy: {A} Simple First-Order Approach}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/6dddcff5b115b40c998a08fbd1cea4d7-Abstract-Conference.html}, timestamp = {Tue, 23 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuYWSL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/MacGlashanADSSW22, author = {James MacGlashan and Evan Archer and Alisa Devlic and Takuma Seno and Craig Sherstan and Peter R. Wurman and Peter Stone}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Value Function Decomposition for Iterative Design of Reinforcement Learning Agents}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/4eb2c0adafbe71269f3a772c130f9e53-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/MacGlashanADSSW22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/NarayanaswamiTD22, author = {Sai Kiran Narayanaswami and Mauricio Tec and Ishan Durugkar and Siddharth Desai and Bharath Masetty and Sanmit Narvekar and Peter Stone}, editor = {Amy Eguchi and Nuno Lau and Maike Paetzel{-}Pr{\"{u}}smann and Thanapat Wanichanon}, title = {Towards a Real-Time, Low-Resource, End-to-End Object Detection Pipeline for Robot Soccer}, booktitle = {RoboCup 2022: - Robot World Cup {XXV} [Bangkok, Thailand, July 11-17, 2022]}, series = {Lecture Notes in Computer Science}, volume = {13561}, pages = {62--74}, publisher = {Springer}, year = {2022}, url = {https://doi.org/10.1007/978-3-031-28469-4\_6}, doi = {10.1007/978-3-031-28469-4\_6}, timestamp = {Wed, 24 May 2023 15:08:30 +0200}, biburl = {https://dblp.org/rec/conf/robocup/NarayanaswamiTD22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ssrr/NairJHXLXS22, author = {Anirudh Nair and Fulin Jiang and Kang Hou and Zifan Xu and Shuozhe Li and Xuesu Xiao and Peter Stone}, title = {DynaBARN: Benchmarking Metric Ground Navigation in Dynamic Environments}, booktitle = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics, {SSRR} 2022, Sevilla, Spain, November 8-10, 2022}, pages = {347--352}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SSRR56537.2022.10018758}, doi = {10.1109/SSRR56537.2022.10018758}, timestamp = {Wed, 08 Feb 2023 22:09:23 +0100}, biburl = {https://dblp.org/rec/conf/ssrr/NairJHXLXS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-00243, author = {Haresh Karnan and Garrett Warnell and Faraz Torabi and Peter Stone}, title = {Adversarial Imitation Learning from Video using a State Observer}, journal = {CoRR}, volume = {abs/2202.00243}, year = {2022}, url = {https://arxiv.org/abs/2202.00243}, eprinttype = {arXiv}, eprint = {2202.00243}, timestamp = {Wed, 09 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-00243.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-09516, author = {Shahaf S. Shperberg and Bo Liu and Peter Stone}, title = {Learning a Shield from Catastrophic Action Effects: Never Repeat the Same Mistake}, journal = {CoRR}, volume = {abs/2202.09516}, year = {2022}, url = {https://arxiv.org/abs/2202.09516}, eprinttype = {arXiv}, eprint = {2202.09516}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-09516.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-10450, author = {Reuth Mirsky and Ignacio Carlucho and Arrasy Rahman and Elliot Fosong and William Macke and Mohan Sridharan and Peter Stone and Stefano V. Albrecht}, title = {A Survey of Ad Hoc Teamwork: Definitions, Methods, and Open Problems}, journal = {CoRR}, volume = {abs/2202.10450}, year = {2022}, url = {https://arxiv.org/abs/2202.10450}, eprinttype = {arXiv}, eprint = {2202.10450}, timestamp = {Wed, 02 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-10450.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-10667, author = {Xiaohan Zhang and Yifeng Zhu and Yan Ding and Yuke Zhu and Peter Stone and Shiqi Zhang}, title = {Visually Grounded Task and Motion Planning for Mobile Manipulation}, journal = {CoRR}, volume = {abs/2202.10667}, year = {2022}, url = {https://arxiv.org/abs/2202.10667}, eprinttype = {arXiv}, eprint = {2202.10667}, timestamp = {Mon, 25 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-10667.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-12817, author = {Bo Liu and Qiang Liu and Peter Stone}, title = {Continual Learning and Private Unlearning}, journal = {CoRR}, volume = {abs/2203.12817}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.12817}, doi = {10.48550/ARXIV.2203.12817}, eprinttype = {arXiv}, eprint = {2203.12817}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-12817.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-15041, author = {Haresh Karnan and Anirudh Nair and Xuesu Xiao and Garrett Warnell and S{\"{o}}ren Pirk and Alexander Toshev and Justin W. Hart and Joydeep Biswas and Peter Stone}, title = {Socially Compliant Navigation Dataset {(SCAND):} {A} Large-Scale Dataset of Demonstrations for Social Navigation}, journal = {CoRR}, volume = {abs/2203.15041}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.15041}, doi = {10.48550/ARXIV.2203.15041}, eprinttype = {arXiv}, eprint = {2203.15041}, timestamp = {Mon, 28 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-15041.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-15983, author = {Haresh Karnan and Kavan Singh Sikand and Pranav Atreya and Sadegh Rabiee and Xuesu Xiao and Garrett Warnell and Peter Stone and Joydeep Biswas}, title = {{VI-IKD:} High-Speed Accurate Off-Road Navigation using Learned Visual-Inertial Inverse Kinodynamics}, journal = {CoRR}, volume = {abs/2203.15983}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.15983}, doi = {10.48550/ARXIV.2203.15983}, eprinttype = {arXiv}, eprint = {2203.15983}, timestamp = {Mon, 04 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-15983.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-04817, author = {Akarsh Kumar and Bo Liu and Risto Miikkulainen and Peter Stone}, title = {Effective Mutation Rate Adaptation through Group Elite Selection}, journal = {CoRR}, volume = {abs/2204.04817}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.04817}, doi = {10.48550/ARXIV.2204.04817}, eprinttype = {arXiv}, eprint = {2204.04817}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-04817.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-02222, author = {Jiaxun Cui and Hang Qiu and Dian Chen and Peter Stone and Yuke Zhu}, title = {{COOPERNAUT:} End-to-End Driving with Cooperative Perception for Networked Vehicles}, journal = {CoRR}, volume = {abs/2205.02222}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.02222}, doi = {10.48550/ARXIV.2205.02222}, eprinttype = {arXiv}, eprint = {2205.02222}, timestamp = {Mon, 13 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-02222.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-00233, author = {Caroline Wang and Ishan Durugkar and Elad Liebman and Peter Stone}, title = {DM\({}^{\mbox{2}}\): Distributed Multi-Agent Reinforcement Learning for Distribution Matching}, journal = {CoRR}, volume = {abs/2206.00233}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.00233}, doi = {10.48550/ARXIV.2206.00233}, eprinttype = {arXiv}, eprint = {2206.00233}, timestamp = {Mon, 13 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-00233.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-02231, author = {W. Bradley Knox and Stephane Hatgis{-}Kessell and Serena Booth and Scott Niekum and Peter Stone and Alessandro Allievi}, title = {Models of human preference for learning reward functions}, journal = {CoRR}, volume = {abs/2206.02231}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.02231}, doi = {10.48550/ARXIV.2206.02231}, eprinttype = {arXiv}, eprint = {2206.02231}, timestamp = {Mon, 13 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-02231.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-08487, author = {Pranav Atreya and Haresh Karnan and Kavan Singh Sikand and Xuesu Xiao and Garrett Warnell and Sadegh Rabiee and Peter Stone and Joydeep Biswas}, title = {High-Speed Accurate Robot Control using Learned Forward Kinodynamics and Non-linear Least Squares Optimization}, journal = {CoRR}, volume = {abs/2206.08487}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.08487}, doi = {10.48550/ARXIV.2206.08487}, eprinttype = {arXiv}, eprint = {2206.08487}, timestamp = {Tue, 21 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-08487.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-13452, author = {Zizhao Wang and Xuesu Xiao and Zifan Xu and Yuke Zhu and Peter Stone}, title = {Causal Dynamics Learning for Task-Independent State Abstraction}, journal = {CoRR}, volume = {abs/2206.13452}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.13452}, doi = {10.48550/ARXIV.2206.13452}, eprinttype = {arXiv}, eprint = {2206.13452}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-13452.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-13901, author = {James MacGlashan and Evan Archer and Alisa Devlic and Takuma Seno and Craig Sherstan and Peter R. Wurman and Peter Stone}, title = {Value Function Decomposition for Iterative Design of Reinforcement Learning Agents}, journal = {CoRR}, volume = {abs/2206.13901}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.13901}, doi = {10.48550/ARXIV.2206.13901}, eprinttype = {arXiv}, eprint = {2206.13901}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-13901.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2208-08133, author = {Bo Liu and Yihao Feng and Qiang Liu and Peter Stone}, title = {Metric Residual Networks for Sample Efficient Goal-conditioned Reinforcement Learning}, journal = {CoRR}, volume = {abs/2208.08133}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2208.08133}, doi = {10.48550/ARXIV.2208.08133}, eprinttype = {arXiv}, eprint = {2208.08133}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2208-08133.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2208-10473, author = {Xuesu Xiao and Zifan Xu and Zizhao Wang and Yunlong Song and Garrett Warnell and Peter Stone and Tingnan Zhang and Shravan Ravi and Gary Wang and Haresh Karnan and Joydeep Biswas and Nicholas Mohammad and Lauren Bramblett and Rahul Peddi and Nicola Bezzo and Zhanteng Xie and Philip M. Dames}, title = {Autonomous Ground Navigation in Highly Constrained Spaces: Lessons learned from The {BARN} Challenge at {ICRA} 2022}, journal = {CoRR}, volume = {abs/2208.10473}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2208.10473}, doi = {10.48550/ARXIV.2208.10473}, eprinttype = {arXiv}, eprint = {2208.10473}, timestamp = {Mon, 29 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2208-10473.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-08709, author = {Mao Ye and Bo Liu and Stephen Wright and Peter Stone and Qiang Liu}, title = {BOME! Bilevel Optimization Made Easy: {A} Simple First-Order Approach}, journal = {CoRR}, volume = {abs/2209.08709}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.08709}, doi = {10.48550/ARXIV.2209.08709}, eprinttype = {arXiv}, eprint = {2209.08709}, timestamp = {Wed, 15 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-08709.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-13641, author = {Jin Soo Park and Xuesu Xiao and Garrett Warnell and Harel Yedidsion and Peter Stone}, title = {Learning Perceptual Hallucination for Multi-Robot Navigation in Narrow Hallways}, journal = {CoRR}, volume = {abs/2209.13641}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.13641}, doi = {10.48550/ARXIV.2209.13641}, eprinttype = {arXiv}, eprint = {2209.13641}, timestamp = {Thu, 06 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-13641.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-04839, author = {Zifan Xu and Bo Liu and Xuesu Xiao and Anirudh Nair and Peter Stone}, title = {Benchmarking Reinforcement Learning Techniques for Autonomous Navigation}, journal = {CoRR}, volume = {abs/2210.04839}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.04839}, doi = {10.48550/ARXIV.2210.04839}, eprinttype = {arXiv}, eprint = {2210.04839}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-04839.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-04852, author = {Zifan Xu and Anirudh Nair and Xuesu Xiao and Peter Stone}, title = {Learning Real-world Autonomous Navigation by Self-Supervised Environment Synthesis}, journal = {CoRR}, volume = {abs/2210.04852}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.04852}, doi = {10.48550/ARXIV.2210.04852}, eprinttype = {arXiv}, eprint = {2210.04852}, timestamp = {Thu, 13 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-04852.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-10999, author = {Vaibhav Bajaj and Guni Sharon and Peter Stone}, title = {Task Phasing: Automated Curriculum Learning from Demonstrations}, journal = {CoRR}, volume = {abs/2210.10999}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.10999}, doi = {10.48550/ARXIV.2210.10999}, eprinttype = {arXiv}, eprint = {2210.10999}, timestamp = {Tue, 25 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-10999.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-11339, author = {Yifeng Zhu and Abhishek Joshi and Peter Stone and Yuke Zhu}, title = {{VIOLA:} Imitation Learning for Vision-Based Manipulation with Object Proposal Priors}, journal = {CoRR}, volume = {abs/2210.11339}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.11339}, doi = {10.48550/ARXIV.2210.11339}, eprinttype = {arXiv}, eprint = {2210.11339}, timestamp = {Tue, 25 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-11339.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-14428, author = {Caroline Wang and Garrett Warnell and Peter Stone}, title = {D-Shape: Demonstration-Shaped Reinforcement Learning via Goal Conditioning}, journal = {CoRR}, volume = {abs/2210.14428}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.14428}, doi = {10.48550/ARXIV.2210.14428}, eprinttype = {arXiv}, eprint = {2210.14428}, timestamp = {Mon, 31 Oct 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-14428.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-00576, author = {Varun Kompella and Thomas Walsh and Samuel Barrett and Peter R. Wurman and Peter Stone}, title = {Event Tables for Efficient Experience Replay}, journal = {CoRR}, volume = {abs/2211.00576}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.00576}, doi = {10.48550/ARXIV.2211.00576}, eprinttype = {arXiv}, eprint = {2211.00576}, timestamp = {Tue, 15 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-00576.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-04005, author = {Eddy Hudson and Ishan Durugkar and Garrett Warnell and Peter Stone}, title = {{ABC:} Adversarial Behavioral Cloning for Offline Mode-Seeking Imitation Learning}, journal = {CoRR}, volume = {abs/2211.04005}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.04005}, doi = {10.48550/ARXIV.2211.04005}, eprinttype = {arXiv}, eprint = {2211.04005}, timestamp = {Wed, 09 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-04005.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-06318, author = {Peter Stone and Rodney Brooks and Erik Brynjolfsson and Ryan Calo and Oren Etzioni and Greg Hager and Julia Hirschberg and Shivaram Kalyanakrishnan and Ece Kamar and Sarit Kraus and Kevin Leyton{-}Brown and David C. Parkes and William H. Press and AnnaLee Saxenian and Julie Shah and Milind Tambe and Astro Teller}, title = {Artificial Intelligence and Life in 2030: The One Hundred Year Study on Artificial Intelligence}, journal = {CoRR}, volume = {abs/2211.06318}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.06318}, doi = {10.48550/ARXIV.2211.06318}, eprinttype = {arXiv}, eprint = {2211.06318}, timestamp = {Sat, 17 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-06318.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-07847, author = {Yoonchang Sung and Zizhao Wang and Peter Stone}, title = {Learning to Correct Mistakes: Backjumping in Long-Horizon Task and Motion Planning}, journal = {CoRR}, volume = {abs/2211.07847}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.07847}, doi = {10.48550/ARXIV.2211.07847}, eprinttype = {arXiv}, eprint = {2211.07847}, timestamp = {Wed, 23 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-07847.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-08302, author = {Hager Radi and Josiah P. Hanna and Peter Stone and Matthew E. Taylor}, title = {Safe Evaluation For Offline Learning: Are We Ready To Deploy?}, journal = {CoRR}, volume = {abs/2212.08302}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.08302}, doi = {10.48550/ARXIV.2212.08302}, eprinttype = {arXiv}, eprint = {2212.08302}, timestamp = {Mon, 02 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-08302.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/ZhangTWS21, author = {Ruohan Zhang and Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Recent advances in leveraging human guidance for sequential decision-making tasks}, journal = {Auton. Agents Multi Agent Syst.}, volume = {35}, number = {2}, pages = {31}, year = {2021}, url = {https://doi.org/10.1007/s10458-021-09514-w}, doi = {10.1007/S10458-021-09514-W}, timestamp = {Thu, 29 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aamas/ZhangTWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/CapobiancoKASJF21, author = {Roberto Capobianco and Varun Kompella and James Ault and Guni Sharon and Stacy Jong and Spencer J. Fox and Lauren Ancel Meyers and Peter R. Wurman and Peter Stone}, title = {Agent-Based Markov Modeling for Improved {COVID-19} Mitigation Policies}, journal = {J. Artif. Intell. Res.}, volume = {71}, pages = {953--992}, year = {2021}, url = {https://doi.org/10.1613/jair.1.12632}, doi = {10.1613/JAIR.1.12632}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/CapobiancoKASJF21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/HannaNS21, author = {Josiah P. Hanna and Scott Niekum and Peter Stone}, title = {Importance sampling in reinforcement learning with an estimated behavior policy}, journal = {Mach. Learn.}, volume = {110}, number = {6}, pages = {1267--1317}, year = {2021}, url = {https://doi.org/10.1007/s10994-020-05938-9}, doi = {10.1007/S10994-020-05938-9}, timestamp = {Thu, 05 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ml/HannaNS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/HannaDKWS21, author = {Josiah P. Hanna and Siddharth Desai and Haresh Karnan and Garrett Warnell and Peter Stone}, title = {Grounded action transformation for sim-to-real reinforcement learning}, journal = {Mach. Learn.}, volume = {110}, number = {9}, pages = {2469--2499}, year = {2021}, url = {https://doi.org/10.1007/s10994-021-05982-z}, doi = {10.1007/S10994-021-05982-Z}, timestamp = {Thu, 16 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ml/HannaDKWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/LiuXS21, author = {Bo Liu and Xuesu Xiao and Peter Stone}, title = {A Lifelong Learning Approach to Mobile Robot Navigation}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {6}, number = {2}, pages = {1090--1096}, year = {2021}, url = {https://doi.org/10.1109/LRA.2021.3056373}, doi = {10.1109/LRA.2021.3056373}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ral/LiuXS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/XiaoLWS21, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {Toward Agile Maneuvers in Highly Constrained Spaces: Learning From Hallucination}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {6}, number = {2}, pages = {1503--1510}, year = {2021}, url = {https://doi.org/10.1109/LRA.2021.3058927}, doi = {10.1109/LRA.2021.3058927}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ral/XiaoLWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/XiaoBS21, author = {Xuesu Xiao and Joydeep Biswas and Peter Stone}, title = {Learning Inverse Kinodynamics for Accurate High-Speed Off-Road Navigation on Unstructured Terrain}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {6}, number = {3}, pages = {6054--6060}, year = {2021}, url = {https://doi.org/10.1109/LRA.2021.3090023}, doi = {10.1109/LRA.2021.3090023}, timestamp = {Tue, 13 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ral/XiaoBS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/WangXWS21, author = {Zizhao Wang and Xuesu Xiao and Garrett Warnell and Peter Stone}, title = {{APPLE:} Adaptive Planner Parameter Learning From Evaluative Feedback}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {6}, number = {4}, pages = {7744--7749}, year = {2021}, url = {https://doi.org/10.1109/lra.2021.3100940}, doi = {10.1109/LRA.2021.3100940}, timestamp = {Thu, 13 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ral/WangXWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ram/StoneITZ21, author = {Peter Stone and Luca Iocchi and Flavio Tonidandel and Changjiu Zhou}, title = {RoboCup 2021 Worldwide: {A} Successful Robotics Competition During a Pandemic [Competitions]}, journal = {{IEEE} Robotics Autom. Mag.}, volume = {28}, number = {4}, pages = {114--119}, year = {2021}, url = {https://doi.org/10.1109/MRA.2021.3117413}, doi = {10.1109/MRA.2021.3117413}, timestamp = {Wed, 15 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ram/StoneITZ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tac/KoppelWSSR21, author = {Alec Koppel and Garrett Warnell and Ethan Stump and Peter Stone and Alejandro Ribeiro}, title = {Policy Evaluation in Continuous MDPs With Efficient Kernelized Gradient Temporal Difference}, journal = {{IEEE} Trans. Autom. Control.}, volume = {66}, number = {4}, pages = {1856--1863}, year = {2021}, url = {https://doi.org/10.1109/TAC.2020.3029315}, doi = {10.1109/TAC.2020.3029315}, timestamp = {Wed, 07 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tac/KoppelWSSR21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/JiangWS21, author = {Yu{-}Sian Jiang and Garrett Warnell and Peter Stone}, title = {Goal Blending for Responsive Shared Autonomy in a Navigating Vehicle}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {5939--5947}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i7.16742}, doi = {10.1609/AAAI.V35I7.16742}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/JiangWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/JiangB0STS21, author = {Yuqian Jiang and Suda Bharadwaj and Bo Wu and Rishi Shah and Ufuk Topcu and Peter Stone}, title = {Temporal-Logic-Based Reward Shaping for Continuing Reinforcement Learning Tasks}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {7995--8003}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i9.16975}, doi = {10.1609/AAAI.V35I9.16975}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/JiangB0STS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MackeMS21, author = {William Macke and Reuth Mirsky and Peter Stone}, title = {Expected Value of Communication for Planning in Ad Hoc Teamwork}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {11290--11298}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i13.17346}, doi = {10.1609/AAAI.V35I13.17346}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MackeMS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/CuiZJASNK21, author = {Yuchen Cui and Qiping Zhang and Sahil Jain and Alessandro Allievi and Peter Stone and Scott Niekum and W. Bradley Knox}, title = {Demonstration of the {EMPATHIC} Framework for Task Learning from Implicit Human Feedback}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {16017--16019}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i18.17998}, doi = {10.1609/AAAI.V35I18.17998}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/CuiZJASNK21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MirskyS21, author = {Reuth Mirsky and Peter Stone}, editor = {Frank Dignum and Alessio Lomuscio and Ulle Endriss and Ann Now{\'{e}}}, title = {The Seeing-Eye Robot Grand Challenge: Rethinking Automated Care}, booktitle = {{AAMAS} '21: 20th International Conference on Autonomous Agents and Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021}, pages = {28--33}, publisher = {{ACM}}, year = {2021}, url = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p28.pdf}, doi = {10.5555/3463952.3463959}, timestamp = {Wed, 20 Jul 2022 17:03:47 +0200}, biburl = {https://dblp.org/rec/conf/atal/MirskyS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/CuiMYGUS21, author = {Jiaxun Cui and William Macke and Harel Yedidsion and Aastha Goyal and Daniel Urieli and Peter Stone}, editor = {Frank Dignum and Alessio Lomuscio and Ulle Endriss and Ann Now{\'{e}}}, title = {Scalable Multiagent Driving Policies for Reducing Traffic Congestion}, booktitle = {{AAMAS} '21: 20th International Conference on Autonomous Agents and Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021}, pages = {386--394}, publisher = {{ACM}}, year = {2021}, url = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p386.pdf}, doi = {10.5555/3463952.3464002}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/CuiMYGUS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SharonASKC21, author = {Guni Sharon and James Ault and Peter Stone and Varun Kompella and Roberto Capobianco}, editor = {Frank Dignum and Alessio Lomuscio and Ulle Endriss and Ann Now{\'{e}}}, title = {Multiagent Epidemiologic Inference through Realtime Contact Tracing}, booktitle = {{AAMAS} '21: 20th International Conference on Autonomous Agents and Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021}, pages = {1182--1190}, publisher = {{ACM}}, year = {2021}, url = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p1182.pdf}, doi = {10.5555/3463952.3464089}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/SharonASKC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icarsc/Stone21, author = {Peter Stone}, editor = {V{\'{\i}}tor Santos and Nuno Lau and Pedro Neto and Ana Cristina Lopes}, title = {Efficient Robot Skill Learning: Grounded Simulation Learning and Imitation Learning from Observation}, booktitle = {{IEEE} International Conference on Autonomous Robot Systems and Competitions, {ICARSC} 2021, Santa Maria da Feira, Portugal, April 28-29, 2021}, pages = {3}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICARSC52212.2021.9429812}, doi = {10.1109/ICARSC52212.2021.9429812}, timestamp = {Thu, 20 May 2021 15:25:12 +0200}, biburl = {https://dblp.org/rec/conf/icarsc/Stone21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LiuLSGZA21, author = {Bo Liu and Qiang Liu and Peter Stone and Animesh Garg and Yuke Zhu and Anima Anandkumar}, editor = {Marina Meila and Tong Zhang}, title = {Coach-Player Multi-agent Reinforcement Learning for Dynamic Team Composition}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {6860--6870}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/liu21m.html}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/LiuLSGZA21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/HolmanASTHS21, author = {Blake Holman and Abrar Anwar and Akash Singh and Mauricio Tec and Justin W. Hart and Peter Stone}, title = {Watch Where You're Going! Gaze and Head Orientation as Predictors for Social Robot Navigation}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {3553--3559}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9561286}, doi = {10.1109/ICRA48506.2021.9561286}, timestamp = {Fri, 22 Oct 2021 19:54:31 +0200}, biburl = {https://dblp.org/rec/conf/icra/HolmanASTHS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/WangXLWS21, author = {Zizhao Wang and Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {{APPLI:} Adaptive Planner Parameter Learning From Interventions}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {6079--6085}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9561311}, doi = {10.1109/ICRA48506.2021.9561311}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/WangXLWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/XuDNXWLWS21, author = {Zifan Xu and Gauraang Dhamankar and Anirudh Nair and Xuesu Xiao and Garrett Warnell and Bo Liu and Zizhao Wang and Peter Stone}, title = {{APPLR:} Adaptive Planner Parameter Learning from Reinforcement}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {6086--6092}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9561647}, doi = {10.1109/ICRA48506.2021.9561647}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/XuDNXWLWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/XiaoLS21, author = {Xuesu Xiao and Bo Liu and Peter Stone}, title = {Agile Robot Navigation through Hallucinated Learning and Sober Deployment}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {7316--7322}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9562117}, doi = {10.1109/ICRA48506.2021.9562117}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/XiaoLS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/YedidsionSXDS21, author = {Harel Yedidsion and Jennifer Suriadinata and Zifan Xu and Stefan Debruyn and Peter Stone}, title = {A Scavenger Hunt for Service Robots}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {7774--7780}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9561722}, doi = {10.1109/ICRA48506.2021.9561722}, timestamp = {Fri, 22 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/YedidsionSXDS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/LoFST21, author = {Shih{-}Yun Lo and Benito Fernandez and Peter Stone and Andrea Lockerd Thomaz}, title = {Towards Safe Motion Planning in Human Workspaces: {A} Robust Multi-agent Approach}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {7929--7935}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9561622}, doi = {10.1109/ICRA48506.2021.9561622}, timestamp = {Fri, 01 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/LoFST21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KhandelwalMWS21, author = {Piyush Khandelwal and James MacGlashan and Peter R. Wurman and Peter Stone}, title = {Efficient Real-Time Inference in Temporal Convolution Networks}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2021, Xi'an, China, May 30 - June 5, 2021}, pages = {13489--13495}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICRA48506.2021.9560784}, doi = {10.1109/ICRA48506.2021.9560784}, timestamp = {Mon, 25 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KhandelwalMWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/WangXNUSBTS21, author = {Zizhao Wang and Xuesu Xiao and Alexander J. Nettekoven and Kadhiravan Umasankar and Anika Singh and Sriram Bommakanti and Ufuk Topcu and Peter Stone}, title = {From Agile Ground to Aerial Navigation: Learning from Learned Hallucination}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021}, pages = {148--153}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IROS51168.2021.9636402}, doi = {10.1109/IROS51168.2021.9636402}, timestamp = {Wed, 22 Dec 2021 12:36:19 +0100}, biburl = {https://dblp.org/rec/conf/iros/WangXNUSBTS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/GhonasgiMNMHSD21, author = {Keya Ghonasgi and Reuth Mirsky and Sanmit Narvekar and Bharath Masetty and Adrian M. Haith and Peter Stone and Ashish D. Deshpande}, title = {Capturing Skill State in Curriculum Learning for Human Skill Acquisition}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021}, pages = {771--776}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IROS51168.2021.9636850}, doi = {10.1109/IROS51168.2021.9636850}, timestamp = {Wed, 22 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/GhonasgiMNMHSD21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/TorabiWS21, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {{DEALIO:} Data-Efficient Adversarial Learning for Imitation from Observation}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021}, pages = {2391--2397}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IROS51168.2021.9636169}, doi = {10.1109/IROS51168.2021.9636169}, timestamp = {Wed, 22 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/TorabiWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/LiuXS21, author = {Bo Liu and Xuesu Xiao and Peter Stone}, title = {Team Orienteering Coverage Planning with Uncertain Reward}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2021, Prague, Czech Republic, September 27 - Oct. 1, 2021}, pages = {9728--9733}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IROS51168.2021.9636288}, doi = {10.1109/IROS51168.2021.9636288}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/LiuXS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DurugkarTNS21, author = {Ishan Durugkar and Mauricio Tec and Scott Niekum and Peter Stone}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Adversarial Intrinsic Motivation for Reinforcement Learning}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {8622--8636}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/486c0401c56bf7ec2daa9eba58907da9-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/DurugkarTNS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuLJSL21, author = {Bo Liu and Xingchao Liu and Xiaojie Jin and Peter Stone and Qiang Liu}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Conflict-Averse Gradient Descent for Multi-task learning}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {18878--18890}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/9d27fdf2477ffbff837d73ef7ae23db9-Abstract.html}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuLJSL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GuoZLZBHS21, author = {Sihang Guo and Ruohan Zhang and Bo Liu and Yifeng Zhu and Dana H. Ballard and Mary M. Hayhoe and Peter Stone}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Machine versus Human Attention in Deep Reinforcement Learning Tasks}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {25370--25385}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/d58e2f077670f4de9cd7963c857f2534-Abstract.html}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/GuoZLZBHS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineLMWS21, author = {Patrick MacAlpine and Bo Liu and William Macke and Caroline Wang and Peter Stone}, editor = {Rachid Alami and Joydeep Biswas and Maya Cakmak and Oliver Obst}, title = {{UT} Austin Villa: RoboCup 2021 3D Simulation League Competition Champions}, booktitle = {RoboCup 2021: Robot World Cup {XXIV}}, series = {Lecture Notes in Computer Science}, volume = {13132}, pages = {314--326}, publisher = {Springer}, year = {2021}, url = {https://doi.org/10.1007/978-3-030-98682-7\_26}, doi = {10.1007/978-3-030-98682-7\_26}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineLMWS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ssrr/XuXWNS21, author = {Zifan Xu and Xuesu Xiao and Garrett Warnell and Anirudh Nair and Peter Stone}, title = {Machine Learning Methods for Local Motion Planning: {A} Study of End-to-End vs. Parameter Learning}, booktitle = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics, {SSRR} 2021, New York City, NY, USA, October 25-27, 2021}, pages = {217--222}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/SSRR53300.2021.9597689}, doi = {10.1109/SSRR53300.2021.9597689}, timestamp = {Tue, 23 Nov 2021 16:16:49 +0100}, biburl = {https://dblp.org/rec/conf/ssrr/XuXWNS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-08574, author = {Lemeng Wu and Bo Liu and Peter Stone and Qiang Liu}, title = {Firefly Neural Architecture Descent: a General Approach for Growing Neural Networks}, journal = {CoRR}, volume = {abs/2102.08574}, year = {2021}, url = {https://arxiv.org/abs/2102.08574}, eprinttype = {arXiv}, eprint = {2102.08574}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-08574.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-12667, author = {Xuesu Xiao and Joydeep Biswas and Peter Stone}, title = {Learning Inverse Kinodynamics for Accurate High-Speed Off-Road Navigation on Unstructured Terrain}, journal = {CoRR}, volume = {abs/2102.12667}, year = {2021}, url = {https://arxiv.org/abs/2102.12667}, eprinttype = {arXiv}, eprint = {2102.12667}, timestamp = {Tue, 02 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-12667.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-00058, author = {Jiaxun Cui and William Macke and Harel Yedidsion and Aastha Goyal and Daniel Urieli and Peter Stone}, title = {Scalable Multiagent Driving Policies For Reducing Traffic Congestion}, journal = {CoRR}, volume = {abs/2103.00058}, year = {2021}, url = {https://arxiv.org/abs/2103.00058}, eprinttype = {arXiv}, eprint = {2103.00058}, timestamp = {Thu, 04 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-00058.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-01171, author = {William Macke and Reuth Mirsky and Peter Stone}, title = {Expected Value of Communication for Planning in Ad Hoc Teamwork}, journal = {CoRR}, volume = {abs/2103.01171}, year = {2021}, url = {https://arxiv.org/abs/2103.01171}, eprinttype = {arXiv}, eprint = {2103.01171}, timestamp = {Thu, 04 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-01171.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-05225, author = {Harel Yedidsion and Jennifer Suriadinata and Zifan Xu and Stefan Debruyn and Peter Stone}, title = {A Scavenger Hunt for Service Robots}, journal = {CoRR}, volume = {abs/2103.05225}, year = {2021}, url = {https://arxiv.org/abs/2103.05225}, eprinttype = {arXiv}, eprint = {2103.05225}, timestamp = {Mon, 15 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-05225.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-00163, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {{DEALIO:} Data-Efficient Adversarial Learning for Imitation from Observation}, journal = {CoRR}, volume = {abs/2104.00163}, year = {2021}, url = {https://arxiv.org/abs/2104.00163}, eprinttype = {arXiv}, eprint = {2104.00163}, timestamp = {Mon, 12 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-00163.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-04159, author = {Harel Yedidsion and Shani Alkoby and Peter Stone}, title = {Sequential Online Chore Division for Autonomous Vehicle Convoy Formation}, journal = {CoRR}, volume = {abs/2104.04159}, year = {2021}, url = {https://arxiv.org/abs/2104.04159}, eprinttype = {arXiv}, eprint = {2104.04159}, timestamp = {Tue, 13 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-04159.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-07810, author = {Eddy Hudson and Garrett Warnell and Faraz Torabi and Peter Stone}, title = {Skeletal Feature Compensation for Imitation Learning with Embodiment Mismatch}, journal = {CoRR}, volume = {abs/2104.07810}, year = {2021}, url = {https://arxiv.org/abs/2104.07810}, eprinttype = {arXiv}, eprint = {2104.07810}, timestamp = {Mon, 19 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-07810.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-13906, author = {W. Bradley Knox and Alessandro Allievi and Holger Banzhaf and Felix Schmitt and Peter Stone}, title = {Reward (Mis)design for Autonomous Driving}, journal = {CoRR}, volume = {abs/2104.13906}, year = {2021}, url = {https://arxiv.org/abs/2104.13906}, eprinttype = {arXiv}, eprint = {2104.13906}, timestamp = {Tue, 04 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-13906.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-03721, author = {Bo Liu and Xuesu Xiao and Peter Stone}, title = {Team Orienteering Coverage Planning with Uncertain Reward}, journal = {CoRR}, volume = {abs/2105.03721}, year = {2021}, url = {https://arxiv.org/abs/2105.03721}, eprinttype = {arXiv}, eprint = {2105.03721}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-03721.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-03756, author = {Eddy Hudson and Garrett Warnell and Peter Stone}, title = {{RAIL:} {A} modular framework for Reinforcement-learning-based Adversarial Imitation Learning}, journal = {CoRR}, volume = {abs/2105.03756}, year = {2021}, url = {https://arxiv.org/abs/2105.03756}, eprinttype = {arXiv}, eprint = {2105.03756}, timestamp = {Fri, 14 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-03756.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-07620, author = {Xuesu Xiao and Zizhao Wang and Zifan Xu and Bo Liu and Garrett Warnell and Gauraang Dhamankar and Anirudh Nair and Peter Stone}, title = {{APPL:} Adaptive Planner Parameter Learning}, journal = {CoRR}, volume = {abs/2105.07620}, year = {2021}, url = {https://arxiv.org/abs/2105.07620}, eprinttype = {arXiv}, eprint = {2105.07620}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-07620.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-08692, author = {Bo Liu and Qiang Liu and Peter Stone and Animesh Garg and Yuke Zhu and Animashree Anandkumar}, title = {Coach-Player Multi-Agent Reinforcement Learning for Dynamic Team Composition}, journal = {CoRR}, volume = {abs/2105.08692}, year = {2021}, url = {https://arxiv.org/abs/2105.08692}, eprinttype = {arXiv}, eprint = {2105.08692}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-08692.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-09371, author = {Haresh Karnan and Garrett Warnell and Xuesu Xiao and Peter Stone}, title = {{VOILA:} Visual-Observation-Only Imitation Learning for Autonomous Navigation}, journal = {CoRR}, volume = {abs/2105.09371}, year = {2021}, url = {https://arxiv.org/abs/2105.09371}, eprinttype = {arXiv}, eprint = {2105.09371}, timestamp = {Mon, 31 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-09371.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-13345, author = {Ishan Durugkar and Mauricio Tec and Scott Niekum and Peter Stone}, title = {Adversarial Intrinsic Motivation for Reinforcement Learning}, journal = {CoRR}, volume = {abs/2105.13345}, year = {2021}, url = {https://arxiv.org/abs/2105.13345}, eprinttype = {arXiv}, eprint = {2105.13345}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-13345.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-04217, author = {Ghada Sokar and Elena Mocanu and Decebal Constantin Mocanu and Mykola Pechenizkiy and Peter Stone}, title = {Dynamic Sparse Training for Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/2106.04217}, year = {2021}, url = {https://arxiv.org/abs/2106.04217}, eprinttype = {arXiv}, eprint = {2106.04217}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-04217.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-12113, author = {Reuth Mirsky and Xuesu Xiao and Justin W. Hart and Peter Stone}, title = {Prevention and Resolution of Conflicts in Social Navigation - a Survey}, journal = {CoRR}, volume = {abs/2106.12113}, year = {2021}, url = {https://arxiv.org/abs/2106.12113}, eprinttype = {arXiv}, eprint = {2106.12113}, timestamp = {Wed, 30 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-12113.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-04001, author = {Justin W. Hart and Reuth Mirsky and Xuesu Xiao and Peter Stone}, title = {Incorporating Gaze into Social Navigation}, journal = {CoRR}, volume = {abs/2107.04001}, year = {2021}, url = {https://arxiv.org/abs/2107.04001}, eprinttype = {arXiv}, eprint = {2107.04001}, timestamp = {Tue, 20 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-04001.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-05825, author = {Ruohan Zhang and Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Recent Advances in Leveraging Human Guidance for Sequential Decision-Making Tasks}, journal = {CoRR}, volume = {abs/2107.05825}, year = {2021}, url = {https://arxiv.org/abs/2107.05825}, eprinttype = {arXiv}, eprint = {2107.05825}, timestamp = {Wed, 21 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-05825.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-09793, author = {Zizhao Wang and Xuesu Xiao and Alexander J. Nettekoven and Kadhiravan Umasankar and Anika Singh and Sriram Bommakanti and Ufuk Topcu and Peter Stone}, title = {From Agile Ground to Aerial Navigation: Learning from Learned Hallucination}, journal = {CoRR}, volume = {abs/2108.09793}, year = {2021}, url = {https://arxiv.org/abs/2108.09793}, eprinttype = {arXiv}, eprint = {2108.09793}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-09793.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-09801, author = {Zizhao Wang and Xuesu Xiao and Garrett Warnell and Peter Stone}, title = {{APPLE:} Adaptive Planner Parameter Learning from Evaluative Feedback}, journal = {CoRR}, volume = {abs/2108.09801}, year = {2021}, url = {https://arxiv.org/abs/2108.09801}, eprinttype = {arXiv}, eprint = {2108.09801}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-09801.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-13841, author = {Yifeng Zhu and Peter Stone and Yuke Zhu}, title = {Bottom-Up Skill Discovery from Unsegmented Demonstrations for Long-Horizon Robot Manipulation}, journal = {CoRR}, volume = {abs/2109.13841}, year = {2021}, url = {https://arxiv.org/abs/2109.13841}, eprinttype = {arXiv}, eprint = {2109.13841}, timestamp = {Mon, 04 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-13841.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-14048, author = {Bo Liu and Xingchao Liu and Xiaojie Jin and Peter Stone and Qiang Liu}, title = {Conflict-Averse Gradient Descent for Multi-task Learning}, journal = {CoRR}, volume = {abs/2110.14048}, year = {2021}, url = {https://arxiv.org/abs/2110.14048}, eprinttype = {arXiv}, eprint = {2110.14048}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-14048.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2112-03759, author = {Yulin Zhang and William Macke and Jiaxun Cui and Daniel Urieli and Peter Stone}, title = {Learning a Robust Multiagent Driving Policy for Traffic Congestion Reduction}, journal = {CoRR}, volume = {abs/2112.03759}, year = {2021}, url = {https://arxiv.org/abs/2112.03759}, eprinttype = {arXiv}, eprint = {2112.03759}, timestamp = {Mon, 13 Dec 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2112-03759.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/SilvaWCS20, author = {Felipe Leno da Silva and Garrett Warnell and Anna Helena Reali Costa and Peter Stone}, title = {Agents teaching agents: a survey on inter-agent transfer learning}, journal = {Auton. Agents Multi Agent Syst.}, volume = {34}, number = {1}, pages = {9}, year = {2020}, url = {https://doi.org/10.1007/s10458-019-09430-0}, doi = {10.1007/S10458-019-09430-0}, timestamp = {Mon, 15 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aamas/SilvaWCS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/AlbrechtSW20, author = {Stefano V. Albrecht and Peter Stone and Michael P. Wellman}, title = {Special issue on autonomous agents modelling other agents: Guest editorial}, journal = {Artif. Intell.}, volume = {285}, pages = {103292}, year = {2020}, url = {https://doi.org/10.1016/j.artint.2020.103292}, doi = {10.1016/J.ARTINT.2020.103292}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ai/AlbrechtSW20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jagi/MonettLTBBGBCCS20, author = {Dagmar Monett and Colin W. P. Lewis and Kristinn R. Th{\'{o}}risson and Joscha Bach and Gianluca Baldassarre and Giovanni Granato and Istvan S. N. Berkeley and Fran{\c{c}}ois Chollet and Matthew Crosby and Henry Shevlin and John F. Sowa and John E. Laird and Shane Legg and Peter Lindes and Tom{\'{a}}s Mikolov and William J. Rapaport and Ra{\'{u}}l Rojas and Marek Rosa and Peter Stone and Richard S. Sutton and Roman V. Yampolskiy and Pei Wang and Roger C. Schank and Aaron Sloman and Alan F. T. Winfield}, title = {Special Issue "On Defining Artificial Intelligence" - Commentaries and Author's Response}, journal = {J. Artif. Gen. Intell.}, volume = {11}, number = {2}, pages = {1--100}, year = {2020}, url = {https://doi.org/10.2478/jagi-2020-0003}, doi = {10.2478/JAGI-2020-0003}, timestamp = {Mon, 03 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jagi/MonettLTBBGBCCS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/ThomasonPSWJYHS20, author = {Jesse Thomason and Aishwarya Padmakumar and Jivko Sinapov and Nick Walker and Yuqian Jiang and Harel Yedidsion and Justin W. Hart and Peter Stone and Raymond J. Mooney}, title = {Jointly Improving Parsing and Perception for Natural Language Commands through Human-Robot Dialog}, journal = {J. Artif. Intell. Res.}, volume = {67}, pages = {327--374}, year = {2020}, url = {https://doi.org/10.1613/jair.1.11485}, doi = {10.1613/JAIR.1.11485}, timestamp = {Sun, 08 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/ThomasonPSWJYHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/LoZS20, author = {Shih{-}Yun Lo and Shiqi Zhang and Peter Stone}, title = {The {PETLON} Algorithm to Plan Efficiently for Task-Level-Optimal Navigation}, journal = {J. Artif. Intell. Res.}, volume = {69}, pages = {471--500}, year = {2020}, url = {https://doi.org/10.1613/jair.1.12181}, doi = {10.1613/JAIR.1.12181}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/LoZS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/NarvekarPLSTS20, author = {Sanmit Narvekar and Bei Peng and Matteo Leonetti and Jivko Sinapov and Matthew E. Taylor and Peter Stone}, title = {Curriculum Learning for Reinforcement Learning Domains: {A} Framework and Survey}, journal = {J. Mach. Learn. Res.}, volume = {21}, pages = {181:1--181:50}, year = {2020}, url = {http://jmlr.org/papers/v21/20-212.html}, timestamp = {Sun, 18 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jmlr/NarvekarPLSTS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/XiaoLWFS20, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Jonathan Fink and Peter Stone}, title = {{APPLD:} Adaptive Planner Parameter Learning From Demonstration}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {5}, number = {3}, pages = {4541--4547}, year = {2020}, url = {https://doi.org/10.1109/LRA.2020.3002217}, doi = {10.1109/LRA.2020.3002217}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ral/XiaoLWFS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ral/PavseTHWS20, author = {Brahma S. Pavse and Faraz Torabi and Josiah Hanna and Garrett Warnell and Peter Stone}, title = {{RIDM:} Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration}, journal = {{IEEE} Robotics Autom. Lett.}, volume = {5}, number = {4}, pages = {6262--6269}, year = {2020}, url = {https://doi.org/10.1109/LRA.2020.3010750}, doi = {10.1109/LRA.2020.3010750}, timestamp = {Sat, 14 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ral/PavseTHWS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/YedidsionAS20, author = {Harel Yedidsion and Shani Alkoby and Peter Stone}, editor = {Amal El Fallah Seghrouchni and Gita Sukthankar and Bo An and Neil Yorke{-}Smith}, title = {The Sequential Online Chore Division Problem - Definition and Application}, booktitle = {Proceedings of the 19th International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13, 2020}, pages = {2059--2061}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2020}, url = {https://dl.acm.org/doi/10.5555/3398761.3399074}, doi = {10.5555/3398761.3399074}, timestamp = {Tue, 26 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/YedidsionAS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SilvaWCS20, author = {Felipe Leno da Silva and Garrett Warnell and Anna Helena Reali Costa and Peter Stone}, editor = {Amal El Fallah Seghrouchni and Gita Sukthankar and Bo An and Neil Yorke{-}Smith}, title = {Agents Teaching Agents: {A} Survey on Inter-agent Transfer Learning}, booktitle = {Proceedings of the 19th International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} '20, Auckland, New Zealand, May 9-13, 2020}, pages = {2165--2167}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2020}, url = {https://dl.acm.org/doi/10.5555/3398761.3399111}, doi = {10.5555/3398761.3399111}, timestamp = {Tue, 26 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/SilvaWCS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/CuiZKASN20, author = {Yuchen Cui and Qiping Zhang and W. Bradley Knox and Alessandro Allievi and Peter Stone and Scott Niekum}, editor = {Jens Kober and Fabio Ramos and Claire J. Tomlin}, title = {The {EMPATHIC} Framework for Task Learning from Implicit Human Feedback}, booktitle = {4th Conference on Robot Learning, CoRL 2020, 16-18 November 2020, Virtual Event / Cambridge, MA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {155}, pages = {604--626}, publisher = {{PMLR}}, year = {2020}, url = {https://proceedings.mlr.press/v155/cui21a.html}, timestamp = {Tue, 18 Oct 2022 08:35:37 +0200}, biburl = {https://dblp.org/rec/conf/corl/CuiZKASN20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/ParkTYWKS20, author = {Jin Soo Park and Brian Tsang and Harel Yedidsion and Garrett Warnell and Daehyun Kyoung and Peter Stone}, editor = {Jens Kober and Fabio Ramos and Claire J. Tomlin}, title = {Learning to Improve Multi-Robot Hallway Navigation}, booktitle = {4th Conference on Robot Learning, CoRL 2020, 16-18 November 2020, Virtual Event / Cambridge, MA, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {155}, pages = {1883--1895}, publisher = {{PMLR}}, year = {2020}, url = {https://proceedings.mlr.press/v155/park21a.html}, timestamp = {Mon, 25 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/corl/ParkTYWKS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/PavseDHS20, author = {Brahma S. Pavse and Ishan Durugkar and Josiah Hanna and Peter Stone}, title = {Reducing Sampling Error in Batch Temporal Difference Learning}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {7543--7552}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/pavse20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/PavseDHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/MirskyMWYS20, author = {Reuth Mirsky and William Macke and Andy Wang and Harel Yedidsion and Peter Stone}, editor = {Christian Bessiere}, title = {A Penny for Your Thoughts: The Value of Communication in Ad Hoc Teamwork}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI} 2020}, pages = {254--260}, publisher = {ijcai.org}, year = {2020}, url = {https://doi.org/10.24963/ijcai.2020/36}, doi = {10.24963/IJCAI.2020/36}, timestamp = {Mon, 20 Jul 2020 12:38:52 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/MirskyMWYS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/DurugkarLS20, author = {Ishan Durugkar and Elad Liebman and Peter Stone}, editor = {Christian Bessiere}, title = {Balancing Individual Preferences and Shared Objectives in Multiagent Reinforcement Learning}, booktitle = {Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, {IJCAI} 2020}, pages = {2505--2511}, publisher = {ijcai.org}, year = {2020}, url = {https://doi.org/10.24963/ijcai.2020/347}, doi = {10.24963/IJCAI.2020/347}, timestamp = {Mon, 13 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/DurugkarLS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/KarnanDHWS20, author = {Haresh Karnan and Siddharth Desai and Josiah P. Hanna and Garrett Warnell and Peter Stone}, title = {Reinforced Grounded Action Transformation for Sim-to-Real Transfer}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021}, pages = {4397--4402}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/IROS45743.2020.9341149}, doi = {10.1109/IROS45743.2020.9341149}, timestamp = {Tue, 16 Feb 2021 19:07:08 +0100}, biburl = {https://dblp.org/rec/conf/iros/KarnanDHWS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/ShahJHS20, author = {Rishi Shah and Yuqian Jiang and Justin W. Hart and Peter Stone}, title = {Deep R-Learning for Continual Area Sweeping}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021}, pages = {5542--5547}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/IROS45743.2020.9341626}, doi = {10.1109/IROS45743.2020.9341626}, timestamp = {Tue, 16 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/ShahJHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/DesaiKHWS20, author = {Siddharth Desai and Haresh Karnan and Josiah P. Hanna and Garrett Warnell and Peter Stone}, title = {Stochastic Grounded Action Transformation for Robot Learning in Simulation}, booktitle = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2020, Las Vegas, NV, USA, October 24, 2020 - January 24, 2021}, pages = {6106--6111}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/IROS45743.2020.9340780}, doi = {10.1109/IROS45743.2020.9340780}, timestamp = {Tue, 16 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/DesaiKHWS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DesaiDKWHS20, author = {Siddharth Desai and Ishan Durugkar and Haresh Karnan and Garrett Warnell and Josiah Hanna and Peter Stone}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {An Imitation from Observation Approach to Transfer Learning with Dynamics Mismatch}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/28f248e9279ac845995c4e9f8af35c2b-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DesaiDKWHS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/WuLS020, author = {Lemeng Wu and Bo Liu and Peter Stone and Qiang Liu}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Firefly Neural Architecture Descent: a General Approach for Growing Neural Networks}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/fdbe012e2e11314b96402b32c0df26b7-Abstract.html}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/WuLS020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigdial/LuZSC20, author = {Keting Lu and Shiqi Zhang and Peter Stone and Xiaoping Chen}, editor = {Olivier Pietquin and Smaranda Muresan and Vivian Chen and Casey Kennington and David Vandyke and Nina Dethlefs and Koji Inoue and Erik Ekstedt and Stefan Ultes}, title = {Learning and Reasoning for Robot Dialog and Navigation Tasks}, booktitle = {Proceedings of the 21th Annual Meeting of the Special Interest Group on Discourse and Dialogue, SIGdial 2020, 1st virtual meeting, July 1-3, 2020}, pages = {107--117}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.sigdial-1.14}, doi = {10.18653/V1/2020.SIGDIAL-1.14}, timestamp = {Fri, 12 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/sigdial/LuZSC20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/socrob/HartMXTMGBOS20, author = {Justin W. Hart and Reuth Mirsky and Xuesu Xiao and Stone Tejeda and Bonny Mahajan and Jamin Goo and Kathryn Baldauf and Sydney Owen and Peter Stone}, editor = {Alan R. Wagner and David Feil{-}Seifer and Kerstin Sophie Haring and Silvia Rossi and Thomas Emrys Williams and Hongsheng He and Shuzhi Sam Ge}, title = {Using Human-Inspired Signals to Disambiguate Navigational Intentions}, booktitle = {Social Robotics - 12th International Conference, {ICSR} 2020, Golden, CO, USA, November 14-18, 2020, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {12483}, pages = {320--331}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-62056-1\_27}, doi = {10.1007/978-3-030-62056-1\_27}, timestamp = {Wed, 21 Dec 2022 13:24:29 +0100}, biburl = {https://dblp.org/rec/conf/socrob/HartMXTMGBOS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ssrr/PerilleTXS20, author = {Daniel Perille and Abigail Truong and Xuesu Xiao and Peter Stone}, title = {Benchmarking Metric Ground Navigation}, booktitle = {{IEEE} International Symposium on Safety, Security, and Rescue Robotics, {SSRR} 2020, Abu Dhabi, United Arab Emirates, November 4-6, 2020}, pages = {116--121}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/SSRR50563.2020.9292572}, doi = {10.1109/SSRR50563.2020.9292572}, timestamp = {Fri, 30 Apr 2021 12:35:39 +0200}, biburl = {https://dblp.org/rec/conf/ssrr/PerilleTXS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-04960, author = {Sanmit Narvekar and Bei Peng and Matteo Leonetti and Jivko Sinapov and Matthew E. Taylor and Peter Stone}, title = {Curriculum Learning for Reinforcement Learning Domains: {A} Framework and Survey}, journal = {CoRR}, volume = {abs/2003.04960}, year = {2020}, url = {https://arxiv.org/abs/2003.04960}, eprinttype = {arXiv}, eprint = {2003.04960}, timestamp = {Sun, 18 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-04960.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-00116, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Jonathan Fink and Peter Stone}, title = {{APPLD:} Adaptive Planner Parameter Learning from Demonstration}, journal = {CoRR}, volume = {abs/2004.00116}, year = {2020}, url = {https://arxiv.org/abs/2004.00116}, eprinttype = {arXiv}, eprint = {2004.00116}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-00116.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-08672, author = {Shiqi Zhang and Peter Stone}, title = {iCORPP: Interleaved Commonsense Reasoning and Probabilistic Planning on Robots}, journal = {CoRR}, volume = {abs/2004.08672}, year = {2020}, url = {https://arxiv.org/abs/2004.08672}, eprinttype = {arXiv}, eprint = {2004.08672}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-08672.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-09833, author = {Keting Lu and Shiqi Zhang and Peter Stone and Xiaoping Chen}, title = {Learning and Reasoning for Robot Dialog and Navigation Tasks}, journal = {CoRR}, volume = {abs/2005.09833}, year = {2020}, url = {https://arxiv.org/abs/2005.09833}, eprinttype = {arXiv}, eprint = {2005.09833}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-09833.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-00589, author = {Rishi Shah and Yuqian Jiang and Justin W. Hart and Peter Stone}, title = {Deep R-Learning for Continual Area Sweeping}, journal = {CoRR}, volume = {abs/2006.00589}, year = {2020}, url = {https://arxiv.org/abs/2006.00589}, eprinttype = {arXiv}, eprint = {2006.00589}, timestamp = {Mon, 08 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-00589.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-10553, author = {Elad Liebman and Peter Stone}, title = {Artificial Musical Intelligence: {A} Survey}, journal = {CoRR}, volume = {abs/2006.10553}, year = {2020}, url = {https://arxiv.org/abs/2006.10553}, eprinttype = {arXiv}, eprint = {2006.10553}, timestamp = {Tue, 23 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-10553.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-01498, author = {Yuqian Jiang and Sudarshanan Bharadwaj and Bo Wu and Rishi Shah and Ufuk Topcu and Peter Stone}, title = {Temporal-Logic-Based Reward Shaping for Continuing Learning Tasks}, journal = {CoRR}, volume = {abs/2007.01498}, year = {2020}, url = {https://arxiv.org/abs/2007.01498}, eprinttype = {arXiv}, eprint = {2007.01498}, timestamp = {Mon, 06 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-01498.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-14479, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {Toward Agile Maneuvers in Highly Constrained Spaces: Learning from Hallucination}, journal = {CoRR}, volume = {abs/2007.14479}, year = {2020}, url = {https://arxiv.org/abs/2007.14479}, eprinttype = {arXiv}, eprint = {2007.14479}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-14479.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-14486, author = {Bo Liu and Xuesu Xiao and Peter Stone}, title = {Lifelong Navigation}, journal = {CoRR}, volume = {abs/2007.14486}, year = {2020}, url = {https://arxiv.org/abs/2007.14486}, eprinttype = {arXiv}, eprint = {2007.14486}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-14486.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-01279, author = {Haresh Karnan and Siddharth Desai and Josiah P. Hanna and Garrett Warnell and Peter Stone}, title = {Reinforced Grounded Action Transformation for Sim-to-Real Transfer}, journal = {CoRR}, volume = {abs/2008.01279}, year = {2020}, url = {https://arxiv.org/abs/2008.01279}, eprinttype = {arXiv}, eprint = {2008.01279}, timestamp = {Fri, 07 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-01279.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-01281, author = {Siddharth Desai and Haresh Karnan and Josiah P. Hanna and Garrett Warnell and Peter Stone}, title = {Stochastic Grounded Action Transformation for Robot Learning in Simulation}, journal = {CoRR}, volume = {abs/2008.01281}, year = {2020}, url = {https://arxiv.org/abs/2008.01281}, eprinttype = {arXiv}, eprint = {2008.01281}, timestamp = {Fri, 07 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-01281.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-01594, author = {Siddharth Desai and Ishan Durugkar and Haresh Karnan and Garrett Warnell and Josiah Hanna and Peter Stone}, title = {An Imitation from Observation Approach to Sim-to-Real Transfer}, journal = {CoRR}, volume = {abs/2008.01594}, year = {2020}, url = {https://arxiv.org/abs/2008.01594}, eprinttype = {arXiv}, eprint = {2008.01594}, timestamp = {Wed, 14 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-01594.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-06738, author = {Brahma S. Pavse and Ishan Durugkar and Josiah Hanna and Peter Stone}, title = {Reducing Sampling Error in Batch Temporal Difference Learning}, journal = {CoRR}, volume = {abs/2008.06738}, year = {2020}, url = {https://arxiv.org/abs/2008.06738}, eprinttype = {arXiv}, eprint = {2008.06738}, timestamp = {Fri, 21 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-06738.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-13315, author = {Daniel Perille and Abigail Truong and Xuesu Xiao and Peter Stone}, title = {Benchmarking Metric Ground Navigation}, journal = {CoRR}, volume = {abs/2008.13315}, year = {2020}, url = {https://arxiv.org/abs/2008.13315}, eprinttype = {arXiv}, eprint = {2008.13315}, timestamp = {Wed, 16 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-13315.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-13649, author = {Yuchen Cui and Qiping Zhang and Alessandro Allievi and Peter Stone and Scott Niekum and W. Bradley Knox}, title = {The {EMPATHIC} Framework for Task Learning from Implicit Human Feedback}, journal = {CoRR}, volume = {abs/2009.13649}, year = {2020}, url = {https://arxiv.org/abs/2009.13649}, eprinttype = {arXiv}, eprint = {2009.13649}, timestamp = {Wed, 30 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-13649.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-13736, author = {Yunshu Du and Garrett Warnell and Assefaw Hadish Gebremedhin and Peter Stone and Matthew E. Taylor}, title = {Lucid Dreaming for Experience Replay: Refreshing Past States with the Current Policy}, journal = {CoRR}, volume = {abs/2009.13736}, year = {2020}, url = {https://arxiv.org/abs/2009.13736}, eprinttype = {arXiv}, eprint = {2009.13736}, timestamp = {Wed, 30 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-13736.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-08098, author = {Xuesu Xiao and Bo Liu and Peter Stone}, title = {Agile Robot Navigation through Hallucinated Learning and Sober Deployment}, journal = {CoRR}, volume = {abs/2010.08098}, year = {2020}, url = {https://arxiv.org/abs/2010.08098}, eprinttype = {arXiv}, eprint = {2010.08098}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-08098.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-09158, author = {Xuesu Xiao and Bo Liu and Peter Stone}, title = {Extended Abstract: Motion Planners Learned from Geometric Hallucination}, journal = {CoRR}, volume = {abs/2010.09158}, year = {2020}, url = {https://arxiv.org/abs/2010.09158}, eprinttype = {arXiv}, eprint = {2010.09158}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-09158.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-10560, author = {Varun Kompella and Roberto Capobianco and Stacy Jong and Jonathan Browne and Spencer J. Fox and Lauren Ancel Meyers and Peter R. Wurman and Peter Stone}, title = {Reinforcement Learning for Optimization of {COVID-19} Mitigation policies}, journal = {CoRR}, volume = {abs/2010.10560}, year = {2020}, url = {https://arxiv.org/abs/2010.10560}, eprinttype = {arXiv}, eprint = {2010.10560}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-10560.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-15942, author = {Ruohan Zhang and Bo Liu and Yifeng Zhu and Sihang Guo and Mary M. Hayhoe and Dana H. Ballard and Peter Stone}, title = {Human versus Machine Attention in Deep Reinforcement Learning Tasks}, journal = {CoRR}, volume = {abs/2010.15942}, year = {2020}, url = {https://arxiv.org/abs/2010.15942}, eprinttype = {arXiv}, eprint = {2010.15942}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-15942.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-00397, author = {Zifan Xu and Gauraang Dhamankar and Anirudh Nair and Xuesu Xiao and Garrett Warnell and Bo Liu and Zizhao Wang and Peter Stone}, title = {{APPLR:} Adaptive Planner Parameter Learning from Reinforcement}, journal = {CoRR}, volume = {abs/2011.00397}, year = {2020}, url = {https://arxiv.org/abs/2011.00397}, eprinttype = {arXiv}, eprint = {2011.00397}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-00397.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-00400, author = {Zizhao Wang and Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {{APPLI:} Adaptive Planner Parameter Learning From Interventions}, journal = {CoRR}, volume = {abs/2011.00400}, year = {2020}, url = {https://arxiv.org/abs/2011.00400}, eprinttype = {arXiv}, eprint = {2011.00400}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-00400.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-13112, author = {Xuesu Xiao and Bo Liu and Garrett Warnell and Peter Stone}, title = {Motion Control for Mobile Robot Navigation Using Machine Learning: a Survey}, journal = {CoRR}, volume = {abs/2011.13112}, year = {2020}, url = {https://arxiv.org/abs/2011.13112}, eprinttype = {arXiv}, eprint = {2011.13112}, timestamp = {Wed, 15 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-13112.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/arobots/JiangYZSS19, author = {Yuqian Jiang and Harel Yedidsion and Shiqi Zhang and Guni Sharon and Peter Stone}, title = {Multi-robot planning with conflicts and synergies}, journal = {Auton. Robots}, volume = {43}, number = {8}, pages = {2011--2032}, year = {2019}, url = {https://doi.org/10.1007/s10514-019-09848-1}, doi = {10.1007/S10514-019-09848-1}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/arobots/JiangYZSS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jzusc/JiangZKS19, author = {Yuqian Jiang and Shiqi Zhang and Piyush Khandelwal and Peter Stone}, title = {Task planning in robotics: an empirical comparison of {PDDL-} and ASP-based systems}, journal = {Frontiers Inf. Technol. Electron. Eng.}, volume = {20}, number = {3}, pages = {363--373}, year = {2019}, url = {https://doi.org/10.1631/FITEE.1800514}, doi = {10.1631/FITEE.1800514}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jzusc/JiangZKS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/misq/LiebmanSS19, author = {Elad Liebman and Maytal Saar{-}Tsechansky and Peter Stone}, title = {The Right Music at the Right Time: Adaptive Personalized Playlists Based on Sequence Modeling}, journal = {{MIS} Q.}, volume = {43}, number = {3}, year = {2019}, url = {https://doi.org/10.25300/misq/2019/14750}, doi = {10.25300/MISQ/2019/14750}, timestamp = {Thu, 30 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/misq/LiebmanSS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ram/AsadaSVLN19, author = {Minoru Asada and Peter Stone and Manuela Veloso and Daniel D. Lee and Daniele Nardi}, title = {RoboCup: {A} Treasure Trove of Rich Diversity for Research Issues and Interdisciplinary Connections {[TC} Spotlight]}, journal = {{IEEE} Robotics Autom. Mag.}, volume = {26}, number = {3}, pages = {99--102}, year = {2019}, url = {https://doi.org/10.1109/MRA.2019.2928959}, doi = {10.1109/MRA.2019.2928959}, timestamp = {Mon, 18 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ram/AsadaSVLN19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HannaSBS19, author = {Josiah P. Hanna and Guni Sharon and Stephen D. Boyles and Peter Stone}, title = {Selecting Compliant Agents for Opt-in Micro-Tolling}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {565--572}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.3301565}, doi = {10.1609/AAAI.V33I01.3301565}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HannaSBS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LoAS19, author = {Shih{-}Yun Lo and Shani Alkoby and Peter Stone}, editor = {Hu{\'{a}}scar Espinoza and Se{\'{a}}n {\'{O}} h{\'{E}}igeartaigh and Xiaowei Huang and Jos{\'{e}} Hern{\'{a}}ndez{-}Orallo and Mauricio Castillo{-}Effen}, title = {Robust Motion Planning and Safety Benchmarking in Human Workspaces}, booktitle = {Workshop on Artificial Intelligence Safety 2019 co-located with the Thirty-Third {AAAI} Conference on Artificial Intelligence 2019 (AAAI-19), Honolulu, Hawaii, January 27, 2019}, series = {{CEUR} Workshop Proceedings}, volume = {2301}, publisher = {CEUR-WS.org}, year = {2019}, url = {https://ceur-ws.org/Vol-2301/paper\_28.pdf}, timestamp = {Fri, 10 Mar 2023 16:22:15 +0100}, biburl = {https://dblp.org/rec/conf/aaai/LoAS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/Jiang0HS19, author = {Yuqian Jiang and Nick Walker and Justin W. Hart and Peter Stone}, editor = {J. Benton and Nir Lipovetzky and Eva Onaindia and David E. Smith and Siddharth Srivastava}, title = {Open-World Reasoning for Service Robots}, booktitle = {Proceedings of the Twenty-Ninth International Conference on Automated Planning and Scheduling, {ICAPS} 2019, Berkeley, CA, USA, July 11-15, 2019}, pages = {725--733}, publisher = {{AAAI} Press}, year = {2019}, url = {https://ojs.aaai.org/index.php/ICAPS/article/view/3541}, timestamp = {Thu, 10 Aug 2023 15:31:45 +0200}, biburl = {https://dblp.org/rec/conf/aips/Jiang0HS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/NarvekarS19, author = {Sanmit Narvekar and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Learning Curriculum Policies for Reinforcement Learning}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {25--33}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3331670}, timestamp = {Wed, 29 May 2019 16:36:58 +0200}, biburl = {https://dblp.org/rec/conf/atal/NarvekarS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/HannaS19, author = {Josiah P. Hanna and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Reducing Sampling Error in Policy Gradient Learning}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {1016--1024}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3331798}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/HannaS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SharonBAS19, author = {Guni Sharon and Stephen D. Boyles and Shani Alkoby and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Marginal Cost Pricing with a Fixed Error Factor in Traffic Networks}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {1539--1546}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3331871}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/SharonBAS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AlkobyRS19, author = {Shani Alkoby and Avilash Rath and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Teaching Social Behavior through Human Reinforcement for Ad hoc Teamwork - The {STAR} Framework: Extended Abstract}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {1773--1775}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3331914}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/AlkobyRS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MenasheS19, author = {Jacob Menashe and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Escape Room: {A} Configurable Testbed for Hierarchical Reinforcement Learning}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {2123--2125}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3332031}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MenasheS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/TorabiWS19, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, editor = {Edith Elkind and Manuela Veloso and Noa Agmon and Matthew E. Taylor}, title = {Adversarial Imitation Learning from State-only Demonstrations}, booktitle = {Proceedings of the 18th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17, 2019}, pages = {2229--2231}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems}, year = {2019}, url = {http://dl.acm.org/citation.cfm?id=3332067}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/TorabiWS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/bracis/SilvaCS19, author = {Felipe Leno da Silva and Anna Helena Reali Costa and Peter Stone}, title = {Building Self-Play Curricula Online by Playing with Expert Agents in Adversarial Games}, booktitle = {8th Brazilian Conference on Intelligent Systems, {BRACIS} 2019, Salvador, Brazil, October 15-18, 2019}, pages = {479--484}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/BRACIS.2019.00090}, doi = {10.1109/BRACIS.2019.00090}, timestamp = {Sun, 25 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/bracis/SilvaCS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/HannaNS19, author = {Josiah Hanna and Scott Niekum and Peter Stone}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {Importance Sampling Policy Evaluation with an Estimated Behavior Policy}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {2605--2613}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/hanna19a.html}, timestamp = {Tue, 11 Jun 2019 15:37:38 +0200}, biburl = {https://dblp.org/rec/conf/icml/HannaNS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/ThomasonPS0JYHS19, author = {Jesse Thomason and Aishwarya Padmakumar and Jivko Sinapov and Nick Walker and Yuqian Jiang and Harel Yedidsion and Justin W. Hart and Peter Stone and Raymond J. Mooney}, title = {Improving Grounded Natural Language Understanding through Human-Robot Dialog}, booktitle = {International Conference on Robotics and Automation, {ICRA} 2019, Montreal, QC, Canada, May 20-24, 2019}, pages = {6934--6941}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICRA.2019.8794287}, doi = {10.1109/ICRA.2019.8794287}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/icra/ThomasonPS0JYHS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/RavulaAS19, author = {Manish Ravula and Shani Alkoby and Peter Stone}, editor = {Sarit Kraus}, title = {Ad Hoc Teamwork With Behavior Switching Agents}, booktitle = {Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16, 2019}, pages = {550--556}, publisher = {ijcai.org}, year = {2019}, url = {https://doi.org/10.24963/ijcai.2019/78}, doi = {10.24963/IJCAI.2019/78}, timestamp = {Tue, 20 Aug 2019 16:18:18 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/RavulaAS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/TorabiWS19, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, editor = {Sarit Kraus}, title = {Imitation Learning from Video by Leveraging Proprioception}, booktitle = {Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16, 2019}, pages = {3585--3591}, publisher = {ijcai.org}, year = {2019}, url = {https://doi.org/10.24963/ijcai.2019/497}, doi = {10.24963/IJCAI.2019/497}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/TorabiWS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/TorabiWS19a, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, editor = {Sarit Kraus}, title = {Recent Advances in Imitation Learning from Observation}, booktitle = {Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16, 2019}, pages = {6325--6331}, publisher = {ijcai.org}, year = {2019}, url = {https://doi.org/10.24963/ijcai.2019/882}, doi = {10.24963/IJCAI.2019/882}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/TorabiWS19a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/ZhangTGBS19, author = {Ruohan Zhang and Faraz Torabi and Lin Guan and Dana H. Ballard and Peter Stone}, editor = {Sarit Kraus}, title = {Leveraging Human Guidance for Deep Reinforcement Learning Tasks}, booktitle = {Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16, 2019}, pages = {6339--6346}, publisher = {ijcai.org}, year = {2019}, url = {https://doi.org/10.24963/ijcai.2019/884}, doi = {10.24963/IJCAI.2019/884}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/ZhangTGBS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/JiangYZS19, author = {Yuqian Jiang and Fangkai Yang and Shiqi Zhang and Peter Stone}, title = {Task-Motion Planning with Reinforcement Learning for Adaptable Mobile Service Robots}, booktitle = {2019 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2019, Macau, SAR, China, November 3-8, 2019}, pages = {7529--7534}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/IROS40897.2019.8967680}, doi = {10.1109/IROS40897.2019.8967680}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/JiangYZS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineTPS19, author = {Patrick MacAlpine and Faraz Torabi and Brahma S. Pavse and Peter Stone}, editor = {Stephan K. Chalup and Tim Niem{\"{u}}ller and Jackrit Suthakorn and Mary{-}Anne Williams}, title = {{UT} Austin Villa: RoboCup 2019 3D Simulation League Competition and Technical Challenge Champions}, booktitle = {RoboCup 2019: Robot World Cup {XXIII} [Sydney, NSW, Australia, July 8, 2019]}, series = {Lecture Notes in Computer Science}, volume = {11531}, pages = {540--552}, publisher = {Springer}, year = {2019}, url = {https://doi.org/10.1007/978-3-030-35699-6\_44}, doi = {10.1007/978-3-030-35699-6\_44}, timestamp = {Thu, 12 Dec 2019 08:32:25 +0100}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineTPS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/socrob/YedidsionDSCHSM19, author = {Harel Yedidsion and Jacqueline Deans and Connor Sheehan and Mahathi Chillara and Justin W. Hart and Peter Stone and Raymond J. Mooney}, editor = {Miguel A. Salichs and Shuzhi Sam Ge and Emilia Ivanova Barakova and John{-}John Cabibihan and Alan R. Wagner and {\'{A}}lvaro Castro Gonz{\'{a}}lez and Hongsheng He}, title = {Optimal Use of Verbal Instructions for Multi-robot Human Navigation Guidance}, booktitle = {Social Robotics - 11th International Conference, {ICSR} 2019, Madrid, Spain, November 26-29, 2019, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {11876}, pages = {133--143}, publisher = {Springer}, year = {2019}, url = {https://doi.org/10.1007/978-3-030-35888-4\_13}, doi = {10.1007/978-3-030-35888-4\_13}, timestamp = {Mon, 25 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/socrob/YedidsionDSCHSM19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1903-00122, author = {Jesse Thomason and Aishwarya Padmakumar and Jivko Sinapov and Nick Walker and Yuqian Jiang and Harel Yedidsion and Justin W. Hart and Peter Stone and Raymond J. Mooney}, title = {Improving Grounded Natural Language Understanding through Human-Robot Dialog}, journal = {CoRR}, volume = {abs/1903.00122}, year = {2019}, url = {http://arxiv.org/abs/1903.00122}, eprinttype = {arXiv}, eprint = {1903.00122}, timestamp = {Sat, 30 Mar 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1903-00122.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-09335, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Imitation Learning from Video by Leveraging Proprioception}, journal = {CoRR}, volume = {abs/1905.09335}, year = {2019}, url = {http://arxiv.org/abs/1905.09335}, eprinttype = {arXiv}, eprint = {1905.09335}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-09335.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-13566, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Recent Advances in Imitation Learning from Observation}, journal = {CoRR}, volume = {abs/1905.13566}, year = {2019}, url = {http://arxiv.org/abs/1905.13566}, eprinttype = {arXiv}, eprint = {1905.13566}, timestamp = {Mon, 03 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-13566.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-07372, author = {Brahma S. Pavse and Faraz Torabi and Josiah P. Hanna and Garrett Warnell and Peter Stone}, title = {{RIDM:} Reinforced Inverse Dynamics Modeling for Learning from a Single Observed Demonstration}, journal = {CoRR}, volume = {abs/1906.07372}, year = {2019}, url = {http://arxiv.org/abs/1906.07372}, eprinttype = {arXiv}, eprint = {1906.07372}, timestamp = {Mon, 24 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-07372.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-07374, author = {Faraz Torabi and Sean Geiger and Garrett Warnell and Peter Stone}, title = {Sample-efficient Adversarial Imitation Learning from Observation}, journal = {CoRR}, volume = {abs/1906.07374}, year = {2019}, url = {http://arxiv.org/abs/1906.07374}, eprinttype = {arXiv}, eprint = {1906.07374}, timestamp = {Mon, 24 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-07374.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-11064, author = {Stefano V. Albrecht and Peter Stone}, title = {Reasoning about Hypothetical Agent Behaviours and their Parameters}, journal = {CoRR}, volume = {abs/1906.11064}, year = {2019}, url = {http://arxiv.org/abs/1906.11064}, eprinttype = {arXiv}, eprint = {1906.11064}, timestamp = {Thu, 27 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-11064.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-02300, author = {Nick Walker and Yuqian Jiang and Maya Cakmak and Peter Stone}, title = {Desiderata for Planning Systems in General-Purpose Service Robots}, journal = {CoRR}, volume = {abs/1907.02300}, year = {2019}, url = {http://arxiv.org/abs/1907.02300}, eprinttype = {arXiv}, eprint = {1907.02300}, timestamp = {Mon, 08 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-02300.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-06529, author = {Rishi Shah and Yuqian Jiang and Haresh Karnan and Gilberto Briscoe{-}Martinez and Dominick Mulder and Ryan Gupta and Rachel Schlossman and Marika Murphy and Justin W. Hart and Luis Sentis and Peter Stone}, title = {Solving Service Robot Tasks: {UT} Austin Villa@Home 2019 Team Report}, journal = {CoRR}, volume = {abs/1909.06529}, year = {2019}, url = {http://arxiv.org/abs/1909.06529}, eprinttype = {arXiv}, eprint = {1909.06529}, timestamp = {Mon, 23 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-06529.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-06560, author = {Justin W. Hart and Reuth Mirsky and Stone Tejeda and Bonny Mahajan and Jamin Goo and Kathryn Baldauf and Sydney Owen and Peter Stone}, title = {Unclogging Our Arteries: Using Human-Inspired Signals to Disambiguate Navigational Intentions}, journal = {CoRR}, volume = {abs/1909.06560}, year = {2019}, url = {http://arxiv.org/abs/1909.06560}, eprinttype = {arXiv}, eprint = {1909.06560}, timestamp = {Tue, 24 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-06560.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-09906, author = {Ruohan Zhang and Faraz Torabi and Lin Guan and Dana H. Ballard and Peter Stone}, title = {Leveraging Human Guidance for Deep Reinforcement Learning Tasks}, journal = {CoRR}, volume = {abs/1909.09906}, year = {2019}, url = {http://arxiv.org/abs/1909.09906}, eprinttype = {arXiv}, eprint = {1909.09906}, timestamp = {Fri, 27 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-09906.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/MacAlpineS18, author = {Patrick MacAlpine and Peter Stone}, title = {Overlapping layered learning}, journal = {Artif. Intell.}, volume = {254}, pages = {21--43}, year = {2018}, url = {https://doi.org/10.1016/j.artint.2017.09.001}, doi = {10.1016/J.ARTINT.2017.09.001}, timestamp = {Mon, 27 Nov 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ai/MacAlpineS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/AlbrechtS18, author = {Stefano V. Albrecht and Peter Stone}, title = {Autonomous agents modelling other agents: {A} comprehensive survey and open problems}, journal = {Artif. Intell.}, volume = {258}, pages = {66--95}, year = {2018}, url = {https://doi.org/10.1016/j.artint.2018.01.002}, doi = {10.1016/J.ARTINT.2018.01.002}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ai/AlbrechtS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cacm/GroszS18, author = {Barbara J. Grosz and Peter Stone}, title = {A century-long commitment to assessing artificial intelligence and its impact on society}, journal = {Commun. {ACM}}, volume = {61}, number = {12}, pages = {68--73}, year = {2018}, url = {https://doi.org/10.1145/3198470}, doi = {10.1145/3198470}, timestamp = {Mon, 26 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/cacm/GroszS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/finr/OssmyHMHSA18, author = {Ori Ossmy and Justine E. Hoch and Patrick MacAlpine and Shohan Hasan and Peter Stone and Karen E. Adolph}, title = {Variety Wins: Soccer-Playing Robots and Infant Walking}, journal = {Frontiers Neurorobotics}, volume = {12}, pages = {19}, year = {2018}, url = {https://doi.org/10.3389/fnbot.2018.00019}, doi = {10.3389/FNBOT.2018.00019}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/finr/OssmyHMHSA18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LiebmanZS18, author = {Elad Liebman and Eric Zavesky and Peter Stone}, title = {Autonomous Model Management via Reinforcement Learning}, booktitle = {The Workshops of the The Thirty-Second {AAAI} Conference on Artificial Intelligence, New Orleans, Louisiana, USA, February 2-7, 2018}, series = {{AAAI} Technical Report}, volume = {{WS-18}}, pages = {348--355}, publisher = {{AAAI} Press}, year = {2018}, url = {https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/17099}, timestamp = {Mon, 04 Sep 2023 16:46:41 +0200}, biburl = {https://dblp.org/rec/conf/aaai/LiebmanZS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/JiangWS18, author = {Yu{-}Sian Jiang and Garrett Warnell and Peter Stone}, title = {{DIPD:} Gaze-Based Intention Inference in Dynamic Environments}, booktitle = {The Workshops of the The Thirty-Second {AAAI} Conference on Artificial Intelligence, New Orleans, Louisiana, USA, February 2-7, 2018}, series = {{AAAI} Technical Report}, volume = {{WS-18}}, pages = {614--621}, publisher = {{AAAI} Press}, year = {2018}, url = {https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/17353}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/JiangWS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/ChenASHSMS18, author = {Haipeng Chen and Bo An and Guni Sharon and Josiah P. Hanna and Peter Stone and Chunyan Miao and Yeng Chai Soh}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {DyETC: Dynamic Electronic Toll Collection for Traffic Congestion Alleviation}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {757--765}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11337}, doi = {10.1609/AAAI.V32I1.11337}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/ChenASHSMS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SharonARBS18, author = {Guni Sharon and Michael Albert and Tarun Rambha and Stephen D. Boyles and Peter Stone}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {Traffic Optimization for a Mixture of Self-Interested and Compliant Agents}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {1202--1209}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11444}, doi = {10.1609/AAAI.V32I1.11444}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SharonARBS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WarnellWLS18, author = {Garrett Warnell and Nicholas R. Waytowich and Vernon Lawhern and Peter Stone}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {Deep {TAMER:} Interactive Agent Shaping in High-Dimensional State Spaces}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {1545--1554}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11485}, doi = {10.1609/AAAI.V32I1.11485}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WarnellWLS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/ThomasonSMS18, author = {Jesse Thomason and Jivko Sinapov and Raymond J. Mooney and Peter Stone}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {Guiding Exploratory Behaviors for Multi-Modal Grounding of Linguistic Descriptions}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {5520--5527}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.11966}, doi = {10.1609/AAAI.V32I1.11966}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/ThomasonSMS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/DurugkarS18, author = {Ishan Durugkar and Peter Stone}, editor = {Sheila A. McIlraith and Kilian Q. Weinberger}, title = {Adversarial Goal Generation for Intrinsic Motivation}, booktitle = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence, (AAAI-18), the 30th innovative Applications of Artificial Intelligence (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February 2-7, 2018}, pages = {8073--8074}, publisher = {{AAAI} Press}, year = {2018}, url = {https://doi.org/10.1609/aaai.v32i1.12195}, doi = {10.1609/AAAI.V32I1.12195}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/DurugkarS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/AmiriWZSTS18, author = {Saeid Amiri and Suhua Wei and Shiqi Zhang and Jivko Sinapov and Jesse Thomason and Peter Stone}, title = {Robot Behavioral Exploration and Multi-modal Perception using Dynamically Constructed Controllers}, booktitle = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 26-28, 2018}, publisher = {{AAAI} Press}, year = {2018}, url = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17581}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/AmiriWZSTS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/HannaS18, author = {Josiah P. Hanna and Peter Stone}, title = {Towards a Data Efficient Off-Policy Policy Gradient}, booktitle = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 26-28, 2018}, publisher = {{AAAI} Press}, year = {2018}, url = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17578}, timestamp = {Tue, 08 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/HannaS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/MenasheS18, author = {Jacob Menashe and Peter Stone}, title = {State Abstraction Synthesis for Discrete Models of Continuous Domains}, booktitle = {2018 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 26-28, 2018}, publisher = {{AAAI} Press}, year = {2018}, url = {https://aaai.org/ocs/index.php/SSS/SSS18/paper/view/17576}, timestamp = {Tue, 08 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/MenasheS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LoZS18, author = {Shih{-}Yun Lo and Shiqi Zhang and Peter Stone}, editor = {Elisabeth Andr{\'{e}} and Sven Koenig and Mehdi Dastani and Gita Sukthankar}, title = {{PETLON:} Planning Efficiently for Task-Level-Optimal Navigation}, booktitle = {Proceedings of the 17th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15, 2018}, pages = {220--228}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems Richland, SC, {USA} / {ACM}}, year = {2018}, url = {http://dl.acm.org/citation.cfm?id=3237422}, timestamp = {Sat, 30 Sep 2023 09:34:53 +0200}, biburl = {https://dblp.org/rec/conf/atal/LoZS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LiebmanZS18, author = {Elad Liebman and Eric Zavesky and Peter Stone}, editor = {Elisabeth Andr{\'{e}} and Sven Koenig and Mehdi Dastani and Gita Sukthankar}, title = {A Stitch in Time - Autonomous Model Management via Reinforcement Learning}, booktitle = {Proceedings of the 17th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15, 2018}, pages = {990--998}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems Richland, SC, {USA} / {ACM}}, year = {2018}, url = {http://dl.acm.org/citation.cfm?id=3237846}, timestamp = {Mon, 16 Jul 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/LiebmanZS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MirzaeiSBGS18, author = {Hamid Mirzaei and Guni Sharon and Stephen D. Boyles and Tony Givargis and Peter Stone}, editor = {Elisabeth Andr{\'{e}} and Sven Koenig and Mehdi Dastani and Gita Sukthankar}, title = {Link-based Parameterized Micro-tolling Scheme for Optimal Traffic Management}, booktitle = {Proceedings of the 17th International Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2018, Stockholm, Sweden, July 10-15, 2018}, pages = {2013--2015}, publisher = {International Foundation for Autonomous Agents and Multiagent Systems Richland, SC, {USA} / {ACM}}, year = {2018}, url = {http://dl.acm.org/citation.cfm?id=3238055}, timestamp = {Mon, 16 Jul 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MirzaeiSBGS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/PadmakumarSM18, author = {Aishwarya Padmakumar and Peter Stone and Raymond J. Mooney}, editor = {Ellen Riloff and David Chiang and Julia Hockenmaier and Jun'ichi Tsujii}, title = {Learning a Policy for Opportunistic Active Learning}, booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, pages = {1347--1357}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/d18-1165}, doi = {10.18653/V1/D18-1165}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/PadmakumarSM18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icmi/JiangWS18, author = {Yu{-}Sian Jiang and Garrett Warnell and Peter Stone}, editor = {Sidney K. D'Mello and Panayiotis G. Georgiou and Stefan Scherer and Emily Mower Provost and Mohammad Soleymani and Marcelo Worsley}, title = {Inferring User Intention using Gaze in Vehicles}, booktitle = {Proceedings of the 2018 on International Conference on Multimodal Interaction, {ICMI} 2018, Boulder, CO, USA, October 16-20, 2018}, pages = {298--306}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3242969.3243018}, doi = {10.1145/3242969.3243018}, timestamp = {Tue, 15 Oct 2019 08:40:00 +0200}, biburl = {https://dblp.org/rec/conf/icmi/JiangWS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/AmiriWZSTS18, author = {Saeid Amiri and Suhua Wei and Shiqi Zhang and Jivko Sinapov and Jesse Thomason and Peter Stone}, editor = {J{\'{e}}r{\^{o}}me Lang}, title = {Multi-modal Predicate Identification using Dynamically Learned Robot Controllers}, booktitle = {Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm, Sweden}, pages = {4638--4645}, publisher = {ijcai.org}, year = {2018}, url = {https://doi.org/10.24963/ijcai.2018/645}, doi = {10.24963/IJCAI.2018/645}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/AmiriWZSTS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/TorabiWS18, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, editor = {J{\'{e}}r{\^{o}}me Lang}, title = {Behavioral Cloning from Observation}, booktitle = {Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence, {IJCAI} 2018, July 13-19, 2018, Stockholm, Sweden}, pages = {4950--4957}, publisher = {ijcai.org}, year = {2018}, url = {https://doi.org/10.24963/ijcai.2018/687}, doi = {10.24963/IJCAI.2018/687}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/TorabiWS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/HartSKWBJS18, author = {Justin W. Hart and Rishi Shah and Sean Kirmani and Nick Walker and Kathryn Baldauf and Nathan John and Peter Stone}, title = {{PRISM:} Pose Registration for Integrated Semantic Mapping}, booktitle = {2018 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2018, Madrid, Spain, October 1-5, 2018}, pages = {896--902}, publisher = {{IEEE}}, year = {2018}, url = {https://doi.org/10.1109/IROS.2018.8593681}, doi = {10.1109/IROS.2018.8593681}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/HartSKWBJS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isaim/BuiniSBGS18, author = {Hamid Mirzaei Buini and Guni Sharon and Stephen D. Boyles and Tony Givargis and Peter Stone}, title = {Enhanced Delta-tolling: Traffic Optimization via Policy Gradient Reinforcement Learning}, booktitle = {International Symposium on Artificial Intelligence and Mathematics, {ISAIM} 2018, Fort Lauderdale, Florida, USA, January 3-5, 2018}, year = {2018}, url = {https://isaim2018.cs.ou.edu/papers/ISAIM2018\_Traffic\_Buini\_etal.pdf}, timestamp = {Wed, 20 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/isaim/BuiniSBGS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isaim/SharonARBS18, author = {Guni Sharon and Michael Albert and Tarun Rambha and Stephen D. Boyles and Peter Stone}, title = {Traffic Optimization For a Mixture of Self-interested and Compliant Agents}, booktitle = {International Symposium on Artificial Intelligence and Mathematics, {ISAIM} 2018, Fort Lauderdale, Florida, USA, January 3-5, 2018}, year = {2018}, url = {https://isaim2018.cs.ou.edu/papers/ISAIM2018\_Traffic\_Sharon\_etal.pdf}, timestamp = {Wed, 20 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/isaim/SharonARBS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ismir/LiebmanWS18, author = {Elad Liebman and Corey N. White and Peter Stone}, editor = {Emilia G{\'{o}}mez and Xiao Hu and Eric Humphrey and Emmanouil Benetos}, title = {On the Impact of Music on Decision Making in Cooperative Tasks}, booktitle = {Proceedings of the 19th International Society for Music Information Retrieval Conference, {ISMIR} 2018, Paris, France, September 23-27, 2018}, pages = {695--701}, year = {2018}, url = {http://ismir2018.ircam.fr/doc/pdfs/298\_Paper.pdf}, timestamp = {Thu, 12 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ismir/LiebmanWS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/itsc/MirzaeiSBGS18, author = {Hamid Mirzaei and Guni Sharon and Stephen D. Boyles and Tony Givargis and Peter Stone}, editor = {Wei{-}Bin Zhang and Alexandre M. Bayen and Javier J. S{\'{a}}nchez Medina and Matthew J. Barth}, title = {Enhanced Delta-tolling: Traffic Optimization via Policy Gradient Reinforcement Learning}, booktitle = {21st International Conference on Intelligent Transportation Systems, {ITSC} 2018, Maui, HI, USA, November 4-7, 2018}, pages = {47--52}, publisher = {{IEEE}}, year = {2018}, url = {https://doi.org/10.1109/ITSC.2018.8569737}, doi = {10.1109/ITSC.2018.8569737}, timestamp = {Wed, 16 Oct 2019 14:14:57 +0200}, biburl = {https://dblp.org/rec/conf/itsc/MirzaeiSBGS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ro-man/FernandezJKHSS18, author = {Rolando Fernandez and Nathan John and Sean Kirmani and Justin W. Hart and Jivko Sinapov and Peter Stone}, title = {Passive Demonstrations of Light-Based Robot Signals for Improved Human Interpretability}, booktitle = {27th {IEEE} International Symposium on Robot and Human Interactive Communication, {RO-MAN} 2018, Nanjing, China, August 27-31, 2018}, pages = {234--239}, publisher = {{IEEE}}, year = {2018}, url = {https://doi.org/10.1109/ROMAN.2018.8525728}, doi = {10.1109/ROMAN.2018.8525728}, timestamp = {Wed, 16 Oct 2019 14:14:50 +0200}, biburl = {https://dblp.org/rec/conf/ro-man/FernandezJKHSS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ro-man/JiangWMS18, author = {Yu{-}Sian Jiang and Garrett Warnell and Eduardo Munera and Peter Stone}, title = {A Study of Human-Robot Copilot Systems for En-route Destination Changing}, booktitle = {27th {IEEE} International Symposium on Robot and Human Interactive Communication, {RO-MAN} 2018, Nanjing, China, August 27-31, 2018}, pages = {997--1004}, publisher = {{IEEE}}, year = {2018}, url = {https://doi.org/10.1109/ROMAN.2018.8525701}, doi = {10.1109/ROMAN.2018.8525701}, timestamp = {Tue, 13 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ro-man/JiangWMS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineTPSS18, author = {Patrick MacAlpine and Faraz Torabi and Brahma S. Pavse and John Sigmon and Peter Stone}, editor = {Dirk Holz and Katie Genter and Maarouf Saad and Oskar von Stryk}, title = {{UT} Austin Villa: RoboCup 2018 3D Simulation League Champions}, booktitle = {RoboCup 2018: Robot World Cup {XXII} [Montreal, QC, Canada, June 18-22, 2018]}, series = {Lecture Notes in Computer Science}, volume = {11374}, pages = {462--475}, publisher = {Springer}, year = {2018}, url = {https://doi.org/10.1007/978-3-030-27544-0\_38}, doi = {10.1007/978-3-030-27544-0\_38}, timestamp = {Tue, 06 Aug 2019 14:04:46 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineTPSS18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1804-08229, author = {Yuqian Jiang and Shiqi Zhang and Piyush Khandelwal and Peter Stone}, title = {An Empirical Comparison of PDDL-based and ASP-based Task Planners}, journal = {CoRR}, volume = {abs/1804.08229}, year = {2018}, url = {http://arxiv.org/abs/1804.08229}, eprinttype = {arXiv}, eprint = {1804.08229}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-08229.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-01954, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Behavioral Cloning from Observation}, journal = {CoRR}, volume = {abs/1805.01954}, year = {2018}, url = {http://arxiv.org/abs/1805.01954}, eprinttype = {arXiv}, eprint = {1805.01954}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-01954.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-01347, author = {Josiah Hanna and Scott Niekum and Peter Stone}, title = {Importance Sampling Policy Evaluation with an Estimated Behavior Policy}, journal = {CoRR}, volume = {abs/1806.01347}, year = {2018}, url = {http://arxiv.org/abs/1806.01347}, eprinttype = {arXiv}, eprint = {1806.01347}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-01347.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-06158, author = {Faraz Torabi and Garrett Warnell and Peter Stone}, title = {Generative Adversarial Imitation from Observation}, journal = {CoRR}, volume = {abs/1807.06158}, year = {2018}, url = {http://arxiv.org/abs/1807.06158}, eprinttype = {arXiv}, eprint = {1807.06158}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-06158.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-07899, author = {Barbara J. Grosz and Peter Stone}, title = {A Century Long Commitment to Assessing Artificial Intelligence and its Impact on Society}, journal = {CoRR}, volume = {abs/1808.07899}, year = {2018}, url = {http://arxiv.org/abs/1808.07899}, eprinttype = {arXiv}, eprint = {1808.07899}, timestamp = {Sun, 02 Sep 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-07899.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-10009, author = {Aishwarya Padmakumar and Peter Stone and Raymond J. Mooney}, title = {Learning a Policy for Opportunistic Active Learning}, journal = {CoRR}, volume = {abs/1808.10009}, year = {2018}, url = {http://arxiv.org/abs/1808.10009}, eprinttype = {arXiv}, eprint = {1808.10009}, timestamp = {Mon, 03 Sep 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-10009.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-05676, author = {Prabhat Nagarajan and Garrett Warnell and Peter Stone}, title = {Deterministic Implementations for Reproducibility in Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/1809.05676}, year = {2018}, url = {http://arxiv.org/abs/1809.05676}, eprinttype = {arXiv}, eprint = {1809.05676}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-05676.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-07880, author = {Shani Alkoby and Avilash Rath and Peter Stone}, title = {Ad hoc Teamwork and Moral Feedback as a Framework for Safe Agent Behavior}, journal = {CoRR}, volume = {abs/1809.07880}, year = {2018}, url = {http://arxiv.org/abs/1809.07880}, eprinttype = {arXiv}, eprint = {1809.07880}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-07880.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-08793, author = {Minkyu Kim and Miguel Arduengo and Nick Walker and Yuqian Jiang and Justin W. Hart and Peter Stone and Luis Sentis}, title = {An Architecture for Person-Following using Active Target Search}, journal = {CoRR}, volume = {abs/1809.08793}, year = {2018}, url = {http://arxiv.org/abs/1809.08793}, eprinttype = {arXiv}, eprint = {1809.08793}, timestamp = {Mon, 25 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-08793.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-11074, author = {Keting Lu and Shiqi Zhang and Peter Stone and Xiaoping Chen}, title = {Robot Representing and Reasoning with Knowledge from Reinforcement Learning}, journal = {CoRR}, volume = {abs/1809.11074}, year = {2018}, url = {http://arxiv.org/abs/1809.11074}, eprinttype = {arXiv}, eprint = {1809.11074}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-11074.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-02919, author = {Justin W. Hart and Harel Yedidsion and Yuqian Jiang and Nick Walker and Rishi Shah and Jesse Thomason and Aishwarya Padmakumar and Rolando Fernandez and Jivko Sinapov and Raymond J. Mooney and Peter Stone}, title = {Interaction and Autonomy in RoboCup@Home and Building-Wide Intelligence}, journal = {CoRR}, volume = {abs/1810.02919}, year = {2018}, url = {http://arxiv.org/abs/1810.02919}, eprinttype = {arXiv}, eprint = {1810.02919}, timestamp = {Mon, 25 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-02919.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-03563, author = {Yuqian Jiang and Nick Walker and Minkyu Kim and Nicolas Brissonneau and Daniel S. Brown and Justin W. Hart and Scott Niekum and Luis Sentis and Peter Stone}, title = {{LAAIR:} {A} Layered Architecture for Autonomous Interactive Robots}, journal = {CoRR}, volume = {abs/1811.03563}, year = {2018}, url = {http://arxiv.org/abs/1811.03563}, eprinttype = {arXiv}, eprint = {1811.03563}, timestamp = {Mon, 25 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-03563.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-08955, author = {Yuqian Jiang and Fangkai Yang and Shiqi Zhang and Peter Stone}, title = {Integrating Task-Motion Planning with Reinforcement Learning for Robust Decision Making in Mobile Robots}, journal = {CoRR}, volume = {abs/1811.08955}, year = {2018}, url = {http://arxiv.org/abs/1811.08955}, eprinttype = {arXiv}, eprint = {1811.08955}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-08955.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1812-00285, author = {Sanmit Narvekar and Peter Stone}, title = {Learning Curriculum Policies for Reinforcement Learning}, journal = {CoRR}, volume = {abs/1812.00285}, year = {2018}, url = {http://arxiv.org/abs/1812.00285}, eprinttype = {arXiv}, eprint = {1812.00285}, timestamp = {Tue, 01 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1812-00285.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1812-09521, author = {Jacob Menashe and Peter Stone}, title = {Escape Room: {A} Configurable Testbed for Hierarchical Reinforcement Learning}, journal = {CoRR}, volume = {abs/1812.09521}, year = {2018}, url = {http://arxiv.org/abs/1812.09521}, eprinttype = {arXiv}, eprint = {1812.09521}, timestamp = {Wed, 02 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1812-09521.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/AlbrechtLS17, author = {Stefano V. Albrecht and Somchaya Liemhetcharat and Peter Stone}, title = {Special issue on multiagent interaction without prior coordination: guest editorial}, journal = {Auton. Agents Multi Agent Syst.}, volume = {31}, number = {4}, pages = {765--766}, year = {2017}, url = {https://doi.org/10.1007/s10458-016-9358-0}, doi = {10.1007/S10458-016-9358-0}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/AlbrechtLS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/GenterLS17, author = {Katie Genter and Tim Laue and Peter Stone}, title = {Three years of the RoboCup standard platform league drop-in player competition - Creating and maintaining a large scale ad hoc teamwork robotics competition}, journal = {Auton. Agents Multi Agent Syst.}, volume = {31}, number = {4}, pages = {790--820}, year = {2017}, url = {https://doi.org/10.1007/s10458-016-9353-5}, doi = {10.1007/S10458-016-9353-5}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/GenterLS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/BarrettRKS17, author = {Samuel Barrett and Avi Rosenfeld and Sarit Kraus and Peter Stone}, title = {Making friends on the fly: Cooperating with new teammates}, journal = {Artif. Intell.}, volume = {242}, pages = {132--171}, year = {2017}, url = {https://doi.org/10.1016/j.artint.2016.10.005}, doi = {10.1016/J.ARTINT.2016.10.005}, timestamp = {Thu, 28 Dec 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ai/BarrettRKS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/HesterS17, author = {Todd Hester and Peter Stone}, title = {Intrinsically motivated model learning for developing curious robots}, journal = {Artif. Intell.}, volume = {247}, pages = {170--186}, year = {2017}, url = {https://doi.org/10.1016/j.artint.2015.05.002}, doi = {10.1016/J.ARTINT.2015.05.002}, timestamp = {Fri, 28 Apr 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/HesterS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/expert/AuBDS17, author = {Tsz{-}Chiu Au and Bikramjit Banerjee and Prithviraj Dasgupta and Peter Stone}, title = {Multirobot Systems}, journal = {{IEEE} Intell. Syst.}, volume = {32}, number = {6}, pages = {3--5}, year = {2017}, url = {https://doi.org/10.1109/MIS.2017.4531221}, doi = {10.1109/MIS.2017.4531221}, timestamp = {Fri, 06 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/expert/AuBDS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijrr/KhandelwalZSLTY17, author = {Piyush Khandelwal and Shiqi Zhang and Jivko Sinapov and Matteo Leonetti and Jesse Thomason and Fangkai Yang and Ilaria Gori and Maxwell Svetlik and Priyanka Khante and Vladimir Lifschitz and J. K. Aggarwal and Raymond J. Mooney and Peter Stone}, title = {BWIBots: {A} platform for bridging the gap between {AI} and human-robot interaction research}, journal = {Int. J. Robotics Res.}, volume = {36}, number = {5-7}, pages = {635--659}, year = {2017}, url = {https://doi.org/10.1177/0278364916688949}, doi = {10.1177/0278364916688949}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijrr/KhandelwalZSLTY17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tnn/HausknechtLMS17, author = {Matthew J. Hausknecht and Wen{-}Ke Li and Michael D. Mauk and Peter Stone}, title = {Machine Learning Capabilities of a Simulated Cerebellum}, journal = {{IEEE} Trans. Neural Networks Learn. Syst.}, volume = {28}, number = {3}, pages = {510--522}, year = {2017}, url = {https://doi.org/10.1109/TNNLS.2015.2512838}, doi = {10.1109/TNNLS.2015.2512838}, timestamp = {Mon, 09 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/tnn/HausknechtLMS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AlbertCS17, author = {Michael Albert and Vincent Conitzer and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Automated Design of Robust Mechanisms}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {298--304}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.10574}, doi = {10.1609/AAAI.V31I1.10574}, timestamp = {Mon, 04 Sep 2023 14:40:32 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AlbertCS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SvetlikLSSWS17, author = {Maxwell Svetlik and Matteo Leonetti and Jivko Sinapov and Rishi Shah and Nick Walker and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Automatic Curriculum Graph Generation for Reinforcement Learning Agents}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {2590--2596}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.10933}, doi = {10.1609/AAAI.V31I1.10933}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SvetlikLSSWS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HannaS17, author = {Josiah P. Hanna and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Grounded Action Transformation for Robot Learning in Simulation}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {3834--3840}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.11044}, doi = {10.1609/AAAI.V31I1.11044}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HannaS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/ZhangKS17, author = {Shiqi Zhang and Piyush Khandelwal and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Dynamically Constructed (PO)MDPs for Adaptive Robot Planning}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {3855--3863}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.11042}, doi = {10.1609/AAAI.V31I1.11042}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/ZhangKS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LiebmanKSS17, author = {Elad Liebman and Piyush Khandelwal and Maytal Saar{-}Tsechansky and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Designing Better Playlists with Monte Carlo Tree Search}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {4715--4720}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.19100}, doi = {10.1609/AAAI.V31I1.19100}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/LiebmanKSS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HannaS17a, author = {Josiah P. Hanna and Peter Stone}, editor = {Satinder Singh and Shaul Markovitch}, title = {Grounded Action Transformation for Robot Learning in Simulation}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {4931--4932}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.11124}, doi = {10.1609/AAAI.V31I1.11124}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HannaS17a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HannaSN17, author = {Josiah P. Hanna and Peter Stone and Scott Niekum}, editor = {Satinder Singh and Shaul Markovitch}, title = {Bootstrapping with Models: Confidence Intervals for Off-Policy Evaluation}, booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence, February 4-9, 2017, San Francisco, California, {USA}}, pages = {4933--4934}, publisher = {{AAAI} Press}, year = {2017}, url = {https://doi.org/10.1609/aaai.v31i1.11123}, doi = {10.1609/AAAI.V31I1.11123}, timestamp = {Sat, 21 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HannaSN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AlbertCS17, author = {Michael Albert and Vincent Conitzer and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Mechanism Design with Unknown Correlated Distributions: Can We Learn Optimal Mechanisms?}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {69--77}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091141}, timestamp = {Wed, 27 Sep 2017 07:24:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/AlbertCS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SharonS17, author = {Guni Sharon and Peter Stone}, editor = {Gita Sukthankar and Juan A. Rodr{\'{\i}}guez{-}Aguilar}, title = {A Protocol for Mixed Autonomous and Human-Operated Vehicles at Intersections}, booktitle = {Autonomous Agents and Multiagent Systems - {AAMAS} 2017 Workshops, Best Papers, S{\~{a}}o Paulo, Brazil, May 8-12, 2017, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {10642}, pages = {151--167}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-3-319-71682-4\_10}, doi = {10.1007/978-3-319-71682-4\_10}, timestamp = {Mon, 05 Feb 2024 20:34:11 +0100}, biburl = {https://dblp.org/rec/conf/atal/SharonS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MacAlpineS17, author = {Patrick MacAlpine and Peter Stone}, editor = {Gita Sukthankar and Juan A. Rodr{\'{\i}}guez{-}Aguilar}, title = {Evaluating Ad Hoc Teamwork Performance in Drop-In Player Challenges}, booktitle = {Autonomous Agents and Multiagent Systems - {AAMAS} 2017 Workshops, Best Papers, S{\~{a}}o Paulo, Brazil, May 8-12, 2017, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {10642}, pages = {168--186}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-3-319-71682-4\_11}, doi = {10.1007/978-3-319-71682-4\_11}, timestamp = {Thu, 30 Nov 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/MacAlpineS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ZhangJSS17, author = {Shiqi Zhang and Yuqian Jiang and Guni Sharon and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Multirobot Symbolic Planning under Temporal Uncertainty}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {501--510}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091199}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/ZhangJSS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterLS17, author = {Katie Genter and Tim Laue and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Three Years of the RoboCup Standard Platform League Drop-In Player Competition: Creating and Maintaining a Large Scale Ad Hoc Teamwork Robotics Competition}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {520--521}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091201}, timestamp = {Thu, 14 Dec 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/GenterLS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/HannaSN17, author = {Josiah P. Hanna and Peter Stone and Scott Niekum}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Bootstrapping with Models: Confidence Intervals for Off-Policy Evaluation}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {538--546}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091205}, timestamp = {Thu, 11 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/HannaSN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AlbrechtS17, author = {Stefano V. Albrecht and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Reasoning about Hypothetical Agent Behaviours and their Parameters}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {547--555}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091206}, timestamp = {Thu, 11 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/AlbrechtS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KhandelwalS17, author = {Piyush Khandelwal and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Multi-Robot Human Guidance: Human Experiments and Multiple Concurrent Requests}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {1369--1377}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091314}, timestamp = {Thu, 11 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/KhandelwalS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterS17, author = {Katie Genter and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Agent Behaviors for Joining and Leaving a Flock}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {1553--1555}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091359}, timestamp = {Thu, 11 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/GenterS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LiebmanZS17, author = {Elad Liebman and Eric Zavesky and Peter Stone}, editor = {Kate Larson and Michael Winikoff and Sanmay Das and Edmund H. Durfee}, title = {Autonomous Model Management via Reinforcement Learning: Extended Abstract}, booktitle = {Proceedings of the 16th Conference on Autonomous Agents and MultiAgent Systems, {AAMAS} 2017, S{\~{a}}o Paulo, Brazil, May 8-12, 2017}, pages = {1601--1603}, publisher = {{ACM}}, year = {2017}, url = {http://dl.acm.org/citation.cfm?id=3091376}, timestamp = {Thu, 11 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/LiebmanZS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/corl/ThomasonPSHSM17, author = {Jesse Thomason and Aishwarya Padmakumar and Jivko Sinapov and Justin W. Hart and Peter Stone and Raymond J. Mooney}, title = {Opportunistic Active Learning for Grounding Natural Language Descriptions}, booktitle = {1st Annual Conference on Robot Learning, CoRL 2017, Mountain View, California, USA, November 13-15, 2017, Proceedings}, series = {Proceedings of Machine Learning Research}, volume = {78}, pages = {67--76}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v78/thomason17a.html}, timestamp = {Wed, 03 Apr 2019 18:17:24 +0200}, biburl = {https://dblp.org/rec/conf/corl/ThomasonPSHSM17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eumas/TuylsS17, author = {Karl Tuyls and Peter Stone}, editor = {Francesco Belardinelli and Estefania Argente}, title = {Multiagent Learning Paradigms}, booktitle = {Multi-Agent Systems and Agreement Technologies - 15th European Conference, {EUMAS} 2017, and 5th International Conference, {AT} 2017, {\'{E}}vry, France, December 14-15, 2017, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {10767}, pages = {3--21}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-3-030-01713-2\_1}, doi = {10.1007/978-3-030-01713-2\_1}, timestamp = {Tue, 21 Mar 2023 20:59:05 +0100}, biburl = {https://dblp.org/rec/conf/eumas/TuylsS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hotstorage/GonzalezCSS17, author = {Santiago Gonzalez and Vijay Chidambaram and Jivko Sinapov and Peter Stone}, title = {CC-Log: Drastically Reducing Storage Requirements for Robots Using Classification and Compression}, booktitle = {9th {USENIX} Workshop on Hot Topics in Storage and File Systems, HotStorage 2017, Santa Clara, CA, USA, July 10-11, 2017}, publisher = {{USENIX} Association}, year = {2017}, url = {https://www.usenix.org/conference/hotstorage17/program/presentation/gonzalez}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/hotstorage/GonzalezCSS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/HannaTSN17, author = {Josiah P. Hanna and Philip S. Thomas and Peter Stone and Scott Niekum}, editor = {Doina Precup and Yee Whye Teh}, title = {Data-Efficient Policy Evaluation Through Behavior Policy Search}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {1394--1403}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/hanna17a.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/HannaTSN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/NarvekarSS17, author = {Sanmit Narvekar and Jivko Sinapov and Peter Stone}, editor = {Carles Sierra}, title = {Autonomous Task Sequencing for Customized Curriculum Design in Reinforcement Learning}, booktitle = {Proceedings of the Twenty-Sixth International Joint Conference on Artificial Intelligence, {IJCAI} 2017, Melbourne, Australia, August 19-25, 2017}, pages = {2536--2542}, publisher = {ijcai.org}, year = {2017}, url = {https://doi.org/10.24963/ijcai.2017/353}, doi = {10.24963/IJCAI.2017/353}, timestamp = {Tue, 20 Aug 2019 16:16:54 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/NarvekarSS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/LuZSC17, author = {Dongcai Lu and Shiqi Zhang and Peter Stone and Xiaoping Chen}, title = {Leveraging commonsense reasoning and multimodal perception for robot spoken dialog systems}, booktitle = {2017 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2017, Vancouver, BC, Canada, September 24-28, 2017}, pages = {6582--6588}, publisher = {{IEEE}}, year = {2017}, url = {https://doi.org/10.1109/IROS.2017.8206570}, doi = {10.1109/IROS.2017.8206570}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/LuZSC17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MenasheKGHLNZS17, author = {Jacob Menashe and Josh Kelle and Katie Genter and Josiah Hanna and Elad Liebman and Sanmit Narvekar and Ruohan Zhang and Peter Stone}, editor = {Hidehisa Akiyama and Oliver Obst and Claude Sammut and Flavio Tonidandel}, title = {Fast and Precise Black and White Ball Detection for RoboCup Soccer}, booktitle = {RoboCup 2017: Robot World Cup {XXI} [Nagoya, Japan, July 27-31, 2017]}, series = {Lecture Notes in Computer Science}, volume = {11175}, pages = {45--58}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-3-030-00308-1\_4}, doi = {10.1007/978-3-030-00308-1\_4}, timestamp = {Wed, 25 Sep 2019 18:10:19 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MenasheKGHLNZS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineS17, author = {Patrick MacAlpine and Peter Stone}, editor = {Hidehisa Akiyama and Oliver Obst and Claude Sammut and Flavio Tonidandel}, title = {{UT} Austin Villa: RoboCup 2017 3D Simulation League Competition and Technical Challenges Champions}, booktitle = {RoboCup 2017: Robot World Cup {XXI} [Nagoya, Japan, July 27-31, 2017]}, series = {Lecture Notes in Computer Science}, volume = {11175}, pages = {473--485}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-3-030-00308-1\_39}, doi = {10.1007/978-3-030-00308-1\_39}, timestamp = {Wed, 12 Sep 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:reference/ml/Stone17, author = {Peter Stone}, editor = {Claude Sammut and Geoffrey I. Webb}, title = {Q-Learning}, booktitle = {Encyclopedia of Machine Learning and Data Mining}, pages = {1033}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-1-4899-7687-1\_689}, doi = {10.1007/978-1-4899-7687-1\_689}, timestamp = {Wed, 12 Jul 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/reference/ml/Stone17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:reference/ml/Stone17a, author = {Peter Stone}, editor = {Claude Sammut and Geoffrey I. Webb}, title = {Reinforcement Learning}, booktitle = {Encyclopedia of Machine Learning and Data Mining}, pages = {1088--1090}, publisher = {Springer}, year = {2017}, url = {https://doi.org/10.1007/978-1-4899-7687-1\_720}, doi = {10.1007/978-1-4899-7687-1\_720}, timestamp = {Wed, 12 Jul 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/reference/ml/Stone17a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/HannaTSN17, author = {Josiah P. Hanna and Philip S. Thomas and Peter Stone and Scott Niekum}, title = {Data-Efficient Policy Evaluation Through Behavior Policy Search}, journal = {CoRR}, volume = {abs/1706.03469}, year = {2017}, url = {http://arxiv.org/abs/1706.03469}, eprinttype = {arXiv}, eprint = {1706.03469}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HannaTSN17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MocanuMSNGL17, author = {Decebal Constantin Mocanu and Elena Mocanu and Peter Stone and Phuong H. Nguyen and Madeleine Gibescu and Antonio Liotta}, title = {Evolutionary Training of Sparse Artificial Neural Networks: {A} Network Science Perspective}, journal = {CoRR}, volume = {abs/1707.04780}, year = {2017}, url = {http://arxiv.org/abs/1707.04780}, eprinttype = {arXiv}, eprint = {1707.04780}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/MocanuMSNGL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-08071, author = {Stefano V. Albrecht and Peter Stone}, title = {Autonomous Agents Modelling Other Agents: {A} Comprehensive Survey and Open Problems}, journal = {CoRR}, volume = {abs/1709.08071}, year = {2017}, url = {http://arxiv.org/abs/1709.08071}, eprinttype = {arXiv}, eprint = {1709.08071}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-08071.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-09569, author = {Guni Sharon and Michael Albert and Tarun Rambha and Stephen D. Boyles and Peter Stone}, title = {Traffic Optimization For a Mixture of Self-interested and Compliant Agents}, journal = {CoRR}, volume = {abs/1709.09569}, year = {2017}, url = {http://arxiv.org/abs/1709.09569}, eprinttype = {arXiv}, eprint = {1709.09569}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-09569.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-10163, author = {Garrett Warnell and Nicholas R. Waytowich and Vernon Lawhern and Peter Stone}, title = {Deep {TAMER:} Interactive Agent Shaping in High-Dimensional State Spaces}, journal = {CoRR}, volume = {abs/1709.10163}, year = {2017}, url = {http://arxiv.org/abs/1709.10163}, eprinttype = {arXiv}, eprint = {1709.10163}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-10163.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/LeonettiIS16, author = {Matteo Leonetti and Luca Iocchi and Peter Stone}, title = {A synthesis of automated planning and reinforcement learning for efficient, robust decision-making}, journal = {Artif. Intell.}, volume = {241}, pages = {103--130}, year = {2016}, url = {https://doi.org/10.1016/j.artint.2016.07.004}, doi = {10.1016/J.ARTINT.2016.07.004}, timestamp = {Mon, 26 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ai/LeonettiIS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/expert/GenterMMHLNZS16, author = {Katie Genter and Patrick MacAlpine and Jacob Menashe and Josiah Hanna and Elad Liebman and Sanmit Narvekar and Ruohan Zhang and Peter Stone}, title = {{UT} Austin Villa: Project-Driven Research in {AI} and Robotics}, journal = {{IEEE} Intell. Syst.}, volume = {31}, number = {2}, pages = {94--101}, year = {2016}, url = {https://doi.org/10.1109/MIS.2016.35}, doi = {10.1109/MIS.2016.35}, timestamp = {Fri, 06 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/expert/GenterMMHLNZS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/UrieliS16, author = {Daniel Urieli and Peter Stone}, editor = {Dale Schuurmans and Michael P. Wellman}, title = {Autonomous Electricity Trading Using Time-of-Use Tariffs in a Competitive Market}, booktitle = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence, February 12-17, 2016, Phoenix, Arizona, {USA}}, pages = {345--352}, publisher = {{AAAI} Press}, year = {2016}, url = {https://doi.org/10.1609/aaai.v30i1.10012}, doi = {10.1609/AAAI.V30I1.10012}, timestamp = {Mon, 04 Sep 2023 15:08:28 +0200}, biburl = {https://dblp.org/rec/conf/aaai/UrieliS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/Stone16, author = {Peter Stone}, editor = {Dale Schuurmans and Michael P. Wellman}, title = {What's Hot at RoboCup}, booktitle = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence, February 12-17, 2016, Phoenix, Arizona, {USA}}, pages = {4346--4348}, publisher = {{AAAI} Press}, year = {2016}, url = {https://doi.org/10.1609/aaai.v30i1.9871}, doi = {10.1609/AAAI.V30I1.9871}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/Stone16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/UrieliS16a, author = {Daniel Urieli and Peter Stone}, editor = {Enrico Pontelli and Alex Rogers and Sylvie Thi{\'{e}}baux and Tran Cao Son}, title = {An MDP-Based Winning Approach to Autonomous Power Trading: Formalization and Empirical Analysis}, booktitle = {{AI} for Smart Grids and Smart Buildings, Papers from the 2016 {AAAI} Workshop, Phoenix, Arizona, USA, February 12, 2016}, series = {{AAAI} Technical Report}, volume = {{WS-16-04}}, publisher = {{AAAI} Press}, year = {2016}, url = {http://www.aaai.org/ocs/index.php/WS/AAAIW16/paper/view/12641}, timestamp = {Tue, 05 Sep 2023 08:59:27 +0200}, biburl = {https://dblp.org/rec/conf/aaai/UrieliS16a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/Stone16, author = {Peter Stone}, editor = {Catholijn M. Jonker and Stacy Marsella and John Thangarajah and Karl Tuyls}, title = {Autonomous Learning Agents: Layered Learning and Ad Hoc Teamwork}, booktitle = {Proceedings of the 2016 International Conference on Autonomous Agents {\&} Multiagent Systems, Singapore, May 9-13, 2016}, pages = {2}, publisher = {{ACM}}, year = {2016}, url = {http://dl.acm.org/citation.cfm?id=2936927}, timestamp = {Fri, 20 May 2016 20:33:29 +0200}, biburl = {https://dblp.org/rec/conf/atal/Stone16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/NarvekarSLS16, author = {Sanmit Narvekar and Jivko Sinapov and Matteo Leonetti and Peter Stone}, editor = {Catholijn M. Jonker and Stacy Marsella and John Thangarajah and Karl Tuyls}, title = {Source Task Creation for Curriculum Learning}, booktitle = {Proceedings of the 2016 International Conference on Autonomous Agents {\&} Multiagent Systems, Singapore, May 9-13, 2016}, pages = {566--574}, publisher = {{ACM}}, year = {2016}, url = {http://dl.acm.org/citation.cfm?id=2937007}, timestamp = {Fri, 20 May 2016 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/NarvekarSLS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterS16, author = {Katie Genter and Peter Stone}, editor = {Catholijn M. Jonker and Stacy Marsella and John Thangarajah and Karl Tuyls}, title = {Adding Influencing Agents to a Flock}, booktitle = {Proceedings of the 2016 International Conference on Autonomous Agents {\&} Multiagent Systems, Singapore, May 9-13, 2016}, pages = {615--623}, publisher = {{ACM}}, year = {2016}, url = {http://dl.acm.org/citation.cfm?id=2937015}, timestamp = {Fri, 20 May 2016 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/GenterS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/UrieliS16, author = {Daniel Urieli and Peter Stone}, editor = {Catholijn M. Jonker and Stacy Marsella and John Thangarajah and Karl Tuyls}, title = {An MDP-Based Winning Approach to Autonomous Power Trading: Formalization and Empirical Analysis}, booktitle = {Proceedings of the 2016 International Conference on Autonomous Agents {\&} Multiagent Systems, Singapore, May 9-13, 2016}, pages = {827--835}, publisher = {{ACM}}, year = {2016}, url = {http://dl.acm.org/citation.cfm?id=2937045}, timestamp = {Fri, 20 May 2016 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/UrieliS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/MacAlpineLS16, author = {Patrick MacAlpine and Elad Liebman and Peter Stone}, editor = {Tobias Friedrich and Frank Neumann and Andrew M. Sutton}, title = {Adaptation of Surrogate Tasks for Bipedal Walk Optimization}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} 2016, Denver, CO, USA, July 20-24, 2016, Companion Material Proceedings}, pages = {1275--1276}, publisher = {{ACM}}, year = {2016}, url = {https://doi.org/10.1145/2908961.2931712}, doi = {10.1145/2908961.2931712}, timestamp = {Tue, 06 Nov 2018 11:06:40 +0100}, biburl = {https://dblp.org/rec/conf/gecco/MacAlpineLS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/humanoids/KimJSS16, author = {Donghyun Kim and Steven Jens Jorgensen and Peter Stone and Luis Sentis}, title = {Dynamic behaviors on the {NAO} robot with closed-loop whole body operational space control}, booktitle = {16th {IEEE-RAS} International Conference on Humanoid Robots, Humanoids 2016, Cancun, Mexico, November 15-17, 2016}, pages = {1121--1128}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/HUMANOIDS.2016.7803411}, doi = {10.1109/HUMANOIDS.2016.7803411}, timestamp = {Wed, 16 Oct 2019 14:14:50 +0200}, biburl = {https://dblp.org/rec/conf/humanoids/KimJSS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KhandelwalLNS16, author = {Piyush Khandelwal and Elad Liebman and Scott Niekum and Peter Stone}, editor = {Maria{-}Florina Balcan and Kilian Q. Weinberger}, title = {On the Analysis of Complex Backup Strategies in Monte Carlo Tree Search}, booktitle = {Proceedings of the 33nd International Conference on Machine Learning, {ICML} 2016, New York City, NY, USA, June 19-24, 2016}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {48}, pages = {1319--1328}, publisher = {JMLR.org}, year = {2016}, url = {http://proceedings.mlr.press/v48/khandelwal16.html}, timestamp = {Wed, 29 May 2019 08:41:46 +0200}, biburl = {https://dblp.org/rec/conf/icml/KhandelwalLNS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/SharonHRASB16, author = {Guni Sharon and Josiah Hanna and Tarun Rambha and Michael Albert and Peter Stone and Stephen D. Boyles}, editor = {Ana L{\'{u}}cia C. Bazzan and Franziska Kl{\"{u}}gl and Sascha Ossowski and Giuseppe Vizzari}, title = {Delta-Tolling: Adaptive Tolling for Optimizing Traffic Throughput}, booktitle = {Proceedings of the Ninth International Workshop on Agents in Traffic and Transportation {(ATT} 2016) co-located with the 25th International Joint Conference On Artificial Intelligence {(IJCAI} 2016), New York, USA, July 10, 2016}, series = {{CEUR} Workshop Proceedings}, volume = {1678}, publisher = {CEUR-WS.org}, year = {2016}, url = {https://ceur-ws.org/Vol-1678/paper1.pdf}, timestamp = {Fri, 10 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ijcai/SharonHRASB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/SinapovKSS16, author = {Jivko Sinapov and Priyanka Khante and Maxwell Svetlik and Peter Stone}, editor = {Subbarao Kambhampati}, title = {Learning to Order Objects Using Haptic and Proprioceptive Exploratory Behaviors}, booktitle = {Proceedings of the Twenty-Fifth International Joint Conference on Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July 2016}, pages = {3462--3468}, publisher = {{IJCAI/AAAI} Press}, year = {2016}, url = {http://www.ijcai.org/Abstract/16/489}, timestamp = {Tue, 20 Aug 2019 16:19:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/SinapovKSS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/ThomasonSSSM16, author = {Jesse Thomason and Jivko Sinapov and Maxwell Svetlik and Peter Stone and Raymond J. Mooney}, editor = {Subbarao Kambhampati}, title = {Learning Multi-Modal Grounded Linguistic Semantics by Playing "I Spy"}, booktitle = {Proceedings of the Twenty-Fifth International Joint Conference on Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July 2016}, pages = {3477--3483}, publisher = {{IJCAI/AAAI} Press}, year = {2016}, url = {http://www.ijcai.org/Abstract/16/491}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/ThomasonSSSM16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/ZhangLCS16, author = {Shiqi Zhang and Dongcai Lu and Xiaoping Chen and Peter Stone}, editor = {Subbarao Kambhampati}, title = {Robot Scavenger Hunt: {A} Standardized Framework for Evaluating Intelligent Mobile Robots}, booktitle = {Proceedings of the Twenty-Fifth International Joint Conference on Artificial Intelligence, {IJCAI} 2016, New York, NY, USA, 9-15 July 2016}, pages = {4276--4277}, publisher = {{IJCAI/AAAI} Press}, year = {2016}, url = {http://www.ijcai.org/Abstract/16/658}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/ZhangLCS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ismir/LiebmanSW16, author = {Elad Liebman and Peter Stone and Corey N. White}, editor = {Michael I. Mandel and Johanna Devaney and Douglas Turnbull and George Tzanetakis}, title = {Impact of Music on Decision Making in Quantitative Tasks}, booktitle = {Proceedings of the 17th International Society for Music Information Retrieval Conference, {ISMIR} 2016, New York City, United States, August 7-11, 2016}, pages = {661--667}, year = {2016}, url = {https://wp.nyu.edu/ismir2016/wp-content/uploads/sites/2294/2016/07/272\_Paper.pdf}, timestamp = {Thu, 12 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ismir/LiebmanSW16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineS16, author = {Patrick MacAlpine and Peter Stone}, editor = {Sven Behnke and Raymond Sheh and Sanem Sariel and Daniel D. Lee}, title = {{UT} Austin Villa RoboCup 3D Simulation Base Code Release}, booktitle = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July 4, 2016]}, series = {Lecture Notes in Computer Science}, volume = {9776}, pages = {135--143}, publisher = {Springer}, year = {2016}, url = {https://doi.org/10.1007/978-3-319-68792-6\_11}, doi = {10.1007/978-3-319-68792-6\_11}, timestamp = {Tue, 14 May 2019 10:00:53 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineS16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineS16a, author = {Patrick MacAlpine and Peter Stone}, editor = {Sven Behnke and Raymond Sheh and Sanem Sariel and Daniel D. Lee}, title = {Prioritized Role Assignment for Marking}, booktitle = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July 4, 2016]}, series = {Lecture Notes in Computer Science}, volume = {9776}, pages = {306--318}, publisher = {Springer}, year = {2016}, url = {https://doi.org/10.1007/978-3-319-68792-6\_25}, doi = {10.1007/978-3-319-68792-6\_25}, timestamp = {Thu, 02 Nov 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineS16a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineS16b, author = {Patrick MacAlpine and Peter Stone}, editor = {Sven Behnke and Raymond Sheh and Sanem Sariel and Daniel D. Lee}, title = {{UT} Austin Villa: RoboCup 2016 3D Simulation League Competition and Technical Challenges Champions}, booktitle = {RoboCup 2016: Robot World Cup {XX} [Leipzig, Germany, June 30 - July 4, 2016]}, series = {Lecture Notes in Computer Science}, volume = {9776}, pages = {515--528}, publisher = {Springer}, year = {2016}, url = {https://doi.org/10.1007/978-3-319-68792-6\_43}, doi = {10.1007/978-3-319-68792-6\_43}, timestamp = {Thu, 02 Nov 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineS16b.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/HausknechtS15a, author = {Matthew J. Hausknecht and Peter Stone}, editor = {Yoshua Bengio and Yann LeCun}, title = {Deep Reinforcement Learning in Parameterized Action Space}, booktitle = {4th International Conference on Learning Representations, {ICLR} 2016, San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings}, year = {2016}, url = {http://arxiv.org/abs/1511.04143}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HausknechtS15a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/HannaSN16, author = {Josiah P. Hanna and Peter Stone and Scott Niekum}, title = {High Confidence Off-Policy Evaluation with Models}, journal = {CoRR}, volume = {abs/1606.06126}, year = {2016}, url = {http://arxiv.org/abs/1606.06126}, eprinttype = {arXiv}, eprint = {1606.06126}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HannaSN16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MocanuVESL16, author = {Decebal Constantin Mocanu and Maria Torres Vega and Eric Eaton and Peter Stone and Antonio Liotta}, title = {Online Contrastive Divergence with Generative Replay: Experience Replay without Storing Data}, journal = {CoRR}, volume = {abs/1610.05555}, year = {2016}, url = {http://arxiv.org/abs/1610.05555}, eprinttype = {arXiv}, eprint = {1610.05555}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/MocanuVESL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aai/LiebmanCS15, author = {Elad Liebman and Benny Chor and Peter Stone}, title = {Representative Selection in Nonmetric Datasets}, journal = {Appl. Artif. Intell.}, volume = {29}, number = {8}, pages = {807--838}, year = {2015}, url = {https://doi.org/10.1080/08839514.2015.1071092}, doi = {10.1080/08839514.2015.1071092}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aai/LiebmanCS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/KnoxS15, author = {W. Bradley Knox and Peter Stone}, title = {Framing reinforcement learning from human reward: Reward positivity, temporal discounting, episodicity, and performance}, journal = {Artif. Intell.}, volume = {225}, pages = {24--50}, year = {2015}, url = {https://doi.org/10.1016/j.artint.2015.03.009}, doi = {10.1016/J.ARTINT.2015.03.009}, timestamp = {Sat, 27 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/KnoxS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aimatters/EatonDGGIKLRRSW15, author = {Eric Eaton and Tom Dietterich and Maria L. Gini and Barbara J. Grosz and Charles L. Isbell Jr. and Subbarao Kambhampati and Michael L. Littman and Francesca Rossi and Stuart Russell and Peter Stone and Toby Walsh and Michael J. Wooldridge}, title = {Who speaks for AI?}, journal = {{AI} Matters}, volume = {2}, number = {2}, pages = {4--14}, year = {2015}, url = {https://doi.org/10.1145/2847557.2847559}, doi = {10.1145/2847557.2847559}, timestamp = {Tue, 23 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aimatters/EatonDGGIKLRRSW15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cea/HigginsMLPS15, author = {Andrew J. Higgins and Stephen McFallan and Luis Laredo and Di Prestwidge and Peter Stone}, title = {{TRANSIT} - {A} model for simulating infrastructure and policy interventions in agriculture logistics: Application to the northern Australia beef industry}, journal = {Comput. Electron. Agric.}, volume = {114}, pages = {32--42}, year = {2015}, url = {https://doi.org/10.1016/j.compag.2015.03.018}, doi = {10.1016/J.COMPAG.2015.03.018}, timestamp = {Mon, 03 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cea/HigginsMLPS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/ZhangS15, author = {Shiqi Zhang and Peter Stone}, editor = {Blai Bonet and Sven Koenig}, title = {{CORPP:} Commonsense Reasoning and Probabilistic Planning, as Applied to Dialog with a Mobile Robot}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {1394--1400}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9385}, doi = {10.1609/AAAI.V29I1.9385}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/ZhangS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BarrettS15, author = {Samuel Barrett and Peter Stone}, editor = {Blai Bonet and Sven Koenig}, title = {Cooperating with Unknown Teammates in Complex Domains: {A} Robot Soccer Case Study of Ad Hoc Teamwork}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {2010--2016}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9428}, doi = {10.1609/AAAI.V29I1.9428}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BarrettS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MacAlpinePS15, author = {Patrick MacAlpine and Eric Price and Peter Stone}, editor = {Blai Bonet and Sven Koenig}, title = {{SCRAM:} Scalable Collision-avoiding Role Assignment with Minimal-Makespan for Formational Positioning}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {2096--2102}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9424}, doi = {10.1609/AAAI.V29I1.9424}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MacAlpinePS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MacAlpineDS15, author = {Patrick MacAlpine and Mike Depinet and Peter Stone}, editor = {Blai Bonet and Sven Koenig}, title = {{UT} Austin Villa 2014: RoboCup 3D Simulation League Champion via Overlapping Layered Learning}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {2842--2848}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9540}, doi = {10.1609/AAAI.V29I1.9540}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MacAlpineDS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/GenterS15, author = {Katie Genter and Peter Stone}, editor = {Blai Bonet and Sven Koenig}, title = {Placing Influencing Agents in a Flock}, booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence, January 25-30, 2015, Austin, Texas, {USA}}, pages = {4160--4161}, publisher = {{AAAI} Press}, year = {2015}, url = {https://doi.org/10.1609/aaai.v29i1.9743}, doi = {10.1609/AAAI.V29I1.9743}, timestamp = {Mon, 18 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/GenterS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/HausknechtS15, author = {Matthew J. Hausknecht and Peter Stone}, editor = {Michael Bowling and Marc G. Bellemare and Erik Talvitie and Joel Veness and Marlos C. Machado}, title = {The Impact of Determinism on Learning Atari 2600 Games}, booktitle = {Learning for General Competency in Video Games, Papers from the 2015 {AAAI} Workshop, Austin, Texas, USA, January 26, 2015}, series = {{AAAI} Technical Report}, volume = {{WS-15-10}}, publisher = {{AAAI} Press}, year = {2015}, url = {http://aaai.org/ocs/index.php/WS/AAAIW15/paper/view/9564}, timestamp = {Tue, 05 Sep 2023 08:59:27 +0200}, biburl = {https://dblp.org/rec/conf/aaai/HausknechtS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/HausknechtS15, author = {Matthew J. Hausknecht and Peter Stone}, title = {Deep Recurrent Q-Learning for Partially Observable MDPs}, booktitle = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14, 2015}, pages = {29--37}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11673}, timestamp = {Wed, 14 Nov 2018 16:20:12 +0100}, biburl = {https://dblp.org/rec/conf/aaaifs/HausknechtS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/UrieliS15, author = {Daniel Urieli and Peter Stone}, title = {Autonomous Electricity Trading Using Time-Of-Use Tariffs in a Competitive Market}, booktitle = {2015 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 12-14, 2015}, pages = {91--92}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS15/paper/view/11715}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaifs/UrieliS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/ZhangS15, author = {Shiqi Zhang and Peter Stone}, title = {{CORPP:} Commonsense Reasoning and Probabilistic Planning, as Applied to Dialog with a Mobile Robot}, booktitle = {2015 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 22-25, 2015}, publisher = {{AAAI} Press}, year = {2015}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS15/paper/view/10260}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/ZhangS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterZS15, author = {Katie Genter and Shun Zhang and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Determining Placements of Influencing Agents in a Flock}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {247--255}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2772914}, timestamp = {Tue, 08 Mar 2022 10:12:47 +0100}, biburl = {https://dblp.org/rec/conf/atal/GenterZS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LiebmanSS15, author = {Elad Liebman and Maytal Saar{-}Tsechansky and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {{DJ-MC:} {A} Reinforcement-Learning Agent for Music Playlist Recommendation}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {591--599}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2772954}, timestamp = {Fri, 15 May 2015 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/LiebmanSS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SinapovNLS15, author = {Jivko Sinapov and Sanmit Narvekar and Matteo Leonetti and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Learning Inter-Task Transferability in the Absence of Target Task Samples}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {725--733}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773247}, timestamp = {Fri, 15 May 2015 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/SinapovNLS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MenasheS15, author = {Jacob Menashe and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Monte Carlo Hierarchical Model Learning}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {771--779}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773252}, timestamp = {Fri, 15 May 2015 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MenasheS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KhandelwalBS15, author = {Piyush Khandelwal and Samuel Barrett and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Leading the Way: An Efficient Multi-robot Guidance System}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {1625--1633}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773358}, timestamp = {Fri, 15 May 2015 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/KhandelwalBS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/FangST15, author = {Fei Fang and Peter Stone and Milind Tambe}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Defender Strategies In Domains Involving Frequent Adversary Interaction}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {1663--1664}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773374}, timestamp = {Wed, 07 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/FangST15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterLS15, author = {Katie Genter and Tim Laue and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {The RoboCup 2014 {SPL} Drop-in Player Competition: Encouraging Teamwork without Pre-coordination}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {1745--1746}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773415}, timestamp = {Thu, 14 Dec 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/GenterLS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MenasheS15a, author = {Jacob Menashe and Peter Stone}, editor = {Gerhard Weiss and Pinar Yolum and Rafael H. Bordini and Edith Elkind}, title = {Monte Carlo Hierarchical Model Learning: (Doctoral Consortium)}, booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015}, pages = {1985--1986}, publisher = {{ACM}}, year = {2015}, url = {http://dl.acm.org/citation.cfm?id=2773538}, timestamp = {Fri, 15 May 2015 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MenasheS15a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/ThomasonZMS15, author = {Jesse Thomason and Shiqi Zhang and Raymond J. Mooney and Peter Stone}, editor = {Qiang Yang and Michael J. Wooldridge}, title = {Learning to Interpret Natural Language Commands through Human-Robot Dialog}, booktitle = {Proceedings of the Twenty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July 25-31, 2015}, pages = {1923--1929}, publisher = {{AAAI} Press}, year = {2015}, url = {http://ijcai.org/Abstract/15/273}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/ThomasonZMS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/FangST15, author = {Fei Fang and Peter Stone and Milind Tambe}, editor = {Qiang Yang and Michael J. Wooldridge}, title = {When Security Games Go Green: Designing Defender Strategies to Prevent Poaching and Illegal Fishing}, booktitle = {Proceedings of the Twenty-Fourth International Joint Conference on Artificial Intelligence, {IJCAI} 2015, Buenos Aires, Argentina, July 25-31, 2015}, pages = {2589--2595}, publisher = {{AAAI} Press}, year = {2015}, url = {http://ijcai.org/Abstract/15/367}, timestamp = {Wed, 07 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ijcai/FangST15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/GenterLS15, author = {Katie Genter and Tim Laue and Peter Stone}, title = {Benchmarking robot cooperation without pre-coordination in the RoboCup Standard Platform League drop-in player competition}, booktitle = {2015 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2015, Hamburg, Germany, September 28 - October 2, 2015}, pages = {3415--3420}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/IROS.2015.7353853}, doi = {10.1109/IROS.2015.7353853}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/GenterLS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ismir/LiebmanSW15, author = {Elad Liebman and Peter Stone and Corey N. White}, editor = {Meinard M{\"{u}}ller and Frans Wiering}, title = {How Music Alters Decision Making - Impact of Music Stimuli on Emotional Classification}, booktitle = {Proceedings of the 16th International Society for Music Information Retrieval Conference, {ISMIR} 2015, M{\'{a}}laga, Spain, October 26-30, 2015}, pages = {793--799}, year = {2015}, url = {http://ismir2015.uma.es/articles/293\_Paper.pdf}, timestamp = {Thu, 12 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ismir/LiebmanSW15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/lpnmr/ZhangYKS15, author = {Shiqi Zhang and Fangkai Yang and Piyush Khandelwal and Peter Stone}, editor = {Francesco Calimeri and Giovambattista Ianni and Miroslaw Truszczynski}, title = {Mobile Robot Planning Using Action Language \emph{BC} with an Abstraction Hierarchy}, booktitle = {Logic Programming and Nonmonotonic Reasoning - 13th International Conference, {LPNMR} 2015, Lexington, KY, USA, September 27-30, 2015. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {9345}, pages = {502--516}, publisher = {Springer}, year = {2015}, url = {https://doi.org/10.1007/978-3-319-23264-5\_42}, doi = {10.1007/978-3-319-23264-5\_42}, timestamp = {Mon, 04 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/lpnmr/ZhangYKS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineHLS15, author = {Patrick MacAlpine and Josiah Hanna and Jason Liang and Peter Stone}, editor = {Lu{\'{\i}}s Almeida and Jianmin Ji and Gerald Steinbauer and Sean Luke}, title = {{UT} Austin Villa: RoboCup 2015 3D Simulation League Competition and Technical Challenges Champions}, booktitle = {RoboCup 2015: Robot World Cup {XIX} [papers from the 19th Annual RoboCup International Symposium, Hefei, China, July 23, 2015]}, series = {Lecture Notes in Computer Science}, volume = {9513}, pages = {118--131}, publisher = {Springer}, year = {2015}, url = {https://doi.org/10.1007/978-3-319-29339-4\_10}, doi = {10.1007/978-3-319-29339-4\_10}, timestamp = {Thu, 14 Jan 2021 15:08:30 +0100}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineHLS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/LeottauRMS15, author = {David Leonardo Leottau and Javier Ruiz{-}del{-}Solar and Patrick MacAlpine and Peter Stone}, editor = {Lu{\'{\i}}s Almeida and Jianmin Ji and Gerald Steinbauer and Sean Luke}, title = {A Study of Layered Learning Strategies Applied to Individual Behaviors in Robot Soccer}, booktitle = {RoboCup 2015: Robot World Cup {XIX} [papers from the 19th Annual RoboCup International Symposium, Hefei, China, July 23, 2015]}, series = {Lecture Notes in Computer Science}, volume = {9513}, pages = {290--302}, publisher = {Springer}, year = {2015}, url = {https://doi.org/10.1007/978-3-319-29339-4\_24}, doi = {10.1007/978-3-319-29339-4\_24}, timestamp = {Tue, 04 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/LeottauRMS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/socrob/GoriSKSA15, author = {Ilaria Gori and Jivko Sinapov and Priyanka Khante and Peter Stone and J. K. Aggarwal}, editor = {Adriana Tapus and Elisabeth Andr{\'{e}} and Jean{-}Claude Martin and Fran{\c{c}}ois Ferland and Mehdi Ammi}, title = {Robot-Centric Activity Recognition 'in the Wild'}, booktitle = {Social Robotics - 7th International Conference, {ICSR} 2015, Paris, France, October 26-30, 2015, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {9388}, pages = {224--234}, publisher = {Springer}, year = {2015}, url = {https://doi.org/10.1007/978-3-319-25554-5\_23}, doi = {10.1007/978-3-319-25554-5\_23}, timestamp = {Sat, 30 Sep 2023 09:57:07 +0200}, biburl = {https://dblp.org/rec/conf/socrob/GoriSKSA15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LiebmanCS15, author = {Elad Liebman and Benny Chor and Peter Stone}, title = {Representative Selection in Non Metric Datasets}, journal = {CoRR}, volume = {abs/1502.07428}, year = {2015}, url = {http://arxiv.org/abs/1502.07428}, eprinttype = {arXiv}, eprint = {1502.07428}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LiebmanCS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/HausknechtS15, author = {Matthew J. Hausknecht and Peter Stone}, title = {Deep Recurrent Q-Learning for Partially Observable MDPs}, journal = {CoRR}, volume = {abs/1507.06527}, year = {2015}, url = {http://arxiv.org/abs/1507.06527}, eprinttype = {arXiv}, eprint = {1507.06527}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HausknechtS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/ChakrabortyS14, author = {Doran Chakraborty and Peter Stone}, title = {Multiagent learning in the presence of memory-bounded agents}, journal = {Auton. Agents Multi Agent Syst.}, volume = {28}, number = {2}, pages = {182--213}, year = {2014}, url = {https://doi.org/10.1007/s10458-013-9222-4}, doi = {10.1007/S10458-013-9222-4}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/ChakrabortyS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/NardiNRSSV14, author = {Daniele Nardi and Itsuki Noda and A. Fernando Ribeiro and Peter Stone and Oskar von Stryk and Manuela M. Veloso}, title = {RoboCup Soccer Leagues}, journal = {{AI} Mag.}, volume = {35}, number = {3}, pages = {77--85}, year = {2014}, url = {https://doi.org/10.1609/aimag.v35i3.2549}, doi = {10.1609/AIMAG.V35I3.2549}, timestamp = {Tue, 21 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aim/NardiNRSSV14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aimatters/StoneMGB14, author = {Peter Stone and Patrick MacAlpine and Katie Genter and Samuel Barrett}, title = {Drop-in games at RoboCup}, journal = {{AI} Matters}, volume = {1}, number = {1}, pages = {20--22}, year = {2014}, url = {https://doi.org/10.1145/2639475.2655756}, doi = {10.1145/2639475.2655756}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aimatters/StoneMGB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tciaig/HausknechtLMS14, author = {Matthew J. Hausknecht and Joel Lehman and Risto Miikkulainen and Peter Stone}, title = {A Neuroevolution Approach to General Atari Game Playing}, journal = {{IEEE} Trans. Comput. Intell. {AI} Games}, volume = {6}, number = {4}, pages = {355--366}, year = {2014}, url = {https://doi.org/10.1109/TCIAIG.2013.2294713}, doi = {10.1109/TCIAIG.2013.2294713}, timestamp = {Wed, 13 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tciaig/HausknechtLMS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/UrieliS14, author = {Daniel Urieli and Peter Stone}, editor = {Carla E. Brodley and Peter Stone}, title = {TacTex'13: {A} Champion Adaptive Power Trading Agent}, booktitle = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence, July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada}, pages = {465--471}, publisher = {{AAAI} Press}, year = {2014}, url = {https://doi.org/10.1609/aaai.v28i1.8767}, doi = {10.1609/AAAI.V28I1.8767}, timestamp = {Mon, 04 Sep 2023 15:06:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/UrieliS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/KhandelwalS14, author = {Piyush Khandelwal and Peter Stone}, title = {Leading the Way: An Efficient Multi-Robot Guidance System}, booktitle = {2014 {AAAI} Fall Symposia, Arlington, Virginia, USA, November 13-15, 2014}, publisher = {{AAAI} Press}, year = {2014}, url = {http://www.aaai.org/ocs/index.php/FSS/FSS14/paper/view/9181}, timestamp = {Wed, 14 Nov 2018 17:08:03 +0100}, biburl = {https://dblp.org/rec/conf/aaaifs/KhandelwalS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/KhandelwalS14, author = {Piyush Khandelwal and Peter Stone}, title = {Multi-Robot Human Guidance Using Topological Graphs}, booktitle = {2014 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 24-26, 2014}, publisher = {{AAAI} Press}, year = {2014}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS14/paper/view/7726}, timestamp = {Wed, 14 Nov 2018 14:23:12 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/KhandelwalS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/YangKLS14, author = {Fangkai Yang and Piyush Khandelwal and Matteo Leonetti and Peter Stone}, title = {Planning in Answer Set Programming while Learning Action Costs for Mobile Robots}, booktitle = {2014 {AAAI} Spring Symposia, Stanford University, Palo Alto, California, USA, March 24-26, 2014}, publisher = {{AAAI} Press}, year = {2014}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS14/paper/view/7727}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/YangKLS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/KhandelwalYLLS14, author = {Piyush Khandelwal and Fangkai Yang and Matteo Leonetti and Vladimir Lifschitz and Peter Stone}, editor = {Steve A. Chien and Minh Binh Do and Alan Fern and Wheeler Ruml}, title = {Planning in Action Language {BC} while Learning Action Costs for Mobile Robots}, booktitle = {Proceedings of the Twenty-Fourth International Conference on Automated Planning and Scheduling, {ICAPS} 2014, Portsmouth, New Hampshire, USA, June 21-26, 2014}, publisher = {{AAAI}}, year = {2014}, url = {http://www.aaai.org/ocs/index.php/ICAPS/ICAPS14/paper/view/7940}, timestamp = {Thu, 19 Nov 2015 08:52:28 +0100}, biburl = {https://dblp.org/rec/conf/aips/KhandelwalYLLS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/antsw/GenterS14, author = {Katie Long Genter and Peter Stone}, editor = {Marco Dorigo and Mauro Birattari and Simon Garnier and Heiko Hamann and Marco Antonio Montes de Oca and Christine Solnon and Thomas St{\"{u}}tzle}, title = {Influencing a Flock via Ad Hoc Teamwork}, booktitle = {Swarm Intelligence - 9th International Conference, {ANTS} 2014, Brussels, Belgium, September 10-12, 2014. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {8667}, pages = {110--121}, publisher = {Springer}, year = {2014}, url = {https://doi.org/10.1007/978-3-319-09952-1\_10}, doi = {10.1007/978-3-319-09952-1\_10}, timestamp = {Tue, 21 Mar 2023 20:56:33 +0100}, biburl = {https://dblp.org/rec/conf/antsw/GenterS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AgmonBS14, author = {Noa Agmon and Samuel Barrett and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {Modeling uncertainty in leading ad hoc teams}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {397--404}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2615797}, timestamp = {Thu, 25 Sep 2014 07:46:15 +0200}, biburl = {https://dblp.org/rec/conf/atal/AgmonBS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/BarrettAHKS14, author = {Samuel Barrett and Noa Agmon and Noam Hazon and Sarit Kraus and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {Communicating with unknown teammates}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1433--1434}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2617509}, timestamp = {Thu, 25 Sep 2014 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/BarrettAHKS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/UrieliS14, author = {Daniel Urieli and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {TacTex'13: a champion adaptive power trading agent}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1447--1448}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2617516}, timestamp = {Thu, 25 Sep 2014 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/UrieliS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AuZS14, author = {Tsz{-}Chiu Au and Shun Zhang and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {Semi-autonomous intersection management}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1451--1452}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2617518}, timestamp = {Thu, 25 Sep 2014 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/AuZS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MacAlpineGBS14, author = {Patrick MacAlpine and Katie Long Genter and Samuel Barrett and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {The RoboCup 2013 drop-in player challenges: a testbed for ad hoc teamwork}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1461--1462}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2617523}, timestamp = {Thu, 25 Sep 2014 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MacAlpineGBS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MacAlpinePS14, author = {Patrick MacAlpine and Eric Price and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {{SCRAM:} scalable collision-avoiding role assignment with minimal-makespan for formational positioning}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1463--1464}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2617524}, timestamp = {Tue, 26 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/MacAlpinePS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterS14, author = {Katie Genter and Peter Stone}, editor = {Ana L. C. Bazzan and Michael N. Huhns and Alessio Lomuscio and Paul Scerri}, title = {Orienting a flock via ad hoc teamwork}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '14, Paris, France, May 5-9, 2014}, pages = {1543--1544}, publisher = {{IFAAMAS/ACM}}, year = {2014}, url = {http://dl.acm.org/citation.cfm?id=2616053}, timestamp = {Thu, 25 Sep 2014 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/GenterS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecai/BarrettAHKS14, author = {Samuel Barrett and Noa Agmon and Noam Hazon and Sarit Kraus and Peter Stone}, editor = {Torsten Schaub and Gerhard Friedrich and Barry O'Sullivan}, title = {Communicating with Unknown Teammates}, booktitle = {{ECAI} 2014 - 21st European Conference on Artificial Intelligence, 18-22 August 2014, Prague, Czech Republic - Including Prestigious Applications of Intelligent Systems {(PAIS} 2014)}, series = {Frontiers in Artificial Intelligence and Applications}, volume = {263}, pages = {45--50}, publisher = {{IOS} Press}, year = {2014}, url = {https://doi.org/10.3233/978-1-61499-419-0-45}, doi = {10.3233/978-1-61499-419-0-45}, timestamp = {Mon, 19 Jun 2023 16:36:09 +0200}, biburl = {https://dblp.org/rec/conf/ecai/BarrettAHKS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/MacAlpineGBS14, author = {Patrick MacAlpine and Katie Genter and Samuel Barrett and Peter Stone}, title = {The RoboCup 2013 drop-in player challenges: Experiments in ad hoc teamwork}, booktitle = {2014 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2014, Chicago, IL, USA, September 14-18, 2014}, pages = {382--387}, publisher = {{IEEE}}, year = {2014}, url = {https://doi.org/10.1109/IROS.2014.6942588}, doi = {10.1109/IROS.2014.6942588}, timestamp = {Tue, 05 Sep 2023 15:07:47 +0200}, biburl = {https://dblp.org/rec/conf/iros/MacAlpineGBS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineDLS14, author = {Patrick MacAlpine and Mike Depinet and Jason Liang and Peter Stone}, editor = {Reinaldo A. C. Bianchi and H. Levent Akin and Subramanian Ramamoorthy and Komei Sugiura}, title = {{UT} Austin Villa: RoboCup 2014 3D Simulation League Competition and Technical Challenge Champions}, booktitle = {RoboCup 2014: Robot World Cup {XVIII} [papers from the 18th Annual RoboCup International Symposium, Jo{\~{a}}o Pessoa, Brazil, July 15}, series = {Lecture Notes in Computer Science}, volume = {8992}, pages = {33--46}, publisher = {Springer}, year = {2014}, url = {https://doi.org/10.1007/978-3-319-18615-3\_3}, doi = {10.1007/978-3-319-18615-3\_3}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineDLS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/DepinetMS14, author = {Mike Depinet and Patrick MacAlpine and Peter Stone}, editor = {Reinaldo A. C. Bianchi and H. Levent Akin and Subramanian Ramamoorthy and Komei Sugiura}, title = {Keyframe Sampling, Optimization, and Behavior Integration: Towards Long-Distance Kicking in the RoboCup 3D Simulation League}, booktitle = {RoboCup 2014: Robot World Cup {XVIII} [papers from the 18th Annual RoboCup International Symposium, Jo{\~{a}}o Pessoa, Brazil, July 15}, series = {Lecture Notes in Computer Science}, volume = {8992}, pages = {571--582}, publisher = {Springer}, year = {2014}, url = {https://doi.org/10.1007/978-3-319-18615-3\_47}, doi = {10.1007/978-3-319-18615-3\_47}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/DepinetMS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/aaai/2014, editor = {Carla E. Brodley and Peter Stone}, title = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence, July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada}, publisher = {{AAAI} Press}, year = {2014}, url = {https://ojs.aaai.org/index.php/AAAI/issue/view/305}, isbn = {978-1-57735-661-5}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/2014.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LiebmanS14, author = {Elad Liebman and Peter Stone}, title = {{DJ-MC:} {A} Reinforcement-Learning Agent for Music Playlist Recommendation}, journal = {CoRR}, volume = {abs/1401.1880}, year = {2014}, url = {http://arxiv.org/abs/1401.1880}, eprinttype = {arXiv}, eprint = {1401.1880}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LiebmanS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/StoneKKRA13, author = {Peter Stone and Gal A. Kaminka and Sarit Kraus and Jeffrey S. Rosenschein and Noa Agmon}, title = {Teaching and leading an ad hoc teammate: Collaboration without pre-coordination}, journal = {Artif. Intell.}, volume = {203}, pages = {35--65}, year = {2013}, url = {https://doi.org/10.1016/j.artint.2013.07.003}, doi = {10.1016/J.ARTINT.2013.07.003}, timestamp = {Sat, 27 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/StoneKKRA13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/HesterS13, author = {Todd Hester and Peter Stone}, title = {{TEXPLORE:} real-time sample-efficient reinforcement learning for robots}, journal = {Mach. Learn.}, volume = {90}, number = {3}, pages = {385--429}, year = {2013}, url = {https://doi.org/10.1007/s10994-012-5322-7}, doi = {10.1007/S10994-012-5322-7}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ml/HesterS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nn/LiHSM13, author = {Wen{-}Ke Li and Matthew J. Hausknecht and Peter Stone and Michael D. Mauk}, title = {Using a million cell simulation of the cerebellum: Network scaling and task generality}, journal = {Neural Networks}, volume = {47}, pages = {95--102}, year = {2013}, url = {https://doi.org/10.1016/j.neunet.2012.11.005}, doi = {10.1016/J.NEUNET.2012.11.005}, timestamp = {Wed, 14 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nn/LiHSM13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BarrettSKR13, author = {Samuel Barrett and Peter Stone and Sarit Kraus and Avi Rosenfeld}, editor = {Marie desJardins and Michael L. Littman}, title = {Teamwork with Limited Knowledge of Teammates}, booktitle = {Proceedings of the Twenty-Seventh {AAAI} Conference on Artificial Intelligence, July 14-18, 2013, Bellevue, Washington, {USA}}, pages = {102--108}, publisher = {{AAAI} Press}, year = {2013}, url = {https://doi.org/10.1609/aaai.v27i1.8659}, doi = {10.1609/AAAI.V27I1.8659}, timestamp = {Mon, 04 Sep 2023 15:56:33 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BarrettSKR13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/FarchyBMS13, author = {Alon Farchy and Samuel Barrett and Patrick MacAlpine and Peter Stone}, editor = {Maria L. Gini and Onn Shehory and Takayuki Ito and Catholijn M. Jonker}, title = {Humanoid robots learning to walk faster: from the real world to simulation and back}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013}, pages = {39--46}, publisher = {{IFAAMAS}}, year = {2013}, url = {http://dl.acm.org/citation.cfm?id=2484930}, timestamp = {Thu, 09 Sep 2021 16:09:54 +0200}, biburl = {https://dblp.org/rec/conf/atal/FarchyBMS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/GenterAS13, author = {Katie Long Genter and Noa Agmon and Peter Stone}, editor = {Maria L. Gini and Onn Shehory and Takayuki Ito and Catholijn M. Jonker}, title = {Ad hoc teamwork for leading a flock}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013}, pages = {531--538}, publisher = {{IFAAMAS}}, year = {2013}, url = {http://dl.acm.org/citation.cfm?id=2485005}, timestamp = {Fri, 28 Jun 2013 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/GenterAS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/HesterLS13, author = {Todd Hester and Manuel Lopes and Peter Stone}, editor = {Maria L. Gini and Onn Shehory and Takayuki Ito and Catholijn M. Jonker}, title = {Learning exploration strategies in model-based reinforcement learning}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013}, pages = {1069--1076}, publisher = {{IFAAMAS}}, year = {2013}, url = {http://dl.acm.org/citation.cfm?id=2485088}, timestamp = {Thu, 18 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/HesterLS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ChakrabortyS13, author = {Doran Chakraborty and Peter Stone}, editor = {Maria L. Gini and Onn Shehory and Takayuki Ito and Catholijn M. Jonker}, title = {Cooperating with a markovian ad hoc teammate}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013}, pages = {1085--1092}, publisher = {{IFAAMAS}}, year = {2013}, url = {http://dl.acm.org/citation.cfm?id=2485091}, timestamp = {Fri, 28 Jun 2013 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/ChakrabortyS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/UrieliS13, author = {Daniel Urieli and Peter Stone}, editor = {Maria L. Gini and Onn Shehory and Takayuki Ito and Catholijn M. Jonker}, title = {A learning agent for heat-pump thermostat control}, booktitle = {International conference on Autonomous Agents and Multi-Agent Systems, {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013}, pages = {1093--1100}, publisher = {{IFAAMAS}}, year = {2013}, url = {http://dl.acm.org/citation.cfm?id=2485092}, timestamp = {Fri, 28 Jun 2013 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/UrieliS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/itsc/CarlinoBS13, author = {Dustin Carlino and Stephen D. Boyles and Peter Stone}, title = {Auction-based autonomous intersection management}, booktitle = {16th International {IEEE} Conference on Intelligent Transportation Systems, {ITSC} 2013, The Hague, The Netherlands, October 6-9, 2013}, pages = {529--534}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ITSC.2013.6728285}, doi = {10.1109/ITSC.2013.6728285}, timestamp = {Wed, 16 Oct 2019 14:14:57 +0200}, biburl = {https://dblp.org/rec/conf/itsc/CarlinoBS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iui/KnoxSB13, author = {W. Bradley Knox and Peter Stone and Cynthia Breazeal}, editor = {Jihie Kim and Jeffrey Nichols and Pedro A. Szekely}, title = {Teaching agents with human feedback: a demonstration of the {TAMER} framework}, booktitle = {18th International Conference on Intelligent User Interfaces, {IUI} '13, Santa Monica, CA, USA, March 19-22, 2013, Companion Volume}, pages = {65--66}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2451176.2451201}, doi = {10.1145/2451176.2451201}, timestamp = {Sun, 26 Nov 2023 00:57:51 +0100}, biburl = {https://dblp.org/rec/conf/iui/KnoxSB13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iui/KnoxS13, author = {W. Bradley Knox and Peter Stone}, editor = {Jihie Kim and Jeffrey Nichols and Pedro A. Szekely}, title = {Learning non-myopically from human-generated reward}, booktitle = {18th International Conference on Intelligent User Interfaces, {IUI} 2013, Santa Monica, CA, USA, March 19-22, 2013}, pages = {191--202}, publisher = {{ACM}}, year = {2013}, url = {https://doi.org/10.1145/2449396.2449422}, doi = {10.1145/2449396.2449422}, timestamp = {Sun, 26 Nov 2023 00:57:51 +0100}, biburl = {https://dblp.org/rec/conf/iui/KnoxS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/UrieliS13, author = {Daniel Urieli and Peter Stone}, editor = {Hendrik Blockeel and Kristian Kersting and Siegfried Nijssen and Filip Zelezn{\'{y}}}, title = {Model-Selection for Non-parametric Function Approximation in Continuous Control Problems: {A} Case Study in a Smart Energy System}, booktitle = {Machine Learning and Knowledge Discovery in Databases - European Conference, {ECML} {PKDD} 2013, Prague, Czech Republic, September 23-27, 2013, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {8188}, pages = {65--80}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-642-40988-2\_5}, doi = {10.1007/978-3-642-40988-2\_5}, timestamp = {Tue, 21 Mar 2023 21:00:11 +0100}, biburl = {https://dblp.org/rec/conf/pkdd/UrieliS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/HesterS13, author = {Todd Hester and Peter Stone}, editor = {Sven Behnke and Manuela M. Veloso and Arnoud Visser and Rong Xiong}, title = {The Open-Source {TEXPLORE} Code Release for Reinforcement Learning on Robots}, booktitle = {RoboCup 2013: Robot World Cup {XVII} [papers from the 17th Annual RoboCup International Symposium, Eindhoven, The Netherlands, July 1, 2013]}, series = {Lecture Notes in Computer Science}, volume = {8371}, pages = {536--543}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-662-44468-9\_47}, doi = {10.1007/978-3-662-44468-9\_47}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/HesterS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/BarrettGHHKMS13, author = {Samuel Barrett and Katie Long Genter and Yuchen He and Todd Hester and Piyush Khandelwal and Jacob Menashe and Peter Stone}, editor = {Sven Behnke and Manuela M. Veloso and Arnoud Visser and Rong Xiong}, title = {The 2012 {UT} Austin Villa Code Release}, booktitle = {RoboCup 2013: Robot World Cup {XVII} [papers from the 17th Annual RoboCup International Symposium, Eindhoven, The Netherlands, July 1, 2013]}, series = {Lecture Notes in Computer Science}, volume = {8371}, pages = {552--559}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-662-44468-9\_49}, doi = {10.1007/978-3-662-44468-9\_49}, timestamp = {Wed, 28 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/BarrettGHHKMS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/socrob/KnoxSB13, author = {W. Bradley Knox and Peter Stone and Cynthia Breazeal}, editor = {Guido Herrmann and Martin J. Pearson and Alexander Lenz and Paul Bremner and Adam Spiers and Ute Leonards}, title = {Training a Robot via Human Feedback: {A} Case Study}, booktitle = {Social Robotics - 5th International Conference, {ICSR} 2013, Bristol, UK, October 27-29, 2013, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {8239}, pages = {460--470}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-319-02675-6\_46}, doi = {10.1007/978-3-319-02675-6\_46}, timestamp = {Thu, 14 Oct 2021 10:29:56 +0200}, biburl = {https://dblp.org/rec/conf/socrob/KnoxSB13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/robocup/2012, editor = {Xiaoping Chen and Peter Stone and Luis Enrique Sucar and Tijn van der Zant}, title = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual RoboCup International Symposium, Mexico City, Mexico, June 18-24, 2012]}, series = {Lecture Notes in Computer Science}, volume = {7500}, publisher = {Springer}, year = {2013}, url = {https://doi.org/10.1007/978-3-642-39250-4}, doi = {10.1007/978-3-642-39250-4}, isbn = {978-3-642-39249-8}, timestamp = {Tue, 14 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/2012.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/SonenbergSTY12, author = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {Ten Years of {AAMAS:} Introduction to the Special Issue}, journal = {{AI} Mag.}, volume = {33}, number = {3}, pages = {11--13}, year = {2012}, url = {https://doi.org/10.1609/aimag.v33i3.2423}, doi = {10.1609/AIMAG.V33I3.2423}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/SonenbergSTY12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijsr/KnoxGLMS12, author = {W. Bradley Knox and Brian D. Glass and Bradley C. Love and W. Todd Maddox and Peter Stone}, title = {How Humans Teach Agents - {A} New Experimental Perspective}, journal = {Int. J. Soc. Robotics}, volume = {4}, number = {4}, pages = {409--421}, year = {2012}, url = {https://doi.org/10.1007/s12369-012-0163-x}, doi = {10.1007/S12369-012-0163-X}, timestamp = {Sat, 25 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijsr/KnoxGLMS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MacAlpineBS12, author = {Patrick MacAlpine and Francisco Barrera and Peter Stone}, editor = {Ariel Felner and Nathan R. Sturtevant and Kostas E. Bekris and Roni Stern}, title = {Positioning to Win: {A} Dynamic Role Assignment and Formation Positioning System}, booktitle = {Multiagent Pathfinding, Papers from the 2012 {AAAI} Workshop, MAPF@AAAI 2012, Toronto, Ontario, Canada, July 22, 2012}, series = {{AAAI} Technical Report}, volume = {{WS-12-10}}, publisher = {{AAAI} Press}, year = {2012}, url = {http://www.aaai.org/ocs/index.php/WS/AAAIW12/paper/view/5220}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MacAlpineBS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/MacAlpineBUVS12, author = {Patrick MacAlpine and Samuel Barrett and Daniel Urieli and Victor Vu and Peter Stone}, editor = {J{\"{o}}rg Hoffmann and Bart Selman}, title = {Design and Optimization of an Omnidirectional Humanoid Walk: {A} Winning Approach at the RoboCup 2011 3D Simulation Competition}, booktitle = {Proceedings of the Twenty-Sixth {AAAI} Conference on Artificial Intelligence, July 22-26, 2012, Toronto, Ontario, Canada}, pages = {1047--1053}, publisher = {{AAAI} Press}, year = {2012}, url = {https://doi.org/10.1609/aaai.v26i1.8317}, doi = {10.1609/AAAI.V26I1.8317}, timestamp = {Mon, 04 Sep 2023 15:56:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/MacAlpineBUVS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/HesterS12, author = {Todd Hester and Peter Stone}, title = {{TEXPLORE:} Real-Time Sample-Efficient Reinforcement Learning for Robots}, booktitle = {Designing Intelligent Robots, Papers from the 2012 {AAAI} Spring Symposium, Palo Alto, California, USA, March 26-28, 2012}, series = {{AAAI} Technical Report}, volume = {{SS-12-02}}, publisher = {{AAAI}}, year = {2012}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS12/paper/view/4271}, timestamp = {Wed, 25 Sep 2013 15:48:48 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/HesterS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aamas/MacAlpineUBKBLSVS12, author = {Patrick MacAlpine and Daniel Urieli and Samuel Barrett and Shivaram Kalyanakrishnan and Francisco Barrera and Adrian Lopez{-}Mobilia and Nicolae Stiurca and Victor Vu and Peter Stone}, editor = {Wiebe van der Hoek and Lin Padgham and Vincent Conitzer and Michael Winikoff}, title = {{UT} Austin Villa 2011: a champion agent in the RoboCup 3D soccer simulation competition}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)}, pages = {129--136}, publisher = {{IFAAMAS}}, year = {2012}, url = {http://dl.acm.org/citation.cfm?id=2343594}, timestamp = {Thu, 19 Mar 2015 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aamas/MacAlpineUBKBLSVS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aamas/AgmonS12, author = {Noa Agmon and Peter Stone}, editor = {Wiebe van der Hoek and Lin Padgham and Vincent Conitzer and Michael Winikoff}, title = {Leading ad hoc agents in joint action settings with multiple teammates}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)}, pages = {341--348}, publisher = {{IFAAMAS}}, year = {2012}, url = {http://dl.acm.org/citation.cfm?id=2343625}, timestamp = {Thu, 19 Mar 2015 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aamas/AgmonS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aamas/BarrettS12, author = {Samuel Barrett and Peter Stone}, editor = {Wiebe van der Hoek and Lin Padgham and Vincent Conitzer and Michael Winikoff}, title = {An analysis framework for ad hoc teamwork tasks}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)}, pages = {357--364}, publisher = {{IFAAMAS}}, year = {2012}, url = {http://dl.acm.org/citation.cfm?id=2343627}, timestamp = {Thu, 19 Mar 2015 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aamas/BarrettS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aamas/KnoxS12, author = {W. Bradley Knox and Peter Stone}, editor = {Wiebe van der Hoek and Lin Padgham and Vincent Conitzer and Michael Winikoff}, title = {Reinforcement learning from simultaneous human and {MDP} reward}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)}, pages = {475--482}, publisher = {{IFAAMAS}}, year = {2012}, url = {http://dl.acm.org/citation.cfm?id=2343644}, timestamp = {Thu, 19 Mar 2015 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aamas/KnoxS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aamas/GenterAS12, author = {Katie Long Genter and Noa Agmon and Peter Stone}, editor = {Wiebe van der Hoek and Lin Padgham and Vincent Conitzer and Michael Winikoff}, title = {Role selection in ad hoc teamwork}, booktitle = {International Conference on Autonomous Agents and Multiagent Systems, {AAMAS} 2012, Valencia, Spain, June 4-8, 2012 {(3} Volumes)}, pages = {1251--1252}, publisher = {{IFAAMAS}}, year = {2012}, url = {http://dl.acm.org/citation.cfm?id=2343948}, timestamp = {Thu, 19 Mar 2015 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aamas/GenterAS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/HausknechtKMS12, author = {Matthew J. Hausknecht and Piyush Khandelwal and Risto Miikkulainen and Peter Stone}, editor = {Terence Soule and Jason H. Moore}, title = {HyperNEAT-GGP: a hyperNEAT-based atari general game player}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} '12, Philadelphia, PA, USA, July 7-11, 2012}, pages = {217--224}, publisher = {{ACM}}, year = {2012}, url = {https://doi.org/10.1145/2330163.2330195}, doi = {10.1145/2330163.2330195}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/HausknechtKMS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccps/FokHGASJV12, author = {Chien{-}Liang Fok and Maykel Hanna and Seth Gee and Tsz{-}Chiu Au and Peter Stone and Christine Julien and Sriram Vishwanath}, title = {A Platform for Evaluating Autonomous Intersection Management Policies}, booktitle = {2012 {IEEE/ACM} Third International Conference on Cyber-Physical Systems, {ICCPS} 2012, Beijing, China, April 17-19, 2012}, pages = {87--96}, publisher = {{IEEE} Computer Society}, year = {2012}, url = {https://doi.org/10.1109/ICCPS.2012.17}, doi = {10.1109/ICCPS.2012.17}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iccps/FokHGASJV12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icdl-epirob/HesterS12, author = {Todd Hester and Peter Stone}, title = {Intrinsically motivated model learning for a developing curious agent}, booktitle = {2012 {IEEE} International Conference on Development and Learning and Epigenetic Robotics, {ICDL-EPIROB} 2012, San Diego, CA, USA, November 7-9, 2012}, pages = {1--6}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/DevLrn.2012.6400802}, doi = {10.1109/DEVLRN.2012.6400802}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icdl-epirob/HesterS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KalyanakrishnanTAS12, author = {Shivaram Kalyanakrishnan and Ambuj Tewari and Peter Auer and Peter Stone}, title = {{PAC} Subset Selection in Stochastic Multi-armed Bandits}, booktitle = {Proceedings of the 29th International Conference on Machine Learning, {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012}, publisher = {icml.cc / Omnipress}, year = {2012}, url = {http://icml.cc/2012/papers/359.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/KalyanakrishnanTAS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/HesterQS12, author = {Todd Hester and Michael J. Quinlan and Peter Stone}, title = {{RTMBA:} {A} Real-Time Model-Based Reinforcement Learning Architecture for robot control}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}}, pages = {85--90}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ICRA.2012.6225072}, doi = {10.1109/ICRA.2012.6225072}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/HesterQS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/AgmonFESJV12, author = {Noa Agmon and Chien{-}Liang Fok and Yehuda Emaliah and Peter Stone and Christine Julien and Sriram Vishwanath}, title = {On coordination in practical multi-robot patrol}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}}, pages = {650--656}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ICRA.2012.6224708}, doi = {10.1109/ICRA.2012.6224708}, timestamp = {Sun, 03 Dec 2017 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icra/AgmonFESJV12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/AuQS12, author = {Tsz{-}Chiu Au and Michael J. Quinlan and Peter Stone}, title = {Setpoint scheduling for autonomous vehicle controllers}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2012, 14-18 May, 2012, St. Paul, Minnesota, {USA}}, pages = {2055--2060}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ICRA.2012.6225232}, doi = {10.1109/ICRA.2012.6225232}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/AuQS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/AuFVJS12, author = {Tsz{-}Chiu Au and Chien{-}Liang Fok and Sriram Vishwanath and Christine Julien and Peter Stone}, title = {Evasion planning for autonomous vehicles at intersections}, booktitle = {2012 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2012, Vilamoura, Algarve, Portugal, October 7-12, 2012}, pages = {1541--1546}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/IROS.2012.6385936}, doi = {10.1109/IROS.2012.6385936}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/AuFVJS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/VelosoS12, author = {Manuela M. Veloso and Peter Stone}, title = {Video: RoboCup robot soccer history 1997 - 2011}, booktitle = {2012 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2012, Vilamoura, Algarve, Portugal, October 7-12, 2012}, pages = {5452--5453}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/IROS.2012.6386302}, doi = {10.1109/IROS.2012.6386302}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/VelosoS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/itsc/CarlinoDKS12, author = {Dustin Carlino and Mike Depinet and Piyush Khandelwal and Peter Stone}, title = {Approximately Orchestrated Routing and Transportation Analyzer: Large-scale traffic simulation for autonomous vehicles}, booktitle = {15th International {IEEE} Conference on Intelligent Transportation Systems, {ITSC} 2012, Anchorage, AK, USA, September 16-19, 2012}, pages = {334--339}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ITSC.2012.6338701}, doi = {10.1109/ITSC.2012.6338701}, timestamp = {Wed, 16 Oct 2019 14:14:57 +0200}, biburl = {https://dblp.org/rec/conf/itsc/CarlinoDKS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ro-man/KnoxS12, author = {W. Bradley Knox and Peter Stone}, title = {Reinforcement learning from human reward: Discounting in episodic tasks}, booktitle = {The 21st {IEEE} International Symposium on Robot and Human Interactive Communication, {IEEE} {RO-MAN} 2012, Paris, France, September 9-13, 2012}, pages = {878--885}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ROMAN.2012.6343862}, doi = {10.1109/ROMAN.2012.6343862}, timestamp = {Wed, 16 Oct 2019 14:14:50 +0200}, biburl = {https://dblp.org/rec/conf/ro-man/KnoxS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/BarrettGHHKMS12, author = {Samuel Barrett and Katie Long Genter and Yuchen He and Todd Hester and Piyush Khandelwal and Jacob Menashe and Peter Stone}, editor = {Xiaoping Chen and Peter Stone and Luis Enrique Sucar and Tijn van der Zant}, title = {{UT} Austin Villa 2012: Standard Platform League World Champions}, booktitle = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual RoboCup International Symposium, Mexico City, Mexico, June 18-24, 2012]}, series = {Lecture Notes in Computer Science}, volume = {7500}, pages = {36--47}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-39250-4\_4}, doi = {10.1007/978-3-642-39250-4\_4}, timestamp = {Wed, 28 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/BarrettGHHKMS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineCLS12, author = {Patrick MacAlpine and Nick Collins and Adrian Lopez{-}Mobilia and Peter Stone}, editor = {Xiaoping Chen and Peter Stone and Luis Enrique Sucar and Tijn van der Zant}, title = {{UT} Austin Villa: RoboCup 2012 3D Simulation League Champion}, booktitle = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual RoboCup International Symposium, Mexico City, Mexico, June 18-24, 2012]}, series = {Lecture Notes in Computer Science}, volume = {7500}, pages = {77--88}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-39250-4\_8}, doi = {10.1007/978-3-642-39250-4\_8}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineCLS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/MacAlpineBS12, author = {Patrick MacAlpine and Francisco Barrera and Peter Stone}, editor = {Xiaoping Chen and Peter Stone and Luis Enrique Sucar and Tijn van der Zant}, title = {Positioning to Win: {A} Dynamic Role Assignment and Formation Positioning System}, booktitle = {RoboCup 2012: Robot Soccer World Cup {XVI} [papers from the 16th Annual RoboCup International Symposium, Mexico City, Mexico, June 18-24, 2012]}, series = {Lecture Notes in Computer Science}, volume = {7500}, pages = {190--201}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-39250-4\_18}, doi = {10.1007/978-3-642-39250-4\_18}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/MacAlpineBS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:books/sp/12/HesterS12, author = {Todd Hester and Peter Stone}, editor = {Marco A. Wiering and Martijn van Otterlo}, title = {Learning and Using Models}, booktitle = {Reinforcement Learning}, series = {Adaptation, Learning, and Optimization}, volume = {12}, pages = {111--141}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-27645-3\_4}, doi = {10.1007/978-3-642-27645-3\_4}, timestamp = {Tue, 29 Dec 2020 18:14:51 +0100}, biburl = {https://dblp.org/rec/books/sp/12/HesterS12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1201-6583, author = {Tobias Jung and Daniel Polani and Peter Stone}, title = {Empowerment for Continuous Agent-Environment Systems}, journal = {CoRR}, volume = {abs/1201.6583}, year = {2012}, url = {http://arxiv.org/abs/1201.6583}, eprinttype = {arXiv}, eprint = {1201.6583}, timestamp = {Fri, 19 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1201-6583.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1201-6604, author = {Tobias Jung and Peter Stone}, title = {Gaussian Processes for Sample Efficient Reinforcement Learning with RMAX-like Exploration}, journal = {CoRR}, volume = {abs/1201.6604}, year = {2012}, url = {http://arxiv.org/abs/1201.6604}, eprinttype = {arXiv}, eprint = {1201.6604}, timestamp = {Fri, 19 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1201-6604.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1201-6615, author = {Tobias Jung and Peter Stone}, title = {Feature Selection for Value Function Approximation Using Bayesian Model Selection}, journal = {CoRR}, volume = {abs/1201.6615}, year = {2012}, url = {http://arxiv.org/abs/1201.6615}, eprinttype = {arXiv}, eprint = {1201.6615}, timestamp = {Fri, 19 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1201-6615.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/adb/JungPS11, author = {Tobias Jung and Daniel Polani and Peter Stone}, title = {Empowerment for continuous agent - environment systems}, journal = {Adapt. Behav.}, volume = {19}, number = {1}, pages = {16--39}, year = {2011}, url = {https://doi.org/10.1177/1059712310392389}, doi = {10.1177/1059712310392389}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/adb/JungPS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/TaylorS11, author = {Matthew E. Taylor and Peter Stone}, title = {An Introduction to Intertask Transfer for Reinforcement Learning}, journal = {{AI} Mag.}, volume = {32}, number = {1}, pages = {15--34}, year = {2011}, url = {https://doi.org/10.1609/aimag.v32i1.2329}, doi = {10.1609/AIMAG.V32I1.2329}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/TaylorS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/KalyanakrishnanS11, author = {Shivaram Kalyanakrishnan and Peter Stone}, title = {Characterizing reinforcement learning methods through parameterized learning problems}, journal = {Mach. Learn.}, volume = {84}, number = {1-2}, pages = {205--247}, year = {2011}, url = {https://doi.org/10.1007/s10994-011-5251-x}, doi = {10.1007/S10994-011-5251-X}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ml/KalyanakrishnanS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/sigecom/PardoeS11, author = {David Pardoe and Peter Stone}, title = {Designing adaptive trading agents}, journal = {SIGecom Exch.}, volume = {10}, number = {2}, pages = {37--39}, year = {2011}, url = {https://doi.org/10.1145/1998549.1998557}, doi = {10.1145/1998549.1998557}, timestamp = {Thu, 04 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/sigecom/PardoeS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AgmonS11, author = {Noa Agmon and Peter Stone}, title = {Leading Multiple Ad Hoc Teammates in Joint Action Settings}, booktitle = {Interactive Decision Theory and Game Theory, Papers from the 2011 {AAAI} Workshop, San Francisco, California, USA, August 8, 2011}, series = {{AAAI} Technical Report}, volume = {{WS-11-13}}, publisher = {{AAAI}}, year = {2011}, url = {http://www.aaai.org/ocs/index.php/WS/AAAIW11/paper/view/3805}, timestamp = {Tue, 05 Sep 2023 08:59:27 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AgmonS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LinKABS11, author = {Raz Lin and Sarit Kraus and Noa Agmon and Samuel Barrett and Peter Stone}, editor = {Wolfram Burgard and Dan Roth}, title = {Comparing Agents' Success against People in Security Domains}, booktitle = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011}, pages = {809--814}, publisher = {{AAAI} Press}, year = {2011}, url = {https://doi.org/10.1609/aaai.v25i1.7940}, doi = {10.1609/AAAI.V25I1.7940}, timestamp = {Mon, 04 Sep 2023 16:05:54 +0200}, biburl = {https://dblp.org/rec/conf/aaai/LinKABS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AgmonUS11, author = {Noa Agmon and Daniel Urieli and Peter Stone}, editor = {Wolfram Burgard and Dan Roth}, title = {Multiagent Patrol Generalized to Complex Environmental Conditions}, booktitle = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011}, pages = {1090--1095}, publisher = {{AAAI} Press}, year = {2011}, url = {https://doi.org/10.1609/aaai.v25i1.7988}, doi = {10.1609/AAAI.V25I1.7988}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AgmonUS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AuSS11, author = {Tsz{-}Chiu Au and Neda Shahidi and Peter Stone}, editor = {Wolfram Burgard and Dan Roth}, title = {Enforcing Liveness in Autonomous Traffic Management}, booktitle = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011}, pages = {1317--1322}, publisher = {{AAAI} Press}, year = {2011}, url = {https://doi.org/10.1609/aaai.v25i1.7807}, doi = {10.1609/AAAI.V25I1.7807}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AuSS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/BarrettS11, author = {Samuel Barrett and Peter Stone}, editor = {Wolfram Burgard and Dan Roth}, title = {Ad Hoc Teamwork in Variations of the Pursuit Domain}, booktitle = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011}, pages = {1758--1759}, publisher = {{AAAI} Press}, year = {2011}, url = {https://doi.org/10.1609/aaai.v25i1.8054}, doi = {10.1609/AAAI.V25I1.8054}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/BarrettS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/GenterAS11, author = {Katie Long Genter and Noa Agmon and Peter Stone}, editor = {Wolfram Burgard and Dan Roth}, title = {Role-Based Ad Hoc Teamwork}, booktitle = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011}, pages = {1782--1783}, publisher = {{AAAI} Press}, year = {2011}, url = {https://doi.org/10.1609/aaai.v25i1.8057}, doi = {10.1609/AAAI.V25I1.8057}, timestamp = {Mon, 04 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/GenterAS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/GenterAS11a, author = {Katie Long Genter and Noa Agmon and Peter Stone}, title = {Role-Based Ad Hoc Teamwork}, booktitle = {Plan, Activity, and Intent Recognition, Papers from the 2011 {AAAI} Workshop, San Francisco, California, USA, August 07, 2011}, series = {{AAAI} Technical Report}, volume = {{WS-11-16}}, publisher = {{AAAI}}, year = {2011}, url = {http://www.aaai.org/ocs/index.php/WS/AAAIW11/paper/view/3967}, timestamp = {Tue, 05 Sep 2023 08:59:27 +0200}, biburl = {https://dblp.org/rec/conf/aaai/GenterAS11a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/KnoxSS11, author = {W. Bradley Knox and Adam Bradley Setapen and Peter Stone}, title = {Reinforcement Learning with Human Feedback in Mountain Car}, booktitle = {Help Me Help You: Bridging the Gaps in Human-Agent Collaboration, Papers from the 2011 {AAAI} Spring Symposium, Technical Report SS-11-05, Stanford, California, USA, March 21-23, 2011}, publisher = {{AAAI}}, year = {2011}, url = {http://www.aaai.org/ocs/index.php/SSS/SSS11/paper/view/2487}, timestamp = {Tue, 14 Feb 2012 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaaiss/KnoxSS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/admi/Stone11, author = {Peter Stone}, editor = {Longbing Cao and Ana L. C. Bazzan and Andreas L. Symeonidis and Vladimir Gorodetsky and Gerhard Weiss and Philip S. Yu}, title = {Intersections of the Future: Using Fully Autonomous Vehicles}, booktitle = {Agents and Data Mining Interaction - 7th International Workshop on Agents and Data Mining Interation, {ADMI} 2011, Taipei, Taiwan, May 2-6, 2011, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7103}, pages = {3}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-27609-5\_1}, doi = {10.1007/978-3-642-27609-5\_1}, timestamp = {Tue, 08 Mar 2022 10:12:50 +0100}, biburl = {https://dblp.org/rec/conf/admi/Stone11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/adprl/KalyanakrishnanS11, author = {Shivaram Kalyanakrishnan and Peter Stone}, title = {On learning with imperfect representations}, booktitle = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011}, pages = {17--24}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ADPRL.2011.5967379}, doi = {10.1109/ADPRL.2011.5967379}, timestamp = {Wed, 16 Oct 2019 14:14:48 +0200}, biburl = {https://dblp.org/rec/conf/adprl/KalyanakrishnanS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/adprl/WhitesonTTS11, author = {Shimon Whiteson and Brian Tanner and Matthew E. Taylor and Peter Stone}, title = {Protecting against evaluation overfitting in empirical reinforcement learning}, booktitle = {2011 {IEEE} Symposium on Adaptive Dynamic Programming And Reinforcement Learning, {ADPRL} 2011, Paris, France, April 12-14, 2011}, pages = {120--127}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ADPRL.2011.5967363}, doi = {10.1109/ADPRL.2011.5967363}, timestamp = {Thu, 15 Jun 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/adprl/WhitesonTTS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ScerriKVMSTDFCDK11, author = {Paul Scerri and Balajee Kannan and Prasanna Velagapudi and Kate Macarthur and Peter Stone and Matthew E. Taylor and John Dolan and Alessandro Farinelli and Archie C. Chapman and Bernadine Dias and George Kantor}, editor = {Francien Dechesne and Hiromitsu Hattori and Adriaan ter Mors and Jose M. Such and Danny Weyns and Frank Dignum}, title = {Flood Disaster Mitigation: {A} Real-World Challenge Problem for Multi-agent Unmanned Surface Vehicles}, booktitle = {Advanced Agent Technology - {AAMAS} 2011 Workshops, AMPLE, AOSE, ARMS, DOCM3AS, ITMAS, Taipei, Taiwan, May 2-6, 2011. Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7068}, pages = {252--269}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-27216-5\_16}, doi = {10.1007/978-3-642-27216-5\_16}, timestamp = {Mon, 15 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/ScerriKVMSTDFCDK11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/BarrettSK11, author = {Samuel Barrett and Peter Stone and Sarit Kraus}, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {Empirical evaluation of ad hoc teamwork in the pursuit domain}, booktitle = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, pages = {567--574}, publisher = {{IFAAMAS}}, year = {2011}, url = {http://portal.acm.org/citation.cfm?id=2031698\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764}, timestamp = {Fri, 18 Nov 2011 09:09:28 +0100}, biburl = {https://dblp.org/rec/conf/atal/BarrettSK11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/UrieliMKBS11, author = {Daniel Urieli and Patrick MacAlpine and Shivaram Kalyanakrishnan and Yinon Bentor and Peter Stone}, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {On optimizing interdependent skills: a case study in simulated 3D humanoid robot soccer}, booktitle = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, pages = {769--776}, publisher = {{IFAAMAS}}, year = {2011}, url = {http://portal.acm.org/citation.cfm?id=2031727\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764}, timestamp = {Fri, 18 Nov 2011 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/UrieliMKBS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeS11, author = {David Pardoe and Peter Stone}, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {A particle filter for bid estimation in ad auctions with periodic ranking observations}, booktitle = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, pages = {887--894}, publisher = {{IFAAMAS}}, year = {2011}, url = {http://portal.acm.org/citation.cfm?id=2031744\&\#38;CFID=54178199\&\#38;CFTOKEN=61392764}, timestamp = {Fri, 18 Nov 2011 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/PardoeS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AgmonUS11, author = {Noa Agmon and Daniel Urieli and Peter Stone}, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {Ship patrol: multiagent patrol under complex environmental conditions}, booktitle = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, pages = {1103--1104}, publisher = {{IFAAMAS}}, year = {2011}, url = {http://portal.acm.org/citation.cfm?id=2034439\&\#38;CFID=69154334\&\#38;CFTOKEN=45298625}, timestamp = {Fri, 18 Nov 2011 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/AgmonUS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ShahidiAS11, author = {Neda Shahidi and Tsz{-}Chiu Au and Peter Stone}, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {Batch reservations in autonomous intersection management}, booktitle = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, pages = {1225--1226}, publisher = {{IFAAMAS}}, year = {2011}, url = {http://portal.acm.org/citation.cfm?id=2034498\&\#38;CFID=69154334\&\#38;CFTOKEN=45298625}, timestamp = {Fri, 18 Nov 2011 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/ShahidiAS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ewrl/Stone11, author = {Peter Stone}, editor = {Scott Sanner and Marcus Hutter}, title = {Invited Talk: {PRISM} - Practical {RL:} Representation, Interaction, Synthesis, and Mortality}, booktitle = {Recent Advances in Reinforcement Learning - 9th European Workshop, {EWRL} 2011, Athens, Greece, September 9-11, 2011, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {7188}, pages = {3}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-29946-9\_3}, doi = {10.1007/978-3-642-29946-9\_3}, timestamp = {Tue, 14 May 2019 10:00:48 +0200}, biburl = {https://dblp.org/rec/conf/ewrl/Stone11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ChakrabortyS11, author = {Doran Chakraborty and Peter Stone}, editor = {Lise Getoor and Tobias Scheffer}, title = {Structure Learning in Ergodic Factored MDPs without Knowledge of the Transition Function's In-Degree}, booktitle = {Proceedings of the 28th International Conference on Machine Learning, {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011}, pages = {737--744}, publisher = {Omnipress}, year = {2011}, url = {https://icml.cc/2011/papers/418\_icmlpaper.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/ChakrabortyS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/HausknechtAS11, author = {Matthew J. Hausknecht and Tsz{-}Chiu Au and Peter Stone}, title = {Autonomous Intersection Management: Multi-intersection optimization}, booktitle = {2011 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, {IROS} 2011, San Francisco, CA, USA, September 25-30, 2011}, pages = {4581--4586}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/IROS.2011.6094668}, doi = {10.1109/IROS.2011.6094668}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/HausknechtAS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/itsc/HausknechtASFW11, author = {Matthew J. Hausknecht and Tsz{-}Chiu Au and Peter Stone and David Fajardo and S. Travis Waller}, title = {Dynamic lane reversal in traffic management}, booktitle = {14th International {IEEE} Conference on Intelligent Transportation Systems, {ITSC} 2011, Washington, DC, USA, October 5-7, 2011}, pages = {1929--1934}, publisher = {{IEEE}}, year = {2011}, url = {https://doi.org/10.1109/ITSC.2011.6082932}, doi = {10.1109/ITSC.2011.6082932}, timestamp = {Wed, 16 Oct 2019 14:14:57 +0200}, biburl = {https://dblp.org/rec/conf/itsc/HausknechtASFW11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/BaiCMUBS11, author = {Aijun Bai and Xiaoping Chen and Patrick MacAlpine and Daniel Urieli and Samuel Barrett and Peter Stone}, editor = {Thomas R{\"{o}}fer and Norbert Michael Mayer and Jesus Savage and Uluc Saranli}, title = {WrightEagle and {UT} Austin Villa: RoboCup 2011 Simulation League Champions}, booktitle = {RoboCup 2011: Robot Soccer World Cup {XV} [papers from the 15th Annual RoboCup International Symposium, Istanbul, Turkey, July 2011]}, series = {Lecture Notes in Computer Science}, volume = {7416}, pages = {1--12}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-32060-6\_1}, doi = {10.1007/978-3-642-32060-6\_1}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/BaiCMUBS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KhandelwalS11, author = {Piyush Khandelwal and Peter Stone}, editor = {Thomas R{\"{o}}fer and Norbert Michael Mayer and Jesus Savage and Uluc Saranli}, title = {A Low Cost Ground Truth Detection System for RoboCup Using the Kinect}, booktitle = {RoboCup 2011: Robot Soccer World Cup {XV} [papers from the 15th Annual RoboCup International Symposium, Istanbul, Turkey, July 2011]}, series = {Lecture Notes in Computer Science}, volume = {7416}, pages = {515--527}, publisher = {Springer}, year = {2011}, url = {https://doi.org/10.1007/978-3-642-32060-6\_44}, doi = {10.1007/978-3-642-32060-6\_44}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KhandelwalS11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/atal/2011, editor = {Liz Sonenberg and Peter Stone and Kagan Tumer and Pinar Yolum}, title = {10th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2011), Taipei, Taiwan, May 2-6, 2011, Volume 1-3}, publisher = {{IFAAMAS}}, year = {2011}, isbn = {978-0-9826571-5-7}, timestamp = {Fri, 18 Nov 2011 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/2011.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1105-1749, author = {Todd Hester and Michael J. Quinlan and Peter Stone}, title = {A Real-Time Model-Based Reinforcement Learning Architecture for Robot Control}, journal = {CoRR}, volume = {abs/1105.1749}, year = {2011}, url = {http://arxiv.org/abs/1105.1749}, eprinttype = {arXiv}, eprint = {1105.1749}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1105-1749.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1106-0678, author = {Michael J. Kearns and Michael L. Littman and Satinder Singh and Peter Stone}, title = {ATTac-2000: An Adaptive Autonomous Bidding Agent}, journal = {CoRR}, volume = {abs/1106.0678}, year = {2011}, url = {http://arxiv.org/abs/1106.0678}, eprinttype = {arXiv}, eprint = {1106.0678}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1106-0678.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1106-5270, author = {J{\'{a}}nos A. Csirik and Michael L. Littman and David A. McAllester and Robert E. Schapire and Peter Stone}, title = {Decision-Theoretic Bidding Based on Learned Density Models in Simultaneous, Interacting Auctions}, journal = {CoRR}, volume = {abs/1106.5270}, year = {2011}, url = {http://arxiv.org/abs/1106.5270}, eprinttype = {arXiv}, eprint = {1106.5270}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1106-5270.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/WhitesonTS10, author = {Shimon Whiteson and Matthew E. Taylor and Peter Stone}, title = {Critical factors in the empirical performance of temporal difference and evolutionary methods for reinforcement learning}, journal = {Auton. Agents Multi Agent Syst.}, volume = {21}, number = {1}, pages = {1--35}, year = {2010}, url = {https://doi.org/10.1007/s10458-009-9100-2}, doi = {10.1007/S10458-009-9100-2}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/WhitesonTS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijauc/WildstromSW10, author = {Jonathan Wildstrom and Peter Stone and Emmett Witchel}, title = {Autonomous return on investment analysis of additional processing resources}, journal = {Int. J. Auton. Comput.}, volume = {1}, number = {3}, pages = {280--296}, year = {2010}, url = {https://doi.org/10.1504/IJAC.2010.033010}, doi = {10.1504/IJAC.2010.033010}, timestamp = {Thu, 18 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijauc/WildstromSW10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/informs/PardoeSSKT10, author = {David Pardoe and Peter Stone and Maytal Saar{-}Tsechansky and Tayfun Keskin and Kerem Tomak}, title = {Adaptive Auction Mechanism Design and the Incorporation of Prior Knowledge}, journal = {{INFORMS} J. Comput.}, volume = {22}, number = {3}, pages = {353--370}, year = {2010}, url = {https://doi.org/10.1287/ijoc.1090.0353}, doi = {10.1287/IJOC.1090.0353}, timestamp = {Sun, 15 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/informs/PardoeSSKT10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AuS10, author = {Tsz{-}Chiu Au and Peter Stone}, title = {Motion Planning Algorithms for Autonomous Intersection Management}, booktitle = {Bridging the Gap Between Task and Motion Planning, Papers from the 2010 {AAAI} Workshop, Atlanta, Georgia, USA, July 11, 2010}, series = {{AAAI} Technical Report}, volume = {{WS-10-01}}, publisher = {{AAAI}}, year = {2010}, url = {http://aaai.org/ocs/index.php/WS/AAAIW10/paper/view/2053}, timestamp = {Tue, 05 Sep 2023 08:59:27 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AuS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/StoneKKR10, author = {Peter Stone and Gal A. Kaminka and Sarit Kraus and Jeffrey S. Rosenschein}, editor = {Maria Fox and David Poole}, title = {Ad Hoc Autonomous Agent Teams: Collaboration without Pre-Coordination}, booktitle = {Proceedings of the Twenty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI} 2010, Atlanta, Georgia, USA, July 11-15, 2010}, pages = {1504--1509}, publisher = {{AAAI} Press}, year = {2010}, url = {https://doi.org/10.1609/aaai.v24i1.7529}, doi = {10.1609/AAAI.V24I1.7529}, timestamp = {Mon, 04 Sep 2023 16:23:45 +0200}, biburl = {https://dblp.org/rec/conf/aaai/StoneKKR10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KnoxS10, author = {W. Bradley Knox and Peter Stone}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {Combining manual feedback with subsequent {MDP} reward signals for reinforcement learning}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {5--12}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838208}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/KnoxS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/StoneK10, author = {Peter Stone and Sarit Kraus}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {To teach or not to teach?: decision making under uncertainty in ad hoc teams}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {117--124}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838223}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/StoneK10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeCS10, author = {David Pardoe and Doran Chakraborty and Peter Stone}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {TacTex09: a champion bidding agent for ad auctions}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {1273--1280}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838372}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/PardoeCS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/SetapenQS10, author = {Adam Setapen and Michael J. Quinlan and Peter Stone}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {MARIOnET: motion acquisition for robots through iterative online evaluative training}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {1435--1436}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838419}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/SetapenQS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ChakrabortyS10, author = {Doran Chakraborty and Peter Stone}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {Online model learning in adversarial Markov decision processes}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {1583--1584}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838492}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/ChakrabortyS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KnoxS10a, author = {W. Bradley Knox and Peter Stone}, editor = {Wiebe van der Hoek and Gal A. Kaminka and Yves Lesp{\'{e}}rance and Michael Luck and Sandip Sen}, title = {Training a Tetris agent via interactive shaping: a demonstration of the {TAMER} framework}, booktitle = {9th International Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2010), Toronto, Canada, May 10-14, 2010, Volume 1-3}, pages = {1767--1768}, publisher = {{IFAAMAS}}, year = {2010}, url = {https://dl.acm.org/citation.cfm?id=1838541}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/KnoxS10a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icdl/HesterS10, author = {Todd Hester and Peter Stone}, editor = {Benjamin Kuipers and Thomas R. Shultz and Alexander Stoytchev and Chen Yu}, title = {Real time targeted exploration in large domains}, booktitle = {2010 {IEEE} 9th International Conference on Development and Learning, {ICDL} 2010, Ann Arbor, MI, USA, August 18-21, 2010}, pages = {191--196}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/DEVLRN.2010.5578845}, doi = {10.1109/DEVLRN.2010.5578845}, timestamp = {Thu, 29 Jul 2021 12:02:58 +0200}, biburl = {https://dblp.org/rec/conf/icdl/HesterS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ChakrabortyS10, author = {Doran Chakraborty and Peter Stone}, editor = {Johannes F{\"{u}}rnkranz and Thorsten Joachims}, title = {Convergence, Targeted Optimality, and Safety in Multiagent Learning}, booktitle = {Proceedings of the 27th International Conference on Machine Learning (ICML-10), June 21-24, 2010, Haifa, Israel}, pages = {191--198}, publisher = {Omnipress}, year = {2010}, url = {https://icml.cc/Conferences/2010/papers/453.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/ChakrabortyS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KalyanakrishnanS10, author = {Shivaram Kalyanakrishnan and Peter Stone}, editor = {Johannes F{\"{u}}rnkranz and Thorsten Joachims}, title = {Efficient Selection of Multiple Bandit Arms: Theory and Practice}, booktitle = {Proceedings of the 27th International Conference on Machine Learning (ICML-10), June 21-24, 2010, Haifa, Israel}, pages = {511--518}, publisher = {Omnipress}, year = {2010}, url = {https://icml.cc/Conferences/2010/papers/410.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/KalyanakrishnanS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/PardoeS10, author = {David Pardoe and Peter Stone}, editor = {Johannes F{\"{u}}rnkranz and Thorsten Joachims}, title = {Boosting for Regression Transfer}, booktitle = {Proceedings of the 27th International Conference on Machine Learning (ICML-10), June 21-24, 2010, Haifa, Israel}, pages = {863--870}, publisher = {Omnipress}, year = {2010}, url = {https://icml.cc/Conferences/2010/papers/330.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/PardoeS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/HesterQS10, author = {Todd Hester and Michael J. Quinlan and Peter Stone}, title = {Generalized model learning for Reinforcement Learning on a humanoid robot}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2010, Anchorage, Alaska, USA, 3-7 May 2010}, pages = {2369--2374}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/ROBOT.2010.5509181}, doi = {10.1109/ROBOT.2010.5509181}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/HesterQS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/QuinlanAZSS10, author = {Michael J. Quinlan and Tsz{-}Chiu Au and Jesse Zhu and Nicolae Stiurca and Peter Stone}, title = {Bringing simulation to life: {A} mixed reality autonomous intersection}, booktitle = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 18-22, 2010, Taipei, Taiwan}, pages = {6083--6088}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/IROS.2010.5651993}, doi = {10.1109/IROS.2010.5651993}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/QuinlanAZSS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/JungS10, author = {Tobias Jung and Peter Stone}, editor = {Jos{\'{e}} L. Balc{\'{a}}zar and Francesco Bonchi and Aristides Gionis and Mich{\`{e}}le Sebag}, title = {Gaussian Processes for Sample Efficient Reinforcement Learning with RMAX-Like Exploration}, booktitle = {Machine Learning and Knowledge Discovery in Databases, European Conference, {ECML} {PKDD} 2010, Barcelona, Spain, September 20-24, 2010, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {6321}, pages = {601--616}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-15880-3\_44}, doi = {10.1007/978-3-642-15880-3\_44}, timestamp = {Fri, 19 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pkdd/JungS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/HausknechtS10, author = {Matthew J. Hausknecht and Peter Stone}, editor = {Javier Ruiz{-}del{-}Solar and Eric Chown and Paul{-}Gerhard Pl{\"{o}}ger}, title = {Learning Powerful Kicks on the Aibo {ERS-7:} The Quest for a Striker}, booktitle = {RoboCup 2010: Robot Soccer World Cup {XIV} [papers from the 14th annual RoboCup International Symposium, Singapore, June 25, 2010]}, series = {Lecture Notes in Computer Science}, volume = {6556}, pages = {254--265}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-20217-9\_22}, doi = {10.1007/978-3-642-20217-9\_22}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/HausknechtS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:books/daglib/p/NodaSYK10, author = {Itsuki Noda and Peter Stone and Tomohisa Yamashita and Koichi Kurumatani}, editor = {Hideyuki Nakashima and Hamid K. Aghajan and Juan Carlos Augusto}, title = {Multi-Agent Social Simulation}, booktitle = {Handbook of Ambient Intelligence and Smart Environments}, pages = {703--729}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-0-387-93808-0\_26}, doi = {10.1007/978-0-387-93808-0\_26}, timestamp = {Tue, 16 May 2017 14:01:34 +0200}, biburl = {https://dblp.org/rec/books/daglib/p/NodaSYK10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:reference/ml/Stone10, author = {Peter Stone}, editor = {Claude Sammut and Geoffrey I. Webb}, title = {Q-Learning}, booktitle = {Encyclopedia of Machine Learning}, pages = {819}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-0-387-30164-8\_683}, doi = {10.1007/978-0-387-30164-8\_683}, timestamp = {Wed, 14 Nov 2018 10:51:34 +0100}, biburl = {https://dblp.org/rec/reference/ml/Stone10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:reference/ml/Stone10a, author = {Peter Stone}, editor = {Claude Sammut and Geoffrey I. Webb}, title = {Reinforcement Learning}, booktitle = {Encyclopedia of Machine Learning}, pages = {849--851}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-0-387-30164-8\_714}, doi = {10.1007/978-0-387-30164-8\_714}, timestamp = {Wed, 12 Jul 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/reference/ml/Stone10a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/TaylorS09, author = {Matthew E. Taylor and Peter Stone}, title = {Transfer Learning for Reinforcement Learning Domains: {A} Survey}, journal = {J. Mach. Learn. Res.}, volume = {10}, pages = {1633--1685}, year = {2009}, url = {https://dl.acm.org/doi/10.5555/1577069.1755839}, doi = {10.5555/1577069.1755839}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/TaylorS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/SridharanS09, author = {Mohan Sridharan and Peter Stone}, title = {Color learning and illumination invariance on mobile robots: {A} survey}, journal = {Robotics Auton. Syst.}, volume = {57}, number = {6-7}, pages = {629--644}, year = {2009}, url = {https://doi.org/10.1016/j.robot.2009.01.004}, doi = {10.1016/J.ROBOT.2009.01.004}, timestamp = {Mon, 24 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ras/SridharanS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/FaselQS09, author = {Ian R. Fasel and Michael J. Quinlan and Peter Stone}, title = {A Task Specification Language for Bootstrap Learning}, booktitle = {Agents that Learn from Human Teachers, Papers from the 2009 {AAAI} Spring Symposium, Technical Report SS-09-01, Stanford, California, USA, March 23-25, 2009}, pages = {48--55}, publisher = {{AAAI}}, year = {2009}, url = {http://www.aaai.org/Library/Symposia/Spring/2009/ss09-01-008.php}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/FaselQS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaiss/KnoxFS09, author = {W. Bradley Knox and Ian R. Fasel and Peter Stone}, title = {Design Principles for Creating Human-Shapable Agents}, booktitle = {Agents that Learn from Human Teachers, Papers from the 2009 {AAAI} Spring Symposium, Technical Report SS-09-01, Stanford, California, USA, March 23-25, 2009}, pages = {79--86}, publisher = {{AAAI}}, year = {2009}, url = {http://www.aaai.org/Library/Symposia/Spring/2009/ss09-01-012.php}, timestamp = {Thu, 14 Apr 2016 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaaiss/KnoxFS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/StoneKR09, author = {Peter Stone and Gal A. Kaminka and Jeffrey S. Rosenschein}, editor = {Esther David and Enrico H. Gerding and David Sarne and Onn Shehory}, title = {Leading a Best-Response Teammate in an Ad Hoc Team}, booktitle = {Agent-Mediated Electronic Commerce. Designing Trading Strategies and Mechanisms for Electronic Markets - {AAMAS} Workshop, {AMEC} 2009, Budapest, Hungary, May 12, 2009, and {IJCAI} Workshop, {TADA} 2009, Pasadena, CA, USA, July 13, 2009, Selected and Revised Papers}, series = {Lecture Notes in Business Information Processing}, volume = {59}, pages = {132--146}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-15117-0\_10}, doi = {10.1007/978-3-642-15117-0\_10}, timestamp = {Thu, 07 Jul 2022 17:31:33 +0200}, biburl = {https://dblp.org/rec/conf/amec/StoneKR09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/HesterS09, author = {Todd Hester and Peter Stone}, editor = {Carles Sierra and Cristiano Castelfranchi and Keith S. Decker and Jaime Sim{\~{a}}o Sichman}, title = {Generalized model learning for reinforcement learning in factored domains}, booktitle = {8th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume 2}, pages = {717--724}, publisher = {{IFAAMAS}}, year = {2009}, url = {https://dl.acm.org/citation.cfm?id=1558111}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/HesterS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KalyanakrishnanS09, author = {Shivaram Kalyanakrishnan and Peter Stone}, editor = {Carles Sierra and Cristiano Castelfranchi and Keith S. Decker and Jaime Sim{\~{a}}o Sichman}, title = {An empirical analysis of value function-based and policy search reinforcement learning}, booktitle = {8th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume 2}, pages = {749--756}, publisher = {{IFAAMAS}}, year = {2009}, url = {https://dl.acm.org/citation.cfm?id=1558115}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/KalyanakrishnanS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/FaselQS09, author = {Ian R. Fasel and Michael J. Quinlan and Peter Stone}, editor = {Carles Sierra and Cristiano Castelfranchi and Keith S. Decker and Jaime Sim{\~{a}}o Sichman}, title = {A task specification language for bootstrap learning}, booktitle = {8th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume 2}, pages = {1169--1170}, publisher = {{IFAAMAS}}, year = {2009}, url = {https://dl.acm.org/citation.cfm?id=1558195}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/FaselQS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KalyanakrishnanS09a, author = {Shivaram Kalyanakrishnan and Peter Stone}, editor = {Carles Sierra and Cristiano Castelfranchi and Keith S. Decker and Jaime Sim{\~{a}}o Sichman}, title = {Learning complementary multiagent behaviors: a case study}, booktitle = {8th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2009), Budapest, Hungary, May 10-15, 2009, Volume 2}, pages = {1359--1360}, publisher = {{IFAAMAS}}, year = {2009}, url = {https://dl.acm.org/citation.cfm?id=1558293}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/KalyanakrishnanS09a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/DjeuQS09, author = {Peter Djeu and Michael J. Quinlan and Peter Stone}, title = {Improving particle filter performance using {SSE} instructions}, booktitle = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 11-15, 2009, St. Louis, MO, {USA}}, pages = {3480--3485}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IROS.2009.5354190}, doi = {10.1109/IROS.2009.5354190}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/DjeuQS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/kcap/KnoxS09, author = {W. Bradley Knox and Peter Stone}, editor = {Yolanda Gil and Natasha Fridman Noy}, title = {Interactively shaping agents via human reinforcement: the {TAMER} framework}, booktitle = {Proceedings of the 5th International Conference on Knowledge Capture {(K-CAP} 2009), September 1-4, 2009, Redondo Beach, California, {USA}}, pages = {9--16}, publisher = {{ACM}}, year = {2009}, url = {https://doi.org/10.1145/1597735.1597738}, doi = {10.1145/1597735.1597738}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/kcap/KnoxS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/JongS09, author = {Nicholas K. Jong and Peter Stone}, editor = {Wray L. Buntine and Marko Grobelnik and Dunja Mladenic and John Shawe{-}Taylor}, title = {Compositional Models for Reinforcement Learning}, booktitle = {Machine Learning and Knowledge Discovery in Databases, European Conference, {ECML} {PKDD} 2009, Bled, Slovenia, September 7-11, 2009, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {5781}, pages = {644--659}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-04180-8\_59}, doi = {10.1007/978-3-642-04180-8\_59}, timestamp = {Tue, 14 May 2019 10:00:47 +0200}, biburl = {https://dblp.org/rec/conf/pkdd/JongS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/JungS09, author = {Tobias Jung and Peter Stone}, editor = {Wray L. Buntine and Marko Grobelnik and Dunja Mladenic and John Shawe{-}Taylor}, title = {Feature Selection for Value Function Approximation Using Bayesian Model Selection}, booktitle = {Machine Learning and Knowledge Discovery in Databases, European Conference, {ECML} {PKDD} 2009, Bled, Slovenia, September 7-11, 2009, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {5781}, pages = {660--675}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-04180-8\_60}, doi = {10.1007/978-3-642-04180-8\_60}, timestamp = {Fri, 19 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/pkdd/JungS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KalyanakrishnanHQBS09, author = {Shivaram Kalyanakrishnan and Todd Hester and Michael J. Quinlan and Yinon Bentor and Peter Stone}, editor = {Jacky Baltes and Michail G. Lagoudakis and Tadashi Naruse and Saeed Shiry Ghidary}, title = {Three Humanoid Soccer Platforms: Comparison and Synthesis}, booktitle = {RoboCup 2009: Robot Soccer World Cup {XIII} [papers from the 13th annual RoboCup International Symposium, Graz, Austria, June 29 - July 5, 2009]}, series = {Lecture Notes in Computer Science}, volume = {5949}, pages = {140--152}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-11876-0\_13}, doi = {10.1007/978-3-642-11876-0\_13}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KalyanakrishnanHQBS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KalyanakrishnanS09, author = {Shivaram Kalyanakrishnan and Peter Stone}, editor = {Jacky Baltes and Michail G. Lagoudakis and Tadashi Naruse and Saeed Shiry Ghidary}, title = {Learning Complementary Multiagent Behaviors: {A} Case Study}, booktitle = {RoboCup 2009: Robot Soccer World Cup {XIII} [papers from the 13th annual RoboCup International Symposium, Graz, Austria, June 29 - July 5, 2009]}, series = {Lecture Notes in Computer Science}, volume = {5949}, pages = {153--165}, publisher = {Springer}, year = {2009}, url = {https://doi.org/10.1007/978-3-642-11876-0\_14}, doi = {10.1007/978-3-642-11876-0\_14}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KalyanakrishnanS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@incollection{DBLP:books/igi/09/DresnerSM09, author = {Kurt M. Dresner and Peter Stone and Mark Van Middlesworth}, editor = {Ana L. C. Bazzan and Franziska Kl{\"{u}}gl}, title = {An Unmanaged Intersection Protocol and Improved Intersection Safety for Autonomous Vehicles}, booktitle = {Multi-Agent Systems for Traffic and Transportation Engineering}, pages = {193--217}, publisher = {{IGI} Global}, year = {2009}, url = {https://doi.org/10.4018/978-1-60566-226-8.ch009}, doi = {10.4018/978-1-60566-226-8.CH009}, timestamp = {Mon, 16 Sep 2019 14:43:09 +0200}, biburl = {https://dblp.org/rec/books/igi/09/DresnerSM09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijait/StrongerS08, author = {Daniel Stronger and Peter Stone}, title = {Polynomial Regression with Automated Degree: a Function Approximator for Autonomous Agents}, journal = {Int. J. Artif. Intell. Tools}, volume = {17}, number = {1}, pages = {159--174}, year = {2008}, url = {https://doi.org/10.1142/S0218213008003820}, doi = {10.1142/S0218213008003820}, timestamp = {Tue, 12 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijait/StrongerS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijhisi/ParryPDS08, author = {David Parry and Emma Parry and Phurb Dorji and Peter Stone}, title = {Open Source Software: {A} Key Component of E-Health in Developing Nations}, journal = {Int. J. Heal. Inf. Syst. Informatics}, volume = {3}, number = {3}, pages = {1--15}, year = {2008}, url = {https://doi.org/10.4018/jhisi.2008070101}, doi = {10.4018/JHISI.2008070101}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ijhisi/ParryPDS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/DresnerS08, author = {Kurt M. Dresner and Peter Stone}, title = {A Multiagent Approach to Autonomous Intersection Management}, journal = {J. Artif. Intell. Res.}, volume = {31}, pages = {591--656}, year = {2008}, url = {https://doi.org/10.1613/jair.2502}, doi = {10.1613/JAIR.2502}, timestamp = {Mon, 21 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/DresnerS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/sigecom/WellmanGS08, author = {Michael P. Wellman and Amy Greenwald and Peter Stone}, title = {Book announcement: autonomous bidding agents}, journal = {SIGecom Exch.}, volume = {7}, number = {2}, year = {2008}, url = {https://doi.org/10.1145/1399589.1399591}, doi = {10.1145/1399589.1399591}, timestamp = {Thu, 04 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/sigecom/WellmanGS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agi/TaylorKS08, author = {Matthew E. Taylor and Gregory Kuhlmann and Peter Stone}, editor = {Pei Wang and Ben Goertzel and Stan Franklin}, title = {Transfer Learning and Intelligence: an Argument and Approach}, booktitle = {Artificial General Intelligence 2008, Proceedings of the First {AGI} Conference, {AGI} 2008, March 1-3, 2008, University of Memphis, Memphis, TN, {USA}}, series = {Frontiers in Artificial Intelligence and Applications}, volume = {171}, pages = {326--337}, publisher = {{IOS} Press}, year = {2008}, url = {http://www.booksonline.iospress.nl/Content/View.aspx?piid=8319}, timestamp = {Thu, 24 Aug 2017 11:33:04 +0200}, biburl = {https://dblp.org/rec/conf/agi/TaylorKS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/PardoeS08, author = {David Pardoe and Peter Stone}, editor = {Wolfgang Ketter and Han La Poutr{\'{e}} and Norman M. Sadeh and Onn Shehory and William E. Walsh}, title = {The 2007 {TAC} {SCM} Prediction Challenge}, booktitle = {Agent-Mediated Electronic Commerce and Trading Agent Design and Analysis - {AAMAS} Workshop, {AMEC} 2008, Estoril, Portugal, May 12-16, 2008, and {AAAI} Workshop, {TADA} 2008, Chicago, IL, USA, July 14, 2008, Revised Selected Papers}, series = {Lecture Notes in Business Information Processing}, volume = {44}, pages = {175--189}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-642-15237-5\_13}, doi = {10.1007/978-3-642-15237-5\_13}, timestamp = {Tue, 22 Jan 2019 08:41:34 +0100}, biburl = {https://dblp.org/rec/conf/amec/PardoeS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/TaylorKS08, author = {Matthew E. Taylor and Gregory Kuhlmann and Peter Stone}, editor = {Lin Padgham and David C. Parkes and J{\"{o}}rg P. M{\"{u}}ller and Simon Parsons}, title = {Autonomous transfer for reinforcement learning}, booktitle = {7th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume 1}, pages = {283--290}, publisher = {{IFAAMAS}}, year = {2008}, url = {https://dl.acm.org/citation.cfm?id=1402427}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/TaylorKS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/JongHS08, author = {Nicholas K. Jong and Todd Hester and Peter Stone}, editor = {Lin Padgham and David C. Parkes and J{\"{o}}rg P. M{\"{u}}ller and Simon Parsons}, title = {The utility of temporal abstraction in reinforcement learning}, booktitle = {7th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume 1}, pages = {299--306}, publisher = {{IFAAMAS}}, year = {2008}, url = {https://dl.acm.org/citation.cfm?id=1402429}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/JongHS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/DresnerS08, author = {Kurt M. Dresner and Peter Stone}, editor = {Lin Padgham and David C. Parkes and J{\"{o}}rg P. M{\"{u}}ller and Simon Parsons}, title = {Mitigating catastrophic failure at intersections of autonomous vehicles}, booktitle = {7th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume 3}, pages = {1393--1396}, publisher = {{IFAAMAS}}, year = {2008}, url = {https://dl.acm.org/citation.cfm?id=1402881}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/DresnerS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/MiddlesworthDS08, author = {Mark Van Middlesworth and Kurt M. Dresner and Peter Stone}, editor = {Lin Padgham and David C. Parkes and J{\"{o}}rg P. M{\"{u}}ller and Simon Parsons}, title = {Replacing the stop sign: unmanaged intersection control for autonomous vehicles}, booktitle = {7th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume 3}, pages = {1413--1416}, publisher = {{IFAAMAS}}, year = {2008}, url = {https://dl.acm.org/citation.cfm?id=1402886}, timestamp = {Fri, 30 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/MiddlesworthDS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icac/WildstromSW08, author = {Jonathan Wildstrom and Peter Stone and Emmett Witchel}, editor = {John Strassner and Simon A. Dobson and Jos{\'{e}} A. B. Fortes and Kumar K. Goswami}, title = {{CARVE:} {A} Cognitive Agent for Resource Value Estimation}, booktitle = {2008 International Conference on Autonomic Computing, {ICAC} 2008, June 2-6, 2008, Chicago, Illinois, {USA}}, pages = {182--191}, publisher = {{IEEE} Computer Society}, year = {2008}, url = {https://doi.org/10.1109/ICAC.2008.27}, doi = {10.1109/ICAC.2008.27}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icac/WildstromSW08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ReisingerSM08, author = {Joseph Reisinger and Peter Stone and Risto Miikkulainen}, editor = {William W. Cohen and Andrew McCallum and Sam T. Roweis}, title = {Online kernel selection for Bayesian reinforcement learning}, booktitle = {Machine Learning, Proceedings of the Twenty-Fifth International Conference {(ICML} 2008), Helsinki, Finland, June 5-9, 2008}, series = {{ACM} International Conference Proceeding Series}, volume = {307}, pages = {816--823}, publisher = {{ACM}}, year = {2008}, url = {https://doi.org/10.1145/1390156.1390259}, doi = {10.1145/1390156.1390259}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/ReisingerSM08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KnoxLS08, author = {W. Bradley Knox and Juhyun Lee and Peter Stone}, title = {Person recognition on a Segway Robot: {A} video of {UT} Austin Villa Robocup@Home 2007 finals demonstration}, booktitle = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA} 2008, May 19-23, 2008, Pasadena, California, {USA}}, pages = {1785--1786}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ROBOT.2008.4543466}, doi = {10.1109/ROBOT.2008.4543466}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KnoxLS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/StrongerS08, author = {Daniel Stronger and Peter Stone}, title = {Maximum likelihood estimation of sensor and action model functions on a mobile robot}, booktitle = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA} 2008, May 19-23, 2008, Pasadena, California, {USA}}, pages = {2104--2109}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ROBOT.2008.4543517}, doi = {10.1109/ROBOT.2008.4543517}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/StrongerS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/LeeS08, author = {Juhyun Lee and Peter Stone}, title = {Person tracking on a mobile robot with heterogeneous inter-characteristic feedback}, booktitle = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA} 2008, May 19-23, 2008, Pasadena, California, {USA}}, pages = {2577--2582}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ROBOT.2008.4543601}, doi = {10.1109/ROBOT.2008.4543601}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/LeeS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/HesterS08, author = {Todd Hester and Peter Stone}, title = {Negative information and line observations for Monte Carlo localization}, booktitle = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA} 2008, May 19-23, 2008, Pasadena, California, {USA}}, pages = {2764--2769}, publisher = {{IEEE}}, year = {2008}, url = {https://doi.org/10.1109/ROBOT.2008.4543629}, doi = {10.1109/ROBOT.2008.4543629}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/HesterS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/ChakrabortyS08, author = {Doran Chakraborty and Peter Stone}, editor = {Walter Daelemans and Bart Goethals and Katharina Morik}, title = {Online Multiagent Learning against Memory Bounded Adversaries}, booktitle = {Machine Learning and Knowledge Discovery in Databases, European Conference, {ECML/PKDD} 2008, Antwerp, Belgium, September 15-19, 2008, Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {5211}, pages = {211--226}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-540-87479-9\_32}, doi = {10.1007/978-3-540-87479-9\_32}, timestamp = {Mon, 28 Aug 2023 21:17:29 +0200}, biburl = {https://dblp.org/rec/conf/pkdd/ChakrabortyS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/pkdd/TaylorJS08, author = {Matthew E. Taylor and Nicholas K. Jong and Peter Stone}, editor = {Walter Daelemans and Bart Goethals and Katharina Morik}, title = {Transferring Instances for Model-Based Reinforcement Learning}, booktitle = {Machine Learning and Knowledge Discovery in Databases, European Conference, {ECML/PKDD} 2008, Antwerp, Belgium, September 15-19, 2008, Proceedings, Part {II}}, series = {Lecture Notes in Computer Science}, volume = {5212}, pages = {488--505}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-540-87481-2\_32}, doi = {10.1007/978-3-540-87481-2\_32}, timestamp = {Tue, 14 May 2019 10:00:47 +0200}, biburl = {https://dblp.org/rec/conf/pkdd/TaylorJS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KnoxLS08, author = {W. Bradley Knox and Juhyun Lee and Peter Stone}, editor = {Luca Iocchi and Hitoshi Matsubara and Alfredo Weitzenfeld and Changjiu Zhou}, title = {Domestic Interaction on a Segway Base}, booktitle = {RoboCup 2008: Robot Soccer World Cup {XII} [papers from the 12th annual RoboCup International Symposium, Suzhou, China, July 15-18, 2008]}, series = {Lecture Notes in Computer Science}, volume = {5399}, pages = {519--531}, publisher = {Springer}, year = {2008}, url = {https://doi.org/10.1007/978-3-642-02921-9\_45}, doi = {10.1007/978-3-642-02921-9\_45}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KnoxLS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/visapp/SridharanS08a, author = {Mohan Sridharan and Peter Stone}, editor = {Luca Iocchi and Domenico G. Sorrenti}, title = {Comparing Two Action Planning Approaches for Color Learning on a Mobile Robot}, booktitle = {Proceedings of the {VISAPP} International Workshop on Robotic Perception, in conjunction with {VISIGRAPP} 2008, Funchal, Madeira, Portugal, January 2008}, pages = {43--52}, publisher = {{INSTICC} - Institute for Systems and Technologies of Information, Control and Communication}, year = {2008}, timestamp = {Sun, 07 Sep 2008 13:06:48 +0200}, biburl = {https://dblp.org/rec/conf/visapp/SridharanS08a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/visapp/SridharanS08, author = {Mohan Sridharan and Peter Stone}, editor = {Alpesh Ranchordas and Helder Ara{\'{u}}jo}, title = {Long-Term vs. Greedy Action Planning for Color Learning on a Mobile Robot}, booktitle = {{VISAPP} 2008: Proceedings of the Third International Conference on Computer Vision Theory and Applications, Funchal, Madeira, Portugal, January 22-25, 2008 - Volume 2}, pages = {682--685}, publisher = {{INSTICC} - Institute for Systems and Technologies of Information, Control and Communication}, year = {2008}, timestamp = {Mon, 15 Jun 2015 19:00:07 +0200}, biburl = {https://dblp.org/rec/conf/visapp/SridharanS08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@book{DBLP:books/daglib/0018264, author = {Michael P. Wellman and Amy Greenwald and Peter Stone}, title = {Autonomous bidding agents - strategies and lessons from the trading agent competition}, publisher = {{MIT} Press}, year = {2007}, isbn = {978-0-262-23260-9}, timestamp = {Thu, 09 Feb 2012 00:00:00 +0100}, biburl = {https://dblp.org/rec/books/daglib/0018264.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@book{DBLP:series/synthesis/2007Stone, author = {Peter Stone}, title = {Intelligent Autonomous Robotics: {A} Robot Soccer Case Study}, series = {Synthesis Lectures on Artificial Intelligence and Machine Learning}, publisher = {Morgan {\&} Claypool Publishers}, year = {2007}, url = {https://doi.org/10.2200/S00090ED1V01Y200705AIM001}, doi = {10.2200/S00090ED1V01Y200705AIM001}, isbn = {978-3-031-00416-2}, timestamp = {Tue, 17 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/series/synthesis/2007Stone.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/adb/WhitesonTS07, author = {Shimon Whiteson and Matthew E. Taylor and Peter Stone}, title = {Empirical Studies in Action Selection with Reinforcement Learning}, journal = {Adapt. Behav.}, volume = {15}, number = {1}, pages = {33--50}, year = {2007}, url = {https://doi.org/10.1177/1059712306076253}, doi = {10.1177/1059712306076253}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/adb/WhitesonTS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/Stone07, author = {Peter Stone}, title = {Multiagent learning is not the answer. It is the question}, journal = {Artif. Intell.}, volume = {171}, number = {7}, pages = {402--405}, year = {2007}, url = {https://doi.org/10.1016/j.artint.2006.12.005}, doi = {10.1016/J.ARTINT.2006.12.005}, timestamp = {Sat, 27 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/Stone07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/arobots/SridharanS07, author = {Mohan Sridharan and Peter Stone}, title = {Structure-based color learning on a mobile robot under changing illumination}, journal = {Auton. Robots}, volume = {23}, number = {3}, pages = {161--182}, year = {2007}, url = {https://doi.org/10.1007/s10514-007-9038-7}, doi = {10.1007/S10514-007-9038-7}, timestamp = {Thu, 18 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/arobots/SridharanS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/TaylorSL07, author = {Matthew E. Taylor and Peter Stone and Yaxin Liu}, title = {Transfer Learning via Inter-Task Mappings for Temporal Difference Learning}, journal = {J. Mach. Learn. Res.}, volume = {8}, pages = {2125--2167}, year = {2007}, url = {https://dl.acm.org/doi/10.5555/1314498.1314569}, doi = {10.5555/1314498.1314569}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/TaylorSL07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/TaylorWS07, author = {Matthew E. Taylor and Shimon Whiteson and Peter Stone}, title = {Temporal Difference and Policy Search Methods for Reinforcement Learning: An Empirical Comparison}, booktitle = {Proceedings of the Twenty-Second {AAAI} Conference on Artificial Intelligence, July 22-26, 2007, Vancouver, British Columbia, Canada}, pages = {1675--1678}, publisher = {{AAAI} Press}, year = {2007}, url = {http://www.aaai.org/Library/AAAI/2007/aaai07-271.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/TaylorWS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/TaylorS07, author = {Matthew E. Taylor and Peter Stone}, title = {Representation Transfer via Elaboration}, booktitle = {Proceedings of the Twenty-Second {AAAI} Conference on Artificial Intelligence, July 22-26, 2007, Vancouver, British Columbia, Canada}, pages = {1906--1907}, publisher = {{AAAI} Press}, year = {2007}, url = {http://www.aaai.org/Library/AAAI/2007/aaai07-328.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/TaylorS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaaifs/TaylorS07, author = {Matthew E. Taylor and Peter Stone}, editor = {Clayton T. Morrison and Tim Oates}, title = {Representation Transfer for Reinforcement Learning}, booktitle = {Computational Approaches to Representation Change during Learning and Development, Papers from the 2007 {AAAI} Fall Symposium, Arlington, Virginia, USA, November 9-11, 2007}, series = {{AAAI} Technical Report}, volume = {{FS-07-03}}, pages = {78--85}, publisher = {{AAAI} Press}, year = {2007}, url = {https://www.aaai.org/Library/Symposia/Fall/2007/fs07-03-015.php}, timestamp = {Sun, 16 Oct 2022 14:19:55 +0200}, biburl = {https://dblp.org/rec/conf/aaaifs/TaylorS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeS07a, author = {David Pardoe and Peter Stone}, editor = {John Collins and Peyman Faratin and Simon Parsons and Juan A. Rodr{\'{\i}}guez{-}Aguilar and Norman M. Sadeh and Onn Shehory and Elizabeth Sklar}, title = {Adapting Price Predictions in {TAC} {SCM}}, booktitle = {Agent-Mediated Electronic Commerce and Trading Agent Design and Analysis, {AAMAS} 2007 Workshop, {AMEC} 2007, Honolulu, Hawaii, May 14, 2007, and {AAAI} 2007 Workshop, {TADA} 2007, Vancouver, Canada, July 23, 2007, Selected and Revised Papers}, series = {Lecture Notes in Business Information Processing}, volume = {13}, pages = {30--45}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-88713-3\_3}, doi = {10.1007/978-3-540-88713-3\_3}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/atal/PardoeS07a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/TaylorWS07, author = {Matthew E. Taylor and Shimon Whiteson and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {Transfer via inter-task mappings in policy search reinforcement learning}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {37}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329170}, doi = {10.1145/1329125.1329170}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/TaylorWS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/KalyanakrishnanS07, author = {Shivaram Kalyanakrishnan and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {Batch reinforcement learning in a complex domain}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {94}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329241}, doi = {10.1145/1329125.1329241}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/KalyanakrishnanS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/JongS07, author = {Nicholas K. Jong and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {Model-based function approximation in reinforcement learning}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {95}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329242}, doi = {10.1145/1329125.1329242}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/JongS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeS07, author = {David Pardoe and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {Adapting in agent-based markets: a study from {TAC} {SCM}}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {98}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329246}, doi = {10.1145/1329125.1329246}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/PardoeS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/TaylorS07, author = {Matthew E. Taylor and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {Towards reinforcement learning representation transfer}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {100}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329248}, doi = {10.1145/1329125.1329248}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/TaylorS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/AhmadiTS07, author = {Mazda Ahmadi and Matthew E. Taylor and Peter Stone}, editor = {Edmund H. Durfee and Makoto Yokoo and Michael N. Huhns and Onn Shehory}, title = {{IFSA:} incremental feature-set augmentation for reinforcement learning tasks}, booktitle = {6th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2007), Honolulu, Hawaii, USA, May 14-18, 2007}, pages = {186}, publisher = {{IFAAMAS}}, year = {2007}, url = {https://doi.org/10.1145/1329125.1329351}, doi = {10.1145/1329125.1329351}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/AhmadiTS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecml/KuhlmannS07, author = {Gregory Kuhlmann and Peter Stone}, editor = {Joost N. Kok and Jacek Koronacki and Ram{\'{o}}n L{\'{o}}pez de M{\'{a}}ntaras and Stan Matwin and Dunja Mladenic and Andrzej Skowron}, title = {Graph-Based Domain Mapping for Transfer Learning in General Games}, booktitle = {Machine Learning: {ECML} 2007, 18th European Conference on Machine Learning, Warsaw, Poland, September 17-21, 2007, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4701}, pages = {188--200}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-74958-5\_20}, doi = {10.1007/978-3-540-74958-5\_20}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/ecml/KuhlmannS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icac/WildstromSW07, author = {Jonathan Wildstrom and Peter Stone and Emmett Witchel}, title = {Autonomous Return on Investment Analysis of Additional Processing Resources}, booktitle = {Fourth International Conference on Autonomic Computing (ICAC'07), Jacksonville, Florida, USA, June 11-15, 2007}, pages = {15}, publisher = {{IEEE} Computer Society}, year = {2007}, url = {https://doi.org/10.1109/ICAC.2007.11}, doi = {10.1109/ICAC.2007.11}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icac/WildstromSW07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/TaylorS07, author = {Matthew E. Taylor and Peter Stone}, editor = {Zoubin Ghahramani}, title = {Cross-domain transfer for reinforcement learning}, booktitle = {Machine Learning, Proceedings of the Twenty-Fourth International Conference {(ICML} 2007), Corvallis, Oregon, USA, June 20-24, 2007}, series = {{ACM} International Conference Proceeding Series}, volume = {227}, pages = {879--886}, publisher = {{ACM}}, year = {2007}, url = {https://doi.org/10.1145/1273496.1273607}, doi = {10.1145/1273496.1273607}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/TaylorS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/StrongerS07, author = {Daniel Stronger and Peter Stone}, title = {A Comparison of Two Approaches for Vision and Self-Localization on a Mobile Robot}, booktitle = {2007 {IEEE} International Conference on Robotics and Automation, {ICRA} 2007, 10-14 April 2007, Roma, Italy}, pages = {3915--3920}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/ROBOT.2007.364079}, doi = {10.1109/ROBOT.2007.364079}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/StrongerS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/Stone07, author = {Peter Stone}, editor = {Manuela M. Veloso}, title = {Learning and Multiagent Reasoning for Autonomous Agents}, booktitle = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference on Artificial Intelligence, Hyderabad, India, January 6-12, 2007}, pages = {12--30}, year = {2007}, url = {http://ijcai.org/Proceedings/07/Papers/002.pdf}, timestamp = {Tue, 20 Aug 2019 16:17:11 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/Stone07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/BanerjeeS07, author = {Bikramjit Banerjee and Peter Stone}, editor = {Manuela M. Veloso}, title = {General Game Learning Using Knowledge Transfer}, booktitle = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference on Artificial Intelligence, Hyderabad, India, January 6-12, 2007}, pages = {672--677}, year = {2007}, url = {http://ijcai.org/Proceedings/07/Papers/107.pdf}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/BanerjeeS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/WildstromSWD07, author = {Jonathan Wildstrom and Peter Stone and Emmett Witchel and Michael Dahlin}, editor = {Manuela M. Veloso}, title = {Machine Learning for On-Line Hardware Reconfiguration}, booktitle = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference on Artificial Intelligence, Hyderabad, India, January 6-12, 2007}, pages = {1113--1118}, year = {2007}, url = {http://ijcai.org/Proceedings/07/Papers/180.pdf}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/WildstromSWD07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/DresnerS07, author = {Kurt M. Dresner and Peter Stone}, editor = {Manuela M. Veloso}, title = {Sharing the Road: Autonomous Vehicles Meet Human Drivers}, booktitle = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference on Artificial Intelligence, Hyderabad, India, January 6-12, 2007}, pages = {1263--1268}, year = {2007}, url = {http://ijcai.org/Proceedings/07/Papers/204.pdf}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/DresnerS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/SridharanS07, author = {Mohan Sridharan and Peter Stone}, editor = {Manuela M. Veloso}, title = {Color Learning on a Mobile Robot: Towards Full Autonomy under Changing Illumination}, booktitle = {{IJCAI} 2007, Proceedings of the 20th International Joint Conference on Artificial Intelligence, Hyderabad, India, January 6-12, 2007}, pages = {2212--2217}, year = {2007}, url = {http://ijcai.org/Proceedings/07/Papers/356.pdf}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/SridharanS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/SridharanS07, author = {Mohan Sridharan and Peter Stone}, title = {Global action selection for illumination invariant color modeling}, booktitle = {2007 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 29 - November 2, 2007, Sheraton Hotel and Marina, San Diego, California, {USA}}, pages = {1671--1676}, publisher = {{IEEE}}, year = {2007}, url = {https://doi.org/10.1109/IROS.2007.4399203}, doi = {10.1109/IROS.2007.4399203}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/SridharanS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/AhmadiS07, author = {Mazda Ahmadi and Peter Stone}, editor = {Ubbo Visser and Fernando Ribeiro and Takeshi Ohashi and Frank Dellaert}, title = {Instance-Based Action Models for Fast Action Planning}, booktitle = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta, GA, {USA}}, series = {Lecture Notes in Computer Science}, volume = {5001}, pages = {1--16}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-68847-1\_1}, doi = {10.1007/978-3-540-68847-1\_1}, timestamp = {Sat, 30 Sep 2023 09:55:24 +0200}, biburl = {https://dblp.org/rec/conf/robocup/AhmadiS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KalyanakrishnanSL07, author = {Shivaram Kalyanakrishnan and Peter Stone and Yaxin Liu}, editor = {Ubbo Visser and Fernando Ribeiro and Takeshi Ohashi and Frank Dellaert}, title = {Model-Based Reinforcement Learning in a Complex Domain}, booktitle = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta, GA, {USA}}, series = {Lecture Notes in Computer Science}, volume = {5001}, pages = {171--183}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-68847-1\_15}, doi = {10.1007/978-3-540-68847-1\_15}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KalyanakrishnanSL07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/GrasemannSS07, author = {Uli Grasemann and Daniel Stronger and Peter Stone}, editor = {Ubbo Visser and Fernando Ribeiro and Takeshi Ohashi and Frank Dellaert}, title = {A Neural Network-Based Approach to Robot Motion Control}, booktitle = {RoboCup 2007: Robot Soccer World Cup XI, July 9-10, 2007, Atlanta, GA, {USA}}, series = {Lecture Notes in Computer Science}, volume = {5001}, pages = {480--487}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-68847-1\_51}, doi = {10.1007/978-3-540-68847-1\_51}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/GrasemannSS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sara/JongS07, author = {Nicholas K. Jong and Peter Stone}, editor = {Ian Miguel and Wheeler Ruml}, title = {Model-Based Exploration in Continuous State Spaces}, booktitle = {Abstraction, Reformulation, and Approximation, 7th International Symposium, {SARA} 2007, Whistler, Canada, July 18-21, 2007, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4612}, pages = {258--272}, publisher = {Springer}, year = {2007}, url = {https://doi.org/10.1007/978-3-540-73580-9\_21}, doi = {10.1007/978-3-540-73580-9\_21}, timestamp = {Tue, 14 May 2019 10:00:38 +0200}, biburl = {https://dblp.org/rec/conf/sara/JongS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/IsbellKSSSK06, author = {Charles Lee Isbell Jr. and Michael J. Kearns and Satinder Singh and Christian R. Shelton and Peter Stone and David P. Kormann}, title = {Cobot in LambdaMOO: An Adaptive Social Statistics Agent}, journal = {Auton. Agents Multi Agent Syst.}, volume = {13}, number = {3}, pages = {327--354}, year = {2006}, url = {https://doi.org/10.1007/s10458-006-0005-z}, doi = {10.1007/S10458-006-0005-Z}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aamas/IsbellKSSSK06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/connection/StrongerS06, author = {Daniel Stronger and Peter Stone}, title = {Towards autonomous sensor and actuator model induction on a mobile robot}, journal = {Connect. Sci.}, volume = {18}, number = {2}, pages = {97--119}, year = {2006}, url = {https://doi.org/10.1080/09540090600768690}, doi = {10.1080/09540090600768690}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/connection/StrongerS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/WhitesonS06, author = {Shimon Whiteson and Peter Stone}, title = {Evolutionary Function Approximation for Reinforcement Learning}, journal = {J. Mach. Learn. Res.}, volume = {7}, pages = {877--917}, year = {2006}, url = {http://jmlr.org/papers/v7/whiteson06a.html}, timestamp = {Wed, 10 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/WhitesonS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/StoneSSKKFJ06, author = {Peter Stone and Mohan Sridharan and Daniel Stronger and Gregory Kuhlmann and Nate Kohl and Peggy Fidelman and Nicholas K. Jong}, title = {From pixels to multi-robot decision-making: {A} study in uncertainty}, journal = {Robotics Auton. Syst.}, volume = {54}, number = {11}, pages = {933--943}, year = {2006}, url = {https://doi.org/10.1016/j.robot.2006.05.010}, doi = {10.1016/J.ROBOT.2006.05.010}, timestamp = {Mon, 24 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ras/StoneSSKKFJ06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ACMicec/PardoeSST06, author = {David Pardoe and Peter Stone and Maytal Saar{-}Tsechansky and Kerem Tomak}, editor = {Mark S. Fox and Bruce Spencer}, title = {Adaptive mechanism design: a metalearning approach}, booktitle = {Proceedings of the 8th International Conference on Electronic Commerce: The new e-commerce - Innovations for Conquering Current Barriers, Obstacles and Limitations to Conducting Successful Business on the Internet, 2006, Fredericton, New Brunswick, Canada, August 13-16, 2006}, series = {{ACM} International Conference Proceeding Series}, volume = {156}, pages = {92--102}, publisher = {{ACM}}, year = {2006}, url = {https://doi.org/10.1145/1151454.1151480}, doi = {10.1145/1151454.1151480}, timestamp = {Tue, 06 Apr 2021 12:12:56 +0200}, biburl = {https://dblp.org/rec/conf/ACMicec/PardoeSST06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/LiuS06, author = {Yaxin Liu and Peter Stone}, title = {Value-Function-Based Transfer for Reinforcement Learning Using Structure Mapping}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {415--420}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-066.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/LiuS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WhitesonS06, author = {Shimon Whiteson and Peter Stone}, title = {Sample-Efficient Evolutionary Function Approximation for Reinforcement Learning}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {518--523}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-083.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WhitesonS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AhmadiS06, author = {Mazda Ahmadi and Peter Stone}, title = {Keeping in Touch: Maintaining Biconnected Structure by Homogeneous Robots}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {580--585}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-093.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AhmadiS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/KuhlmannS06, author = {Gregory Kuhlmann and Peter Stone}, title = {Automatic Heuristic Construction in a Complete General Game Player}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1457--1462}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-229.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KuhlmannS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/KuhlmannKS06, author = {Gregory Kuhlmann and William B. Knox and Peter Stone}, title = {Know Thine Enemy: {A} Champion RoboCup Coach Agent}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1463--1468}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-230.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KuhlmannKS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/PardoeS06, author = {David Pardoe and Peter Stone}, title = {TacTex-05: {A} Champion Supply Chain Management Agent}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1489--1494}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-234.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/PardoeS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/DresnerS06, author = {Kurt M. Dresner and Peter Stone}, title = {Traffic Intersections of the Future}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1593--1596}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-258.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/DresnerS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/AhmadiS06a, author = {Mazda Ahmadi and Peter Stone}, title = {Biconnected Structure for Multi-Robot Systems}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1853}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-305.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/AhmadiS06a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/DresnerS06a, author = {Kurt M. Dresner and Peter Stone}, title = {Making Autonomous Intersection Management Backwards-Compatible}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1865--1866}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-311.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/DresnerS06a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/KuhlmannS06a, author = {Gregory Kuhlmann and Peter Stone}, title = {Automatic Heuristic Construction for General Game Playing}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1883--1884}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-320.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KuhlmannS06a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/StrongerS06, author = {Daniel Stronger and Peter Stone}, title = {Expectation-Based Vision for Self-Localization on a Legged Robot}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1899--1900}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-328.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/StrongerS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/TaylorS06, author = {Matthew E. Taylor and Peter Stone}, title = {Inter-Task Action Correlation for Reinforcement Learning Tasks}, booktitle = {Proceedings, The Twenty-First National Conference on Artificial Intelligence and the Eighteenth Innovative Applications of Artificial Intelligence Conference, July 16-20, 2006, Boston, Massachusetts, {USA}}, pages = {1901--1903}, publisher = {{AAAI} Press}, year = {2006}, url = {http://www.aaai.org/Library/AAAI/2006/aaai06-329.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/TaylorS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/PardoeS06, author = {David Pardoe and Peter Stone}, editor = {Derek Long and Stephen F. Smith and Daniel Borrajo and Lee McCluskey}, title = {Predictive Planning for Supply Chain Management}, booktitle = {Proceedings of the Sixteenth International Conference on Automated Planning and Scheduling, {ICAPS} 2006, Cumbria, UK, June 6-10, 2006}, pages = {21--30}, publisher = {{AAAI}}, year = {2006}, url = {http://www.aaai.org/Library/ICAPS/2006/icaps06-003.php}, timestamp = {Fri, 05 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aips/PardoeS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeSM06, author = {David Pardoe and Peter Stone and Mark Van Middlesworth}, editor = {Maria Fasli and Onn Shehory}, title = {TacTex-05: An Adaptive Agent for {TAC} {SCM}}, booktitle = {Agent-Mediated Electronic Commerce. Automated Negotiation and Strategy Design for Electronic Markets, {AAMAS} 2006 Workshop, {TADA/AMEC} 2006, Hakodate, Japan, May 9, 2006, Selected and Revised Papers}, series = {Lecture Notes in Computer Science}, volume = {4452}, pages = {46--61}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-72502-2\_4}, doi = {10.1007/978-3-540-72502-2\_4}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/atal/PardoeSM06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/dars/AhmadiS06, author = {Mazda Ahmadi and Peter Stone}, editor = {Maria L. Gini and Richard M. Voyles}, title = {A Distributed Biconnectivity Check}, booktitle = {Distributed Autonomous Robotic Systems 7, Proceedings of the 8th International Symposium on Distributed Autonomous Robotic Systems, {DARS} 2006, Minneapolis, Minnesota, USA, 2006}, pages = {1--10}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/4-431-35881-1\_1}, doi = {10.1007/4-431-35881-1\_1}, timestamp = {Fri, 26 Jul 2019 10:09:14 +0200}, biburl = {https://dblp.org/rec/conf/dars/AhmadiS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/TaylorWS06, author = {Matthew E. Taylor and Shimon Whiteson and Peter Stone}, editor = {Mike Cattolico}, title = {Comparing evolutionary and temporal difference methods in a reinforcement learning domain}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings, Seattle, Washington, USA, July 8-12, 2006}, pages = {1321--1328}, publisher = {{ACM}}, year = {2006}, url = {https://doi.org/10.1145/1143997.1144202}, doi = {10.1145/1143997.1144202}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/TaylorWS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/WhitesonS06, author = {Shimon Whiteson and Peter Stone}, editor = {Mike Cattolico}, title = {On-line evolutionary computation for reinforcement learning in stochastic domains}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings, Seattle, Washington, USA, July 8-12, 2006}, pages = {1577--1584}, publisher = {{ACM}}, year = {2006}, url = {https://doi.org/10.1145/1143997.1144252}, doi = {10.1145/1143997.1144252}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/WhitesonS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/SubramanianRSK06, author = {Harish Subramanian and Subramanian Ramamoorthy and Peter Stone and Benjamin Kuipers}, editor = {Mike Cattolico}, title = {Designing safe, profitable automated stock trading agents using evolutionary algorithms}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} 2006, Proceedings, Seattle, Washington, USA, July 8-12, 2006}, pages = {1777--1784}, publisher = {{ACM}}, year = {2006}, url = {https://doi.org/10.1145/1143997.1144285}, doi = {10.1145/1143997.1144285}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/SubramanianRSK06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icarcv/SridharanS06, author = {Mohan Sridharan and Peter Stone}, title = {Autonomous Planned Color Learning on a Mobile Robot Without Labeled Data}, booktitle = {Ninth International Conference on Control, Automation, Robotics and Vision, {ICARCV} 2006, Singapore, 5-8 December 2006, Proceedings}, pages = {1--6}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/ICARCV.2006.345403}, doi = {10.1109/ICARCV.2006.345403}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icarcv/SridharanS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/AhmadiS06, author = {Mazda Ahmadi and Peter Stone}, title = {A Multi-robot System for Continuous Area Sweeping Tasks}, booktitle = {Proceedings of the 2006 {IEEE} International Conference on Robotics and Automation, {ICRA} 2006, May 15-19, 2006, Orlando, Florida, {USA}}, pages = {1724--1729}, publisher = {{IEEE}}, year = {2006}, url = {https://doi.org/10.1109/ROBOT.2006.1641955}, doi = {10.1109/ROBOT.2006.1641955}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/AhmadiS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ictai/StrongerS06, author = {Daniel Stronger and Peter Stone}, title = {Polynomial Regression with Automated Degree: {A} Function Approximator for Autonomous Agents}, booktitle = {18th {IEEE} International Conference on Tools with Artificial Intelligence {(ICTAI} 2006), 13-15 November 2006, Arlington, VA, {USA}}, pages = {474--480}, publisher = {{IEEE} Computer Society}, year = {2006}, url = {https://doi.org/10.1109/ICTAI.2006.96}, doi = {10.1109/ICTAI.2006.96}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ictai/StrongerS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/FidelmanS06, author = {Peggy Fidelman and Peter Stone}, editor = {Gerhard Lakemeyer and Elizabeth Sklar and Domenico G. Sorrenti and Tomoichi Takahashi}, title = {The Chin Pinch: {A} Case Study in Skill Learning on a Legged Robot}, booktitle = {RoboCup 2006: Robot Soccer World Cup {X}}, series = {Lecture Notes in Computer Science}, volume = {4434}, pages = {59--71}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-74024-7\_6}, doi = {10.1007/978-3-540-74024-7\_6}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/FidelmanS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KalyanakrishnanLS06, author = {Shivaram Kalyanakrishnan and Yaxin Liu and Peter Stone}, editor = {Gerhard Lakemeyer and Elizabeth Sklar and Domenico G. Sorrenti and Tomoichi Takahashi}, title = {Half Field Offense in RoboCup Soccer: {A} Multiagent Reinforcement Learning Case Study}, booktitle = {RoboCup 2006: Robot Soccer World Cup {X}}, series = {Lecture Notes in Computer Science}, volume = {4434}, pages = {72--85}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-74024-7\_7}, doi = {10.1007/978-3-540-74024-7\_7}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KalyanakrishnanLS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/SaggarDKS06, author = {Manish Saggar and Thomas D'Silva and Nate Kohl and Peter Stone}, editor = {Gerhard Lakemeyer and Elizabeth Sklar and Domenico G. Sorrenti and Tomoichi Takahashi}, title = {Autonomous Learning of Stable Quadruped Locomotion}, booktitle = {RoboCup 2006: Robot Soccer World Cup {X}}, series = {Lecture Notes in Computer Science}, volume = {4434}, pages = {98--109}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-74024-7\_9}, doi = {10.1007/978-3-540-74024-7\_9}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/SaggarDKS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StrongerS06, author = {Daniel Stronger and Peter Stone}, editor = {Gerhard Lakemeyer and Elizabeth Sklar and Domenico G. Sorrenti and Tomoichi Takahashi}, title = {Selective Visual Attention for Object Detection on a Legged Robot}, booktitle = {RoboCup 2006: Robot Soccer World Cup {X}}, series = {Lecture Notes in Computer Science}, volume = {4434}, pages = {158--170}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-74024-7\_14}, doi = {10.1007/978-3-540-74024-7\_14}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StrongerS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/SridharanS06, author = {Mohan Sridharan and Peter Stone}, editor = {Gerhard Lakemeyer and Elizabeth Sklar and Domenico G. Sorrenti and Tomoichi Takahashi}, title = {Autonomous Planned Color Learning on a Legged Robot}, booktitle = {RoboCup 2006: Robot Soccer World Cup {X}}, series = {Lecture Notes in Computer Science}, volume = {4434}, pages = {270--278}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/978-3-540-74024-7\_23}, doi = {10.1007/978-3-540-74024-7\_23}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/SridharanS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/atal/2006, editor = {Hideyuki Nakashima and Michael P. Wellman and Gerhard Weiss and Peter Stone}, title = {5th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2006), Hakodate, Japan, May 8-12, 2006}, publisher = {{ACM}}, year = {2006}, isbn = {1-59593-303-4}, timestamp = {Tue, 08 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/2006.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/adb/StoneSK05, author = {Peter Stone and Richard S. Sutton and Gregory Kuhlmann}, title = {Reinforcement Learning for RoboCup Soccer Keepaway}, journal = {Adapt. Behav.}, volume = {13}, number = {3}, pages = {165--188}, year = {2005}, url = {https://doi.org/10.1177/105971230501300301}, doi = {10.1177/105971230501300301}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/adb/StoneSK05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/dss/LittmanS05, author = {Michael L. Littman and Peter Stone}, title = {A polynomial-time Nash equilibrium algorithm for repeated games}, journal = {Decis. Support Syst.}, volume = {39}, number = {1}, pages = {55--66}, year = {2005}, url = {https://doi.org/10.1016/j.dss.2004.08.007}, doi = {10.1016/J.DSS.2004.08.007}, timestamp = {Thu, 20 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/dss/LittmanS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ecr/StoneG05, author = {Peter Stone and Amy Greenwald}, title = {The First International Trading Agent Competition: Autonomous Bidding Agents}, journal = {Electron. Commer. Res.}, volume = {5}, number = {2}, pages = {229--265}, year = {2005}, url = {https://doi.org/10.1007/s10660-005-6158-z}, doi = {10.1007/S10660-005-6158-Z}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ecr/StoneG05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ml/WhitesonKMS05, author = {Shimon Whiteson and Nate Kohl and Risto Miikkulainen and Peter Stone}, title = {Evolving Soccer Keepaway Players Through Task Decomposition}, journal = {Mach. Learn.}, volume = {59}, number = {1-2}, pages = {5--30}, year = {2005}, url = {https://doi.org/10.1007/s10994-005-0460-9}, doi = {10.1007/S10994-005-0460-9}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ml/WhitesonKMS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/sigecom/PardoeS05, author = {David Pardoe and Peter Stone}, title = {Developing adaptive auction mechanisms}, journal = {SIGecom Exch.}, volume = {5}, number = {3}, pages = {1--10}, year = {2005}, url = {https://doi.org/10.1145/1120680.1120682}, doi = {10.1145/1120680.1120682}, timestamp = {Thu, 04 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/sigecom/PardoeS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/TaylorSL05, author = {Matthew E. Taylor and Peter Stone and Yaxin Liu}, editor = {Manuela M. Veloso and Subbarao Kambhampati}, title = {Value Functions for RL-Based Behavior Transfer: {A} Comparative Study}, booktitle = {Proceedings, The Twentieth National Conference on Artificial Intelligence and the Seventeenth Innovative Applications of Artificial Intelligence Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}}, pages = {880--885}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2005}, url = {http://www.aaai.org/Library/AAAI/2005/aaai05-139.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/TaylorSL05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SherstovS05, author = {Alexander A. Sherstov and Peter Stone}, editor = {Manuela M. Veloso and Subbarao Kambhampati}, title = {Improving Action Selection in MDP's via Knowledge Transfer}, booktitle = {Proceedings, The Twentieth National Conference on Artificial Intelligence and the Seventeenth Innovative Applications of Artificial Intelligence Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}}, pages = {1024--1029}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2005}, url = {http://www.aaai.org/Library/AAAI/2005/aaai05-162.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SherstovS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/SridharanS05, author = {Mohan Sridharan and Peter Stone}, editor = {Manuela M. Veloso and Subbarao Kambhampati}, title = {Autonomous Color Learning on a Mobile Robot}, booktitle = {Proceedings, The Twentieth National Conference on Artificial Intelligence and the Seventeenth Innovative Applications of Artificial Intelligence Conference, July 9-13, 2005, Pittsburgh, Pennsylvania, {USA}}, pages = {1318--1323}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2005}, url = {http://www.aaai.org/Library/AAAI/2005/aaai05-209.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/SridharanS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/TaylorS05, author = {Matthew E. Taylor and Peter Stone}, editor = {Frank Dignum and Virginia Dignum and Sven Koenig and Sarit Kraus and Munindar P. Singh and Michael J. Wooldridge}, title = {Behavior transfer for value-function-based reinforcement learning}, booktitle = {4th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2005), July 25-29, 2005, Utrecht, The Netherlands}, pages = {53--59}, publisher = {{ACM}}, year = {2005}, url = {https://doi.org/10.1145/1082473.1082482}, doi = {10.1145/1082473.1082482}, timestamp = {Fri, 26 Apr 2019 14:26:42 +0200}, biburl = {https://dblp.org/rec/conf/atal/TaylorS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/DresnerS05, author = {Kurt M. Dresner and Peter Stone}, editor = {Frank Dignum and Virginia Dignum and Sven Koenig and Sarit Kraus and Munindar P. Singh and Michael J. Wooldridge}, title = {Multiagent traffic management: an improved intersection control mechanism}, booktitle = {4th International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2005), July 25-29, 2005, Utrecht, The Netherlands}, pages = {471--477}, publisher = {{ACM}}, year = {2005}, url = {https://doi.org/10.1145/1082473.1082545}, doi = {10.1145/1082473.1082545}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/DresnerS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/WhitesonSSMK05, author = {Shimon Whiteson and Peter Stone and Kenneth O. Stanley and Risto Miikkulainen and Nate Kohl}, editor = {Hans{-}Georg Beyer and Una{-}May O'Reilly}, title = {Automatic feature selection in neuroevolution}, booktitle = {Genetic and Evolutionary Computation Conference, {GECCO} 2005, Proceedings, Washington DC, USA, June 25-29, 2005}, pages = {1225--1232}, publisher = {{ACM}}, year = {2005}, url = {https://doi.org/10.1145/1068009.1068210}, doi = {10.1145/1068009.1068210}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/WhitesonSSMK05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icac/WildstromSWMD05, author = {Jonathan Wildstrom and Peter Stone and Emmett Witchel and Raymond J. Mooney and Michael Dahlin}, title = {Towards Self-Configuring Hardware for Distributed Computer Systems}, booktitle = {Second International Conference on Autonomic Computing {(ICAC} 2005), 13-16 June 2005, Seattle, WA, {USA}}, pages = {241--249}, publisher = {{IEEE} Computer Society}, year = {2005}, url = {https://doi.org/10.1109/ICAC.2005.63}, doi = {10.1109/ICAC.2005.63}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icac/WildstromSWMD05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/SridharanKS05, author = {Mohan Sridharan and Gregory Kuhlmann and Peter Stone}, title = {Practical Vision-Based Monte Carlo Localization on a Legged Robot}, booktitle = {Proceedings of the 2005 {IEEE} International Conference on Robotics and Automation, {ICRA} 2005, April 18-22, 2005, Barcelona, Spain}, pages = {3366--3371}, publisher = {{IEEE}}, year = {2005}, url = {https://doi.org/10.1109/ROBOT.2005.1570630}, doi = {10.1109/ROBOT.2005.1570630}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/SridharanKS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/StrongerS05, author = {Daniel Stronger and Peter Stone}, title = {Simultaneous Calibration of Action and Sensor Models on a Mobile Robot}, booktitle = {Proceedings of the 2005 {IEEE} International Conference on Robotics and Automation, {ICRA} 2005, April 18-22, 2005, Barcelona, Spain}, pages = {4563--4568}, publisher = {{IEEE}}, year = {2005}, url = {https://doi.org/10.1109/ROBOT.2005.1570823}, doi = {10.1109/ROBOT.2005.1570823}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/StrongerS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/JongS05, author = {Nicholas K. Jong and Peter Stone}, editor = {Leslie Pack Kaelbling and Alessandro Saffiotti}, title = {State Abstraction Discovery from Irrelevant State Variables}, booktitle = {IJCAI-05, Proceedings of the Nineteenth International Joint Conference on Artificial Intelligence, Edinburgh, Scotland, UK, July 30 - August 5, 2005}, pages = {752--757}, publisher = {Professional Book Center}, year = {2005}, url = {http://ijcai.org/Proceedings/05/Papers/1655.pdf}, timestamp = {Tue, 20 Aug 2019 16:16:29 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/JongS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/SridharanS05, author = {Mohan Sridharan and Peter Stone}, title = {Real-time vision on a mobile robot platform}, booktitle = {2005 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, Edmonton, Alberta, Canada, August 2-6, 2005}, pages = {2148--2153}, publisher = {{IEEE}}, year = {2005}, url = {https://doi.org/10.1109/IROS.2005.1545540}, doi = {10.1109/IROS.2005.1545540}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/SridharanS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/lamas/AhmadiS05, author = {Mazda Ahmadi and Peter Stone}, editor = {Karl Tuyls and Pieter Jan't Hoen and Katja Verbeeck and Sandip Sen}, title = {Multi-robot Learning for Continuous Area Sweeping}, booktitle = {Learning and Adaption in Multi-Agent Systems, First International Workshop, {LAMAS} 2005, Utrecht, The Netherlands, July 25, 2005, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {3898}, pages = {47--70}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11691839\_2}, doi = {10.1007/11691839\_2}, timestamp = {Tue, 14 May 2019 10:00:47 +0200}, biburl = {https://dblp.org/rec/conf/lamas/AhmadiS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/lamas/DresnerS05, author = {Kurt M. Dresner and Peter Stone}, editor = {Karl Tuyls and Pieter Jan't Hoen and Katja Verbeeck and Sandip Sen}, title = {Multiagent Traffic Management: Opportunities for Multiagent Learning}, booktitle = {Learning and Adaption in Multi-Agent Systems, First International Workshop, {LAMAS} 2005, Utrecht, The Netherlands, July 25, 2005, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {3898}, pages = {129--138}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11691839\_7}, doi = {10.1007/11691839\_7}, timestamp = {Wed, 24 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/lamas/DresnerS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneKTL05, author = {Peter Stone and Gregory Kuhlmann and Matthew E. Taylor and Yaxin Liu}, editor = {Ansgar Bredenfeld and Adam Jacoff and Itsuki Noda and Yasutake Takahashi}, title = {Keepaway Soccer: From Machine Learning Testbed to Benchmark}, booktitle = {RoboCup 2005: Robot Soccer World Cup {IX}}, series = {Lecture Notes in Computer Science}, volume = {4020}, pages = {93--105}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11780519\_9}, doi = {10.1007/11780519\_9}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneKTL05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/SridharanS05, author = {Mohan Sridharan and Peter Stone}, editor = {Ansgar Bredenfeld and Adam Jacoff and Itsuki Noda and Yasutake Takahashi}, title = {Towards Eliminating Manual Color Calibration at RoboCup}, booktitle = {RoboCup 2005: Robot Soccer World Cup {IX}}, series = {Lecture Notes in Computer Science}, volume = {4020}, pages = {673--681}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11780519\_68}, doi = {10.1007/11780519\_68}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/SridharanS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sara/SherstovS05, author = {Alexander A. Sherstov and Peter Stone}, editor = {Jean{-}Daniel Zucker and Lorenza Saitta}, title = {Function Approximation via Tile Coding: Automating Parameter Choice}, booktitle = {Abstraction, Reformulation and Approximation, 6th International Symposium, {SARA} 2005, Airth Castle, Scotland, UK, July 26-29, 2005, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {3607}, pages = {194--205}, publisher = {Springer}, year = {2005}, url = {https://doi.org/10.1007/11527862\_14}, doi = {10.1007/11527862\_14}, timestamp = {Tue, 14 May 2019 10:00:38 +0200}, biburl = {https://dblp.org/rec/conf/sara/SherstovS05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/eaai/WhitesonS04, author = {Shimon Whiteson and Peter Stone}, title = {Adaptive job routing and scheduling}, journal = {Eng. Appl. Artif. Intell.}, volume = {17}, number = {7}, pages = {855--869}, year = {2004}, url = {https://doi.org/10.1016/j.engappai.2004.08.027}, doi = {10.1016/J.ENGAPPAI.2004.08.027}, timestamp = {Thu, 20 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/eaai/WhitesonS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jeric/SklarPS04, author = {Elizabeth Sklar and Simon Parsons and Peter Stone}, title = {Using RoboCup in university-level computer science education}, journal = {{ACM} J. Educ. Resour. Comput.}, volume = {4}, number = {2}, pages = {4}, year = {2004}, url = {https://doi.org/10.1145/1071620.1071624}, doi = {10.1145/1071620.1071624}, timestamp = {Sun, 17 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jeric/SklarPS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/sigecom/PardoeS04, author = {David Pardoe and Peter Stone}, title = {TacTex-03: a supply chain management agent}, journal = {SIGecom Exch.}, volume = {4}, number = {3}, pages = {19--28}, year = {2004}, url = {https://doi.org/10.1145/1120701.1120705}, doi = {10.1145/1120701.1120705}, timestamp = {Thu, 04 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/sigecom/PardoeS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/KohlS04, author = {Nate Kohl and Peter Stone}, editor = {Deborah L. McGuinness and George Ferguson}, title = {Machine Learning for Fast Quadrupedal Locomotion}, booktitle = {Proceedings of the Nineteenth National Conference on Artificial Intelligence, Sixteenth Conference on Innovative Applications of Artificial Intelligence, July 25-29, 2004, San Jose, California, {USA}}, pages = {611--616}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2004}, url = {http://www.aaai.org/Library/AAAI/2004/aaai04-097.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KohlS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WhitesonS04, author = {Shimon Whiteson and Peter Stone}, editor = {Deborah L. McGuinness and George Ferguson}, title = {Towards Autonomic Computing: Adaptive Job Routing and Scheduling}, booktitle = {Proceedings of the Nineteenth National Conference on Artificial Intelligence, Sixteenth Conference on Innovative Applications of Artificial Intelligence, July 25-29, 2004, San Jose, California, {USA}}, pages = {916--922}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2004}, timestamp = {Wed, 21 Jul 2004 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WhitesonS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/PardoeS04, author = {David Pardoe and Peter Stone}, editor = {Peyman Faratin and Juan A. Rodr{\'{\i}}guez{-}Aguilar}, title = {Bidding for Customer Orders in {TAC} {SCM}}, booktitle = {Agent-Mediated Electronic Commerce VI, Theories for and Engineering of Distributed Mechanisms and Systems, {AAMAS} 2004 Workshop, {AMEC} 2004, New York, NY, USA, July 19, 2004, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {3435}, pages = {143--157}, publisher = {Springer}, year = {2004}, url = {https://doi.org/10.1007/11575726\_11}, doi = {10.1007/11575726\_11}, timestamp = {Tue, 14 May 2019 10:00:39 +0200}, biburl = {https://dblp.org/rec/conf/amec/PardoeS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/SherstovS04, author = {Alexander A. Sherstov and Peter Stone}, editor = {Peyman Faratin and Juan A. Rodr{\'{\i}}guez{-}Aguilar}, title = {Three Automated Stock-Trading Agents: {A} Comparative Study}, booktitle = {Agent-Mediated Electronic Commerce VI, Theories for and Engineering of Distributed Mechanisms and Systems, {AAMAS} 2004 Workshop, {AMEC} 2004, New York, NY, USA, July 19, 2004, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {3435}, pages = {173--187}, publisher = {Springer}, year = {2004}, url = {https://doi.org/10.1007/11575726\_13}, doi = {10.1007/11575726\_13}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/amec/SherstovS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/DresnerS04, author = {Kurt M. Dresner and Peter Stone}, title = {Multiagent Traffic Management: {A} Reservation-Based Intersection Control Mechanism}, booktitle = {3rd International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2004), 19-23 August 2004, New York, NY, {USA}}, pages = {530--537}, publisher = {{IEEE} Computer Society}, year = {2004}, url = {https://doi.ieeecomputersociety.org/10.1109/AAMAS.2004.10121}, doi = {10.1109/AAMAS.2004.10121}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/DresnerS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/PardoeS04, author = {David Pardoe and Peter Stone}, title = {Agent-Based Supply Chain Management: Bidding for Customer Orders}, booktitle = {3rd International Joint Conference on Autonomous Agents and Multiagent Systems {(AAMAS} 2004), 19-23 August 2004, New York, NY, {USA}}, pages = {1442--1443}, publisher = {{IEEE} Computer Society}, year = {2004}, url = {https://doi.ieeecomputersociety.org/10.1109/AAMAS.2004.10276}, doi = {10.1109/AAMAS.2004.10276}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/PardoeS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/crv/SridharanS04, author = {Mohan Sridharan and Peter Stone}, title = {Towards On-Board Color Constancy on Mobile Robots}, booktitle = {1st Canadian Conference on Computer and Robot Vision {(CRV} 2004) 17-19 May 2004, London, Ontario, Canada}, pages = {130--137}, publisher = {{IEEE} Computer Society}, year = {2004}, url = {https://doi.org/10.1109/CCCRV.2004.1301436}, doi = {10.1109/CCCRV.2004.1301436}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/crv/SridharanS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icac/WhitesonS04, author = {Shimon Whiteson and Peter Stone}, title = {Towards Autonomic Computing: Adaptive Network Routing and Scheduling}, booktitle = {1st International Conference on Autonomic Computing {(ICAC} 2004), 17-19 May 2004, New York, NY, {USA}}, pages = {286--287}, publisher = {{IEEE} Computer Society}, year = {2004}, url = {https://doi.ieeecomputersociety.org/10.1109/ICAC.2004.62}, doi = {10.1109/ICAC.2004.62}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icac/WhitesonS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/KohlS04, author = {Nate Kohl and Peter Stone}, title = {Policy Gradient Reinforcement Learning for Fast Quadrupedal Locomotion}, booktitle = {Proceedings of the 2004 {IEEE} International Conference on Robotics and Automation, {ICRA} 2004, April 26 - May 1, 2004, New Orleans, LA, {USA}}, pages = {2619--2624}, publisher = {{IEEE}}, year = {2004}, url = {https://doi.org/10.1109/ROBOT.2004.1307456}, doi = {10.1109/ROBOT.2004.1307456}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/KohlS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isbi/WahleOVBBRCSMCFS04, author = {Andreas Wahle and Mark E. Olszewski and Sarah C. Vigmostad and Kathleen Braddy and Theresa Brennan and James D. Rossen and Krishnan B. Chandran and Milan Sonka and Rub{\'{e}}n Medina and A. Coskun and Charles Feldman and Peter Stone}, title = {Quantitative Analysis of Circumferential Plaque Distribution in Human Coronary Arteries in Relation to Local Vessel Curvature}, booktitle = {Proceedings of the 2004 {IEEE} International Symposium on Biomedical Imaging: From Nano to Macro, Arlington, VA, USA, 15-18 April 2004}, pages = {531--534}, publisher = {{IEEE}}, year = {2004}, url = {https://doi.org/10.1109/ISBI.2004.1398592}, doi = {10.1109/ISBI.2004.1398592}, timestamp = {Sat, 28 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/isbi/WahleOVBBRCSMCFS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/SridharanS04, author = {Mohan Sridharan and Peter Stone}, editor = {Daniele Nardi and Martin A. Riedmiller and Claude Sammut and Jos{\'{e}} Santos{-}Victor}, title = {Towards Illumination Invariance in the Legged League}, booktitle = {RoboCup 2004: Robot Soccer World Cup {VIII}}, series = {Lecture Notes in Computer Science}, volume = {3276}, pages = {196--208}, publisher = {Springer}, year = {2004}, url = {https://doi.org/10.1007/978-3-540-32256-6\_16}, doi = {10.1007/978-3-540-32256-6\_16}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/SridharanS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StrongerS04, author = {Daniel Stronger and Peter Stone}, editor = {Daniele Nardi and Martin A. Riedmiller and Claude Sammut and Jos{\'{e}} Santos{-}Victor}, title = {A Model-Based Approach to Robot Joint Control}, booktitle = {RoboCup 2004: Robot Soccer World Cup {VIII}}, series = {Lecture Notes in Computer Science}, volume = {3276}, pages = {297--309}, publisher = {Springer}, year = {2004}, url = {https://doi.org/10.1007/978-3-540-32256-6\_24}, doi = {10.1007/978-3-540-32256-6\_24}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StrongerS04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KuhlmannSL04, author = {Gregory Kuhlmann and Peter Stone and Justin Lallinger}, editor = {Daniele Nardi and Martin A. Riedmiller and Claude Sammut and Jos{\'{e}} Santos{-}Victor}, title = {The {UT} Austin Villa 2003 Champion Simulator Coach: {A} Machine Learning Approach}, booktitle = {RoboCup 2004: Robot Soccer World Cup {VIII}}, series = {Lecture Notes in Computer Science}, volume = {3276}, pages = {636--644}, publisher = {Springer}, year = {2004}, url = {https://doi.org/10.1007/978-3-540-32256-6\_61}, doi = {10.1007/978-3-540-32256-6\_61}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KuhlmannSL04.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aamas/NodaS03, author = {Itsuki Noda and Peter Stone}, title = {The RoboCup Soccer Server and CMUnited Clients: Implemented Infrastructure for {MAS} Research}, journal = {Auton. Agents Multi Agent Syst.}, volume = {7}, number = {1-2}, pages = {101--120}, year = {2003}, url = {https://doi.org/10.1023/A:1024128904944}, doi = {10.1023/A:1024128904944}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/aamas/NodaS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/electronicmarkets/WellmanGSW03, author = {Michael P. Wellman and Amy Greenwald and Peter Stone and Peter R. Wurman}, title = {The 2001 Trading Agent Competition}, journal = {Electron. Mark.}, volume = {13}, number = {1}, pages = {4--12}, year = {2003}, url = {https://doi.org/10.1080/1019678032000062212}, doi = {10.1080/1019678032000062212}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/electronicmarkets/WellmanGSW03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/expert/GreenwaldJS03, author = {Amy Greenwald and Nicholas R. Jennings and Peter Stone}, title = {Guest Editors' Introduction: Agents and Markets}, journal = {{IEEE} Intell. Syst.}, volume = {18}, number = {6}, pages = {12--14}, year = {2003}, url = {https://doi.org/10.1109/MIS.2003.1249164}, doi = {10.1109/MIS.2003.1249164}, timestamp = {Fri, 06 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/expert/GreenwaldJS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/StoneSLCM03, author = {Peter Stone and Robert E. Schapire and Michael L. Littman and J{\'{a}}nos A. Csirik and David A. McAllester}, title = {Decision-Theoretic Bidding Based on Learned Density Models in Simultaneous, Interacting Auctions}, journal = {J. Artif. Intell. Res.}, volume = {19}, pages = {209--242}, year = {2003}, url = {https://doi.org/10.1613/jair.1200}, doi = {10.1613/JAIR.1200}, timestamp = {Mon, 21 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/StoneSLCM03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ACMicec/YuS03, author = {Ronggang Yu and Peter Stone}, editor = {Norman M. Sadeh and Mary Jo Dively and Robert J. Kauffman and Yannis Labrou and Onn Shehory and Rahul Telang and Lorrie Faith Cranor}, title = {Performance analysis of a counter-intuitive automated stock-trading agent}, booktitle = {Proceedings of the 5th International Conference on Electronic Commerce, {ICEC} 2003, Pittsburgh, Pennsylvania, USA, September 30 - October 03, 2003}, series = {{ACM} International Conference Proceeding Series}, volume = {50}, pages = {40--46}, publisher = {{ACM}}, year = {2003}, url = {https://doi.org/10.1145/948005.948011}, doi = {10.1145/948005.948011}, timestamp = {Tue, 06 Apr 2021 12:12:56 +0200}, biburl = {https://dblp.org/rec/conf/ACMicec/YuS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/FengYS03, author = {Y. Feng and Rong Yu and Peter Stone}, editor = {Peyman Faratin and David C. Parkes and Juan A. Rodr{\'{\i}}guez{-}Aguilar and William E. Walsh}, title = {Two Stock-Trading Agents: Market Making and Technical Analysis}, booktitle = {Agent-Mediated Electronic Commerce V, Designing Mechanisms and Systems, {AAMAS} 2003 Workshop, {AMEC} 2003, Melbourne, Australia, July 15, 2003, Revised Selected Papers}, series = {Lecture Notes in Computer Science}, volume = {3048}, pages = {18--36}, publisher = {Springer}, year = {2003}, url = {https://doi.org/10.1007/978-3-540-25947-3\_2}, doi = {10.1007/978-3-540-25947-3\_2}, timestamp = {Sat, 14 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/amec/FengYS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/WhitesonS03, author = {Shimon Whiteson and Peter Stone}, title = {Concurrent layered learning}, booktitle = {The Second International Joint Conference on Autonomous Agents {\&} Multiagent Systems, {AAMAS} 2003, July 14-18, 2003, Melbourne, Victoria, Australia, Proceedings}, pages = {193--200}, publisher = {{ACM}}, year = {2003}, url = {https://doi.org/10.1145/860575.860607}, doi = {10.1145/860575.860607}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/WhitesonS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/WhitesonKMS03, author = {Shimon Whiteson and Nate Kohl and Risto Miikkulainen and Peter Stone}, editor = {Erick Cant{\'{u}}{-}Paz and James A. Foster and Kalyanmoy Deb and Lawrence Davis and Rajkumar Roy and Una{-}May O'Reilly and Hans{-}Georg Beyer and Russell K. Standish and Graham Kendall and Stewart W. Wilson and Mark Harman and Joachim Wegener and Dipankar Dasgupta and Mitchell A. Potter and Alan C. Schultz and Kathryn A. Dowsland and Natasa Jonoska and Julian F. Miller}, title = {Evolving Keepaway Soccer Players through Task Decomposition}, booktitle = {Genetic and Evolutionary Computation - {GECCO} 2003, Genetic and Evolutionary Computation Conference, Chicago, IL, USA, July 12-16, 2003. Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {2723}, pages = {356--368}, publisher = {Springer}, year = {2003}, url = {https://doi.org/10.1007/3-540-45105-6\_41}, doi = {10.1007/3-540-45105-6\_41}, timestamp = {Tue, 14 May 2019 10:00:35 +0200}, biburl = {https://dblp.org/rec/conf/gecco/WhitesonKMS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SinghLJPS03, author = {Satinder Singh and Michael L. Littman and Nicholas K. Jong and David Pardoe and Peter Stone}, editor = {Tom Fawcett and Nina Mishra}, title = {Learning Predictive State Representations}, booktitle = {Machine Learning, Proceedings of the Twentieth International Conference {(ICML} 2003), August 21-24, 2003, Washington, DC, {USA}}, pages = {712--719}, publisher = {{AAAI} Press}, year = {2003}, url = {http://www.aaai.org/Library/ICML/2003/icml03-093.php}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/SinghLJPS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/Stone03, author = {Peter Stone}, editor = {Daniel Polani and Brett Browning and Andrea Bonarini and Kazuo Yoshida}, title = {RoboCup as an Introduction to {CS} Research}, booktitle = {RoboCup 2003: Robot Soccer World Cup {VII}}, series = {Lecture Notes in Computer Science}, volume = {3020}, pages = {284--295}, publisher = {Springer}, year = {2003}, url = {https://doi.org/10.1007/978-3-540-25940-4\_25}, doi = {10.1007/978-3-540-25940-4\_25}, timestamp = {Tue, 14 May 2019 10:00:53 +0200}, biburl = {https://dblp.org/rec/conf/robocup/Stone03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/SklarPS03, author = {Elizabeth Sklar and Simon Parsons and Peter Stone}, editor = {Daniel Polani and Brett Browning and Andrea Bonarini and Kazuo Yoshida}, title = {RoboCup in Higher Education: {A} Preliminary Report}, booktitle = {RoboCup 2003: Robot Soccer World Cup {VII}}, series = {Lecture Notes in Computer Science}, volume = {3020}, pages = {296--307}, publisher = {Springer}, year = {2003}, url = {https://doi.org/10.1007/978-3-540-25940-4\_26}, doi = {10.1007/978-3-540-25940-4\_26}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/SklarPS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KuhlmannS03, author = {Gregory Kuhlmann and Peter Stone}, editor = {Daniel Polani and Brett Browning and Andrea Bonarini and Kazuo Yoshida}, title = {Progress in Learning 3 vs. 2 Keepaway}, booktitle = {RoboCup 2003: Robot Soccer World Cup {VII}}, series = {Lecture Notes in Computer Science}, volume = {3020}, pages = {694--702}, publisher = {Springer}, year = {2003}, url = {https://doi.org/10.1007/978-3-540-25940-4\_68}, doi = {10.1007/978-3-540-25940-4\_68}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KuhlmannS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/sigecom/LittmanS03, author = {Michael L. Littman and Peter Stone}, editor = {Daniel A. Menasc{\'{e}} and Noam Nisan}, title = {A polynomial-time nash equilibrium algorithm for repeated games}, booktitle = {Proceedings 4th {ACM} Conference on Electronic Commerce (EC-2003), San Diego, California, USA, June 9-12, 2003}, pages = {48--54}, publisher = {{ACM}}, year = {2003}, url = {https://doi.org/10.1145/779928.779935}, doi = {10.1145/779928.779935}, timestamp = {Tue, 27 Nov 2018 11:56:48 +0100}, biburl = {https://dblp.org/rec/conf/sigecom/LittmanS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/smc/KuhlmannS03, author = {Gregory Kuhlmann and Peter Stone}, title = {Progress in learning 3 vs. 2 keepaway}, booktitle = {Proceedings of the {IEEE} International Conference on Systems, Man {\&} Cybernetics: Washington, D.C., USA, 5-8 October 2003}, pages = {52--59}, publisher = {{IEEE}}, year = {2003}, url = {https://doi.org/10.1109/ICSMC.2003.1243791}, doi = {10.1109/ICSMC.2003.1243791}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/smc/KuhlmannS03.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/VelosoBSKYEAJSMKCHHC02, author = {Manuela M. Veloso and Tucker R. Balch and Peter Stone and Hiroaki Kitano and Fuminori Yamasaki and Ken Endo and Minoru Asada and Mansour Jamzad and Sayyed Bashir Sadjad and Vahab S. Mirrokni and Moslem Kazemi and Hamid Reza Chitsaz and Abbas Heydarnoori and Mohammad Taghi Hajiaghayi and Ehsan Chiniforooshan}, title = {RoboCup-2001: The Fifth Robotic Soccer World Championships}, journal = {{AI} Mag.}, volume = {23}, number = {1}, pages = {55--68}, year = {2002}, url = {https://doi.org/10.1609/aimag.v23i1.1609}, doi = {10.1609/AIMAG.V23I1.1609}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/VelosoBSKYEAJSMKCHHC02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/KarlgrenKGFTSGSBFSHCBGSDL02, author = {Jussi Karlgren and Pentti Kanerva and Bj{\"{o}}rn Gamb{\"{a}}ck and Kenneth D. Forbus and Kagan Tumer and Peter Stone and Kai Goebel and Gaurav S. Sukhatme and Tucker R. Balch and Bernd Fischer and Doug Smith and Sanda M. Harabagiu and Vinay K. Chaudri and Mike Barley and Hans W. Guesgen and Thomas F. Stahovich and Randall Davis and James A. Landay}, title = {The 2002 {AAAI} Spring Symposium Series}, journal = {{AI} Mag.}, volume = {23}, number = {4}, pages = {101--106}, year = {2002}, url = {https://doi.org/10.1609/aimag.v23i4.1675}, doi = {10.1609/AIMAG.V23I4.1675}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/KarlgrenKGFTSGSBFSHCBGSDL02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/WellmanGSW02, author = {Michael P. Wellman and Amy Greenwald and Peter Stone and Peter R. Wurman}, editor = {Rina Dechter and Michael J. Kearns and Richard S. Sutton}, title = {The 2001 Trading Agent Competition}, booktitle = {Proceedings of the Eighteenth National Conference on Artificial Intelligence and Fourteenth Conference on Innovative Applications of Artificial Intelligence, July 28 - August 1, 2002, Edmonton, Alberta, Canada}, pages = {935--942}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2002}, url = {http://www.aaai.org/Library/AAAI/2002/aaai02-138.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/WellmanGSW02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/StoneSCLM02, author = {Peter Stone and Robert E. Schapire and J{\'{a}}nos A. Csirik and Michael L. Littman and David A. McAllester}, editor = {Julian A. Padget and Onn Shehory and David C. Parkes and Norman M. Sadeh and William E. Walsh}, title = {ATTac-2001: {A} Learning, Autonomous Bidding Agent}, booktitle = {Agent-Mediated Electronic Commerce IV, Designing Mechanisms and Systems, {AAMAS} 2002 Workshop on Agent Mediated Electronic Commerce, Bologna, Italy, July 16, 2002, Revised Papers}, series = {Lecture Notes in Computer Science}, volume = {2531}, pages = {143--160}, publisher = {Springer}, year = {2002}, url = {https://doi.org/10.1007/3-540-36378-5\_9}, doi = {10.1007/3-540-36378-5\_9}, timestamp = {Tue, 14 May 2019 10:00:39 +0200}, biburl = {https://dblp.org/rec/conf/amec/StoneSCLM02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/amec/ReitsmaSCL02, author = {Paul S. A. Reitsma and Peter Stone and J{\'{a}}nos A. Csirik and Michael L. Littman}, editor = {Julian A. Padget and Onn Shehory and David C. Parkes and Norman M. Sadeh and William E. Walsh}, title = {Self-Enforcing Strategic Demand Reduction}, booktitle = {Agent-Mediated Electronic Commerce IV, Designing Mechanisms and Systems, {AAMAS} 2002 Workshop on Agent Mediated Electronic Commerce, Bologna, Italy, July 16, 2002, Revised Papers}, series = {Lecture Notes in Computer Science}, volume = {2531}, pages = {289--306}, publisher = {Springer}, year = {2002}, url = {https://doi.org/10.1007/3-540-36378-5\_18}, doi = {10.1007/3-540-36378-5\_18}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/amec/ReitsmaSCL02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/ReitsmaSCL02, author = {Paul S. A. Reitsma and Peter Stone and J{\'{a}}nos A. Csirik and Michael L. Littman}, title = {Randomized strategic demand reduction: getting more by asking for less}, booktitle = {The First International Joint Conference on Autonomous Agents {\&} Multiagent Systems, {AAMAS} 2002, July 15-19, 2002, Bologna, Italy, Proceedings}, pages = {162--163}, publisher = {{ACM}}, year = {2002}, url = {https://doi.org/10.1145/544741.544778}, doi = {10.1145/544741.544778}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/ReitsmaSCL02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SchapireSMLC02, author = {Robert E. Schapire and Peter Stone and David A. McAllester and Michael L. Littman and J{\'{a}}nos A. Csirik}, editor = {Claude Sammut and Achim G. Hoffmann}, title = {Modeling Auction Price Uncertainty Using Boosting-based Conditional Density Estimation}, booktitle = {Machine Learning, Proceedings of the Nineteenth International Conference {(ICML} 2002), University of New South Wales, Sydney, Australia, July 8-12, 2002}, pages = {546--553}, publisher = {Morgan Kaufmann}, year = {2002}, timestamp = {Tue, 16 Mar 2004 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/SchapireSMLC02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/Stone02, author = {Peter Stone}, editor = {Gal A. Kaminka and Pedro U. Lima and Ra{\'{u}}l Rojas}, title = {Multiagent Competitions and Research: Lessons from RoboCup and {TAC}}, booktitle = {RoboCup 2002: Robot Soccer World Cup {VI}}, series = {Lecture Notes in Computer Science}, volume = {2752}, pages = {224--237}, publisher = {Springer}, year = {2002}, url = {https://doi.org/10.1007/978-3-540-45135-8\_17}, doi = {10.1007/978-3-540-45135-8\_17}, timestamp = {Mon, 23 Nov 2020 14:36:01 +0100}, biburl = {https://dblp.org/rec/conf/robocup/Stone02.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/Stone01, author = {Peter Stone}, title = {RoboCup-2000: The Fourth Robotic Soccer World Championships}, journal = {{AI} Mag.}, volume = {22}, number = {1}, pages = {11--38}, year = {2001}, url = {https://doi.org/10.1609/aimag.v22i1.1541}, doi = {10.1609/AIMAG.V22I1.1541}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/Stone01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/internet/GreenwaldS01, author = {Amy Greenwald and Peter Stone}, title = {Autonomous Bidding Agents in the Trading Agent Competition}, journal = {{IEEE} Internet Comput.}, volume = {5}, number = {2}, pages = {52--60}, year = {2001}, url = {https://doi.org/10.1109/4236.914648}, doi = {10.1109/4236.914648}, timestamp = {Fri, 13 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/internet/GreenwaldS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/StoneLSK01, author = {Peter Stone and Michael L. Littman and Satinder Singh and Michael J. Kearns}, title = {ATTac-2000: An Adaptive Autonomous Bidding Agent}, journal = {J. Artif. Intell. Res.}, volume = {15}, pages = {189--206}, year = {2001}, url = {https://doi.org/10.1613/jair.865}, doi = {10.1613/JAIR.865}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jair/StoneLSK01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/StoneLSK01, author = {Peter Stone and Michael L. Littman and Satinder Singh and Michael J. Kearns}, editor = {Elisabeth Andr{\'{e}} and Sandip Sen and Claude Frasson and J{\"{o}}rg P. M{\"{u}}ller}, title = {ATTac-2000: an adaptive autonomous bidding agent}, booktitle = {Proceedings of the Fifth International Conference on Autonomous Agents, {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001}, pages = {238--245}, publisher = {{ACM}}, year = {2001}, url = {https://doi.org/10.1145/375735.376301}, doi = {10.1145/375735.376301}, timestamp = {Sat, 30 Sep 2023 09:33:47 +0200}, biburl = {https://dblp.org/rec/conf/agents/StoneLSK01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/StoneM01, author = {Peter Stone and David A. McAllester}, editor = {Elisabeth Andr{\'{e}} and Sandip Sen and Claude Frasson and J{\"{o}}rg P. M{\"{u}}ller}, title = {An architecture for action selection in robotic soccer}, booktitle = {Proceedings of the Fifth International Conference on Autonomous Agents, {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001}, pages = {316--323}, publisher = {{ACM}}, year = {2001}, url = {https://doi.org/10.1145/375735.376320}, doi = {10.1145/375735.376320}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/agents/StoneM01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/IsbellSKSS01, author = {Charles Lee Isbell Jr. and Christian R. Shelton and Michael J. Kearns and Satinder Singh and Peter Stone}, editor = {Elisabeth Andr{\'{e}} and Sandip Sen and Claude Frasson and J{\"{o}}rg P. M{\"{u}}ller}, title = {A social reinforcement learning agent}, booktitle = {Proceedings of the Fifth International Conference on Autonomous Agents, {AGENTS} 2001, Montreal, Canada, May 28 - June 1, 2001}, pages = {377--384}, publisher = {{ACM}}, year = {2001}, url = {https://doi.org/10.1145/375735.376334}, doi = {10.1145/375735.376334}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/agents/IsbellSKSS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/LittmanS01, author = {Michael L. Littman and Peter Stone}, editor = {John{-}Jules Ch. Meyer and Milind Tambe}, title = {Implicit Negotiation in Repeated Games}, booktitle = {Intelligent Agents VIII, 8th International Workshop, {ATAL} 2001 Seattle, WA, USA, August 1-3, 2001, Revised Papers}, series = {Lecture Notes in Computer Science}, volume = {2333}, pages = {393--404}, publisher = {Springer}, year = {2001}, url = {https://doi.org/10.1007/3-540-45448-9\_29}, doi = {10.1007/3-540-45448-9\_29}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/atal/LittmanS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/StoneS01, author = {Peter Stone and Richard S. Sutton}, editor = {Carla E. Brodley and Andrea Pohoreckyj Danyluk}, title = {Scaling Reinforcement Learning toward RoboCup Soccer}, booktitle = {Proceedings of the Eighteenth International Conference on Machine Learning {(ICML} 2001), Williams College, Williamstown, MA, USA, June 28 - July 1, 2001}, pages = {537--544}, publisher = {Morgan Kaufmann}, year = {2001}, timestamp = {Wed, 27 Nov 2002 10:53:35 +0100}, biburl = {https://dblp.org/rec/conf/icml/StoneS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/IsbellSKSS01, author = {Charles Lee Isbell Jr. and Christian R. Shelton and Michael J. Kearns and Satinder Singh and Peter Stone}, editor = {Thomas G. Dietterich and Suzanna Becker and Zoubin Ghahramani}, title = {Cobot: {A} Social Reinforcement Learning Agent}, booktitle = {Advances in Neural Information Processing Systems 14 [Neural Information Processing Systems: Natural and Synthetic, {NIPS} 2001, December 3-8, 2001, Vancouver, British Columbia, Canada]}, pages = {1393--1400}, publisher = {{MIT} Press}, year = {2001}, url = {https://proceedings.neurips.cc/paper/2001/hash/92bbd31f8e0e43a7da8a6295b251725f-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/IsbellSKSS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneS01, author = {Peter Stone and Richard S. Sutton}, editor = {Andreas Birk and Silvia Coradeschi and Satoshi Tadokoro}, title = {Keepaway Soccer: {A} Machine Learning Testbed}, booktitle = {RoboCup 2001: Robot Soccer World Cup {V}}, series = {Lecture Notes in Computer Science}, volume = {2377}, pages = {214--223}, publisher = {Springer}, year = {2001}, url = {https://doi.org/10.1007/3-540-45603-1\_22}, doi = {10.1007/3-540-45603-1\_22}, timestamp = {Tue, 14 May 2019 10:00:53 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/Stone01, author = {Peter Stone}, editor = {Andreas Birk and Silvia Coradeschi and Satoshi Tadokoro}, title = {ATTUnited-2001: Using Heterogeneous Players}, booktitle = {RoboCup 2001: Robot Soccer World Cup {V}}, series = {Lecture Notes in Computer Science}, volume = {2377}, pages = {495--498}, publisher = {Springer}, year = {2001}, url = {https://doi.org/10.1007/3-540-45603-1\_67}, doi = {10.1007/3-540-45603-1\_67}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/Stone01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/welcom/CsirikLSS01, author = {J{\'{a}}nos A. Csirik and Michael L. Littman and Satinder Singh and Peter Stone}, editor = {Ludger Fiege and Gero M{\"{u}}hl and Uwe G. Wilhelm}, title = {FAucS : An {FCC} Spectrum Auction Simulator for Autonomous Bidding Agents}, booktitle = {Electronic Commerce, Second International Workshop, {WELCOM} 2001 Heidelberg, Germany, November 16-17, 2001, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {2232}, pages = {139--151}, publisher = {Springer}, year = {2001}, url = {https://doi.org/10.1007/3-540-45598-1\_14}, doi = {10.1007/3-540-45598-1\_14}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/welcom/CsirikLSS01.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@proceedings{DBLP:conf/robocup/2000, editor = {Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar}, title = {RoboCup 2000: Robot Soccer World Cup {IV}}, series = {Lecture Notes in Computer Science}, volume = {2019}, publisher = {Springer}, year = {2001}, url = {https://doi.org/10.1007/3-540-45324-5}, doi = {10.1007/3-540-45324-5}, isbn = {3-540-42185-8}, timestamp = {Tue, 14 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/2000.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@book{DBLP:books/daglib/0015985, author = {Peter Stone}, title = {Layered learning in multiagent systems - a winning approach to robotic soccer}, series = {Intelligent robotics and autonomous agents}, publisher = {{MIT} Press}, year = {2000}, isbn = {978-0-262-19438-9}, timestamp = {Mon, 22 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/books/daglib/0015985.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/StoneVR00, author = {Peter Stone and Manuela M. Veloso and Patrick Riley}, title = {{CMUNITED-98} Simulator Team}, journal = {{AI} Mag.}, volume = {21}, number = {1}, pages = {20--28}, year = {2000}, url = {https://doi.org/10.1609/aimag.v21i1.1491}, doi = {10.1609/AIMAG.V21I1.1491}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/StoneVR00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/VelosoBAHS00, author = {Manuela M. Veloso and Michael H. Bowling and Sorin Achim and Kwun Han and Peter Stone}, title = {{CMUNITED-98:} RoboCup-98 Small-Robot World Champion Team}, journal = {{AI} Mag.}, volume = {21}, number = {1}, pages = {29--36}, year = {2000}, url = {https://doi.org/10.1609/aimag.v21i1.1492}, doi = {10.1609/AIMAG.V21I1.1492}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/VelosoBAHS00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/CoradeschiKSBKA00, author = {Silvia Coradeschi and Lars Karlsson and Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar and Minoru Asada}, title = {Overview of RoboCup-99}, journal = {{AI} Mag.}, volume = {21}, number = {3}, pages = {11--18}, year = {2000}, url = {https://doi.org/10.1609/aimag.v21i3.1516}, doi = {10.1609/AIMAG.V21I3.1516}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/CoradeschiKSBKA00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/StoneRV00, author = {Peter Stone and Patrick Riley and Manuela M. Veloso}, title = {The CMUnited-99 Champion Simulator Team}, journal = {{AI} Mag.}, volume = {21}, number = {3}, pages = {33--40}, year = {2000}, url = {https://doi.org/10.1609/aimag.v21i3.1520}, doi = {10.1609/AIMAG.V21I3.1520}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/StoneRV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/arobots/StoneV00, author = {Peter Stone and Manuela M. Veloso}, title = {Multiagent Systems: {A} Survey from a Machine Learning Perspective}, journal = {Auton. Robots}, volume = {8}, number = {3}, pages = {345--383}, year = {2000}, url = {https://doi.org/10.1023/A:1008942012299}, doi = {10.1023/A:1008942012299}, timestamp = {Thu, 18 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/arobots/StoneV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/IsbellKKSS00, author = {Charles Lee Isbell Jr. and Michael J. Kearns and David P. Kormann and Satinder Singh and Peter Stone}, editor = {Henry A. Kautz and Bruce W. Porter}, title = {Cobot in LambdaMOO: {A} Social Statistics Agent}, booktitle = {Proceedings of the Seventeenth National Conference on Artificial Intelligence and Twelfth Conference on on Innovative Applications of Artificial Intelligence, July 30 - August 3, 2000, Austin, Texas, {USA}}, pages = {36--41}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2000}, url = {http://www.aaai.org/Library/AAAI/2000/aaai00-006.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/IsbellKKSS00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/StoneRV00, author = {Peter Stone and Patrick Riley and Manuela M. Veloso}, editor = {Henry A. Kautz and Bruce W. Porter}, title = {Defining and Using Ideal Teammate and Opponent Agent Models}, booktitle = {Proceedings of the Seventeenth National Conference on Artificial Intelligence and Twelfth Conference on on Innovative Applications of Artificial Intelligence, July 30 - August 3, 2000, Austin, Texas, {USA}}, pages = {1040--1045}, publisher = {{AAAI} Press / The {MIT} Press}, year = {2000}, url = {http://www.aaai.org/Library/IAAI/2000/iaai00-016.php}, timestamp = {Tue, 05 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/StoneRV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/NodaS00, author = {Itsuki Noda and Peter Stone}, editor = {Thomas Wagner and Omer F. Rana}, title = {The RoboCup Soccer Server and CMUnited: Implemented Infrastructure for {MAS} Research}, booktitle = {Infrastructure for Agents, Multi-Agent Systems, and Scalable Multi-Agent Systems, International Workshop on Infrastructure for Multi-Agent Systems, Barcelona, Spain, June 3-7, 2000, Revised Papers}, series = {Lecture Notes in Computer Science}, volume = {1887}, pages = {94--101}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-47772-1\_10}, doi = {10.1007/3-540-47772-1\_10}, timestamp = {Tue, 14 May 2019 10:00:38 +0200}, biburl = {https://dblp.org/rec/conf/agents/NodaS00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/StoneRV00, author = {Peter Stone and Patrick Riley and Manuela M. Veloso}, editor = {Carles Sierra and Maria L. Gini and Jeffrey S. Rosenschein}, title = {Layered disclosure: why is the agent doing what it's doing?}, booktitle = {Proceedings of the Fourth International Conference on Autonomous Agents, {AGENTS} 2000, Barcelona, Catalonia, Spain, June 3-7, 2000}, pages = {225--226}, publisher = {{ACM}}, year = {2000}, url = {https://doi.org/10.1145/336595.337387}, doi = {10.1145/336595.337387}, timestamp = {Thu, 21 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/agents/StoneRV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/RileySV00, author = {Patrick Riley and Peter Stone and Manuela M. Veloso}, editor = {Cristiano Castelfranchi and Yves Lesp{\'{e}}rance}, title = {Layered Disclosure: Revealing Agents' Internals}, booktitle = {Intelligent Agents {VII.} Agent Theories Architectures and Languages, 7th International Workshop, {ATAL} 2000, Boston, MA, USA, July 7-9, 2000, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {1986}, pages = {61--72}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-44631-1\_5}, doi = {10.1007/3-540-44631-1\_5}, timestamp = {Thu, 21 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/atal/RileySV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecml/StoneV00, author = {Peter Stone and Manuela M. Veloso}, editor = {Ram{\'{o}}n L{\'{o}}pez de M{\'{a}}ntaras and Enric Plaza}, title = {Layered Learning}, booktitle = {Machine Learning: {ECML} 2000, 11th European Conference on Machine Learning, Barcelona, Catalonia, Spain, May 31 - June 2, 2000, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {1810}, pages = {369--381}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45164-1\_38}, doi = {10.1007/3-540-45164-1\_38}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/ecml/StoneV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icmas/StoneRV00, author = {Peter Stone and Patrick Riley and Manuela M. Veloso}, title = {Defining and Using Ideal Teammate and Opponent Agent Models: {A} Case Study in Robotic Soccer}, booktitle = {4th International Conference on Multi-Agent Systems, {ICMAS} 2000, Boston, MA, USA, July 10-12, 2000}, pages = {441--442}, publisher = {{IEEE} Computer Society}, year = {2000}, url = {https://doi.org/10.1109/ICMAS.2000.858515}, doi = {10.1109/ICMAS.2000.858515}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icmas/StoneRV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Stone00, author = {Peter Stone}, editor = {Pat Langley}, title = {{TPOT-RL} Applied to Network Routing}, booktitle = {Proceedings of the Seventeenth International Conference on Machine Learning {(ICML} 2000), Stanford University, Stanford, CA, USA, June 29 - July 2, 2000}, pages = {935--942}, publisher = {Morgan Kaufmann}, year = {2000}, timestamp = {Sun, 21 Feb 2010 20:54:50 +0100}, biburl = {https://dblp.org/rec/conf/icml/Stone00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iser/AsadaBPFNTDSVBKT00, author = {Minoru Asada and Andreas Birk and Enrico Pagello and Masahiro Fujita and Itsuki Noda and Satoshi Tadokoro and Dominique Duhaut and Peter Stone and Manuela M. Veloso and Tucker R. Balch and Hiroaki Kitano and Brian Thomas}, editor = {Daniela Rus and Sanjiv Singh}, title = {Progress in RoboCup Soccer Research in 2000}, booktitle = {Experimental Robotics {VII} {[ISER} 2000, Waikiki, Hawaii, USA, December 11-13, 2000]}, series = {Lecture Notes in Control and Information Sciences}, volume = {271}, pages = {363--372}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45118-8\_37}, doi = {10.1007/3-540-45118-8\_37}, timestamp = {Fri, 02 Jun 2017 12:01:41 +0200}, biburl = {https://dblp.org/rec/conf/iser/AsadaBPFNTDSVBKT00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneABFKLSTW00, author = {Peter Stone and Minoru Asada and Tucker R. Balch and Masahiro Fujita and Gerhard K. Kraetzschmar and Henrik Hautop Lund and Paul Scerri and Satoshi Tadokoro and Gordon F. Wyeth}, editor = {Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar}, title = {Overview of RoboCup-2000}, booktitle = {RoboCup 2000: Robot Soccer World Cup {IV}}, series = {Lecture Notes in Computer Science}, volume = {2019}, pages = {1--28}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45324-5\_1}, doi = {10.1007/3-540-45324-5\_1}, timestamp = {Mon, 23 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/StoneABFKLSTW00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneSS00, author = {Peter Stone and Richard S. Sutton and Satinder Singh}, editor = {Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar}, title = {Reinforcement Learning for 3 vs. 2 Keepaway}, booktitle = {RoboCup 2000: Robot Soccer World Cup {IV}}, series = {Lecture Notes in Computer Science}, volume = {2019}, pages = {249--258}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45324-5\_23}, doi = {10.1007/3-540-45324-5\_23}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneSS00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/McAllesterS00, author = {David A. McAllester and Peter Stone}, editor = {Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar}, title = {Keeping the Ball from CMUnited-99}, booktitle = {RoboCup 2000: Robot Soccer World Cup {IV}}, series = {Lecture Notes in Computer Science}, volume = {2019}, pages = {333--338}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45324-5\_35}, doi = {10.1007/3-540-45324-5\_35}, timestamp = {Fri, 26 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/McAllesterS00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/RileySMV00, author = {Patrick Riley and Peter Stone and David A. McAllester and Manuela M. Veloso}, editor = {Peter Stone and Tucker R. Balch and Gerhard K. Kraetzschmar}, title = {ATT-CMUnited-2000: Third Place Finisher in the RoboCup-2000 Simulator League}, booktitle = {RoboCup 2000: Robot Soccer World Cup {IV}}, series = {Lecture Notes in Computer Science}, volume = {2019}, pages = {489--492}, publisher = {Springer}, year = {2000}, url = {https://doi.org/10.1007/3-540-45324-5\_68}, doi = {10.1007/3-540-45324-5\_68}, timestamp = {Thu, 21 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/RileySMV00.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ai/StoneV99, author = {Peter Stone and Manuela M. Veloso}, title = {Task Decomposition, Dynamic Role Assignment, and Low-Bandwidth Communication for Real-Time Strategic Teamwork}, journal = {Artif. Intell.}, volume = {110}, number = {2}, pages = {241--273}, year = {1999}, url = {https://doi.org/10.1016/S0004-3702(99)00025-9}, doi = {10.1016/S0004-3702(99)00025-9}, timestamp = {Sat, 27 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ai/StoneV99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ras/VelosoSH99, author = {Manuela M. Veloso and Peter Stone and Kwun Han}, title = {The CMUnited-97 robotic soccer team: Perception and multi-agent control}, journal = {Robotics Auton. Syst.}, volume = {29}, number = {2-3}, pages = {133--143}, year = {1999}, url = {https://doi.org/10.1016/S0921-8890(99)00048-2}, doi = {10.1016/S0921-8890(99)00048-2}, timestamp = {Mon, 24 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ras/VelosoSH99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/VelosoBAHS99, author = {Manuela M. Veloso and Michael H. Bowling and Sorin Achim and Kwun Han and Peter Stone}, editor = {Jim Hendler and Devika Subramanian}, title = {CMUnited-98: {A} Team of Robotic Soccer Agents}, booktitle = {Proceedings of the Sixteenth National Conference on Artificial Intelligence and Eleventh Conference on Innovative Applications of Artificial Intelligence, July 18-22, 1999, Orlando, Florida, {USA}}, pages = {891--896}, publisher = {{AAAI} Press / The {MIT} Press}, year = {1999}, url = {http://www.aaai.org/Library/IAAI/1999/iaai99-126.php}, timestamp = {Tue, 05 Sep 2023 09:10:47 +0200}, biburl = {https://dblp.org/rec/conf/aaai/VelosoBAHS99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/StoneV99, author = {Peter Stone and Manuela M. Veloso}, editor = {Oren Etzioni and J{\"{o}}rg P. M{\"{u}}ller and Jeffrey M. Bradshaw}, title = {Team-Partitioned, Opaque-Transition Reinforcement Learning}, booktitle = {Proceedings of the Third Annual Conference on Autonomous Agents, {AGENTS} 1999, Seattle, WA, USA, May 1-5, 1999}, pages = {206--212}, publisher = {{ACM}}, year = {1999}, url = {https://doi.org/10.1145/301136.301195}, doi = {10.1145/301136.301195}, timestamp = {Tue, 06 Nov 2018 11:07:01 +0100}, biburl = {https://dblp.org/rec/conf/agents/StoneV99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/VelosoKPKSBACKF99, author = {Manuela M. Veloso and Hiroaki Kitano and Enrico Pagello and Gerhard K. Kraetzschmar and Peter Stone and Tucker R. Balch and Minoru Asada and Silvia Coradeschi and Lars Karlsson and Masahiro Fujita}, editor = {Manuela M. Veloso and Enrico Pagello and Hiroaki Kitano}, title = {Overview of RoboCup-99}, booktitle = {RoboCup-99: Robot Soccer World Cup {III}}, series = {Lecture Notes in Computer Science}, volume = {1856}, pages = {1--34}, publisher = {Springer}, year = {1999}, url = {https://doi.org/10.1007/3-540-45327-X\_1}, doi = {10.1007/3-540-45327-X\_1}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/VelosoKPKSBACKF99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneRV99, author = {Peter Stone and Patrick Riley and Manuela M. Veloso}, editor = {Manuela M. Veloso and Enrico Pagello and Hiroaki Kitano}, title = {The CMUnited-99 Champion Simulator Team}, booktitle = {RoboCup-99: Robot Soccer World Cup {III}}, series = {Lecture Notes in Computer Science}, volume = {1856}, pages = {35--48}, publisher = {Springer}, year = {1999}, url = {https://doi.org/10.1007/3-540-45327-X\_2}, doi = {10.1007/3-540-45327-X\_2}, timestamp = {Thu, 21 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/StoneRV99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneV99, author = {Peter Stone and Manuela M. Veloso}, editor = {Manuela M. Veloso and Enrico Pagello and Hiroaki Kitano}, title = {Layered Learning and Flexible Teamwork in RoboCup Simulation Agents}, booktitle = {RoboCup-99: Robot Soccer World Cup {III}}, series = {Lecture Notes in Computer Science}, volume = {1856}, pages = {495--508}, publisher = {Springer}, year = {1999}, url = {https://doi.org/10.1007/3-540-45327-X\_42}, doi = {10.1007/3-540-45327-X\_42}, timestamp = {Wed, 24 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneV99.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aai/StoneV98, author = {Peter Stone and Manuela M. Veloso}, title = {Layered Approach to Learning Client Behaviors in the Robocup Soccer Server}, journal = {Appl. Artif. Intell.}, volume = {12}, number = {2-3}, pages = {165--188}, year = {1998}, url = {https://doi.org/10.1080/088395198117811}, doi = {10.1080/088395198117811}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aai/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aai/AsadaSKWKDDVAS98, author = {Minoru Asada and Peter Stone and Hiroaki Kitano and Barry Brian Werger and Yasuo Kuniyoshi and Alexis Drogoul and Dominique Duhaut and Manuela M. Veloso and Hajime Asama and Sho'ji Suzuki}, title = {The Robocup Physical Agent Challenge: Phase {I}}, journal = {Appl. Artif. Intell.}, volume = {12}, number = {2-3}, pages = {251--263}, year = {1998}, url = {https://doi.org/10.1080/088395198117857}, doi = {10.1080/088395198117857}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aai/AsadaSKWKDDVAS98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/aim/VelosoSH98, author = {Manuela M. Veloso and Peter Stone and Kwun Han}, title = {{CMUNITED-97:} RoboCup-97 Small-Robot World Champion Team}, journal = {{AI} Mag.}, volume = {19}, number = {3}, pages = {61--69}, year = {1998}, url = {https://doi.org/10.1609/aimag.v19i3.1394}, doi = {10.1609/AIMAG.V19I3.1394}, timestamp = {Tue, 25 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/aim/VelosoSH98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ar/VelosoBS98, author = {Manuela M. Veloso and Michael H. Bowling and Peter Stone}, title = {The CMUnited-98 champion small-robot team}, journal = {Adv. Robotics}, volume = {13}, number = {8}, pages = {753--766}, year = {1998}, url = {https://doi.org/10.1163/156855300X00089}, doi = {10.1163/156855300X00089}, timestamp = {Sat, 25 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/ar/VelosoBS98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/crossroads/VelosoSHA98, author = {Manuela Veloso and Peter Stone and Kwun Han and Sorin Achim}, title = {CMUnited: a team of robotics soccer agents collaborating in an adversarial environment}, journal = {{XRDS}}, volume = {4}, number = {3}, pages = {11--17}, year = {1998}, url = {https://doi.org/10.1145/332084.332089}, doi = {10.1145/332084.332089}, timestamp = {Wed, 04 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/crossroads/VelosoSHA98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijmms/StoneV98, author = {Peter Stone and Manuela M. Veloso}, title = {Towards collaborative and adversarial learning: a case study in robotic soccer}, journal = {Int. J. Hum. Comput. Stud.}, volume = {48}, number = {1}, pages = {83--104}, year = {1998}, url = {https://doi.org/10.1006/ijhc.1997.0162}, doi = {10.1006/IJHC.1997.0162}, timestamp = {Fri, 21 Feb 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijmms/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/VelosoSH98, author = {Manuela M. Veloso and Peter Stone and Kwun Han}, editor = {Katia P. Sycara and Michael J. Wooldridge}, title = {The CMUnited-97 Robotic Socccer Team: Perception and Multiagent Control}, booktitle = {Proceedings of the Second International Conference on Autonomous Agents, {AGENTS} 1998, St. Paul, Minnepolis, USA, May 9-13, 1998}, pages = {78--85}, publisher = {{ACM}}, year = {1998}, url = {https://doi.org/10.1145/280765.280778}, doi = {10.1145/280765.280778}, timestamp = {Fri, 26 Apr 2019 14:26:42 +0200}, biburl = {https://dblp.org/rec/conf/agents/VelosoSH98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/StoneV98, author = {Peter Stone and Manuela M. Veloso}, editor = {Katia P. Sycara and Michael J. Wooldridge}, title = {Using Decision Tree Confidence Factors for Multi-Agent Control}, booktitle = {Proceedings of the Second International Conference on Autonomous Agents, {AGENTS} 1998, St. Paul, Minnepolis, USA, May 9-13, 1998}, pages = {86--91}, publisher = {{ACM}}, year = {1998}, url = {https://doi.org/10.1145/280765.280780}, doi = {10.1145/280765.280780}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/agents/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/atal/StoneV98, author = {Peter Stone and Manuela M. Veloso}, editor = {J{\"{o}}rg P. M{\"{u}}ller and Munindar P. Singh and Anand S. Rao}, title = {Task Decomposition and Dynamic Role Assignment for Real-Time Strategic Teamwork}, booktitle = {Intelligent Agents V, Agent Theories, Architectures, and Languages, 5th International Workshop, {ATAL} '98, Paris, France, July 4-7, 1998, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {1555}, pages = {293--308}, publisher = {Springer}, year = {1998}, url = {https://doi.org/10.1007/3-540-49057-4\_19}, doi = {10.1007/3-540-49057-4\_19}, timestamp = {Tue, 29 Dec 2020 18:27:45 +0100}, biburl = {https://dblp.org/rec/conf/atal/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/crw/StoneV98, author = {Peter Stone and Manuela M. Veloso}, editor = {Alexis Drogoul and Milind Tambe and Toshio Fukuda}, title = {Communication in Domains with Unreliable, Single-Channel, Low-Bandwidth Communication}, booktitle = {Collective Robotics, First International Workshop, CRW'98, Paris, France, July 4-5, 1998, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {1456}, pages = {85--97}, publisher = {Springer}, year = {1998}, url = {https://doi.org/10.1007/BFb0033376}, doi = {10.1007/BFB0033376}, timestamp = {Tue, 14 May 2019 10:00:55 +0200}, biburl = {https://dblp.org/rec/conf/crw/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icmas/VelosoS98, author = {Manuela M. Veloso and Peter Stone}, editor = {Yves Demazeau}, title = {Individual and Collaborative Behaviors in a Team of Robotic Soccer Agents}, booktitle = {Proceedings of the Third International Conference on Multiagent Systems, {ICMAS} 1998, Paris, France, July 3-7, 1998}, pages = {309--316}, publisher = {{IEEE} Computer Society}, year = {1998}, url = {https://doi.org/10.1109/ICMAS.1998.699074}, doi = {10.1109/ICMAS.1998.699074}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icmas/VelosoS98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneVR98, author = {Peter Stone and Manuela M. Veloso and Patrick Riley}, editor = {Minoru Asada and Hiroaki Kitano}, title = {The CMUnited-98 Champion Simulator Team}, booktitle = {RoboCup-98: Robot Soccer World Cup {II}}, series = {Lecture Notes in Computer Science}, volume = {1604}, pages = {61--76}, publisher = {Springer}, year = {1998}, url = {https://doi.org/10.1007/3-540-48422-1\_5}, doi = {10.1007/3-540-48422-1\_5}, timestamp = {Thu, 21 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/robocup/StoneVR98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/VelosoBAHS98, author = {Manuela M. Veloso and Michael H. Bowling and Sorin Achim and Kwun Han and Peter Stone}, editor = {Minoru Asada and Hiroaki Kitano}, title = {The CMUnited-98 Small-Robot Team}, booktitle = {RoboCup-98: Robot Soccer World Cup {II}}, series = {Lecture Notes in Computer Science}, volume = {1604}, pages = {77--92}, publisher = {Springer}, year = {1998}, url = {https://doi.org/10.1007/3-540-48422-1\_6}, doi = {10.1007/3-540-48422-1\_6}, timestamp = {Wed, 24 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/VelosoBAHS98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneV98, author = {Peter Stone and Manuela M. Veloso}, editor = {Minoru Asada and Hiroaki Kitano}, title = {Team-Partitioned, Opaque-Transition Reinforced Learning}, booktitle = {RoboCup-98: Robot Soccer World Cup {II}}, series = {Lecture Notes in Computer Science}, volume = {1604}, pages = {261--272}, publisher = {Springer}, year = {1998}, url = {https://doi.org/10.1007/3-540-48422-1\_21}, doi = {10.1007/3-540-48422-1\_21}, timestamp = {Wed, 24 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneV98.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/clsr/Stone97, author = {Peter Stone}, title = {Lessons from America: Filtration of functionality from software copyright}, journal = {Comput. Law Secur. Rev.}, volume = {13}, number = {1}, pages = {15--21}, year = {1997}, url = {https://doi.org/10.1016/S0267-3649(97)81187-9}, doi = {10.1016/S0267-3649(97)81187-9}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/clsr/Stone97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/Stone97, author = {Peter Stone}, editor = {Benjamin Kuipers and Bonnie L. Webber}, title = {Layered Learning in Multiagent Systems}, booktitle = {Proceedings of the Fourteenth National Conference on Artificial Intelligence and Ninth Innovative Applications of Artificial Intelligence Conference, {AAAI} 97, {IAAI} 97, July 27-31, 1997, Providence, Rhode Island, {USA}}, pages = {819}, publisher = {{AAAI} Press / The {MIT} Press}, year = {1997}, url = {http://www.aaai.org/Library/AAAI/1997/aaai97-150.php}, timestamp = {Tue, 05 Sep 2023 08:53:09 +0200}, biburl = {https://dblp.org/rec/conf/aaai/Stone97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/agents/VelosoSA97, author = {Manuela M. Veloso and Peter Stone and Sorin Achim}, editor = {W. Lewis Johnson}, title = {A Layered Approach for an Autonomous Robotic Soccer System}, booktitle = {Proceedings of the First International Conference on Autonomous Agents, {AGENTS} 1997, Marina del Rey, California, USA, February 5-8, 1997}, pages = {530--531}, publisher = {{ACM}}, year = {1997}, url = {https://doi.org/10.1145/267658.267818}, doi = {10.1145/267658.267818}, timestamp = {Tue, 06 Nov 2018 11:07:02 +0100}, biburl = {https://dblp.org/rec/conf/agents/VelosoSA97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ijcai/KitanoTSVCOMNA97, author = {Hiroaki Kitano and Milind Tambe and Peter Stone and Manuela M. Veloso and Silvia Coradeschi and Eiichi Osawa and Hitoshi Matsubara and Itsuki Noda and Minoru Asada}, title = {The RoboCup Synthetic Agent Challenge 97}, booktitle = {Proceedings of the Fifteenth International Joint Conference on Artificial Intelligence, {IJCAI} 97, Nagoya, Japan, August 23-29, 1997, 2 Volumes}, pages = {24--30}, publisher = {Morgan Kaufmann}, year = {1997}, url = {http://ijcai.org/Proceedings/97-1/Papers/004.pdf}, timestamp = {Tue, 20 Aug 2019 16:17:27 +0200}, biburl = {https://dblp.org/rec/conf/ijcai/KitanoTSVCOMNA97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/AsadaSKDDVAS97, author = {Minoru Asada and Peter Stone and Hiroaki Kitano and Alexis Drogoul and Dominique Duhaut and Manuela M. Veloso and Hajime Asama and Sho'ji Suzuki}, editor = {Hiroaki Kitano}, title = {The RoboCup Physical Agent Challenge: Goals and Protocols for Phase 1}, booktitle = {RoboCup-97: Robot Soccer World Cup {I}}, series = {Lecture Notes in Computer Science}, volume = {1395}, pages = {42--61}, publisher = {Springer}, year = {1997}, url = {https://doi.org/10.1007/3-540-64473-3\_48}, doi = {10.1007/3-540-64473-3\_48}, timestamp = {Tue, 14 May 2019 10:00:53 +0200}, biburl = {https://dblp.org/rec/conf/robocup/AsadaSKDDVAS97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/KitanoTSVCOMNA97, author = {Hiroaki Kitano and Milind Tambe and Peter Stone and Manuela M. Veloso and Silvia Coradeschi and Eiichi Osawa and Hitoshi Matsubara and Itsuki Noda and Minoru Asada}, editor = {Hiroaki Kitano}, title = {The RoboCup Synthetic Agent Challenge 97}, booktitle = {RoboCup-97: Robot Soccer World Cup {I}}, series = {Lecture Notes in Computer Science}, volume = {1395}, pages = {62--73}, publisher = {Springer}, year = {1997}, url = {https://doi.org/10.1007/3-540-64473-3\_49}, doi = {10.1007/3-540-64473-3\_49}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/KitanoTSVCOMNA97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneV97, author = {Peter Stone and Manuela M. Veloso}, editor = {Hiroaki Kitano}, title = {Using Decision Tree Confidence Factors for Multiagent Control}, booktitle = {RoboCup-97: Robot Soccer World Cup {I}}, series = {Lecture Notes in Computer Science}, volume = {1395}, pages = {99--111}, publisher = {Springer}, year = {1997}, url = {https://doi.org/10.1007/3-540-64473-3\_52}, doi = {10.1007/3-540-64473-3\_52}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneV97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/VelosoSHA97, author = {Manuela M. Veloso and Peter Stone and Kwun Han and Sorin Achim}, editor = {Hiroaki Kitano}, title = {The CMUnited-97 Small Robot Team}, booktitle = {RoboCup-97: Robot Soccer World Cup {I}}, series = {Lecture Notes in Computer Science}, volume = {1395}, pages = {242--256}, publisher = {Springer}, year = {1997}, url = {https://doi.org/10.1007/3-540-64473-3\_64}, doi = {10.1007/3-540-64473-3\_64}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/VelosoSHA97.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/robocup/StoneV97a, author = {Peter Stone and Manuela M. Veloso}, editor = {Hiroaki Kitano}, title = {The CMUnited-97 Simulator Team}, booktitle = {RoboCup-97: Robot Soccer World Cup {I}}, series = {Lecture Notes in Computer Science}, volume = {1395}, pages = {389--397}, publisher = {Springer}, year = {1997}, url = {https://doi.org/10.1007/3-540-64473-3\_75}, doi = {10.1007/3-540-64473-3\_75}, timestamp = {Tue, 23 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/robocup/StoneV97a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jair/VelosoS95, author = {Manuela M. Veloso and Peter Stone}, title = {{FLECS:} Planning with a Flexible Commitment Strategy}, journal = {J. Artif. Intell. Res.}, volume = {3}, pages = {25--52}, year = {1995}, url = {https://doi.org/10.1613/jair.131}, doi = {10.1613/JAIR.131}, timestamp = {Mon, 21 Jan 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jair/VelosoS95.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/StoneV95, author = {Peter Stone and Manuela M. Veloso}, editor = {David S. Touretzky and Michael Mozer and Michael E. Hasselmo}, title = {Beating a Defender in Robotic Soccer: Memory-Based Learning of a Continuous Function}, booktitle = {Advances in Neural Information Processing Systems 8, NIPS, Denver, CO, USA, November 27-30, 1995}, pages = {896--902}, publisher = {{MIT} Press}, year = {1995}, url = {http://papers.nips.cc/paper/1089-beating-a-defender-in-robotic-soccer-memory-based-learning-of-a-continuous-function}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/StoneV95.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-cs-9506101, author = {Manuela M. Veloso and Peter Stone}, title = {{FLECS:} Planning with a Flexible Commitment Strategy}, journal = {CoRR}, volume = {abs/cs/9506101}, year = {1995}, url = {http://arxiv.org/abs/cs/9506101}, eprinttype = {arXiv}, eprint = {cs/9506101}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-cs-9506101.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aips/StoneVB94, author = {Peter Stone and Manuela M. Veloso and Jim Blythe}, editor = {Kristian J. Hammond}, title = {The Need for Different Domain-independent Heuristics}, booktitle = {Proceedings of the Second International Conference on Artificial Intelligence Planning Systems, University of Chicago, Chicago, Illinois, USA, June 13-15, 1994}, pages = {164--169}, publisher = {{AAAI}}, year = {1994}, url = {http://www.aaai.org/Library/AIPS/1994/aips94-028.php}, timestamp = {Fri, 05 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aips/StoneVB94.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/cn/Stone90, author = {Peter Stone}, title = {Developing Networked Services for Libraries: The U. K. Experience}, journal = {Comput. Networks {ISDN} Syst.}, volume = {19}, number = {3-5}, pages = {343--349}, year = {1990}, url = {https://doi.org/10.1016/0169-7552(90)90098-D}, doi = {10.1016/0169-7552(90)90098-D}, timestamp = {Thu, 14 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/cn/Stone90.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.