default search action
BibTeX records: Jimmy Ba
@inproceedings{DBLP:conf/iclr/PasterSAB24, author = {Keiran Paster and Marco Dos Santos and Zhangir Azerbayev and Jimmy Ba}, title = {OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=jKHmjlpViu}, timestamp = {Wed, 07 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PasterSAB24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/RuanDWPZBDMH24, author = {Yangjun Ruan and Honghua Dong and Andrew Wang and Silviu Pitis and Yongchao Zhou and Jimmy Ba and Yann Dubois and Chris J. Maddison and Tatsunori Hashimoto}, title = {Identifying the Risks of {LM} Agents with an LM-Emulated Sandbox}, booktitle = {The Twelfth International Conference on Learning Representations, {ICLR} 2024, Vienna, Austria, May 7-11, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=GEcwtMk1uA}, timestamp = {Mon, 29 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/RuanDWPZBDMH24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LiPGYBGLDGMHLJL24, author = {Nathaniel Li and Alexander Pan and Anjali Gopal and Summer Yue and Daniel Berrios and Alice Gatti and Justin D. Li and Ann{-}Kathrin Dombrowski and Shashwat Goel and Gabriel Mukobi and Nathan Helm{-}Burger and Rassin Lababidi and Lennart Justen and Andrew B. Liu and Michael Chen and Isabelle Barrass and Oliver Zhang and Xiaoyuan Zhu and Rishub Tamirisa and Bhrugu Bharathi and Ariel Herbert{-}Voss and Cort B. Breuer and Andy Zou and Mantas Mazeika and Zifan Wang and Palash Oswal and Weiran Lin and Adam A. Hunt and Justin Tienken{-}Harder and Kevin Y. Shih and Kemper Talley and John Guan and Ian Steneker and David Campbell and Brad Jokubaitis and Steven Basart and Stephen Fitz and Ponnurangam Kumaraguru and Kallol Krishna Karmakar and Uday Kiran Tupakula and Vijay Varadharajan and Yan Shoshitaishvili and Jimmy Ba and Kevin M. Esvelt and Alexandr Wang and Dan Hendrycks}, title = {The {WMDP} Benchmark: Measuring and Reducing Malicious Use with Unlearning}, booktitle = {Forty-first International Conference on Machine Learning, {ICML} 2024, Vienna, Austria, July 21-27, 2024}, publisher = {OpenReview.net}, year = {2024}, url = {https://openreview.net/forum?id=xlr6AUDuJz}, timestamp = {Mon, 02 Sep 2024 16:45:29 +0200}, biburl = {https://dblp.org/rec/conf/icml/LiPGYBGLDGMHLJL24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2403-03218, author = {Nathaniel Li and Alexander Pan and Anjali Gopal and Summer Yue and Daniel Berrios and Alice Gatti and Justin D. Li and Ann{-}Kathrin Dombrowski and Shashwat Goel and Long Phan and Gabriel Mukobi and Nathan Helm{-}Burger and Rassin Lababidi and Lennart Justen and Andrew B. Liu and Michael Chen and Isabelle Barrass and Oliver Zhang and Xiaoyuan Zhu and Rishub Tamirisa and Bhrugu Bharathi and Adam Khoja and Zhenqi Zhao and Ariel Herbert{-}Voss and Cort B. Breuer and Andy Zou and Mantas Mazeika and Zifan Wang and Palash Oswal and Weiran Liu and Adam A. Hunt and Justin Tienken{-}Harder and Kevin Y. Shih and Kemper Talley and John Guan and Russell Kaplan and Ian Steneker and David Campbell and Brad Jokubaitis and Alex Levinson and Jean Wang and William Qian and Kallol Krishna Karmakar and Steven Basart and Stephen Fitz and Mindy Levine and Ponnurangam Kumaraguru and Uday Kiran Tupakula and Vijay Varadharajan and Yan Shoshitaishvili and Jimmy Ba and Kevin M. Esvelt and Alexandr Wang and Dan Hendrycks}, title = {The {WMDP} Benchmark: Measuring and Reducing Malicious Use With Unlearning}, journal = {CoRR}, volume = {abs/2403.03218}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2403.03218}, doi = {10.48550/ARXIV.2403.03218}, eprinttype = {arXiv}, eprint = {2403.03218}, timestamp = {Tue, 20 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2403-03218.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2407-21170, author = {Brandon Jaipersaud and Paul Zhang and Jimmy Ba and Andrew Petersen and Lisa Zhang and Michael R. Zhang}, title = {Decomposed Prompting to Answer Questions on a Course Discussion Board}, journal = {CoRR}, volume = {abs/2407.21170}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2407.21170}, doi = {10.48550/ARXIV.2407.21170}, eprinttype = {arXiv}, eprint = {2407.21170}, timestamp = {Wed, 21 Aug 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2407-21170.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/RazdaibiedinaMK23, author = {Anastasia Razdaibiedina and Yuning Mao and Madian Khabsa and Mike Lewis and Rui Hou and Jimmy Ba and Amjad Almahairi}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {Residual Prompt Tuning: improving prompt tuning with residual reparameterization}, booktitle = {Findings of the Association for Computational Linguistics: {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {6740--6757}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.findings-acl.421}, doi = {10.18653/V1/2023.FINDINGS-ACL.421}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/RazdaibiedinaMK23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aied/JaipersaudZBPZZ23, author = {Brandon Jaipersaud and Paul Zhang and Jimmy Ba and Andrew Petersen and Lisa Zhang and Michael R. Zhang}, editor = {Ning Wang and Genaro Rebolledo{-}Mendez and Vania Dimitrova and Noboru Matsuda and Olga C. Santos}, title = {Decomposed Prompting to Answer Questions on a Course Discussion Board}, booktitle = {Artificial Intelligence in Education. Posters and Late Breaking Results, Workshops and Tutorials, Industry and Innovation Tracks, Practitioners, Doctoral Consortium and Blue Sky - 24th International Conference, {AIED} 2023, Tokyo, Japan, July 3-7, 2023, Proceedings}, series = {Communications in Computer and Information Science}, volume = {1831}, pages = {218--223}, publisher = {Springer}, year = {2023}, url = {https://doi.org/10.1007/978-3-031-36336-8\_33}, doi = {10.1007/978-3-031-36336-8\_33}, timestamp = {Fri, 04 Aug 2023 15:27:47 +0200}, biburl = {https://dblp.org/rec/conf/aied/JaipersaudZBPZZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BaeZRWHBG23, author = {Juhan Bae and Michael R. Zhang and Michael Ruan and Eric Wang and So Hasegawa and Jimmy Ba and Roger Baker Grosse}, title = {Multi-Rate {VAE:} Train Once, Get the Full Rate-Distortion Curve}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/forum?id=OJ8aSjCaMNK}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/BaeZRWHBG23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ZhouMHPPCB23, author = {Yongchao Zhou and Andrei Ioan Muresanu and Ziwen Han and Keiran Paster and Silviu Pitis and Harris Chan and Jimmy Ba}, title = {Large Language Models are Human-Level Prompt Engineers}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/forum?id=92gvk82DE-}, timestamp = {Wed, 24 Jul 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ZhouMHPPCB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LiuVGBL23, author = {Zhaoyan Liu and No{\"{e}}l Vouitsis and Satya Krishna Gorti and Jimmy Ba and Gabriel Loaiza{-}Ganem}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {{TR0N:} Translator Networks for 0-Shot Plug-and-Play Conditional Generation}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {22092--22112}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/liu23ak.html}, timestamp = {Mon, 28 Aug 2023 17:23:08 +0200}, biburl = {https://dblp.org/rec/conf/icml/LiuVGBL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iticse/ZhangJB0ZZ23, author = {Paul Zhang and Brandon Jaipersaud and Jimmy Ba and Andrew Petersen and Lisa Zhang and Michael R. Zhang}, editor = {Mikko{-}Jussi Laakso and Mattia Monga and Simon and Judithe Sheard}, title = {Classifying Course Discussion Board Questions using LLMs}, booktitle = {Proceedings of the 2023 Conference on Innovation and Technology in Computer Science Education V. 2, ITiCSE 2023, Turku, Finland, July 7-12, 2023}, pages = {658}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3587103.3594202}, doi = {10.1145/3587103.3594202}, timestamp = {Fri, 07 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iticse/ZhangJB0ZZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaESWW23, author = {Jimmy Ba and Murat A. Erdogdu and Taiji Suzuki and Zhichao Wang and Denny Wu}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Learning in the Presence of Low-dimensional Structure: {A} Spiked Random Matrix Perspective}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/38a1671ab0747b6ffe4d1c6ef117a3a9-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/BaESWW23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DuboisLTZGBGLH23, author = {Yann Dubois and Chen Xuechen Li and Rohan Taori and Tianyi Zhang and Ishaan Gulrajani and Jimmy Ba and Carlos Guestrin and Percy Liang and Tatsunori B. Hashimoto}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {AlpacaFarm: {A} Simulation Framework for Methods that Learn from Human Feedback}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/5fc47800ee5b30b8777fdd30abcaaf3b-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DuboisLTZGBGLH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LifshitzPCBM23, author = {Shalev Lifshitz and Keiran Paster and Harris Chan and Jimmy Ba and Sheila A. McIlraith}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {{STEVE-1:} {A} Generative Model for Text-to-Behavior in Minecraft}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/dd03f856fc7f2efeec8b1c796284561d-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LifshitzPCBM23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-04104, author = {Danijar Hafner and Jurgis Pasukonis and Jimmy Ba and Timothy P. Lillicrap}, title = {Mastering Diverse Domains through World Models}, journal = {CoRR}, volume = {abs/2301.04104}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.04104}, doi = {10.48550/ARXIV.2301.04104}, eprinttype = {arXiv}, eprint = {2301.04104}, timestamp = {Thu, 19 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-04104.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2304-05970, author = {Silviu Pitis and Michael R. Zhang and Andrew Wang and Jimmy Ba}, title = {Boosted Prompt Ensembles for Large Language Models}, journal = {CoRR}, volume = {abs/2304.05970}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2304.05970}, doi = {10.48550/ARXIV.2304.05970}, eprinttype = {arXiv}, eprint = {2304.05970}, timestamp = {Wed, 19 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2304-05970.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2304-13742, author = {Zhaoyan Liu and No{\"{e}}l Vouitsis and Satya Krishna Gorti and Jimmy Ba and Gabriel Loaiza{-}Ganem}, title = {{TR0N:} Translator Networks for 0-Shot Plug-and-Play Conditional Generation}, journal = {CoRR}, volume = {abs/2304.13742}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2304.13742}, doi = {10.48550/ARXIV.2304.13742}, eprinttype = {arXiv}, eprint = {2304.13742}, timestamp = {Wed, 03 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2304-13742.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-03937, author = {Anastasia Razdaibiedina and Yuning Mao and Rui Hou and Madian Khabsa and Mike Lewis and Jimmy Ba and Amjad Almahairi}, title = {Residual Prompt Tuning: Improving Prompt Tuning with Residual Reparameterization}, journal = {CoRR}, volume = {abs/2305.03937}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.03937}, doi = {10.48550/ARXIV.2305.03937}, eprinttype = {arXiv}, eprint = {2305.03937}, timestamp = {Thu, 11 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-03937.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-12031, author = {Augustin Toma and Patrick R. Lawler and Jimmy Ba and Rahul G. Krishnan and Barry B. Rubin and Bo Wang}, title = {Clinical Camel: An Open-Source Expert-Level Medical Language Model with Dialogue-Based Knowledge Encoding}, journal = {CoRR}, volume = {abs/2305.12031}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.12031}, doi = {10.48550/ARXIV.2305.12031}, eprinttype = {arXiv}, eprint = {2305.12031}, timestamp = {Fri, 26 May 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-12031.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-14387, author = {Yann Dubois and Xuechen Li and Rohan Taori and Tianyi Zhang and Ishaan Gulrajani and Jimmy Ba and Carlos Guestrin and Percy Liang and Tatsunori B. Hashimoto}, title = {AlpacaFarm: {A} Simulation Framework for Methods that Learn from Human Feedback}, journal = {CoRR}, volume = {abs/2305.14387}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.14387}, doi = {10.48550/ARXIV.2305.14387}, eprinttype = {arXiv}, eprint = {2305.14387}, timestamp = {Tue, 06 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-14387.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-15316, author = {Yongchao Zhou and Hshmat Sahak and Jimmy Ba}, title = {Training on Thin Air: Improve Image Classification with Generated Data}, journal = {CoRR}, volume = {abs/2305.15316}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.15316}, doi = {10.48550/ARXIV.2305.15316}, eprinttype = {arXiv}, eprint = {2305.15316}, timestamp = {Tue, 06 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-15316.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-00937, author = {Shalev Lifshitz and Keiran Paster and Harris Chan and Jimmy Ba and Sheila A. McIlraith}, title = {{STEVE-1:} {A} Generative Model for Text-to-Behavior in Minecraft}, journal = {CoRR}, volume = {abs/2306.00937}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.00937}, doi = {10.48550/ARXIV.2306.00937}, eprinttype = {arXiv}, eprint = {2306.00937}, timestamp = {Mon, 12 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-00937.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-15817, author = {Yangjun Ruan and Honghua Dong and Andrew Wang and Silviu Pitis and Yongchao Zhou and Jimmy Ba and Yann Dubois and Chris J. Maddison and Tatsunori Hashimoto}, title = {Identifying the Risks of {LM} Agents with an LM-Emulated Sandbox}, journal = {CoRR}, volume = {abs/2309.15817}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.15817}, doi = {10.48550/ARXIV.2309.15817}, eprinttype = {arXiv}, eprint = {2309.15817}, timestamp = {Tue, 17 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-15817.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-06786, author = {Keiran Paster and Marco Dos Santos and Zhangir Azerbayev and Jimmy Ba}, title = {OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text}, journal = {CoRR}, volume = {abs/2310.06786}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.06786}, doi = {10.48550/ARXIV.2310.06786}, eprinttype = {arXiv}, eprint = {2310.06786}, timestamp = {Tue, 24 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-06786.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2312-04528, author = {Michael R. Zhang and Nishkrit Desai and Juhan Bae and Jonathan Lorraine and Jimmy Ba}, title = {Using Large Language Models for Hyperparameter Optimization}, journal = {CoRR}, volume = {abs/2312.04528}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2312.04528}, doi = {10.48550/ARXIV.2312.04528}, eprinttype = {arXiv}, eprint = {2312.04528}, timestamp = {Tue, 02 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2312-04528.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BaEGSSWZ22, author = {Jimmy Ba and Murat A. Erdogdu and Marzyeh Ghassemi and Shengyang Sun and Taiji Suzuki and Denny Wu and Tianzong Zhang}, title = {Understanding the Variance Collapse of {SVGD} in High Dimensions}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=Qycd9j5Qp9J}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/BaEGSSWZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaESWWY22, author = {Jimmy Ba and Murat A. Erdogdu and Taiji Suzuki and Zhichao Wang and Denny Wu and Greg Yang}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {High-dimensional Asymptotics of Feature Learning: How One Gradient Step Improves the Representation}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/f7e7fabd73b3df96c54a320862afcb78-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/BaESWWY22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PasterMB22, author = {Keiran Paster and Sheila A. McIlraith and Jimmy Ba}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {You Can't Count on Luck: Why Decision Transformers and RvS Fail in Stochastic Environments}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/fe90657b12193c7b52a3418bdc351807-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PasterMB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ZhouNB22, author = {Yongchao Zhou and Ehsan Nezhadarya and Jimmy Ba}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Dataset Distillation using Neural Feature Regression}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/3fe2a777282299ecb4f9e7ebb531f0ab-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ZhouNB22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-01445, author = {Jimmy Ba and Murat A. Erdogdu and Taiji Suzuki and Zhichao Wang and Denny Wu and Greg Yang}, title = {High-dimensional Asymptotics of Feature Learning: How One Gradient Step Improves the Representation}, journal = {CoRR}, volume = {abs/2205.01445}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.01445}, doi = {10.48550/ARXIV.2205.01445}, eprinttype = {arXiv}, eprint = {2205.01445}, timestamp = {Thu, 05 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-01445.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-15967, author = {Keiran Paster and Sheila A. McIlraith and Jimmy Ba}, title = {You Can't Count on Luck: Why Decision Transformers Fail in Stochastic Environments}, journal = {CoRR}, volume = {abs/2205.15967}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.15967}, doi = {10.48550/ARXIV.2205.15967}, eprinttype = {arXiv}, eprint = {2205.15967}, timestamp = {Wed, 01 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-15967.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-00719, author = {Yongchao Zhou and Ehsan Nezhadarya and Jimmy Ba}, title = {Dataset Distillation using Neural Feature Regression}, journal = {CoRR}, volume = {abs/2206.00719}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.00719}, doi = {10.48550/ARXIV.2206.00719}, eprinttype = {arXiv}, eprint = {2206.00719}, timestamp = {Mon, 13 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-00719.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2209-13569, author = {Siddhartha Rao Kamalakara and Acyr Locatelli and Bharat Venkitesh and Jimmy Ba and Yarin Gal and Aidan N. Gomez}, title = {Exploring Low Rank Training of Deep Neural Networks}, journal = {CoRR}, volume = {abs/2209.13569}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2209.13569}, doi = {10.48550/ARXIV.2209.13569}, eprinttype = {arXiv}, eprint = {2209.13569}, timestamp = {Thu, 06 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2209-13569.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-01910, author = {Yongchao Zhou and Andrei Ioan Muresanu and Ziwen Han and Keiran Paster and Silviu Pitis and Harris Chan and Jimmy Ba}, title = {Large Language Models Are Human-Level Prompt Engineers}, journal = {CoRR}, volume = {abs/2211.01910}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.01910}, doi = {10.48550/ARXIV.2211.01910}, eprinttype = {arXiv}, eprint = {2211.01910}, timestamp = {Fri, 04 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-01910.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-03905, author = {Juhan Bae and Michael R. Zhang and Michael Ruan and Eric Wang and So Hasegawa and Jimmy Ba and Roger B. Grosse}, title = {Multi-Rate {VAE:} Train Once, Get the Full Rate-Distortion Curve}, journal = {CoRR}, volume = {abs/2212.03905}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.03905}, doi = {10.48550/ARXIV.2212.03905}, eprinttype = {arXiv}, eprint = {2212.03905}, timestamp = {Mon, 02 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-03905.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/AmariBGLNSWX21, author = {Shun{-}ichi Amari and Jimmy Ba and Roger Baker Grosse and Xuechen Li and Atsushi Nitanda and Taiji Suzuki and Denny Wu and Ji Xu}, title = {When does preconditioning help or hurt generalization?}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=S724o4\_WB3}, timestamp = {Wed, 23 Jun 2021 17:36:39 +0200}, biburl = {https://dblp.org/rec/conf/iclr/AmariBGLNSWX21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/HafnerL0B21, author = {Danijar Hafner and Timothy P. Lillicrap and Mohammad Norouzi and Jimmy Ba}, title = {Mastering Atari with Discrete World Models}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=0oabwyZbOu}, timestamp = {Wed, 23 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/HafnerL0B21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PasterMB21, author = {Keiran Paster and Sheila A. McIlraith and Jimmy Ba}, title = {Planning from Pixels using Inverse Dynamics Models}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=V6BjBgku7Ro}, timestamp = {Wed, 23 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PasterMB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WuJBG21, author = {Yuhuai Wu and Albert Q. Jiang and Jimmy Ba and Roger Baker Grosse}, title = {{INT:} An Inequality Benchmark for Evaluating Generalization in Theorem Proving}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=O6LPudowNQm}, timestamp = {Mon, 30 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WuJBG21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/JiaNWB21, author = {Sheng Jia and Ehsan Nezhadarya and Yuhuai Wu and Jimmy Ba}, editor = {Marina Meila and Tong Zhang}, title = {Efficient Statistical Tests: {A} Neural Tangent Kernel Approach}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {4893--4903}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/jia21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/JiaNWB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/WuRLBGS21, author = {Yuhuai Wu and Markus N. Rabe and Wenda Li and Jimmy Ba and Roger B. Grosse and Christian Szegedy}, editor = {Marina Meila and Tong Zhang}, title = {{LIME:} Learning Inductive Bias for Primitives of Mathematical Reasoning}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {11251--11262}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/wu21c.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/WuRLBGS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/HanZCPZB21, author = {Beining Han and Chongyi Zheng and Harris Chan and Keiran Paster and Michael R. Zhang and Jimmy Ba}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Learning Domain Invariant Representations in Goal-conditioned Block MDPs}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {764--776}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/06d172404821f7d01060cc9629171b2e-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/HanZCPZB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiZXDB21, author = {Jingling Li and Mozhi Zhang and Keyulu Xu and John Dickerson and Jimmy Ba}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {How does a Neural Network's Architecture Impact its Robustness to Noisy Labels?}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {9788--9803}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/51311013e51adebc3c34d2cc591fefee-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/LiZXDB21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SaxenaBH21, author = {Vaibhav Saxena and Jimmy Ba and Danijar Hafner}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Clockwork Variational Autoencoders}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {29246--29257}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/f490d0af974fedf90cb0f1edce8e3dd5-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/SaxenaBH21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-06223, author = {Yuhuai Wu and Markus N. Rabe and Wenda Li and Jimmy Ba and Roger B. Grosse and Christian Szegedy}, title = {{LIME:} Learning Inductive Bias for Primitives of Mathematical Reasoning}, journal = {CoRR}, volume = {abs/2101.06223}, year = {2021}, url = {https://arxiv.org/abs/2101.06223}, eprinttype = {arXiv}, eprint = {2101.06223}, timestamp = {Fri, 22 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-06223.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-09532, author = {Vaibhav Saxena and Jimmy Ba and Danijar Hafner}, title = {Clockwork Variational Autoencoders}, journal = {CoRR}, volume = {abs/2102.09532}, year = {2021}, url = {https://arxiv.org/abs/2102.09532}, eprinttype = {arXiv}, eprint = {2102.09532}, timestamp = {Wed, 24 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-09532.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-14248, author = {Beining Han and Chongyi Zheng and Harris Chan and Keiran Paster and Michael R. Zhang and Jimmy Ba}, title = {Learning Domain Invariant Representations in Goal-conditioned Block MDPs}, journal = {CoRR}, volume = {abs/2110.14248}, year = {2021}, url = {https://arxiv.org/abs/2110.14248}, eprinttype = {arXiv}, eprint = {2110.14248}, timestamp = {Fri, 29 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-14248.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/WenLGZCB20, author = {Yeming Wen and Kevin Luk and Maxime Gazeau and Guodong Zhang and Harris Chan and Jimmy Ba}, editor = {Silvia Chiappa and Roberto Calandra}, title = {An Empirical Study of Stochastic Gradient Descent with Structured Covariance Noise}, booktitle = {The 23rd International Conference on Artificial Intelligence and Statistics, {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]}, series = {Proceedings of Machine Learning Research}, volume = {108}, pages = {3621--3631}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v108/wen20a.html}, timestamp = {Mon, 29 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/WenLGZCB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BaESWZ20, author = {Jimmy Ba and Murat A. Erdogdu and Taiji Suzuki and Denny Wu and Tianzong Zhang}, title = {Generalization of Two-layer Neural Networks: An Asymptotic Viewpoint}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=H1gBsgBYwH}, timestamp = {Thu, 07 May 2020 17:11:47 +0200}, biburl = {https://dblp.org/rec/conf/iclr/BaESWZ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/HafnerLB020, author = {Danijar Hafner and Timothy P. Lillicrap and Jimmy Ba and Mohammad Norouzi}, title = {Dream to Control: Learning Behaviors by Latent Imagination}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=S1lOTC4tDS}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/HafnerLB020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PitisCJB20, author = {Silviu Pitis and Harris Chan and Kiarash Jamali and Jimmy Ba}, title = {An Inductive Bias for Distances: Neural Nets that Respect the Triangle Inequality}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=HJeiDpVFPr}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PitisCJB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WangB20, author = {Tingwu Wang and Jimmy Ba}, title = {Exploring Model-based Planning with Policy Networks}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=H1exf64KwH}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WangB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WangZB20, author = {Yuanhao Wang and Guodong Zhang and Jimmy Ba}, title = {On Solving Minimax Optimization Locally: {A} Follow-the-Ridge Approach}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=Hkx7\_1rKwS}, timestamp = {Fri, 12 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WangZB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WenTB20, author = {Yeming Wen and Dustin Tran and Jimmy Ba}, title = {BatchEnsemble: an Alternative Approach to Efficient Ensemble and Lifelong Learning}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=Sklf1yrYDr}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WenTB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/HuangPBV20, author = {Xiao Shi Huang and Felipe P{\'{e}}rez and Jimmy Ba and Maksims Volkovs}, title = {Improving Transformer Optimization Through Better Initialization}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {4475--4483}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/huang20f.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/HuangPBV20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/PitisCZSB20, author = {Silviu Pitis and Harris Chan and Stephen Zhao and Bradly C. Stadie and Jimmy Ba}, title = {Maximum Entropy Gain Exploration for Long Horizon Multi-goal Reinforcement Learning}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {7750--7761}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/pitis20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/PitisCZSB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/uai/StadieZB20, author = {Bradly C. Stadie and Lunjun Zhang and Jimmy Ba}, editor = {Ryan P. Adams and Vibhav Gogate}, title = {Learning Intrinsic Rewards as a Bi-Level Optimization Problem}, booktitle = {Proceedings of the Thirty-Sixth Conference on Uncertainty in Artificial Intelligence, {UAI} 2020, virtual online, August 3-6, 2020}, series = {Proceedings of Machine Learning Research}, volume = {124}, pages = {111--120}, publisher = {{AUAI} Press}, year = {2020}, url = {http://proceedings.mlr.press/v124/stadie20a.html}, timestamp = {Tue, 07 May 2024 20:09:01 +0200}, biburl = {https://dblp.org/rec/conf/uai/StadieZB20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-05825, author = {Silviu Pitis and Harris Chan and Kiarash Jamali and Jimmy Ba}, title = {An Inductive Bias for Distances: Neural Nets that Respect the Triangle Inequality}, journal = {CoRR}, volume = {abs/2002.05825}, year = {2020}, url = {https://arxiv.org/abs/2002.05825}, eprinttype = {arXiv}, eprint = {2002.05825}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-05825.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2002-06715, author = {Yeming Wen and Dustin Tran and Jimmy Ba}, title = {BatchEnsemble: An Alternative Approach to Efficient Ensemble and Lifelong Learning}, journal = {CoRR}, volume = {abs/2002.06715}, year = {2020}, url = {https://arxiv.org/abs/2002.06715}, eprinttype = {arXiv}, eprint = {2002.06715}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2002-06715.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-10732, author = {Shun{-}ichi Amari and Jimmy Ba and Roger B. Grosse and Xuechen Li and Atsushi Nitanda and Taiji Suzuki and Denny Wu and Ji Xu}, title = {When Does Preconditioning Help or Hurt Generalization?}, journal = {CoRR}, volume = {abs/2006.10732}, year = {2020}, url = {https://arxiv.org/abs/2006.10732}, eprinttype = {arXiv}, eprint = {2006.10732}, timestamp = {Wed, 24 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-10732.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-02832, author = {Silviu Pitis and Harris Chan and Stephen Zhao and Bradly C. Stadie and Jimmy Ba}, title = {Maximum Entropy Gain Exploration for Long Horizon Multi-goal Reinforcement Learning}, journal = {CoRR}, volume = {abs/2007.02832}, year = {2020}, url = {https://arxiv.org/abs/2007.02832}, eprinttype = {arXiv}, eprint = {2007.02832}, timestamp = {Wed, 02 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-02832.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-02924, author = {Yuhuai Wu and Albert Q. Jiang and Jimmy Ba and Roger B. Grosse}, title = {{INT:} An Inequality Benchmark for Evaluating Generalization in Theorem Proving}, journal = {CoRR}, volume = {abs/2007.02924}, year = {2020}, url = {https://arxiv.org/abs/2007.02924}, eprinttype = {arXiv}, eprint = {2007.02924}, timestamp = {Mon, 30 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-02924.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-04212, author = {Yuhuai Wu and Honghua Dong and Roger B. Grosse and Jimmy Ba}, title = {The Scattering Compositional Learner: Discovering Objects, Attributes, Relationships in Analogical Reasoning}, journal = {CoRR}, volume = {abs/2007.04212}, year = {2020}, url = {https://arxiv.org/abs/2007.04212}, eprinttype = {arXiv}, eprint = {2007.04212}, timestamp = {Mon, 20 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-04212.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-04532, author = {Fartash Faghri and David Duvenaud and David J. Fleet and Jimmy Ba}, title = {A Study of Gradient Variance in Deep Learning}, journal = {CoRR}, volume = {abs/2007.04532}, year = {2020}, url = {https://arxiv.org/abs/2007.04532}, eprinttype = {arXiv}, eprint = {2007.04532}, timestamp = {Mon, 20 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-04532.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-01791, author = {Danijar Hafner and Pedro A. Ortega and Jimmy Ba and Thomas Parr and Karl J. Friston and Nicolas Heess}, title = {Action and Perception as Divergence Minimization}, journal = {CoRR}, volume = {abs/2009.01791}, year = {2020}, url = {https://arxiv.org/abs/2009.01791}, eprinttype = {arXiv}, eprint = {2009.01791}, timestamp = {Wed, 16 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-01791.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-02193, author = {Danijar Hafner and Timothy P. Lillicrap and Mohammad Norouzi and Jimmy Ba}, title = {Mastering Atari with Discrete World Models}, journal = {CoRR}, volume = {abs/2010.02193}, year = {2020}, url = {https://arxiv.org/abs/2010.02193}, eprinttype = {arXiv}, eprint = {2010.02193}, timestamp = {Mon, 12 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-02193.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-02419, author = {Keiran Paster and Sheila A. McIlraith and Jimmy Ba}, title = {Planning from Pixels using Inverse Dynamics Models}, journal = {CoRR}, volume = {abs/2012.02419}, year = {2020}, url = {https://arxiv.org/abs/2012.02419}, eprinttype = {arXiv}, eprint = {2012.02419}, timestamp = {Wed, 09 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-02419.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-11538, author = {Brendon Matusch and Jimmy Ba and Danijar Hafner}, title = {Evaluating Agents without Rewards}, journal = {CoRR}, volume = {abs/2012.11538}, year = {2020}, url = {https://arxiv.org/abs/2012.11538}, eprinttype = {arXiv}, eprint = {2012.11538}, timestamp = {Mon, 04 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-11538.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-12896, author = {Jingling Li and Mozhi Zhang and Keyulu Xu and John P. Dickerson and Jimmy Ba}, title = {Noisy Labels Can Induce Good Representations}, journal = {CoRR}, volume = {abs/2012.12896}, year = {2020}, url = {https://arxiv.org/abs/2012.12896}, eprinttype = {arXiv}, eprint = {2012.12896}, timestamp = {Tue, 05 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-12896.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/JiaKB19, author = {Sheng Jia and Jamie Kiros and Jimmy Ba}, title = {{DOM-Q-NET:} Grounded {RL} on Structured Language}, booktitle = {7th International Conference on Learning Representations, {ICLR} 2019, New Orleans, LA, USA, May 6-9, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=HJgd1nAqFX}, timestamp = {Thu, 25 Jul 2019 13:03:15 +0200}, biburl = {https://dblp.org/rec/conf/iclr/JiaKB19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WangZFB19, author = {Tingwu Wang and Yuhao Zhou and Sanja Fidler and Jimmy Ba}, title = {Neural Graph Evolution: Towards Efficient Automatic Robot Design}, booktitle = {7th International Conference on Learning Representations, {ICLR} 2019, New Orleans, LA, USA, May 6-9, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=BkgWHnR5tm}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WangZFB19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ZhangLBH19, author = {Michael R. Zhang and James Lucas and Jimmy Ba and Geoffrey E. Hinton}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Lookahead Optimizer: k steps forward, 1 step back}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {9593--9604}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/90fd4f88f588ae64038134f1eeaa023f-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/ZhangLBH19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuKBKS19, author = {Jenny Liu and Aviral Kumar and Jimmy Ba and Jamie Kiros and Kevin Swersky}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Graph Normalizing Flows}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {13556--13566}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/1e44fdf9c44d7328fecc02d677ed704d-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuKBKS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-04546, author = {Harris Chan and Yuhuai Wu and Jamie Kiros and Sanja Fidler and Jimmy Ba}, title = {{ACTRCE:} Augmenting Experience via Teacher's Advice For Multi-Goal Reinforcement Learning}, journal = {CoRR}, volume = {abs/1902.04546}, year = {2019}, url = {http://arxiv.org/abs/1902.04546}, eprinttype = {arXiv}, eprint = {1902.04546}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-04546.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-07257, author = {Sheng Jia and Jamie Kiros and Jimmy Ba}, title = {{DOM-Q-NET:} Grounded {RL} on Structured Language}, journal = {CoRR}, volume = {abs/1902.07257}, year = {2019}, url = {http://arxiv.org/abs/1902.07257}, eprinttype = {arXiv}, eprint = {1902.07257}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-07257.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-08234, author = {Yeming Wen and Kevin Luk and Maxime Gazeau and Guodong Zhang and Harris Chan and Jimmy Ba}, title = {Interplay Between Optimization and Generalization of Stochastic Gradient Descent with Covariance Noise}, journal = {CoRR}, volume = {abs/1902.08234}, year = {2019}, url = {http://arxiv.org/abs/1902.08234}, eprinttype = {arXiv}, eprint = {1902.08234}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-08234.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-13177, author = {Jenny Liu and Aviral Kumar and Jimmy Ba and Jamie Kiros and Kevin Swersky}, title = {Graph Normalizing Flows}, journal = {CoRR}, volume = {abs/1905.13177}, year = {2019}, url = {http://arxiv.org/abs/1905.13177}, eprinttype = {arXiv}, eprint = {1905.13177}, timestamp = {Mon, 03 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-13177.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-05370, author = {Tingwu Wang and Yuhao Zhou and Sanja Fidler and Jimmy Ba}, title = {Neural Graph Evolution: Towards Efficient Automatic Robot Design}, journal = {CoRR}, volume = {abs/1906.05370}, year = {2019}, url = {http://arxiv.org/abs/1906.05370}, eprinttype = {arXiv}, eprint = {1906.05370}, timestamp = {Mon, 24 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-05370.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-08649, author = {Tingwu Wang and Jimmy Ba}, title = {Exploring Model-based Planning with Policy Networks}, journal = {CoRR}, volume = {abs/1906.08649}, year = {2019}, url = {http://arxiv.org/abs/1906.08649}, eprinttype = {arXiv}, eprint = {1906.08649}, timestamp = {Mon, 24 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-08649.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-02057, author = {Tingwu Wang and Xuchan Bao and Ignasi Clavera and Jerrick Hoang and Yeming Wen and Eric D. Langlois and Shunshi Zhang and Guodong Zhang and Pieter Abbeel and Jimmy Ba}, title = {Benchmarking Model-Based Reinforcement Learning}, journal = {CoRR}, volume = {abs/1907.02057}, year = {2019}, url = {http://arxiv.org/abs/1907.02057}, eprinttype = {arXiv}, eprint = {1907.02057}, timestamp = {Fri, 20 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-02057.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-08610, author = {Michael R. Zhang and James Lucas and Geoffrey E. Hinton and Jimmy Ba}, title = {Lookahead Optimizer: k steps forward, 1 step back}, journal = {CoRR}, volume = {abs/1907.08610}, year = {2019}, url = {http://arxiv.org/abs/1907.08610}, eprinttype = {arXiv}, eprint = {1907.08610}, timestamp = {Tue, 23 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-08610.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-07512, author = {Yuanhao Wang and Guodong Zhang and Jimmy Ba}, title = {On Solving Minimax Optimization Locally: {A} Follow-the-Ridge Approach}, journal = {CoRR}, volume = {abs/1910.07512}, year = {2019}, url = {http://arxiv.org/abs/1910.07512}, eprinttype = {arXiv}, eprint = {1910.07512}, timestamp = {Fri, 12 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-07512.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-01603, author = {Danijar Hafner and Timothy P. Lillicrap and Jimmy Ba and Mohammad Norouzi}, title = {Dream to Control: Learning Behaviors by Latent Imagination}, journal = {CoRR}, volume = {abs/1912.01603}, year = {2019}, url = {http://arxiv.org/abs/1912.01603}, eprinttype = {arXiv}, eprint = {1912.01603}, timestamp = {Tue, 07 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-01603.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/MartensBJ18, author = {James Martens and Jimmy Ba and Matt Johnson}, title = {Kronecker-factored Curvature Approximations for Recurrent Neural Networks}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=HyMTkQZAb}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/MartensBJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WangLBF18, author = {Tingwu Wang and Renjie Liao and Jimmy Ba and Sanja Fidler}, title = {NerveNet: Learning Structured Policy with Graph Neural Networks}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=S1sqHMZCb}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WangLBF18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WenVBTG18, author = {Yeming Wen and Paul Vicol and Jimmy Ba and Dustin Tran and Roger B. Grosse}, title = {Flipout: Efficient Pseudo-Independent Weight Perturbations on Mini-Batches}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=rJNpifWAb}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WenVBTG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SanjabiBRL18, author = {Maziar Sanjabi and Jimmy Ba and Meisam Razaviyayn and Jason D. Lee}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {On the Convergence and Robustness of Training GANs with Regularized Optimal Transport}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {7091--7101}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/5a9d8bf5b7a4b35f3110dde8673bdda2-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/SanjabiBRL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/MacKayVBG18, author = {Matthew MacKay and Paul Vicol and Jimmy Ba and Roger B. Grosse}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Reversible Recurrent Neural Networks}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {9043--9054}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/4ff6fa96179cdc2838e8d8ce64cd10a7-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/MacKayVBG18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-08249, author = {Maziar Sanjabi and Jimmy Ba and Meisam Razaviyayn and Jason D. Lee}, title = {Solving Approximate Wasserstein GANs to Stationarity}, journal = {CoRR}, volume = {abs/1802.08249}, year = {2018}, url = {http://arxiv.org/abs/1802.08249}, eprinttype = {arXiv}, eprint = {1802.08249}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-08249.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1803-04386, author = {Yeming Wen and Paul Vicol and Jimmy Ba and Dustin Tran and Roger B. Grosse}, title = {Flipout: Efficient Pseudo-Independent Weight Perturbations on Mini-Batches}, journal = {CoRR}, volume = {abs/1803.04386}, year = {2018}, url = {http://arxiv.org/abs/1803.04386}, eprinttype = {arXiv}, eprint = {1803.04386}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1803-04386.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-10999, author = {Matthew MacKay and Paul Vicol and Jimmy Ba and Roger B. Grosse}, title = {Reversible Recurrent Neural Networks}, journal = {CoRR}, volume = {abs/1810.10999}, year = {2018}, url = {http://arxiv.org/abs/1810.10999}, eprinttype = {arXiv}, eprint = {1810.10999}, timestamp = {Mon, 22 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-10999.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BaGM17, author = {Jimmy Ba and Roger B. Grosse and James Martens}, title = {Distributed Second-Order Optimization using Kronecker-Factored Approximations}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=SkkTMpjex}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/BaGM17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/WuMGLB17, author = {Yuhuai Wu and Elman Mansimov and Roger B. Grosse and Shun Liao and Jimmy Ba}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Scalable trust-region method for deep reinforcement learning using Kronecker-factored approximation}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {5279--5288}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/361440528766bbaaaa1901845cf4152b-Abstract.html}, timestamp = {Thu, 21 Jan 2021 13:58:27 +0100}, biburl = {https://dblp.org/rec/conf/nips/WuMGLB17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1708-05144, author = {Yuhuai Wu and Elman Mansimov and Shun Liao and Roger B. Grosse and Jimmy Ba}, title = {Scalable trust-region method for deep reinforcement learning using Kronecker-factored approximation}, journal = {CoRR}, volume = {abs/1708.05144}, year = {2017}, url = {http://arxiv.org/abs/1708.05144}, eprinttype = {arXiv}, eprint = {1708.05144}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1708-05144.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/bioinformatics/KrausBF16, author = {Oren Z. Kraus and Lei Jimmy Ba and Brendan J. Frey}, title = {Classifying and segmenting microscopy images with deep multiple instance learning}, journal = {Bioinform.}, volume = {32}, number = {12}, pages = {52--59}, year = {2016}, url = {https://doi.org/10.1093/bioinformatics/btw252}, doi = {10.1093/BIOINFORMATICS/BTW252}, timestamp = {Mon, 02 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/bioinformatics/KrausBF16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaHMLI16, author = {Jimmy Ba and Geoffrey E. Hinton and Volodymyr Mnih and Joel Z. Leibo and Catalin Ionescu}, editor = {Daniel D. Lee and Masashi Sugiyama and Ulrike von Luxburg and Isabelle Guyon and Roman Garnett}, title = {Using Fast Weights to Attend to the Recent Past}, booktitle = {Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, December 5-10, 2016, Barcelona, Spain}, pages = {4331--4339}, year = {2016}, url = {https://proceedings.neurips.cc/paper/2016/hash/9f44e956e3a2b7b5598c625fcc802c36-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BaHMLI16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/MansimovPBS15, author = {Elman Mansimov and Emilio Parisotto and Lei Jimmy Ba and Ruslan Salakhutdinov}, editor = {Yoshua Bengio and Yann LeCun}, title = {Generating Images from Captions with Attention}, booktitle = {4th International Conference on Learning Representations, {ICLR} 2016, San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings}, year = {2016}, url = {http://arxiv.org/abs/1511.02793}, timestamp = {Wed, 17 Jul 2019 10:40:54 +0200}, biburl = {https://dblp.org/rec/journals/corr/MansimovPBS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/ParisottoBS15, author = {Emilio Parisotto and Lei Jimmy Ba and Ruslan Salakhutdinov}, editor = {Yoshua Bengio and Yann LeCun}, title = {Actor-Mimic: Deep Multitask and Transfer Reinforcement Learning}, booktitle = {4th International Conference on Learning Representations, {ICLR} 2016, San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings}, year = {2016}, url = {http://arxiv.org/abs/1511.06342}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ParisottoBS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BaKH16, author = {Lei Jimmy Ba and Jamie Ryan Kiros and Geoffrey E. Hinton}, title = {Layer Normalization}, journal = {CoRR}, volume = {abs/1607.06450}, year = {2016}, url = {http://arxiv.org/abs/1607.06450}, eprinttype = {arXiv}, eprint = {1607.06450}, timestamp = {Tue, 23 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BaKH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BaHMLI16, author = {Jimmy Ba and Geoffrey E. Hinton and Volodymyr Mnih and Joel Z. Leibo and Catalin Ionescu}, title = {Using Fast Weights to Attend to the Recent Past}, journal = {CoRR}, volume = {abs/1610.06258}, year = {2016}, url = {http://arxiv.org/abs/1610.06258}, eprinttype = {arXiv}, eprint = {1610.06258}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BaHMLI16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gamesem/MannJRHB15, author = {Steve Mann and Ryan E. Janzen and Valmiki Rampersad and Jason Huang and Lei Jimmy Ba}, editor = {Elena G. Bertozzi and Bill Kapralos and Nahum D. Gershon and Jim R. Parker}, title = {"SQUEAKeys": {A} friction idiophone, for physical interaction with mobile devices}, booktitle = {2015 {IEEE} Games Entertainment Media Conference, {GEM} 2015, Toronto, ON, Canada, October 14-16, 2015}, pages = {1--4}, publisher = {{IEEE}}, year = {2015}, url = {https://doi.org/10.1109/GEM.2015.7377235}, doi = {10.1109/GEM.2015.7377235}, timestamp = {Mon, 18 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gamesem/MannJRHB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/BaSFS15, author = {Lei Jimmy Ba and Kevin Swersky and Sanja Fidler and Ruslan Salakhutdinov}, title = {Predicting Deep Zero-Shot Convolutional Neural Networks Using Textual Descriptions}, booktitle = {2015 {IEEE} International Conference on Computer Vision, {ICCV} 2015, Santiago, Chile, December 7-13, 2015}, pages = {4247--4255}, publisher = {{IEEE} Computer Society}, year = {2015}, url = {https://doi.org/10.1109/ICCV.2015.483}, doi = {10.1109/ICCV.2015.483}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iccv/BaSFS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/XuBKCCSZB15, author = {Kelvin Xu and Jimmy Ba and Ryan Kiros and Kyunghyun Cho and Aaron C. Courville and Ruslan Salakhutdinov and Richard S. Zemel and Yoshua Bengio}, editor = {Francis R. Bach and David M. Blei}, title = {Show, Attend and Tell: Neural Image Caption Generation with Visual Attention}, booktitle = {Proceedings of the 32nd International Conference on Machine Learning, {ICML} 2015, Lille, France, 6-11 July 2015}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {37}, pages = {2048--2057}, publisher = {JMLR.org}, year = {2015}, url = {http://proceedings.mlr.press/v37/xuc15.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/XuBKCCSZB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaSGF15, author = {Jimmy Ba and Ruslan Salakhutdinov and Roger B. Grosse and Brendan J. Frey}, editor = {Corinna Cortes and Neil D. Lawrence and Daniel D. Lee and Masashi Sugiyama and Roman Garnett}, title = {Learning Wake-Sleep Recurrent Attention Models}, booktitle = {Advances in Neural Information Processing Systems 28: Annual Conference on Neural Information Processing Systems 2015, December 7-12, 2015, Montreal, Quebec, Canada}, pages = {2593--2601}, year = {2015}, url = {https://proceedings.neurips.cc/paper/2015/hash/db1915052d15f7815c8b88e879465a1e-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BaSGF15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/BaMK14, author = {Jimmy Ba and Volodymyr Mnih and Koray Kavukcuoglu}, editor = {Yoshua Bengio and Yann LeCun}, title = {Multiple Object Recognition with Visual Attention}, booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015, San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings}, year = {2015}, url = {http://arxiv.org/abs/1412.7755}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BaMK14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/KingmaB14, author = {Diederik P. Kingma and Jimmy Ba}, editor = {Yoshua Bengio and Yann LeCun}, title = {Adam: {A} Method for Stochastic Optimization}, booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015, San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings}, year = {2015}, url = {http://arxiv.org/abs/1412.6980}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/KingmaB14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/XuBKCCSZB15, author = {Kelvin Xu and Jimmy Ba and Ryan Kiros and Kyunghyun Cho and Aaron C. Courville and Ruslan Salakhutdinov and Richard S. Zemel and Yoshua Bengio}, title = {Show, Attend and Tell: Neural Image Caption Generation with Visual Attention}, journal = {CoRR}, volume = {abs/1502.03044}, year = {2015}, url = {http://arxiv.org/abs/1502.03044}, eprinttype = {arXiv}, eprint = {1502.03044}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/XuBKCCSZB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BaSFS15, author = {Jimmy Ba and Kevin Swersky and Sanja Fidler and Ruslan Salakhutdinov}, title = {Predicting Deep Zero-Shot Convolutional Neural Networks using Textual Descriptions}, journal = {CoRR}, volume = {abs/1506.00511}, year = {2015}, url = {http://arxiv.org/abs/1506.00511}, eprinttype = {arXiv}, eprint = {1506.00511}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BaSFS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BaGSF15, author = {Jimmy Ba and Roger B. Grosse and Ruslan Salakhutdinov and Brendan J. Frey}, title = {Learning Wake-Sleep Recurrent Attention Models}, journal = {CoRR}, volume = {abs/1509.06812}, year = {2015}, url = {http://arxiv.org/abs/1509.06812}, eprinttype = {arXiv}, eprint = {1509.06812}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BaGSF15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/KrausBF15, author = {Oren Z. Kraus and Lei Jimmy Ba and Brendan J. Frey}, title = {Classifying and Segmenting Microscopy Images Using Convolutional Multiple Instance Learning}, journal = {CoRR}, volume = {abs/1511.05286}, year = {2015}, url = {http://arxiv.org/abs/1511.05286}, eprinttype = {arXiv}, eprint = {1511.05286}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/KrausBF15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaC14, author = {Jimmy Ba and Rich Caruana}, editor = {Zoubin Ghahramani and Max Welling and Corinna Cortes and Neil D. Lawrence and Kilian Q. Weinberger}, title = {Do Deep Nets Really Need to be Deep?}, booktitle = {Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems 2014, December 8-13 2014, Montreal, Quebec, Canada}, pages = {2654--2662}, year = {2014}, url = {https://proceedings.neurips.cc/paper/2014/hash/ea8fcd92d59581717e06eb187f10666d-Abstract.html}, timestamp = {Fri, 10 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/BaC14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BaF13, author = {Lei Jimmy Ba and Brendan J. Frey}, editor = {Christopher J. C. Burges and L{\'{e}}on Bottou and Zoubin Ghahramani and Kilian Q. Weinberger}, title = {Adaptive dropout for training deep neural networks}, booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual Conference on Neural Information Processing Systems 2013. Proceedings of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States}, pages = {3084--3092}, year = {2013}, url = {https://proceedings.neurips.cc/paper/2013/hash/7b5b23f4aadf9513306bcd59afb6e4c9-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BaF13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BaC13, author = {Lei Jimmy Ba and Rich Caruana}, title = {Do Deep Nets Really Need to be Deep?}, journal = {CoRR}, volume = {abs/1312.6184}, year = {2013}, url = {http://arxiv.org/abs/1312.6184}, eprinttype = {arXiv}, eprint = {1312.6184}, timestamp = {Fri, 10 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/BaC13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/tei/MannJHKBC11, author = {Steve Mann and Ryan E. Janzen and Jason Huang and Matthew B. Kelly and Lei Jimmy Ba and Alexander Chen}, editor = {Mark D. Gross and Nuno Jardim Nunes and Ellen Yi{-}Luen Do and Stephen A. Brewster and Ian Oakley}, title = {User-interfaces based on the water-hammer effect: water-hammer piano as an interactive percussion surface}, booktitle = {Proceedings of the 5th International Conference on Tangible and Embedded Interaction 2011, Funchal, Madeira, Portugal, January 22-26, 2011}, pages = {1--8}, publisher = {{ACM}}, year = {2011}, url = {https://doi.org/10.1145/1935701.1935703}, doi = {10.1145/1935701.1935703}, timestamp = {Mon, 18 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/tei/MannJHKBC11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.