BibTeX records: Quoc V. Le

download as .bib file

@article{DBLP:journals/nature/TrinhWLHL24,
  author       = {Trieu H. Trinh and
                  Yuhuai Wu and
                  Quoc V. Le and
                  He He and
                  Thang Luong},
  title        = {Solving olympiad geometry without human demonstrations},
  journal      = {Nat.},
  volume       = {625},
  number       = {7995},
  pages        = {476--482},
  year         = {2024},
  url          = {https://doi.org/10.1038/s41586-023-06747-5},
  doi          = {10.1038/S41586-023-06747-5},
  timestamp    = {Fri, 08 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nature/TrinhWLHL24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-03620,
  author       = {Pei Zhou and
                  Jay Pujara and
                  Xiang Ren and
                  Xinyun Chen and
                  Heng{-}Tze Cheng and
                  Quoc V. Le and
                  Ed H. Chi and
                  Denny Zhou and
                  Swaroop Mishra and
                  Huaixiu Steven Zheng},
  title        = {Self-Discover: Large Language Models Self-Compose Reasoning Structures},
  journal      = {CoRR},
  volume       = {abs/2402.03620},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.03620},
  doi          = {10.48550/ARXIV.2402.03620},
  eprinttype    = {arXiv},
  eprint       = {2402.03620},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-03620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijon/PhamDGKLYYCLWTL23,
  author       = {Hieu Pham and
                  Zihang Dai and
                  Golnaz Ghiasi and
                  Kenji Kawaguchi and
                  Hanxiao Liu and
                  Adams Wei Yu and
                  Jiahui Yu and
                  Yi{-}Ting Chen and
                  Minh{-}Thang Luong and
                  Yonghui Wu and
                  Mingxing Tan and
                  Quoc V. Le},
  title        = {Combined scaling for zero-shot transfer learning},
  journal      = {Neurocomputing},
  volume       = {555},
  pages        = {126658},
  year         = {2023},
  url          = {https://doi.org/10.1016/j.neucom.2023.126658},
  doi          = {10.1016/J.NEUCOM.2023.126658},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijon/PhamDGKLYYCLWTL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SuzgunSSGTCCLCZ23,
  author       = {Mirac Suzgun and
                  Nathan Scales and
                  Nathanael Sch{\"{a}}rli and
                  Sebastian Gehrmann and
                  Yi Tay and
                  Hyung Won Chung and
                  Aakanksha Chowdhery and
                  Quoc V. Le and
                  Ed H. Chi and
                  Denny Zhou and
                  Jason Wei},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {Challenging BIG-Bench Tasks and Whether Chain-of-Thought Can Solve
                  Them},
  booktitle    = {Findings of the Association for Computational Linguistics: {ACL} 2023,
                  Toronto, Canada, July 9-14, 2023},
  pages        = {13003--13051},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.findings-acl.824},
  doi          = {10.18653/V1/2023.FINDINGS-ACL.824},
  timestamp    = {Mon, 29 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/SuzgunSSGTCCLCZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asplos/LiACCGHLLLLLLNP23,
  author       = {Sheng Li and
                  Garrett Andersen and
                  Tao Chen and
                  Liqun Cheng and
                  Julian Grady and
                  Da Huang and
                  Quoc V. Le and
                  Andrew Li and
                  Xin Li and
                  Yang Li and
                  Chen Liang and
                  Yifeng Lu and
                  Yun Ni and
                  Ruoming Pang and
                  Mingxing Tan and
                  Martin Wicke and
                  Gang Wu and
                  Shengqi Zhu and
                  Parthasarathy Ranganathan and
                  Norman P. Jouppi},
  editor       = {Tor M. Aamodt and
                  Natalie D. Enright Jerger and
                  Michael M. Swift},
  title        = {Hyperscale Hardware Optimized Neural Architecture Search},
  booktitle    = {Proceedings of the 28th {ACM} International Conference on Architectural
                  Support for Programming Languages and Operating Systems, Volume 3,
                  {ASPLOS} 2023, Vancouver, BC, Canada, March 25-29, 2023},
  pages        = {343--358},
  publisher    = {{ACM}},
  year         = {2023},
  url          = {https://doi.org/10.1145/3582016.3582049},
  doi          = {10.1145/3582016.3582049},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/asplos/LiACCGHLLLLLLNP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WeiHLCHTCLZ0L23,
  author       = {Jerry W. Wei and
                  Le Hou and
                  Andrew K. Lampinen and
                  Xiangning Chen and
                  Da Huang and
                  Yi Tay and
                  Xinyun Chen and
                  Yifeng Lu and
                  Denny Zhou and
                  Tengyu Ma and
                  Quoc V. Le},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Symbol tuning improves in-context learning in language models},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {968--979},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-main.61},
  timestamp    = {Wed, 13 Dec 2023 17:20:20 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/WeiHLCHTCLZ0L23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/TayWC0SSGZRCZMP23,
  author       = {Yi Tay and
                  Jason Wei and
                  Hyung Won Chung and
                  Vinh Q. Tran and
                  David R. So and
                  Siamak Shakeri and
                  Xavier Garcia and
                  Huaixiu Steven Zheng and
                  Jinfeng Rao and
                  Aakanksha Chowdhery and
                  Denny Zhou and
                  Donald Metzler and
                  Slav Petrov and
                  Neil Houlsby and
                  Quoc V. Le and
                  Mostafa Dehghani},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Transcending Scaling Laws with 0.1{\%} Extra Compute},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {1471--1486},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-main.91},
  timestamp    = {Thu, 14 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/TayWC0SSGZRCZMP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WeiKTL23,
  author       = {Jason Wei and
                  Najoung Kim and
                  Yi Tay and
                  Quoc V. Le},
  editor       = {Houda Bouamor and
                  Juan Pino and
                  Kalika Bali},
  title        = {Inverse Scaling Can Become U-Shaped},
  booktitle    = {Proceedings of the 2023 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023},
  pages        = {15580--15591},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://aclanthology.org/2023.emnlp-main.963},
  timestamp    = {Thu, 14 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/WeiKTL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/0002WSLCNCZ23,
  author       = {Xuezhi Wang and
                  Jason Wei and
                  Dale Schuurmans and
                  Quoc V. Le and
                  Ed H. Chi and
                  Sharan Narang and
                  Aakanksha Chowdhery and
                  Denny Zhou},
  title        = {Self-Consistency Improves Chain of Thought Reasoning in Language Models},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=1PL1NIMMrw},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/0002WSLCNCZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhouSHWS0SCBLC23,
  author       = {Denny Zhou and
                  Nathanael Sch{\"{a}}rli and
                  Le Hou and
                  Jason Wei and
                  Nathan Scales and
                  Xuezhi Wang and
                  Dale Schuurmans and
                  Claire Cui and
                  Olivier Bousquet and
                  Quoc V. Le and
                  Ed H. Chi},
  title        = {Least-to-Most Prompting Enables Complex Reasoning in Large Language
                  Models},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=WZH7099tgfM},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhouSHWS0SCBLC23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LongpreHVWCTZLZ23,
  author       = {Shayne Longpre and
                  Le Hou and
                  Tu Vu and
                  Albert Webson and
                  Hyung Won Chung and
                  Yi Tay and
                  Denny Zhou and
                  Quoc V. Le and
                  Barret Zoph and
                  Jason Wei and
                  Adam Roberts},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {The Flan Collection: Designing Data and Methods for Effective Instruction
                  Tuning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {22631--22648},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/longpre23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LongpreHVWCTZLZ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ZhouDHPLHSSDLCL23,
  author       = {Yanqi Zhou and
                  Nan Du and
                  Yanping Huang and
                  Daiyi Peng and
                  Chang Lan and
                  Da Huang and
                  Siamak Shakeri and
                  David R. So and
                  Andrew M. Dai and
                  Yifeng Lu and
                  Zhifeng Chen and
                  Quoc V. Le and
                  Claire Cui and
                  James Laudon and
                  Jeff Dean},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Brainformers: Trading Simplicity for Efficiency},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {42531--42542},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/zhou23c.html},
  timestamp    = {Fri, 01 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/ZhouDHPLHSSDLCL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChenLHRW0DLHLL23,
  author       = {Xiangning Chen and
                  Chen Liang and
                  Da Huang and
                  Esteban Real and
                  Kaiyuan Wang and
                  Hieu Pham and
                  Xuanyi Dong and
                  Thang Luong and
                  Cho{-}Jui Hsieh and
                  Yifeng Lu and
                  Quoc V. Le},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Symbolic Discovery of Optimization Algorithms},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/9a39b4925e35cf447ccba8757137d84f-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChenLHRW0DLHLL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Xie0DDLLLL0Y23,
  author       = {Sang Michael Xie and
                  Hieu Pham and
                  Xuanyi Dong and
                  Nan Du and
                  Hanxiao Liu and
                  Yifeng Lu and
                  Percy Liang and
                  Quoc V. Le and
                  Tengyu Ma and
                  Adams Wei Yu},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {DoReMi: Optimizing Data Mixtures Speeds Up Language Model Pretraining},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/dcba6be91359358c2355cd920da3fcbd-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Xie0DDLLLL0Y23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-13688,
  author       = {Shayne Longpre and
                  Le Hou and
                  Tu Vu and
                  Albert Webson and
                  Hyung Won Chung and
                  Yi Tay and
                  Denny Zhou and
                  Quoc V. Le and
                  Barret Zoph and
                  Jason Wei and
                  Adam Roberts},
  title        = {The Flan Collection: Designing Data and Methods for Effective Instruction
                  Tuning},
  journal      = {CoRR},
  volume       = {abs/2301.13688},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.13688},
  doi          = {10.48550/ARXIV.2301.13688},
  eprinttype    = {arXiv},
  eprint       = {2301.13688},
  timestamp    = {Thu, 02 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-13688.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-01918,
  author       = {Daiyi Peng and
                  Xuanyi Dong and
                  Esteban Real and
                  Yifeng Lu and
                  Quoc V. Le},
  title        = {PyGlove: Efficiently Exchanging {ML} Ideas as Code},
  journal      = {CoRR},
  volume       = {abs/2302.01918},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.01918},
  doi          = {10.48550/ARXIV.2302.01918},
  eprinttype    = {arXiv},
  eprint       = {2302.01918},
  timestamp    = {Fri, 10 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-01918.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-03917,
  author       = {Qingqing Huang and
                  Daniel S. Park and
                  Tao Wang and
                  Timo I. Denk and
                  Andy Ly and
                  Nanxin Chen and
                  Zhengdong Zhang and
                  Zhishuai Zhang and
                  Jiahui Yu and
                  Christian Havn{\o} Frank and
                  Jesse H. Engel and
                  Quoc V. Le and
                  William Chan and
                  Wei Han},
  title        = {Noise2Music: Text-conditioned Music Generation with Diffusion Models},
  journal      = {CoRR},
  volume       = {abs/2302.03917},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.03917},
  doi          = {10.48550/ARXIV.2302.03917},
  eprinttype    = {arXiv},
  eprint       = {2302.03917},
  timestamp    = {Fri, 10 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-03917.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-05433,
  author       = {Ryan Gillard and
                  Stephen Jonany and
                  Yingjie Miao and
                  Michael Munn and
                  Connal de Souza and
                  Jonathan Dungay and
                  Chen Liang and
                  David R. So and
                  Quoc V. Le and
                  Esteban Real},
  title        = {Unified Functional Hashing in Automatic Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2302.05433},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.05433},
  doi          = {10.48550/ARXIV.2302.05433},
  eprinttype    = {arXiv},
  eprint       = {2302.05433},
  timestamp    = {Mon, 13 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-05433.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-06675,
  author       = {Xiangning Chen and
                  Chen Liang and
                  Da Huang and
                  Esteban Real and
                  Kaiyuan Wang and
                  Yao Liu and
                  Hieu Pham and
                  Xuanyi Dong and
                  Thang Luong and
                  Cho{-}Jui Hsieh and
                  Yifeng Lu and
                  Quoc V. Le},
  title        = {Symbolic Discovery of Optimization Algorithms},
  journal      = {CoRR},
  volume       = {abs/2302.06675},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.06675},
  doi          = {10.48550/ARXIV.2302.06675},
  eprinttype    = {arXiv},
  eprint       = {2302.06675},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-06675.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-08298,
  author       = {Jerry W. Wei and
                  Le Hou and
                  Andrew K. Lampinen and
                  Xiangning Chen and
                  Da Huang and
                  Yi Tay and
                  Xinyun Chen and
                  Yifeng Lu and
                  Denny Zhou and
                  Tengyu Ma and
                  Quoc V. Le},
  title        = {Symbol tuning improves in-context learning in language models},
  journal      = {CoRR},
  volume       = {abs/2305.08298},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.08298},
  doi          = {10.48550/ARXIV.2305.08298},
  eprinttype    = {arXiv},
  eprint       = {2305.08298},
  timestamp    = {Thu, 01 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-08298.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-10429,
  author       = {Sang Michael Xie and
                  Hieu Pham and
                  Xuanyi Dong and
                  Nan Du and
                  Hanxiao Liu and
                  Yifeng Lu and
                  Percy Liang and
                  Quoc V. Le and
                  Tengyu Ma and
                  Adams Wei Yu},
  title        = {DoReMi: Optimizing Data Mixtures Speeds Up Language Model Pretraining},
  journal      = {CoRR},
  volume       = {abs/2305.10429},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.10429},
  doi          = {10.48550/ARXIV.2305.10429},
  eprinttype    = {arXiv},
  eprint       = {2305.10429},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-10429.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-00008,
  author       = {Yanqi Zhou and
                  Nan Du and
                  Yanping Huang and
                  Daiyi Peng and
                  Chang Lan and
                  Da Huang and
                  Siamak Shakeri and
                  David R. So and
                  Andrew M. Dai and
                  Yifeng Lu and
                  Zhifeng Chen and
                  Quoc V. Le and
                  Claire Cui and
                  James Laudon and
                  Jeff Dean},
  title        = {Brainformers: Trading Simplicity for Efficiency},
  journal      = {CoRR},
  volume       = {abs/2306.00008},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.00008},
  doi          = {10.48550/ARXIV.2306.00008},
  eprinttype    = {arXiv},
  eprint       = {2306.00008},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-00008.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-03290,
  author       = {Jordan Dotzel and
                  Gang Wu and
                  Andrew Li and
                  Muhammad Umar and
                  Yun Ni and
                  Mohamed S. Abdelfattah and
                  Zhiru Zhang and
                  Liqun Cheng and
                  Martin G. Dixon and
                  Norman P. Jouppi and
                  Quoc V. Le and
                  Sheng Li},
  title        = {{FLIQS:} One-Shot Mixed-Precision Floating-Point and Integer Quantization
                  Search},
  journal      = {CoRR},
  volume       = {abs/2308.03290},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.03290},
  doi          = {10.48550/ARXIV.2308.03290},
  eprinttype    = {arXiv},
  eprint       = {2308.03290},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-03290.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-03958,
  author       = {Jerry W. Wei and
                  Da Huang and
                  Yifeng Lu and
                  Denny Zhou and
                  Quoc V. Le},
  title        = {Simple synthetic data reduces sycophancy in large language models},
  journal      = {CoRR},
  volume       = {abs/2308.03958},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.03958},
  doi          = {10.48550/ARXIV.2308.03958},
  eprinttype    = {arXiv},
  eprint       = {2308.03958},
  timestamp    = {Tue, 22 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-03958.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-03409,
  author       = {Chengrun Yang and
                  Xuezhi Wang and
                  Yifeng Lu and
                  Hanxiao Liu and
                  Quoc V. Le and
                  Denny Zhou and
                  Xinyun Chen},
  title        = {Large Language Models as Optimizers},
  journal      = {CoRR},
  volume       = {abs/2309.03409},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.03409},
  doi          = {10.48550/ARXIV.2309.03409},
  eprinttype    = {arXiv},
  eprint       = {2309.03409},
  timestamp    = {Tue, 12 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-03409.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-03214,
  author       = {Tu Vu and
                  Mohit Iyyer and
                  Xuezhi Wang and
                  Noah Constant and
                  Jerry W. Wei and
                  Jason Wei and
                  Chris Tar and
                  Yun{-}Hsuan Sung and
                  Denny Zhou and
                  Quoc V. Le and
                  Thang Luong},
  title        = {FreshLLMs: Refreshing Large Language Models with Search Engine Augmentation},
  journal      = {CoRR},
  volume       = {abs/2310.03214},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.03214},
  doi          = {10.48550/ARXIV.2310.03214},
  eprinttype    = {arXiv},
  eprint       = {2310.03214},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-03214.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06117,
  author       = {Huaixiu Steven Zheng and
                  Swaroop Mishra and
                  Xinyun Chen and
                  Heng{-}Tze Cheng and
                  Ed H. Chi and
                  Quoc V. Le and
                  Denny Zhou},
  title        = {Take a Step Back: Evoking Reasoning via Abstraction in Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2310.06117},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06117},
  doi          = {10.48550/ARXIV.2310.06117},
  eprinttype    = {arXiv},
  eprint       = {2310.06117},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06117.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-00763,
  author       = {Xiao Ma and
                  Swaroop Mishra and
                  Ariel Liu and
                  Sophie Su and
                  Jilin Chen and
                  Chinmay Kulkarni and
                  Heng{-}Tze Cheng and
                  Quoc V. Le and
                  Ed H. Chi},
  title        = {Beyond ChatBots: ExploreLLM for Structured Thoughts and Personalized
                  Model Responses},
  journal      = {CoRR},
  volume       = {abs/2312.00763},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.00763},
  doi          = {10.48550/ARXIV.2312.00763},
  eprinttype    = {arXiv},
  eprint       = {2312.00763},
  timestamp    = {Mon, 11 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-00763.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-08472,
  author       = {Esteban Real and
                  Yao Chen and
                  Mirko Rossini and
                  Connal de Souza and
                  Manav Garg and
                  Akhil Verghese and
                  Moritz Firsching and
                  Quoc V. Le and
                  Ekin Dogus Cubuk and
                  David H. Park},
  title        = {AutoNumerics-Zero: Automated Discovery of State-of-the-Art Mathematical
                  Functions},
  journal      = {CoRR},
  volume       = {abs/2312.08472},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.08472},
  doi          = {10.48550/ARXIV.2312.08472},
  eprinttype    = {arXiv},
  eprint       = {2312.08472},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-08472.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/computer/PattersonGHLLMR22,
  author       = {David A. Patterson and
                  Joseph Gonzalez and
                  Urs H{\"{o}}lzle and
                  Quoc V. Le and
                  Chen Liang and
                  Lluis{-}Miquel Munguia and
                  Daniel Rothchild and
                  David R. So and
                  Maud Texier and
                  Jeff Dean},
  title        = {The Carbon Footprint of Machine Learning Training Will Plateau, Then
                  Shrink},
  journal      = {Computer},
  volume       = {55},
  number       = {7},
  pages        = {18--28},
  year         = {2022},
  url          = {https://doi.org/10.1109/MC.2022.3148714},
  doi          = {10.1109/MC.2022.3148714},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/computer/PattersonGHLLMR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jstsp/ZhangPHQGSJXHWZ22,
  author       = {Yu Zhang and
                  Daniel S. Park and
                  Wei Han and
                  James Qin and
                  Anmol Gulati and
                  Joel Shor and
                  Aren Jansen and
                  Yuanzhong Xu and
                  Yanping Huang and
                  Shibo Wang and
                  Zongwei Zhou and
                  Bo Li and
                  Min Ma and
                  William Chan and
                  Jiahui Yu and
                  Yongqiang Wang and
                  Liangliang Cao and
                  Khe Chai Sim and
                  Bhuvana Ramabhadran and
                  Tara N. Sainath and
                  Fran{\c{c}}oise Beaufays and
                  Zhifeng Chen and
                  Quoc V. Le and
                  Chung{-}Cheng Chiu and
                  Ruoming Pang and
                  Yonghui Wu},
  title        = {BigSSL: Exploring the Frontier of Large-Scale Semi-Supervised Learning
                  for Automatic Speech Recognition},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {16},
  number       = {6},
  pages        = {1519--1532},
  year         = {2022},
  url          = {https://doi.org/10.1109/JSTSP.2022.3182537},
  doi          = {10.1109/JSTSP.2022.3182537},
  timestamp    = {Sun, 13 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jstsp/ZhangPHQGSJXHWZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/asplos/ZhangHSPLGM22,
  author       = {Dan Zhang and
                  Safeen Huda and
                  Ebrahim M. Songhori and
                  Kartik Prabhu and
                  Quoc V. Le and
                  Anna Goldie and
                  Azalia Mirhoseini},
  editor       = {Babak Falsafi and
                  Michael Ferdman and
                  Shan Lu and
                  Thomas F. Wenisch},
  title        = {A full-stack search technique for domain optimized deep learning accelerators},
  booktitle    = {{ASPLOS} '22: 27th {ACM} International Conference on Architectural
                  Support for Programming Languages and Operating Systems, Lausanne,
                  Switzerland, 28 February 2022 - 4 March 2022},
  pages        = {27--42},
  publisher    = {{ACM}},
  year         = {2022},
  url          = {https://doi.org/10.1145/3503222.3507767},
  doi          = {10.1145/3503222.3507767},
  timestamp    = {Fri, 23 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/asplos/ZhangHSPLGM22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LiYMCNPSLZLYT22,
  author       = {Yingwei Li and
                  Adams Wei Yu and
                  Tianjian Meng and
                  Benjamin Caine and
                  Jiquan Ngiam and
                  Daiyi Peng and
                  Junyang Shen and
                  Yifeng Lu and
                  Denny Zhou and
                  Quoc V. Le and
                  Alan L. Yuille and
                  Mingxing Tan},
  title        = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection},
  booktitle    = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022},
  pages        = {17161--17170},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/CVPR52688.2022.01667},
  doi          = {10.1109/CVPR52688.2022.01667},
  timestamp    = {Wed, 05 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/LiYMCNPSLZLYT22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/WeiBZGYLDDL22,
  author       = {Jason Wei and
                  Maarten Bosma and
                  Vincent Y. Zhao and
                  Kelvin Guu and
                  Adams Wei Yu and
                  Brian Lester and
                  Nan Du and
                  Andrew M. Dai and
                  Quoc V. Le},
  title        = {Finetuned Language Models are Zero-Shot Learners},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=gEZrGCozdqR},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/WeiBZGYLDDL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DuHDTLXKZYFZFBZ22,
  author       = {Nan Du and
                  Yanping Huang and
                  Andrew M. Dai and
                  Simon Tong and
                  Dmitry Lepikhin and
                  Yuanzhong Xu and
                  Maxim Krikun and
                  Yanqi Zhou and
                  Adams Wei Yu and
                  Orhan Firat and
                  Barret Zoph and
                  Liam Fedus and
                  Maarten P. Bosma and
                  Zongwei Zhou and
                  Tao Wang and
                  Yu Emma Wang and
                  Kellie Webster and
                  Marie Pellat and
                  Kevin Robinson and
                  Kathleen S. Meier{-}Hellstern and
                  Toju Duke and
                  Lucas Dixon and
                  Kun Zhang and
                  Quoc V. Le and
                  Yonghui Wu and
                  Zhifeng Chen and
                  Claire Cui},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {GLaM: Efficient Scaling of Language Models with Mixture-of-Experts},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {5547--5569},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/du22c.html},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DuHDTLXKZYFZFBZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HuaDLL22,
  author       = {Weizhe Hua and
                  Zihang Dai and
                  Hanxiao Liu and
                  Quoc V. Le},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Transformer Quality in Linear Time},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {9099--9117},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/hua22a.html},
  timestamp    = {Tue, 12 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HuaDLL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Wei0SBIXCLZ22,
  author       = {Jason Wei and
                  Xuezhi Wang and
                  Dale Schuurmans and
                  Maarten Bosma and
                  Brian Ichter and
                  Fei Xia and
                  Ed H. Chi and
                  Quoc V. Le and
                  Denny Zhou},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Chain-of-Thought Prompting Elicits Reasoning in Large Language Models},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/9d5609613524ecf4f15af0f7b31abca4-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Wei0SBIXCLZ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangBLKULLH22,
  author       = {Chengrun Yang and
                  Gabriel Bender and
                  Hanxiao Liu and
                  Pieter{-}Jan Kindermans and
                  Madeleine Udell and
                  Yifeng Lu and
                  Quoc V. Le and
                  Da Huang},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {TabNAS: Rejection Sampling for Neural Architecture Search on Tabular
                  Datasets},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/4e392aa9bc70ed731d3c9c32810f92fb-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangBLKULLH22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhouLLDHZDCLL22,
  author       = {Yanqi Zhou and
                  Tao Lei and
                  Hanxiao Liu and
                  Nan Du and
                  Yanping Huang and
                  Vincent Y. Zhao and
                  Andrew M. Dai and
                  Zhifeng Chen and
                  Quoc V. Le and
                  James Laudon},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Mixture-of-Experts with Expert Choice Routing},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/2f00ecd787b432c1d36f3de9800728eb-Abstract-Conference.html},
  timestamp    = {Tue, 27 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhouLLDHZDCLL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/WangCRCWRMLP22,
  author       = {Gary Wang and
                  Ekin D. Cubuk and
                  Andrew Rosenberg and
                  Shuyang Cheng and
                  Ron J. Weiss and
                  Bhuvana Ramabhadran and
                  Pedro J. Moreno and
                  Quoc V. Le and
                  Daniel S. Park},
  title        = {G-Augment: Searching for the Meta-Structure of Data Augmentation Policies
                  for {ASR}},
  booktitle    = {{IEEE} Spoken Language Technology Workshop, {SLT} 2022, Doha, Qatar,
                  January 9-12, 2023},
  pages        = {23--30},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/SLT54892.2023.10022748},
  doi          = {10.1109/SLT54892.2023.10022748},
  timestamp    = {Mon, 06 Feb 2023 22:19:30 +0100},
  biburl       = {https://dblp.org/rec/conf/slt/WangCRCWRMLP22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-08239,
  author       = {Romal Thoppilan and
                  Daniel De Freitas and
                  Jamie Hall and
                  Noam Shazeer and
                  Apoorv Kulshreshtha and
                  Heng{-}Tze Cheng and
                  Alicia Jin and
                  Taylor Bos and
                  Leslie Baker and
                  Yu Du and
                  YaGuang Li and
                  Hongrae Lee and
                  Huaixiu Steven Zheng and
                  Amin Ghafouri and
                  Marcelo Menegali and
                  Yanping Huang and
                  Maxim Krikun and
                  Dmitry Lepikhin and
                  James Qin and
                  Dehao Chen and
                  Yuanzhong Xu and
                  Zhifeng Chen and
                  Adam Roberts and
                  Maarten Bosma and
                  Yanqi Zhou and
                  Chung{-}Ching Chang and
                  Igor Krivokon and
                  Will Rusch and
                  Marc Pickett and
                  Kathleen S. Meier{-}Hellstern and
                  Meredith Ringel Morris and
                  Tulsee Doshi and
                  Renelito Delos Santos and
                  Toju Duke and
                  Johnny Soraker and
                  Ben Zevenbergen and
                  Vinodkumar Prabhakaran and
                  Mark Diaz and
                  Ben Hutchinson and
                  Kristen Olson and
                  Alejandra Molina and
                  Erin Hoffman{-}John and
                  Josh Lee and
                  Lora Aroyo and
                  Ravi Rajakumar and
                  Alena Butryna and
                  Matthew Lamm and
                  Viktoriya Kuzmina and
                  Joe Fenton and
                  Aaron Cohen and
                  Rachel Bernstein and
                  Ray Kurzweil and
                  Blaise Ag{\"{u}}era y Arcas and
                  Claire Cui and
                  Marian Croak and
                  Ed H. Chi and
                  Quoc Le},
  title        = {LaMDA: Language Models for Dialog Applications},
  journal      = {CoRR},
  volume       = {abs/2201.08239},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.08239},
  eprinttype    = {arXiv},
  eprint       = {2201.08239},
  timestamp    = {Fri, 16 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-08239.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-11903,
  author       = {Jason Wei and
                  Xuezhi Wang and
                  Dale Schuurmans and
                  Maarten Bosma and
                  Ed H. Chi and
                  Quoc Le and
                  Denny Zhou},
  title        = {Chain of Thought Prompting Elicits Reasoning in Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2201.11903},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.11903},
  eprinttype    = {arXiv},
  eprint       = {2201.11903},
  timestamp    = {Fri, 22 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-11903.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-09368,
  author       = {Yanqi Zhou and
                  Tao Lei and
                  Hanxiao Liu and
                  Nan Du and
                  Yanping Huang and
                  Vincent Y. Zhao and
                  Andrew M. Dai and
                  Zhifeng Chen and
                  Quoc Le and
                  James Laudon},
  title        = {Mixture-of-Experts with Expert Choice Routing},
  journal      = {CoRR},
  volume       = {abs/2202.09368},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.09368},
  eprinttype    = {arXiv},
  eprint       = {2202.09368},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-09368.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-10447,
  author       = {Weizhe Hua and
                  Zihang Dai and
                  Hanxiao Liu and
                  Quoc V. Le},
  title        = {Transformer Quality in Linear Time},
  journal      = {CoRR},
  volume       = {abs/2202.10447},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.10447},
  eprinttype    = {arXiv},
  eprint       = {2202.10447},
  timestamp    = {Wed, 02 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-10447.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-08195,
  author       = {Yingwei Li and
                  Adams Wei Yu and
                  Tianjian Meng and
                  Benjamin Caine and
                  Jiquan Ngiam and
                  Daiyi Peng and
                  Junyang Shen and
                  Bo Wu and
                  Yifeng Lu and
                  Denny Zhou and
                  Quoc V. Le and
                  Alan L. Yuille and
                  Mingxing Tan},
  title        = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection},
  journal      = {CoRR},
  volume       = {abs/2203.08195},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.08195},
  doi          = {10.48550/ARXIV.2203.08195},
  eprinttype    = {arXiv},
  eprint       = {2203.08195},
  timestamp    = {Mon, 28 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-08195.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-11171,
  author       = {Xuezhi Wang and
                  Jason Wei and
                  Dale Schuurmans and
                  Quoc V. Le and
                  Ed H. Chi and
                  Denny Zhou},
  title        = {Self-Consistency Improves Chain of Thought Reasoning in Language Models},
  journal      = {CoRR},
  volume       = {abs/2203.11171},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.11171},
  doi          = {10.48550/ARXIV.2203.11171},
  eprinttype    = {arXiv},
  eprint       = {2203.11171},
  timestamp    = {Fri, 22 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-11171.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-12683,
  author       = {Tianjian Meng and
                  Golnaz Ghiasi and
                  Reza Mahjourian and
                  Quoc V. Le and
                  Mingxing Tan},
  title        = {Revisiting Multi-Scale Feature Fusion for Semantic Segmentation},
  journal      = {CoRR},
  volume       = {abs/2203.12683},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.12683},
  doi          = {10.48550/ARXIV.2203.12683},
  eprinttype    = {arXiv},
  eprint       = {2203.12683},
  timestamp    = {Tue, 29 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-12683.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-05149,
  author       = {David A. Patterson and
                  Joseph Gonzalez and
                  Urs H{\"{o}}lzle and
                  Quoc V. Le and
                  Chen Liang and
                  Lluis{-}Miquel Munguia and
                  Daniel Rothchild and
                  David R. So and
                  Maud Texier and
                  Jeff Dean},
  title        = {The Carbon Footprint of Machine Learning Training Will Plateau, Then
                  Shrink},
  journal      = {CoRR},
  volume       = {abs/2204.05149},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.05149},
  doi          = {10.48550/ARXIV.2204.05149},
  eprinttype    = {arXiv},
  eprint       = {2204.05149},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-05149.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-07615,
  author       = {Chengrun Yang and
                  Gabriel Bender and
                  Hanxiao Liu and
                  Pieter{-}Jan Kindermans and
                  Madeleine Udell and
                  Yifeng Lu and
                  Quoc V. Le and
                  Da Huang},
  title        = {Resource-Constrained Neural Architecture Search on Tabular Datasets},
  journal      = {CoRR},
  volume       = {abs/2204.07615},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.07615},
  doi          = {10.48550/ARXIV.2204.07615},
  eprinttype    = {arXiv},
  eprint       = {2204.07615},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-07615.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-10625,
  author       = {Denny Zhou and
                  Nathanael Sch{\"{a}}rli and
                  Le Hou and
                  Jason Wei and
                  Nathan Scales and
                  Xuezhi Wang and
                  Dale Schuurmans and
                  Olivier Bousquet and
                  Quoc Le and
                  Ed H. Chi},
  title        = {Least-to-Most Prompting Enables Complex Reasoning in Large Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2205.10625},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10625},
  doi          = {10.48550/ARXIV.2205.10625},
  eprinttype    = {arXiv},
  eprint       = {2205.10625},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10625.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-00747,
  author       = {Xuezhi Wang and
                  Jason Wei and
                  Dale Schuurmans and
                  Quoc V. Le and
                  Ed H. Chi and
                  Denny Zhou},
  title        = {Rationale-Augmented Ensembles in Language Models},
  journal      = {CoRR},
  volume       = {abs/2207.00747},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.00747},
  doi          = {10.48550/ARXIV.2207.00747},
  eprinttype    = {arXiv},
  eprint       = {2207.00747},
  timestamp    = {Wed, 06 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-00747.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-09261,
  author       = {Mirac Suzgun and
                  Nathan Scales and
                  Nathanael Sch{\"{a}}rli and
                  Sebastian Gehrmann and
                  Yi Tay and
                  Hyung Won Chung and
                  Aakanksha Chowdhery and
                  Quoc V. Le and
                  Ed H. Chi and
                  Denny Zhou and
                  Jason Wei},
  title        = {Challenging BIG-Bench Tasks and Whether Chain-of-Thought Can Solve
                  Them},
  journal      = {CoRR},
  volume       = {abs/2210.09261},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.09261},
  doi          = {10.48550/ARXIV.2210.09261},
  eprinttype    = {arXiv},
  eprint       = {2210.09261},
  timestamp    = {Wed, 19 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-09261.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-10879,
  author       = {Gary Wang and
                  Ekin D. Cubuk and
                  Andrew Rosenberg and
                  Shuyang Cheng and
                  Ron J. Weiss and
                  Bhuvana Ramabhadran and
                  Pedro J. Moreno and
                  Quoc V. Le and
                  Daniel S. Park},
  title        = {G-Augment: Searching for the Meta-Structure of Data Augmentation Policies
                  for {ASR}},
  journal      = {CoRR},
  volume       = {abs/2210.10879},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.10879},
  doi          = {10.48550/ARXIV.2210.10879},
  eprinttype    = {arXiv},
  eprint       = {2210.10879},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-10879.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-11399,
  author       = {Yi Tay and
                  Jason Wei and
                  Hyung Won Chung and
                  Vinh Q. Tran and
                  David R. So and
                  Siamak Shakeri and
                  Xavier Garcia and
                  Huaixiu Steven Zheng and
                  Jinfeng Rao and
                  Aakanksha Chowdhery and
                  Denny Zhou and
                  Donald Metzler and
                  Slav Petrov and
                  Neil Houlsby and
                  Quoc V. Le and
                  Mostafa Dehghani},
  title        = {Transcending Scaling Laws with 0.1{\%} Extra Compute},
  journal      = {CoRR},
  volume       = {abs/2210.11399},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.11399},
  doi          = {10.48550/ARXIV.2210.11399},
  eprinttype    = {arXiv},
  eprint       = {2210.11399},
  timestamp    = {Tue, 25 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-11399.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-11416,
  author       = {Hyung Won Chung and
                  Le Hou and
                  Shayne Longpre and
                  Barret Zoph and
                  Yi Tay and
                  William Fedus and
                  Eric Li and
                  Xuezhi Wang and
                  Mostafa Dehghani and
                  Siddhartha Brahma and
                  Albert Webson and
                  Shixiang Shane Gu and
                  Zhuyun Dai and
                  Mirac Suzgun and
                  Xinyun Chen and
                  Aakanksha Chowdhery and
                  Sharan Narang and
                  Gaurav Mishra and
                  Adams Yu and
                  Vincent Y. Zhao and
                  Yanping Huang and
                  Andrew M. Dai and
                  Hongkun Yu and
                  Slav Petrov and
                  Ed H. Chi and
                  Jeff Dean and
                  Jacob Devlin and
                  Adam Roberts and
                  Denny Zhou and
                  Quoc V. Le and
                  Jason Wei},
  title        = {Scaling Instruction-Finetuned Language Models},
  journal      = {CoRR},
  volume       = {abs/2210.11416},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.11416},
  doi          = {10.48550/ARXIV.2210.11416},
  eprinttype    = {arXiv},
  eprint       = {2210.11416},
  timestamp    = {Mon, 04 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-11416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-02011,
  author       = {Jason Wei and
                  Yi Tay and
                  Quoc V. Le},
  title        = {Inverse scaling can become U-shaped},
  journal      = {CoRR},
  volume       = {abs/2211.02011},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.02011},
  doi          = {10.48550/ARXIV.2211.02011},
  eprinttype    = {arXiv},
  eprint       = {2211.02011},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-02011.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nature/MirhoseiniGYJSW21,
  author       = {Azalia Mirhoseini and
                  Anna Goldie and
                  Mustafa Yazgan and
                  Joe Wenjie Jiang and
                  Ebrahim M. Songhori and
                  Shen Wang and
                  Young{-}Joon Lee and
                  Eric Johnson and
                  Omkar Pathak and
                  Azade Nazi and
                  Jiwoo Pak and
                  Andy Tong and
                  Kavya Srinivasa and
                  William Hang and
                  Emre Tuncer and
                  Quoc V. Le and
                  James Laudon and
                  Richard Ho and
                  Roger Carpenter and
                  Jeff Dean},
  title        = {A graph placement methodology for fast chip design},
  journal      = {Nat.},
  volume       = {594},
  number       = {7862},
  pages        = {207--212},
  year         = {2021},
  url          = {https://doi.org/10.1038/s41586-021-03544-w},
  doi          = {10.1038/S41586-021-03544-W},
  timestamp    = {Mon, 05 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nature/MirhoseiniGYJSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/PhamL21,
  author       = {Hieu Pham and
                  Quoc V. Le},
  title        = {AutoDropout: Learning Dropout Patterns to Regularize Deep Networks},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {9351--9359},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i11.17127},
  doi          = {10.1609/AAAI.V35I11.17127},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/PhamL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/GhiasiCSQLCLZ21,
  author       = {Golnaz Ghiasi and
                  Yin Cui and
                  Aravind Srinivas and
                  Rui Qian and
                  Tsung{-}Yi Lin and
                  Ekin D. Cubuk and
                  Quoc V. Le and
                  Barret Zoph},
  title        = {Simple Copy-Paste Is a Strong Data Augmentation Method for Instance
                  Segmentation},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {2918--2928},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Ghiasi\_Simple\_Copy-Paste\_Is\_a\_Strong\_Data\_Augmentation\_Method\_for\_Instance\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.00294},
  timestamp    = {Mon, 18 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/GhiasiCSQLCLZ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/0007TPLCLJ21,
  author       = {Sheng Li and
                  Mingxing Tan and
                  Ruoming Pang and
                  Andrew Li and
                  Liqun Cheng and
                  Quoc V. Le and
                  Norman P. Jouppi},
  title        = {Searching for Fast Model Families on Datacenter Accelerators},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {8085--8095},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Li\_Searching\_for\_Fast\_Model\_Families\_on\_Datacenter\_Accelerators\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.00799},
  timestamp    = {Mon, 18 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/0007TPLCLJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/PhamDXL21,
  author       = {Hieu Pham and
                  Zihang Dai and
                  Qizhe Xie and
                  Quoc V. Le},
  title        = {Meta Pseudo Labels},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2021, virtual, June 19-25, 2021},
  pages        = {11557--11568},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2021},
  url          = {https://openaccess.thecvf.com/content/CVPR2021/html/Pham\_Meta\_Pseudo\_Labels\_CVPR\_2021\_paper.html},
  doi          = {10.1109/CVPR46437.2021.01139},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/PhamDXL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/VuLLSI21,
  author       = {Tu Vu and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Grady Simon and
                  Mohit Iyyer},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {STraTA: Self-Training with Task Augmentation for Better Few-shot Learning},
  booktitle    = {Proceedings of the 2021 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican
                  Republic, 7-11 November, 2021},
  pages        = {5715--5731},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.emnlp-main.462},
  doi          = {10.18653/V1/2021.EMNLP-MAIN.462},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/VuLLSI21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/GhiasiZCLL21,
  author       = {Golnaz Ghiasi and
                  Barret Zoph and
                  Ekin D. Cubuk and
                  Quoc V. Le and
                  Tsung{-}Yi Lin},
  title        = {Multi-Task Self-Training for Learning General Representations},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {8836--8845},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.00873},
  doi          = {10.1109/ICCV48922.2021.00873},
  timestamp    = {Fri, 11 Mar 2022 10:01:27 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/GhiasiZCLL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Co-ReyesMPRLLLF21,
  author       = {John D. Co{-}Reyes and
                  Yingjie Miao and
                  Daiyi Peng and
                  Esteban Real and
                  Quoc V. Le and
                  Sergey Levine and
                  Honglak Lee and
                  Aleksandra Faust},
  title        = {Evolving Reinforcement Learning Algorithms},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=0XXpJ4OtjW},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Co-ReyesMPRLLLF21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JiaYXCPPLSLD21,
  author       = {Chao Jia and
                  Yinfei Yang and
                  Ye Xia and
                  Yi{-}Ting Chen and
                  Zarana Parekh and
                  Hieu Pham and
                  Quoc V. Le and
                  Yun{-}Hsuan Sung and
                  Zhen Li and
                  Tom Duerig},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Scaling Up Visual and Vision-Language Representation Learning With
                  Noisy Text Supervision},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {4904--4916},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/jia21b.html},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/JiaYXCPPLSLD21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TanL21,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {EfficientNetV2: Smaller Models and Faster Training},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {10096--10106},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/tan21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TanL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/VermaLKPL21,
  author       = {Vikas Verma and
                  Thang Luong and
                  Kenji Kawaguchi and
                  Hieu Pham and
                  Quoc V. Le},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Towards Domain-Agnostic Contrastive Learning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {10530--10541},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/verma21a.html},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/VermaLKPL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ipps/WongpanichPDTLY21,
  author       = {Arissa Wongpanich and
                  Hieu Pham and
                  James Demmel and
                  Mingxing Tan and
                  Quoc V. Le and
                  Yang You and
                  Sameer Kumar},
  title        = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1
                  Accuracy in One Hour},
  booktitle    = {{IEEE} International Parallel and Distributed Processing Symposium
                  Workshops, {IPDPS} Workshops 2021, Portland, OR, USA, June 17-21,
                  2021},
  pages        = {947--950},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IPDPSW52791.2021.00146},
  doi          = {10.1109/IPDPSW52791.2021.00146},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ipps/WongpanichPDTLY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DaiLLT21,
  author       = {Zihang Dai and
                  Hanxiao Liu and
                  Quoc V. Le and
                  Mingxing Tan},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {CoAtNet: Marrying Convolution and Attention for All Data Sizes},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {3965--3977},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/20568692db622456cc42a2e853ca21f8-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DaiLLT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SoMLDSL21,
  author       = {David R. So and
                  Wojciech Manke and
                  Hanxiao Liu and
                  Zihang Dai and
                  Noam Shazeer and
                  Quoc V. Le},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Searching for Efficient Transformers for Language Modeling},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {6010--6022},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/2f3c6a4cd8af177f6456e7e51a916ff3-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SoMLDSL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuDSL21,
  author       = {Hanxiao Liu and
                  Zihang Dai and
                  David R. So and
                  Quoc V. Le},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Pay Attention to MLPs},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {9204--9215},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/4cc05b35c2f937c5bd9e7d41d3686fff-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LiuDSL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-01761,
  author       = {Hieu Pham and
                  Quoc V. Le},
  title        = {AutoDropout: Learning Dropout Patterns to Regularize Deep Networks},
  journal      = {CoRR},
  volume       = {abs/2101.01761},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.01761},
  eprinttype    = {arXiv},
  eprint       = {2101.01761},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-01761.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-03958,
  author       = {John D. Co{-}Reyes and
                  Yingjie Miao and
                  Daiyi Peng and
                  Esteban Real and
                  Sergey Levine and
                  Quoc V. Le and
                  Honglak Lee and
                  Aleksandra Faust},
  title        = {Evolving Reinforcement Learning Algorithms},
  journal      = {CoRR},
  volume       = {abs/2101.03958},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.03958},
  eprinttype    = {arXiv},
  eprint       = {2101.03958},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-03958.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-08809,
  author       = {Daiyi Peng and
                  Xuanyi Dong and
                  Esteban Real and
                  Mingxing Tan and
                  Yifeng Lu and
                  Hanxiao Liu and
                  Gabriel Bender and
                  Adam Kraft and
                  Chen Liang and
                  Quoc V. Le},
  title        = {PyGlove: Symbolic Programming for Automated Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2101.08809},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.08809},
  eprinttype    = {arXiv},
  eprint       = {2101.08809},
  timestamp    = {Sat, 30 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-08809.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-05610,
  author       = {Sheng Li and
                  Mingxing Tan and
                  Ruoming Pang and
                  Andrew Li and
                  Liqun Cheng and
                  Quoc V. Le and
                  Norman P. Jouppi},
  title        = {Searching for Fast Model Families on Datacenter Accelerators},
  journal      = {CoRR},
  volume       = {abs/2102.05610},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.05610},
  eprinttype    = {arXiv},
  eprint       = {2102.05610},
  timestamp    = {Thu, 18 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-05610.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-05918,
  author       = {Chao Jia and
                  Yinfei Yang and
                  Ye Xia and
                  Yi{-}Ting Chen and
                  Zarana Parekh and
                  Hieu Pham and
                  Quoc V. Le and
                  Yun{-}Hsuan Sung and
                  Zhen Li and
                  Tom Duerig},
  title        = {Scaling Up Visual and Vision-Language Representation Learning With
                  Noisy Text Supervision},
  journal      = {CoRR},
  volume       = {abs/2102.05918},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.05918},
  eprinttype    = {arXiv},
  eprint       = {2102.05918},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-05918.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-00298,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  title        = {EfficientNetV2: Smaller Models and Faster Training},
  journal      = {CoRR},
  volume       = {abs/2104.00298},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.00298},
  eprinttype    = {arXiv},
  eprint       = {2104.00298},
  timestamp    = {Mon, 12 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-00298.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-02133,
  author       = {William Chan and
                  Daniel S. Park and
                  Chris A. Lee and
                  Yu Zhang and
                  Quoc V. Le and
                  Mohammad Norouzi},
  title        = {SpeechStew: Simply Mix All Available Speech Recognition Data to Train
                  One Large Neural Network},
  journal      = {CoRR},
  volume       = {abs/2104.02133},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.02133},
  eprinttype    = {arXiv},
  eprint       = {2104.02133},
  timestamp    = {Tue, 16 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-02133.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-10350,
  author       = {David A. Patterson and
                  Joseph Gonzalez and
                  Quoc V. Le and
                  Chen Liang and
                  Lluis{-}Miquel Munguia and
                  Daniel Rothchild and
                  David R. So and
                  Maud Texier and
                  Jeff Dean},
  title        = {Carbon Emissions and Large Neural Network Training},
  journal      = {CoRR},
  volume       = {abs/2104.10350},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.10350},
  eprinttype    = {arXiv},
  eprint       = {2104.10350},
  timestamp    = {Thu, 13 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-10350.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-08050,
  author       = {Hanxiao Liu and
                  Zihang Dai and
                  David R. So and
                  Quoc V. Le},
  title        = {Pay Attention to MLPs},
  journal      = {CoRR},
  volume       = {abs/2105.08050},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.08050},
  eprinttype    = {arXiv},
  eprint       = {2105.08050},
  timestamp    = {Tue, 18 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-08050.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-12842,
  author       = {Dan Zhang and
                  Safeen Huda and
                  Ebrahim M. Songhori and
                  Quoc V. Le and
                  Anna Goldie and
                  Azalia Mirhoseini},
  title        = {A Full-stack Accelerator Search Technique for Vision Applications},
  journal      = {CoRR},
  volume       = {abs/2105.12842},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.12842},
  eprinttype    = {arXiv},
  eprint       = {2105.12842},
  timestamp    = {Fri, 23 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-12842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04803,
  author       = {Zihang Dai and
                  Hanxiao Liu and
                  Quoc V. Le and
                  Mingxing Tan},
  title        = {CoAtNet: Marrying Convolution and Attention for All Data Sizes},
  journal      = {CoRR},
  volume       = {abs/2106.04803},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04803},
  eprinttype    = {arXiv},
  eprint       = {2106.04803},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04803.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-07732,
  author       = {Jacob Austin and
                  Augustus Odena and
                  Maxwell I. Nye and
                  Maarten Bosma and
                  Henryk Michalewski and
                  David Dohan and
                  Ellen Jiang and
                  Carrie J. Cai and
                  Michael Terry and
                  Quoc V. Le and
                  Charles Sutton},
  title        = {Program Synthesis with Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2108.07732},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.07732},
  eprinttype    = {arXiv},
  eprint       = {2108.07732},
  timestamp    = {Fri, 29 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-07732.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-11353,
  author       = {Golnaz Ghiasi and
                  Barret Zoph and
                  Ekin D. Cubuk and
                  Quoc V. Le and
                  Tsung{-}Yi Lin},
  title        = {Multi-Task Self-Training for Learning General Representations},
  journal      = {CoRR},
  volume       = {abs/2108.11353},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.11353},
  eprinttype    = {arXiv},
  eprint       = {2108.11353},
  timestamp    = {Fri, 27 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-11353.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-01652,
  author       = {Jason Wei and
                  Maarten Bosma and
                  Vincent Y. Zhao and
                  Kelvin Guu and
                  Adams Wei Yu and
                  Brian Lester and
                  Nan Du and
                  Andrew M. Dai and
                  Quoc V. Le},
  title        = {Finetuned Language Models Are Zero-Shot Learners},
  journal      = {CoRR},
  volume       = {abs/2109.01652},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.01652},
  eprinttype    = {arXiv},
  eprint       = {2109.01652},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-01652.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-06270,
  author       = {Tu Vu and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Grady Simon and
                  Mohit Iyyer},
  title        = {STraTA: Self-Training with Task Augmentation for Better Few-shot Learning},
  journal      = {CoRR},
  volume       = {abs/2109.06270},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.06270},
  eprinttype    = {arXiv},
  eprint       = {2109.06270},
  timestamp    = {Tue, 21 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-06270.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-08668,
  author       = {David R. So and
                  Wojciech Manke and
                  Hanxiao Liu and
                  Zihang Dai and
                  Noam Shazeer and
                  Quoc V. Le},
  title        = {Primer: Searching for Efficient Transformers for Language Modeling},
  journal      = {CoRR},
  volume       = {abs/2109.08668},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.08668},
  eprinttype    = {arXiv},
  eprint       = {2109.08668},
  timestamp    = {Wed, 22 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-08668.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-13226,
  author       = {Yu Zhang and
                  Daniel S. Park and
                  Wei Han and
                  James Qin and
                  Anmol Gulati and
                  Joel Shor and
                  Aren Jansen and
                  Yuanzhong Xu and
                  Yanping Huang and
                  Shibo Wang and
                  Zongwei Zhou and
                  Bo Li and
                  Min Ma and
                  William Chan and
                  Jiahui Yu and
                  Yongqiang Wang and
                  Liangliang Cao and
                  Khe Chai Sim and
                  Bhuvana Ramabhadran and
                  Tara N. Sainath and
                  Fran{\c{c}}oise Beaufays and
                  Zhifeng Chen and
                  Quoc V. Le and
                  Chung{-}Cheng Chiu and
                  Ruoming Pang and
                  Yonghui Wu},
  title        = {BigSSL: Exploring the Frontier of Large-Scale Semi-Supervised Learning
                  for Automatic Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2109.13226},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.13226},
  eprinttype    = {arXiv},
  eprint       = {2109.13226},
  timestamp    = {Wed, 20 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-13226.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-10050,
  author       = {Hieu Pham and
                  Zihang Dai and
                  Golnaz Ghiasi and
                  Hanxiao Liu and
                  Adams Wei Yu and
                  Minh{-}Thang Luong and
                  Mingxing Tan and
                  Quoc V. Le},
  title        = {Combined Scaling for Zero-shot Transfer Learning},
  journal      = {CoRR},
  volume       = {abs/2111.10050},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.10050},
  eprinttype    = {arXiv},
  eprint       = {2111.10050},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-10050.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-06905,
  author       = {Nan Du and
                  Yanping Huang and
                  Andrew M. Dai and
                  Simon Tong and
                  Dmitry Lepikhin and
                  Yuanzhong Xu and
                  Maxim Krikun and
                  Yanqi Zhou and
                  Adams Wei Yu and
                  Orhan Firat and
                  Barret Zoph and
                  Liam Fedus and
                  Maarten Bosma and
                  Zongwei Zhou and
                  Tao Wang and
                  Yu Emma Wang and
                  Kellie Webster and
                  Marie Pellat and
                  Kevin Robinson and
                  Kathy Meier{-}Hellstern and
                  Toju Duke and
                  Lucas Dixon and
                  Kun Zhang and
                  Quoc V. Le and
                  Yonghui Wu and
                  Zhifeng Chen and
                  Claire Cui},
  title        = {GLaM: Efficient Scaling of Language Models with Mixture-of-Experts},
  journal      = {CoRR},
  volume       = {abs/2112.06905},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.06905},
  eprinttype    = {arXiv},
  eprint       = {2112.06905},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-06905.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/XieTGWYL20,
  author       = {Cihang Xie and
                  Mingxing Tan and
                  Boqing Gong and
                  Jiang Wang and
                  Alan L. Yuille and
                  Quoc V. Le},
  title        = {Adversarial Examples Improve Image Recognition},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {816--825},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Xie\_Adversarial\_Examples\_Improve\_Image\_Recognition\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.00090},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/XieTGWYL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/CubukZSL20,
  author       = {Ekin D. Cubuk and
                  Barret Zoph and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Randaugment: Practical automated data augmentation with a reduced
                  search space},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} Workshops 2020, Seattle, WA, USA, June 14-19, 2020},
  pages        = {3008--3017},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPRW\_2020/html/w40/Cubuk\_Randaugment\_Practical\_Automated\_Data\_Augmentation\_With\_a\_Reduced\_Search\_Space\_CVPRW\_2020\_paper.html},
  doi          = {10.1109/CVPRW50498.2020.00359},
  timestamp    = {Tue, 31 Aug 2021 14:00:09 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/CubukZSL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/XieLHL20,
  author       = {Qizhe Xie and
                  Minh{-}Thang Luong and
                  Eduard H. Hovy and
                  Quoc V. Le},
  title        = {Self-Training With Noisy Student Improves ImageNet Classification},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {10684--10695},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Xie\_Self-Training\_With\_Noisy\_Student\_Improves\_ImageNet\_Classification\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01070},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/XieLHL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/TanPL20,
  author       = {Mingxing Tan and
                  Ruoming Pang and
                  Quoc V. Le},
  title        = {EfficientDet: Scalable and Efficient Object Detection},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {10778--10787},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Tan\_EfficientDet\_Scalable\_and\_Efficient\_Object\_Detection\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01079},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/TanPL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/DuLJGTCLS20,
  author       = {Xianzhi Du and
                  Tsung{-}Yi Lin and
                  Pengchong Jin and
                  Golnaz Ghiasi and
                  Mingxing Tan and
                  Yin Cui and
                  Quoc V. Le and
                  Xiaodan Song},
  title        = {SpineNet: Learning Scale-Permuted Backbone for Recognition and Localization},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {11589--11598},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Du\_SpineNet\_Learning\_Scale-Permuted\_Backbone\_for\_Recognition\_and\_Localization\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01161},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/DuLJGTCLS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/ChenGLLKAL20,
  author       = {Bo Chen and
                  Golnaz Ghiasi and
                  Hanxiao Liu and
                  Tsung{-}Yi Lin and
                  Dmitry Kalenichenko and
                  Hartwig Adam and
                  Quoc V. Le},
  title        = {MnasFPN: Learning Latency-Aware Pyramid Architecture for Object Detection
                  on Mobile Devices},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {13604--13613},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Chen\_MnasFPN\_Learning\_Latency-Aware\_Pyramid\_Architecture\_for\_Object\_Detection\_on\_Mobile\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01362},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/ChenGLLKAL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/BenderLCCCKL20,
  author       = {Gabriel Bender and
                  Hanxiao Liu and
                  Bo Chen and
                  Grace Chu and
                  Shuyang Cheng and
                  Pieter{-}Jan Kindermans and
                  Quoc V. Le},
  title        = {Can Weight Sharing Outperform Random Architecture Search? An Investigation
                  With TuNAS},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020},
  pages        = {14311--14320},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Bender\_Can\_Weight\_Sharing\_Outperform\_Random\_Architecture\_Search\_An\_Investigation\_With\_CVPR\_2020\_paper.html},
  doi          = {10.1109/CVPR42600.2020.01433},
  timestamp    = {Mon, 30 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/BenderLCCCKL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/ChengLCZBNSCVLL20,
  author       = {Shuyang Cheng and
                  Zhaoqi Leng and
                  Ekin Dogus Cubuk and
                  Barret Zoph and
                  Chunyan Bai and
                  Jiquan Ngiam and
                  Yang Song and
                  Benjamin Caine and
                  Vijay Vasudevan and
                  Congcong Li and
                  Quoc V. Le and
                  Jonathon Shlens and
                  Dragomir Anguelov},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Improving 3D Object Detection Through Progressive Population Based
                  Augmentation},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {XXI}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12366},
  pages        = {279--294},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58589-1\_17},
  doi          = {10.1007/978-3-030-58589-1\_17},
  timestamp    = {Thu, 12 Nov 2020 17:00:57 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/ChengLCZBNSCVLL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/ZophCGLSL20,
  author       = {Barret Zoph and
                  Ekin D. Cubuk and
                  Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Jonathon Shlens and
                  Quoc V. Le},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Learning Data Augmentation Strategies for Object Detection},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {XXVII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12372},
  pages        = {566--583},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58583-9\_34},
  doi          = {10.1007/978-3-030-58583-9\_34},
  timestamp    = {Mon, 23 Nov 2020 08:37:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/ZophCGLSL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/DuLJCTLS20,
  author       = {Xianzhi Du and
                  Tsung{-}Yi Lin and
                  Pengchong Jin and
                  Yin Cui and
                  Mingxing Tan and
                  Quoc V. Le and
                  Xiaodan Song},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {Efficient Scale-Permuted Backbone with Learned Resource Distribution},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {XXIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12368},
  pages        = {572--586},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58592-1\_34},
  doi          = {10.1007/978-3-030-58592-1\_34},
  timestamp    = {Tue, 03 Nov 2020 17:25:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/DuLJCTLS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/YuJLBKTHSPL20,
  author       = {Jiahui Yu and
                  Pengchong Jin and
                  Hanxiao Liu and
                  Gabriel Bender and
                  Pieter{-}Jan Kindermans and
                  Mingxing Tan and
                  Thomas S. Huang and
                  Xiaodan Song and
                  Ruoming Pang and
                  Quoc Le},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {BigNAS: Scaling up Neural Architecture Search with Big Single-Stage
                  Models},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {VII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12352},
  pages        = {702--717},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58571-6\_41},
  doi          = {10.1007/978-3-030-58571-6\_41},
  timestamp    = {Thu, 03 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/YuJLBKTHSPL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ClarkLLM20,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Christopher D. Manning},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Pre-Training Transformers as Energy-Based Cloze Models},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {285--294},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.20},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.20},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ClarkLLM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ParkZCCLCLW20,
  author       = {Daniel S. Park and
                  Yu Zhang and
                  Chung{-}Cheng Chiu and
                  Youzheng Chen and
                  Bo Li and
                  William Chan and
                  Quoc V. Le and
                  Yonghui Wu},
  title        = {Specaugment on Large Scale Datasets},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6879--6883},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053205},
  doi          = {10.1109/ICASSP40776.2020.9053205},
  timestamp    = {Thu, 26 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/ParkZCCLCLW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ChenLYZSL20,
  author       = {Xinyun Chen and
                  Chen Liang and
                  Adams Wei Yu and
                  Denny Zhou and
                  Dawn Song and
                  Quoc V. Le},
  title        = {Neural Symbolic Reader: Scalable Integration of Distributed and Symbolic
                  Representations for Reading Comprehension},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=ryxjnREFwH},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ChenLYZSL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ClarkLLM20,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Christopher D. Manning},
  title        = {{ELECTRA:} Pre-training Text Encoders as Discriminators Rather Than
                  Generators},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=r1xMH1BtvB},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ClarkLLM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RealLSL20,
  author       = {Esteban Real and
                  Chen Liang and
                  David R. So and
                  Quoc V. Le},
  title        = {AutoML-Zero: Evolving Machine Learning Algorithms From Scratch},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {8007--8019},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/real20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/RealLSL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ZhouYCMTSLLS20,
  author       = {Denny Zhou and
                  Mao Ye and
                  Chen Chen and
                  Tianjian Meng and
                  Mingxing Tan and
                  Xiaodan Song and
                  Quoc V. Le and
                  Qiang Liu and
                  Dale Schuurmans},
  title        = {Go Wide, Then Narrow: Efficient Training of Deep Thin Networks},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {11546--11555},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/zhou20f.html},
  timestamp    = {Wed, 15 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/ZhouYCMTSLLS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ParkZJHCLWL20,
  author       = {Daniel S. Park and
                  Yu Zhang and
                  Ye Jia and
                  Wei Han and
                  Chung{-}Cheng Chiu and
                  Bo Li and
                  Yonghui Wu and
                  Quoc V. Le},
  editor       = {Helen Meng and
                  Bo Xu and
                  Thomas Fang Zheng},
  title        = {Improved Noisy Student Training for Automatic Speech Recognition},
  booktitle    = {Interspeech 2020, 21st Annual Conference of the International Speech
                  Communication Association, Virtual Event, Shanghai, China, 25-29 October
                  2020},
  pages        = {2817--2821},
  publisher    = {{ISCA}},
  year         = {2020},
  url          = {https://doi.org/10.21437/Interspeech.2020-1470},
  doi          = {10.21437/INTERSPEECH.2020-1470},
  timestamp    = {Tue, 09 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/ParkZJHCLWL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/JoglekarLCXWAKL20,
  author       = {Manas R. Joglekar and
                  Cong Li and
                  Mei Chen and
                  Taibai Xu and
                  Xiaoming Wang and
                  Jay K. Adams and
                  Pranav Khaitan and
                  Jiahui Liu and
                  Quoc V. Le},
  editor       = {Rajesh Gupta and
                  Yan Liu and
                  Jiliang Tang and
                  B. Aditya Prakash},
  title        = {Neural Input Search for Large Scale Recommendation Models},
  booktitle    = {{KDD} '20: The 26th {ACM} {SIGKDD} Conference on Knowledge Discovery
                  and Data Mining, Virtual Event, CA, USA, August 23-27, 2020},
  pages        = {2387--2397},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3394486.3403288},
  doi          = {10.1145/3394486.3403288},
  timestamp    = {Tue, 09 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/kdd/JoglekarLCXWAKL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CubukZS020,
  author       = {Ekin Dogus Cubuk and
                  Barret Zoph and
                  Jonathon Shlens and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {RandAugment: Practical Automated Data Augmentation with a Reduced
                  Search Space},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/d85b63ef0ccb114d0a3bb7b7d808028f-Abstract.html},
  timestamp    = {Mon, 02 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/CubukZS020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DaiLY020,
  author       = {Zihang Dai and
                  Guokun Lai and
                  Yiming Yang and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Funnel-Transformer: Filtering out Sequential Redundancy for Efficient
                  Language Processing},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/2cd2915e69546904e4e5d4a2ac9e1652-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DaiLY020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuBS020,
  author       = {Hanxiao Liu and
                  Andy Brock and
                  Karen Simonyan and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Evolving Normalization-Activation Layers},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/9d4c03631b8b0c85ae08bf05eda37d0f-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LiuBS020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PengDRTLBLKL020,
  author       = {Daiyi Peng and
                  Xuanyi Dong and
                  Esteban Real and
                  Mingxing Tan and
                  Yifeng Lu and
                  Gabriel Bender and
                  Hanxiao Liu and
                  Adam Kraft and
                  Chen Liang and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {PyGlove: Symbolic Programming for Automated Machine Learning},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/012a91467f210472fab4e11359bbfef6-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/PengDRTLBLKL020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/XieDHL020,
  author       = {Qizhe Xie and
                  Zihang Dai and
                  Eduard H. Hovy and
                  Thang Luong and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Unsupervised Data Augmentation for Consistency Training},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/44feb0096faa8326192570788b38c1d1-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/XieDHL020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZophGLCLC020,
  author       = {Barret Zoph and
                  Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Yin Cui and
                  Hanxiao Liu and
                  Ekin Dogus Cubuk and
                  Quoc Le},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Rethinking Pre-training and Self-training},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/27e9661e033a73a6ad8cefcde965c54d-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZophGLCLC020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-09977,
  author       = {Daniel Adiwardana and
                  Minh{-}Thang Luong and
                  David R. So and
                  Jamie Hall and
                  Noah Fiedel and
                  Romal Thoppilan and
                  Zi Yang and
                  Apoorv Kulshreshtha and
                  Gaurav Nemade and
                  Yifeng Lu and
                  Quoc V. Le},
  title        = {Towards a Human-like Open-Domain Chatbot},
  journal      = {CoRR},
  volume       = {abs/2001.09977},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.09977},
  eprinttype    = {arXiv},
  eprint       = {2001.09977},
  timestamp    = {Thu, 30 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-09977.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-03384,
  author       = {Esteban Real and
                  Chen Liang and
                  David R. So and
                  Quoc V. Le},
  title        = {AutoML-Zero: Evolving Machine Learning Algorithms From Scratch},
  journal      = {CoRR},
  volume       = {abs/2003.03384},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.03384},
  eprinttype    = {arXiv},
  eprint       = {2003.03384},
  timestamp    = {Tue, 10 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-03384.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-10555,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Christopher D. Manning},
  title        = {{ELECTRA:} Pre-training Text Encoders as Discriminators Rather Than
                  Generators},
  journal      = {CoRR},
  volume       = {abs/2003.10555},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.10555},
  eprinttype    = {arXiv},
  eprint       = {2003.10555},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-10555.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-10580,
  author       = {Hieu Pham and
                  Qizhe Xie and
                  Zihang Dai and
                  Quoc V. Le},
  title        = {Meta Pseudo Labels},
  journal      = {CoRR},
  volume       = {abs/2003.10580},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.10580},
  eprinttype    = {arXiv},
  eprint       = {2003.10580},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-10580.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-11142,
  author       = {Jiahui Yu and
                  Pengchong Jin and
                  Hanxiao Liu and
                  Gabriel Bender and
                  Pieter{-}Jan Kindermans and
                  Mingxing Tan and
                  Thomas S. Huang and
                  Xiaodan Song and
                  Ruoming Pang and
                  Quoc V. Le},
  title        = {BigNAS: Scaling Up Neural Architecture Search with Big Single-Stage
                  Models},
  journal      = {CoRR},
  volume       = {abs/2003.11142},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.11142},
  eprinttype    = {arXiv},
  eprint       = {2003.11142},
  timestamp    = {Tue, 03 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-11142.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-00831,
  author       = {Shuyang Cheng and
                  Zhaoqi Leng and
                  Ekin Dogus Cubuk and
                  Barret Zoph and
                  Chunyan Bai and
                  Jiquan Ngiam and
                  Yang Song and
                  Benjamin Caine and
                  Vijay Vasudevan and
                  Congcong Li and
                  Quoc V. Le and
                  Jonathon Shlens and
                  Dragomir Anguelov},
  title        = {Improving 3D Object Detection through Progressive Population Based
                  Augmentation},
  journal      = {CoRR},
  volume       = {abs/2004.00831},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.00831},
  eprinttype    = {arXiv},
  eprint       = {2004.00831},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-00831.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-02967,
  author       = {Hanxiao Liu and
                  Andrew Brock and
                  Karen Simonyan and
                  Quoc V. Le},
  title        = {Evolving Normalization-Activation Layers},
  journal      = {CoRR},
  volume       = {abs/2004.02967},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.02967},
  eprinttype    = {arXiv},
  eprint       = {2004.02967},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-02967.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-10746,
  author       = {Azalia Mirhoseini and
                  Anna Goldie and
                  Mustafa Yazgan and
                  Joe W. J. Jiang and
                  Ebrahim M. Songhori and
                  Shen Wang and
                  Young{-}Joon Lee and
                  Eric Johnson and
                  Omkar Pathak and
                  Sungmin Bae and
                  Azade Nazi and
                  Jiwoo Pak and
                  Andy Tong and
                  Kavya Srinivasa and
                  William Hang and
                  Emre Tuncer and
                  Anand Babu and
                  Quoc V. Le and
                  James Laudon and
                  Richard Ho and
                  Roger Carpenter and
                  Jeff Dean},
  title        = {Chip Placement with Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2004.10746},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.10746},
  eprinttype    = {arXiv},
  eprint       = {2004.10746},
  timestamp    = {Fri, 29 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-10746.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-09629,
  author       = {Daniel S. Park and
                  Yu Zhang and
                  Ye Jia and
                  Wei Han and
                  Chung{-}Cheng Chiu and
                  Bo Li and
                  Yonghui Wu and
                  Quoc V. Le},
  title        = {Improved Noisy Student Training for Automatic Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2005.09629},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.09629},
  eprinttype    = {arXiv},
  eprint       = {2005.09629},
  timestamp    = {Thu, 26 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-09629.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-03236,
  author       = {Zihang Dai and
                  Guokun Lai and
                  Yiming Yang and
                  Quoc V. Le},
  title        = {Funnel-Transformer: Filtering out Sequential Redundancy for Efficient
                  Language Processing},
  journal      = {CoRR},
  volume       = {abs/2006.03236},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.03236},
  eprinttype    = {arXiv},
  eprint       = {2006.03236},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-03236.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-03656,
  author       = {Xuanyi Dong and
                  Mingxing Tan and
                  Adams Wei Yu and
                  Daiyi Peng and
                  Bogdan Gabrys and
                  Quoc V. Le},
  title        = {AutoHAS: Differentiable Hyper-parameter and Architecture Search},
  journal      = {CoRR},
  volume       = {abs/2006.03656},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.03656},
  eprinttype    = {arXiv},
  eprint       = {2006.03656},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-03656.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-06882,
  author       = {Barret Zoph and
                  Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Yin Cui and
                  Hanxiao Liu and
                  Ekin D. Cubuk and
                  Quoc V. Le},
  title        = {Rethinking Pre-training and Self-training},
  journal      = {CoRR},
  volume       = {abs/2006.06882},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.06882},
  eprinttype    = {arXiv},
  eprint       = {2006.06882},
  timestamp    = {Wed, 17 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-06882.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-14536,
  author       = {Cihang Xie and
                  Mingxing Tan and
                  Boqing Gong and
                  Alan L. Yuille and
                  Quoc V. Le},
  title        = {Smooth Adversarial Training},
  journal      = {CoRR},
  volume       = {abs/2006.14536},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.14536},
  eprinttype    = {arXiv},
  eprint       = {2006.14536},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-14536.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-00811,
  author       = {Denny Zhou and
                  Mao Ye and
                  Chen Chen and
                  Tianjian Meng and
                  Mingxing Tan and
                  Xiaodan Song and
                  Quoc V. Le and
                  Qiang Liu and
                  Dale Schuurmans},
  title        = {Go Wide, Then Narrow: Efficient Training of Deep Thin Networks},
  journal      = {CoRR},
  volume       = {abs/2007.00811},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.00811},
  eprinttype    = {arXiv},
  eprint       = {2007.00811},
  timestamp    = {Wed, 15 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-00811.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-06120,
  author       = {Gabriel Bender and
                  Hanxiao Liu and
                  Bo Chen and
                  Grace Chu and
                  Shuyang Cheng and
                  Pieter{-}Jan Kindermans and
                  Quoc Le},
  title        = {Can weight sharing outperform random architecture search? An investigation
                  with TuNAS},
  journal      = {CoRR},
  volume       = {abs/2008.06120},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.06120},
  eprinttype    = {arXiv},
  eprint       = {2008.06120},
  timestamp    = {Mon, 31 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-06120.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-10504,
  author       = {Yu Zhang and
                  James Qin and
                  Daniel S. Park and
                  Wei Han and
                  Chung{-}Cheng Chiu and
                  Ruoming Pang and
                  Quoc V. Le and
                  Yonghui Wu},
  title        = {Pushing the Limits of Semi-Supervised Learning for Automatic Speech
                  Recognition},
  journal      = {CoRR},
  volume       = {abs/2010.10504},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.10504},
  eprinttype    = {arXiv},
  eprint       = {2010.10504},
  timestamp    = {Thu, 26 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-10504.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-11426,
  author       = {Xianzhi Du and
                  Tsung{-}Yi Lin and
                  Pengchong Jin and
                  Yin Cui and
                  Mingxing Tan and
                  Quoc V. Le and
                  Xiaodan Song},
  title        = {Efficient Scale-Permuted Backbone with Learned Resource Distribution},
  journal      = {CoRR},
  volume       = {abs/2010.11426},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.11426},
  eprinttype    = {arXiv},
  eprint       = {2010.11426},
  timestamp    = {Tue, 03 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-11426.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-00071,
  author       = {Arissa Wongpanich and
                  Hieu Pham and
                  James Demmel and
                  Mingxing Tan and
                  Quoc V. Le and
                  Yang You and
                  Sameer Kumar},
  title        = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1
                  Accuracy in One Hour},
  journal      = {CoRR},
  volume       = {abs/2011.00071},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.00071},
  eprinttype    = {arXiv},
  eprint       = {2011.00071},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-00071.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-04419,
  author       = {Vikas Verma and
                  Minh{-}Thang Luong and
                  Kenji Kawaguchi and
                  Hieu Pham and
                  Quoc V. Le},
  title        = {Towards Domain-Agnostic Contrastive Learning},
  journal      = {CoRR},
  volume       = {abs/2011.04419},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.04419},
  eprinttype    = {arXiv},
  eprint       = {2011.04419},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-04419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-07177,
  author       = {Golnaz Ghiasi and
                  Yin Cui and
                  Aravind Srinivas and
                  Rui Qian and
                  Tsung{-}Yi Lin and
                  Ekin D. Cubuk and
                  Quoc V. Le and
                  Barret Zoph},
  title        = {Simple Copy-Paste is a Strong Data Augmentation Method for Instance
                  Segmentation},
  journal      = {CoRR},
  volume       = {abs/2012.07177},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.07177},
  eprinttype    = {arXiv},
  eprint       = {2012.07177},
  timestamp    = {Sat, 02 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-07177.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-08561,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Quoc V. Le and
                  Christopher D. Manning},
  title        = {Pre-Training Transformers as Energy-Based Cloze Models},
  journal      = {CoRR},
  volume       = {abs/2012.08561},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.08561},
  eprinttype    = {arXiv},
  eprint       = {2012.08561},
  timestamp    = {Sat, 02 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-08561.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/KwiatkowskiPRCP19,
  author       = {Tom Kwiatkowski and
                  Jennimaria Palomaki and
                  Olivia Redfield and
                  Michael Collins and
                  Ankur P. Parikh and
                  Chris Alberti and
                  Danielle Epstein and
                  Illia Polosukhin and
                  Jacob Devlin and
                  Kenton Lee and
                  Kristina Toutanova and
                  Llion Jones and
                  Matthew Kelcey and
                  Ming{-}Wei Chang and
                  Andrew M. Dai and
                  Jakob Uszkoreit and
                  Quoc Le and
                  Slav Petrov},
  title        = {Natural Questions: a Benchmark for Question Answering Research},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {7},
  pages        = {452--466},
  year         = {2019},
  url          = {https://doi.org/10.1162/tacl\_a\_00276},
  doi          = {10.1162/TACL\_A\_00276},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/KwiatkowskiPRCP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/RealAHL19,
  author       = {Esteban Real and
                  Alok Aggarwal and
                  Yanping Huang and
                  Quoc V. Le},
  title        = {Regularized Evolution for Image Classifier Architecture Search},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {4780--4789},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33014780},
  doi          = {10.1609/AAAI.V33I01.33014780},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/RealAHL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DaiYYCLS19,
  author       = {Zihang Dai and
                  Zhilin Yang and
                  Yiming Yang and
                  Jaime G. Carbonell and
                  Quoc Viet Le and
                  Ruslan Salakhutdinov},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Transformer-XL: Attentive Language Models beyond a Fixed-Length Context},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {2978--2988},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1285},
  doi          = {10.18653/V1/P19-1285},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DaiYYCLS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ClarkLKML19,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Urvashi Khandelwal and
                  Christopher D. Manning and
                  Quoc V. Le},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {BAM! Born-Again Multi-Task Networks for Natural Language Understanding},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {5931--5937},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1595},
  doi          = {10.18653/V1/P19-1595},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ClarkLKML19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bmvc/TanL19,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  title        = {MixConv: Mixed Depthwise Convolutional Kernels},
  booktitle    = {30th British Machine Vision Conference 2019, {BMVC} 2019, Cardiff,
                  UK, September 9-12, 2019},
  pages        = {74},
  publisher    = {{BMVA} Press},
  year         = {2019},
  url          = {https://bmvc2019.org/wp-content/uploads/papers/0583-paper.pdf},
  timestamp    = {Wed, 03 Feb 2021 08:35:59 +0100},
  biburl       = {https://dblp.org/rec/conf/bmvc/TanL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/CubukZMVL19,
  author       = {Ekin D. Cubuk and
                  Barret Zoph and
                  Dandelion Man{\'{e}} and
                  Vijay Vasudevan and
                  Quoc V. Le},
  title        = {AutoAugment: Learning Augmentation Strategies From Data},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {113--123},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Cubuk\_AutoAugment\_Learning\_Augmentation\_Strategies\_From\_Data\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.00020},
  timestamp    = {Mon, 30 Aug 2021 17:01:14 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/CubukZMVL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/KornblithSL19,
  author       = {Simon Kornblith and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Do Better ImageNet Models Transfer Better?},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {2661--2671},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Kornblith\_Do\_Better\_ImageNet\_Models\_Transfer\_Better\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.00277},
  timestamp    = {Mon, 20 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/KornblithSL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/TanCPVSHL19,
  author       = {Mingxing Tan and
                  Bo Chen and
                  Ruoming Pang and
                  Vijay Vasudevan and
                  Mark Sandler and
                  Andrew Howard and
                  Quoc V. Le},
  title        = {MnasNet: Platform-Aware Neural Architecture Search for Mobile},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {2820--2828},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Tan\_MnasNet\_Platform-Aware\_Neural\_Architecture\_Search\_for\_Mobile\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.00293},
  timestamp    = {Thu, 27 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cvpr/TanCPVSHL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/GhiasiLL19,
  author       = {Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Quoc V. Le},
  title        = {{NAS-FPN:} Learning Scalable Feature Pyramid Architecture for Object
                  Detection},
  booktitle    = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR}
                  2019, Long Beach, CA, USA, June 16-20, 2019},
  pages        = {7036--7045},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2019},
  url          = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Ghiasi\_NAS-FPN\_Learning\_Scalable\_Feature\_Pyramid\_Architecture\_for\_Object\_Detection\_CVPR\_2019\_paper.html},
  doi          = {10.1109/CVPR.2019.00720},
  timestamp    = {Mon, 20 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/GhiasiLL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/HowardPALSCWCTC19,
  author       = {Andrew Howard and
                  Ruoming Pang and
                  Hartwig Adam and
                  Quoc V. Le and
                  Mark Sandler and
                  Bo Chen and
                  Weijun Wang and
                  Liang{-}Chieh Chen and
                  Mingxing Tan and
                  Grace Chu and
                  Vijay Vasudevan and
                  Yukun Zhu},
  title        = {Searching for MobileNetV3},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {1314--1324},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00140},
  doi          = {10.1109/ICCV.2019.00140},
  timestamp    = {Thu, 27 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/HowardPALSCWCTC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/BelloZLVS19,
  author       = {Irwan Bello and
                  Barret Zoph and
                  Quoc Le and
                  Ashish Vaswani and
                  Jonathon Shlens},
  title        = {Attention Augmented Convolutional Networks},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {3285--3294},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00338},
  doi          = {10.1109/ICCV.2019.00338},
  timestamp    = {Thu, 03 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/BelloZLVS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RamachandranL19,
  author       = {Prajit Ramachandran and
                  Quoc V. Le},
  title        = {Diversity and Depth in Per-Example Routing Models},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=BkxWJnC9tX},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RamachandranL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ParkSLS19,
  author       = {Daniel S. Park and
                  Jascha Sohl{-}Dickstein and
                  Quoc V. Le and
                  Samuel L. Smith},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {The Effect of Network Width on Stochastic Gradient Descent and Generalization:
                  an Empirical Study},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {5042--5051},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/park19b.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ParkSLS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SoLL19,
  author       = {David R. So and
                  Quoc V. Le and
                  Chen Liang},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {The Evolved Transformer},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {5877--5886},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/so19a.html},
  timestamp    = {Thu, 26 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SoLL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TanL19,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {6105--6114},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/tan19a.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TanL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ParkCZCZCL19,
  author       = {Daniel S. Park and
                  William Chan and
                  Yu Zhang and
                  Chung{-}Cheng Chiu and
                  Barret Zoph and
                  Ekin D. Cubuk and
                  Quoc V. Le},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {SpecAugment: {A} Simple Data Augmentation Method for Automatic Speech
                  Recognition},
  booktitle    = {Interspeech 2019, 20th Annual Conference of the International Speech
                  Communication Association, Graz, Austria, 15-19 September 2019},
  pages        = {2613--2617},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2680},
  doi          = {10.21437/INTERSPEECH.2019-2680},
  timestamp    = {Fri, 29 Jan 2021 17:41:10 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/ParkCZCZCL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VillegasPKELL19,
  author       = {Ruben Villegas and
                  Arkanath Pathak and
                  Harini Kannan and
                  Dumitru Erhan and
                  Quoc V. Le and
                  Honglak Lee},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {High Fidelity Video Prediction with Large Stochastic Recurrent Neural
                  Networks},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {81--91},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/f7177163c833dff4b38fc8d2872f1ec6-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/VillegasPKELL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HuangCBFCCLNLWC19,
  author       = {Yanping Huang and
                  Youlong Cheng and
                  Ankur Bapna and
                  Orhan Firat and
                  Dehao Chen and
                  Mia Xu Chen and
                  HyoukJoong Lee and
                  Jiquan Ngiam and
                  Quoc V. Le and
                  Yonghui Wu and
                  Zhifeng Chen},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {GPipe: Efficient Training of Giant Neural Networks using Pipeline
                  Parallelism},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {103--112},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/093f65e080a295f8076b1c5722a46aa2-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HuangCBFCCLNLWC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ElsayedKL19,
  author       = {Gamaleldin F. Elsayed and
                  Simon Kornblith and
                  Quoc V. Le},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Saccader: Improving Accuracy of Hard Attention Models for Vision},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {700--712},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/8dd48d6a2e2cad213179a3992c0be53c-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ElsayedKL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangBLN19,
  author       = {Brandon Yang and
                  Gabriel Bender and
                  Quoc V. Le and
                  Jiquan Ngiam},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {CondConv: Conditionally Parameterized Convolutions for Efficient Inference},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {1305--1316},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/f2201f5191c4e92cc5af043eebfd0946-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangBLN19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangDYCSL19,
  author       = {Zhilin Yang and
                  Zihang Dai and
                  Yiming Yang and
                  Jaime G. Carbonell and
                  Ruslan Salakhutdinov and
                  Quoc V. Le},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {XLNet: Generalized Autoregressive Pretraining for Language Understanding},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {5754--5764},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/dc6a7e655d7e5840e66733e9ee67cc69-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangDYCSL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YangLSL19,
  author       = {Zhilin Yang and
                  Thang Luong and
                  Ruslan Salakhutdinov and
                  Quoc V. Le},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Mixtape: Breaking the Softmax Bottleneck Efficiently},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {15922--15930},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/512fc3c5227f637e41437c999a2d3169-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YangLSL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-02860,
  author       = {Zihang Dai and
                  Zhilin Yang and
                  Yiming Yang and
                  Jaime G. Carbonell and
                  Quoc V. Le and
                  Ruslan Salakhutdinov},
  title        = {Transformer-XL: Attentive Language Models Beyond a Fixed-Length Context},
  journal      = {CoRR},
  volume       = {abs/1901.02860},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.02860},
  eprinttype    = {arXiv},
  eprint       = {1901.02860},
  timestamp    = {Fri, 01 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-02860.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-11117,
  author       = {David R. So and
                  Chen Liang and
                  Quoc V. Le},
  title        = {The Evolved Transformer},
  journal      = {CoRR},
  volume       = {abs/1901.11117},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.11117},
  eprinttype    = {arXiv},
  eprint       = {1901.11117},
  timestamp    = {Mon, 04 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-11117.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-04971,
  author       = {Brandon Yang and
                  Gabriel Bender and
                  Quoc V. Le and
                  Jiquan Ngiam},
  title        = {Soft Conditional Computation},
  journal      = {CoRR},
  volume       = {abs/1904.04971},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.04971},
  eprinttype    = {arXiv},
  eprint       = {1904.04971},
  timestamp    = {Thu, 25 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-04971.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-07392,
  author       = {Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Ruoming Pang and
                  Quoc V. Le},
  title        = {{NAS-FPN:} Learning Scalable Feature Pyramid Architecture for Object
                  Detection},
  journal      = {CoRR},
  volume       = {abs/1904.07392},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.07392},
  eprinttype    = {arXiv},
  eprint       = {1904.07392},
  timestamp    = {Thu, 25 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-07392.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-08779,
  author       = {Daniel S. Park and
                  William Chan and
                  Yu Zhang and
                  Chung{-}Cheng Chiu and
                  Barret Zoph and
                  Ekin D. Cubuk and
                  Quoc V. Le},
  title        = {SpecAugment: {A} Simple Data Augmentation Method for Automatic Speech
                  Recognition},
  journal      = {CoRR},
  volume       = {abs/1904.08779},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.08779},
  eprinttype    = {arXiv},
  eprint       = {1904.08779},
  timestamp    = {Tue, 27 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-08779.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-09925,
  author       = {Irwan Bello and
                  Barret Zoph and
                  Ashish Vaswani and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Attention Augmented Convolutional Networks},
  journal      = {CoRR},
  volume       = {abs/1904.09925},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.09925},
  eprinttype    = {arXiv},
  eprint       = {1904.09925},
  timestamp    = {Fri, 26 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-09925.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-10076,
  author       = {Keren Gu and
                  Brandon Yang and
                  Jiquan Ngiam and
                  Quoc V. Le and
                  Jonathon Shlens},
  title        = {Using Videos to Evaluate Image Model Robustness},
  journal      = {CoRR},
  volume       = {abs/1904.10076},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.10076},
  eprinttype    = {arXiv},
  eprint       = {1904.10076},
  timestamp    = {Sat, 27 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-10076.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-12848,
  author       = {Qizhe Xie and
                  Zihang Dai and
                  Eduard H. Hovy and
                  Minh{-}Thang Luong and
                  Quoc V. Le},
  title        = {Unsupervised Data Augmentation},
  journal      = {CoRR},
  volume       = {abs/1904.12848},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.12848},
  eprinttype    = {arXiv},
  eprint       = {1904.12848},
  timestamp    = {Thu, 02 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-12848.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-02244,
  author       = {Andrew Howard and
                  Mark Sandler and
                  Grace Chu and
                  Liang{-}Chieh Chen and
                  Bo Chen and
                  Mingxing Tan and
                  Weijun Wang and
                  Yukun Zhu and
                  Ruoming Pang and
                  Vijay Vasudevan and
                  Quoc V. Le and
                  Hartwig Adam},
  title        = {Searching for MobileNetV3},
  journal      = {CoRR},
  volume       = {abs/1905.02244},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.02244},
  eprinttype    = {arXiv},
  eprint       = {1905.02244},
  timestamp    = {Thu, 27 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-02244.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-03776,
  author       = {Daniel S. Park and
                  Jascha Sohl{-}Dickstein and
                  Quoc V. Le and
                  Samuel L. Smith},
  title        = {The Effect of Network Width on Stochastic Gradient Descent and Generalization:
                  an Empirical Study},
  journal      = {CoRR},
  volume       = {abs/1905.03776},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.03776},
  eprinttype    = {arXiv},
  eprint       = {1905.03776},
  timestamp    = {Mon, 27 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-03776.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-11946,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  title        = {EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1905.11946},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.11946},
  eprinttype    = {arXiv},
  eprint       = {1905.11946},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-11946.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-02940,
  author       = {Trieu H. Trinh and
                  Minh{-}Thang Luong and
                  Quoc V. Le},
  title        = {Selfie: Self-supervised Pretraining for Image Embedding},
  journal      = {CoRR},
  volume       = {abs/1906.02940},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.02940},
  eprinttype    = {arXiv},
  eprint       = {1906.02940},
  timestamp    = {Fri, 14 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-02940.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-08237,
  author       = {Zhilin Yang and
                  Zihang Dai and
                  Yiming Yang and
                  Jaime G. Carbonell and
                  Ruslan Salakhutdinov and
                  Quoc V. Le},
  title        = {XLNet: Generalized Autoregressive Pretraining for Language Understanding},
  journal      = {CoRR},
  volume       = {abs/1906.08237},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.08237},
  eprinttype    = {arXiv},
  eprint       = {1906.08237},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-08237.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-11172,
  author       = {Barret Zoph and
                  Ekin D. Cubuk and
                  Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Learning Data Augmentation Strategies for Object Detection},
  journal      = {CoRR},
  volume       = {abs/1906.11172},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.11172},
  eprinttype    = {arXiv},
  eprint       = {1906.11172},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-11172.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-04471,
  author       = {Manas R. Joglekar and
                  Cong Li and
                  Jay K. Adams and
                  Pranav Khaitan and
                  Quoc V. Le},
  title        = {Neural Input Search for Large Scale Recommendation Models},
  journal      = {CoRR},
  volume       = {abs/1907.04471},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.04471},
  eprinttype    = {arXiv},
  eprint       = {1907.04471},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-04471.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-04829,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Urvashi Khandelwal and
                  Christopher D. Manning and
                  Quoc V. Le},
  title        = {BAM! Born-Again Multi-Task Networks for Natural Language Understanding},
  journal      = {CoRR},
  volume       = {abs/1907.04829},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.04829},
  eprinttype    = {arXiv},
  eprint       = {1907.04829},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-04829.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-09595,
  author       = {Mingxing Tan and
                  Quoc V. Le},
  title        = {MixConv: Mixed Depthwise Convolutional Kernels},
  journal      = {CoRR},
  volume       = {abs/1907.09595},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.09595},
  eprinttype    = {arXiv},
  eprint       = {1907.09595},
  timestamp    = {Fri, 02 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-09595.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-07644,
  author       = {Gamaleldin F. Elsayed and
                  Simon Kornblith and
                  Quoc V. Le},
  title        = {Saccader: Improving Accuracy of Hard Attention Models for Vision},
  journal      = {CoRR},
  volume       = {abs/1908.07644},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.07644},
  eprinttype    = {arXiv},
  eprint       = {1908.07644},
  timestamp    = {Mon, 26 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-07644.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-13719,
  author       = {Ekin D. Cubuk and
                  Barret Zoph and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {RandAugment: Practical data augmentation with no separate search},
  journal      = {CoRR},
  volume       = {abs/1909.13719},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.13719},
  eprinttype    = {arXiv},
  eprint       = {1909.13719},
  timestamp    = {Wed, 02 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-13719.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-01655,
  author       = {Ruben Villegas and
                  Arkanath Pathak and
                  Harini Kannan and
                  Dumitru Erhan and
                  Quoc V. Le and
                  Honglak Lee},
  title        = {High Fidelity Video Prediction with Large Stochastic Recurrent Neural
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1911.01655},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.01655},
  eprinttype    = {arXiv},
  eprint       = {1911.01655},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-01655.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-04252,
  author       = {Qizhe Xie and
                  Eduard H. Hovy and
                  Minh{-}Thang Luong and
                  Quoc V. Le},
  title        = {Self-training with Noisy Student improves ImageNet classification},
  journal      = {CoRR},
  volume       = {abs/1911.04252},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.04252},
  eprinttype    = {arXiv},
  eprint       = {1911.04252},
  timestamp    = {Sun, 01 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-04252.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-09070,
  author       = {Mingxing Tan and
                  Ruoming Pang and
                  Quoc V. Le},
  title        = {EfficientDet: Scalable and Efficient Object Detection},
  journal      = {CoRR},
  volume       = {abs/1911.09070},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.09070},
  eprinttype    = {arXiv},
  eprint       = {1911.09070},
  timestamp    = {Tue, 03 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-09070.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-09665,
  author       = {Cihang Xie and
                  Mingxing Tan and
                  Boqing Gong and
                  Jiang Wang and
                  Alan L. Yuille and
                  Quoc V. Le},
  title        = {Adversarial Examples Improve Image Recognition},
  journal      = {CoRR},
  volume       = {abs/1911.09665},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.09665},
  eprinttype    = {arXiv},
  eprint       = {1911.09665},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-09665.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-01106,
  author       = {Bo Chen and
                  Golnaz Ghiasi and
                  Hanxiao Liu and
                  Tsung{-}Yi Lin and
                  Dmitry Kalenichenko and
                  Hartwig Adam and
                  Quoc V. Le},
  title        = {MnasFPN: Learning Latency-aware Pyramid Architecture for Object Detection
                  on Mobile Devices},
  journal      = {CoRR},
  volume       = {abs/1912.01106},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.01106},
  eprinttype    = {arXiv},
  eprint       = {1912.01106},
  timestamp    = {Mon, 31 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-01106.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-05027,
  author       = {Xianzhi Du and
                  Tsung{-}Yi Lin and
                  Pengchong Jin and
                  Golnaz Ghiasi and
                  Mingxing Tan and
                  Yin Cui and
                  Quoc V. Le and
                  Xiaodan Song},
  title        = {SpineNet: Learning Scale-Permuted Backbone for Recognition and Localization},
  journal      = {CoRR},
  volume       = {abs/1912.05027},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.05027},
  eprinttype    = {arXiv},
  eprint       = {1912.05027},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-05027.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-05533,
  author       = {Daniel S. Park and
                  Yu Zhang and
                  Chung{-}Cheng Chiu and
                  Youzheng Chen and
                  Bo Li and
                  William Chan and
                  Quoc V. Le and
                  Yonghui Wu},
  title        = {SpecAugment on Large Scale Datasets},
  journal      = {CoRR},
  volume       = {abs/1912.05533},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.05533},
  eprinttype    = {arXiv},
  eprint       = {1912.05533},
  timestamp    = {Tue, 07 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-05533.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/RajkomarO0DHHLL18,
  author       = {Alvin Rajkomar and
                  Eyal Oren and
                  Kai Chen and
                  Andrew M. Dai and
                  Nissan Hajaj and
                  Michaela Hardt and
                  Peter J. Liu and
                  Xiaobing Liu and
                  Jake Marcus and
                  Mimi Sun and
                  Patrik Sundberg and
                  Hector Yee and
                  Kun Zhang and
                  Yi Zhang and
                  Gerardo Flores and
                  Gavin E. Duggan and
                  Jamie Irvine and
                  Quoc Le and
                  Kurt Litsch and
                  Alexander Mossin and
                  Justin Tansuwan and
                  De Wang and
                  James Wexler and
                  Jimbo Wilson and
                  Dana Ludwig and
                  Samuel L. Volchenboum and
                  Katherine Chou and
                  Michael Pearson and
                  Srinivasan Madabushi and
                  Nigam H. Shah and
                  Atul J. Butte and
                  Michael D. Howell and
                  Claire Cui and
                  Gregory S. Corrado and
                  Jeffrey Dean},
  title        = {Scalable and accurate deep learning with electronic health records},
  journal      = {npj Digit. Medicine},
  volume       = {1},
  year         = {2018},
  url          = {https://doi.org/10.1038/s41746-018-0029-1},
  doi          = {10.1038/S41746-018-0029-1},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npjdm/RajkomarO0DHHLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/ZophVSL18,
  author       = {Barret Zoph and
                  Vijay Vasudevan and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Learning Transferable Architectures for Scalable Image Recognition},
  booktitle    = {2018 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2018, Salt Lake City, UT, USA, June 18-22, 2018},
  pages        = {8697--8710},
  publisher    = {Computer Vision Foundation / {IEEE} Computer Society},
  year         = {2018},
  url          = {http://openaccess.thecvf.com/content\_cvpr\_2018/html/Zoph\_Learning\_Transferable\_Architectures\_CVPR\_2018\_paper.html},
  doi          = {10.1109/CVPR.2018.00907},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/ZophVSL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ClarkLML18,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Christopher D. Manning and
                  Quoc V. Le},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Semi-Supervised Sequence Modeling with Cross-View Training},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {1914--1925},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1217},
  doi          = {10.18653/V1/D18-1217},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ClarkLML18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/WeiLDL18,
  author       = {Wei Wei and
                  Quoc V. Le and
                  Andrew M. Dai and
                  Jia Li},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {AirDialogue: An Environment for Goal-Oriented Dialogue Research},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {3844--3854},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1419},
  doi          = {10.18653/V1/D18-1419},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/WeiLDL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/DohanSL18,
  author       = {David Dohan and
                  David R. So and
                  Quoc V. Le},
  editor       = {Hern{\'{a}}n E. Aguirre and
                  Keiki Takadama},
  title        = {Evolving modular neural sequence architectures with genetic programming},
  booktitle    = {Proceedings of the Genetic and Evolutionary Computation Conference
                  Companion, {GECCO} 2018, Kyoto, Japan, July 15-19, 2018},
  pages        = {37--38},
  publisher    = {{ACM}},
  year         = {2018},
  url          = {https://doi.org/10.1145/3205651.3208782},
  doi          = {10.1145/3205651.3208782},
  timestamp    = {Mon, 04 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/gecco/DohanSL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CubukZSL18,
  author       = {Ekin Dogus Cubuk and
                  Barret Zoph and
                  Samuel S. Schoenholz and
                  Quoc V. Le},
  title        = {Intriguing Properties of Adversarial Examples},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=Skz1zaRLz},
  timestamp    = {Thu, 04 Apr 2019 13:20:09 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/CubukZSL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MirhoseiniGPSLD18,
  author       = {Azalia Mirhoseini and
                  Anna Goldie and
                  Hieu Pham and
                  Benoit Steiner and
                  Quoc V. Le and
                  Jeff Dean},
  title        = {A Hierarchical Model for Device Placement},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=Hkc-TeZ0W},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/MirhoseiniGPSLD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PhamGZLD18,
  author       = {Hieu Pham and
                  Melody Y. Guan and
                  Barret Zoph and
                  Quoc V. Le and
                  Jeff Dean},
  title        = {Faster Discovery of Neural Architectures by Searching for Paths in
                  a Large Model},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=rJkCq4JvM},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/PhamGZLD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RaghuIAKLK18,
  author       = {Maithra Raghu and
                  Alex Irpan and
                  Jacob Andreas and
                  Robert Kleinberg and
                  Quoc V. Le and
                  Jon M. Kleinberg},
  title        = {Can Deep Reinforcement Learning solve Erdos-Selfridge-Spencer Games?},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SJbKi81wf},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RaghuIAKLK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RamachandranZL18,
  author       = {Prajit Ramachandran and
                  Barret Zoph and
                  Quoc V. Le},
  title        = {Searching for Activation Functions},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=Hkuq2EkPf},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RamachandranZL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SmithKYL18,
  author       = {Samuel L. Smith and
                  Pieter{-}Jan Kindermans and
                  Chris Ying and
                  Quoc V. Le},
  title        = {Don't Decay the Learning Rate, Increase the Batch Size},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=B1Yy1BxCZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SmithKYL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SmithL18,
  author       = {Samuel L. Smith and
                  Quoc V. Le},
  title        = {A Bayesian Perspective on Generalization and Stochastic Gradient Descent},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=BJij4yg0Z},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SmithL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TrinhDLL18,
  author       = {Trieu H. Trinh and
                  Andrew M. Dai and
                  Minh{-}Thang Luong and
                  Quoc V. Le},
  title        = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=Hy9xDwyPM},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TrinhDLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/YuDLZ00L18,
  author       = {Adams Wei Yu and
                  David Dohan and
                  Minh{-}Thang Luong and
                  Rui Zhao and
                  Kai Chen and
                  Mohammad Norouzi and
                  Quoc V. Le},
  title        = {QANet: Combining Local Convolution with Global Self-Attention for
                  Reading Comprehension},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=B14TlG-RW},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/YuDLZ00L18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BenderKZVL18,
  author       = {Gabriel Bender and
                  Pieter{-}Jan Kindermans and
                  Barret Zoph and
                  Vijay Vasudevan and
                  Quoc V. Le},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Understanding and Simplifying One-Shot Architecture Search},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {549--558},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/bender18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:30 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BenderKZVL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PhamGZLD18,
  author       = {Hieu Pham and
                  Melody Y. Guan and
                  Barret Zoph and
                  Quoc V. Le and
                  Jeff Dean},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Efficient Neural Architecture Search via Parameter Sharing},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {4092--4101},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/pham18a.html},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/PhamGZLD18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RaghuIAKLK18,
  author       = {Maithra Raghu and
                  Alex Irpan and
                  Jacob Andreas and
                  Robert Kleinberg and
                  Quoc V. Le and
                  Jon M. Kleinberg},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Can Deep Reinforcement Learning Solve Erdos-Selfridge-Spencer Games?},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {4235--4243},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/raghu18a.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RaghuIAKLK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TrinhDLL18,
  author       = {Trieu H. Trinh and
                  Andrew M. Dai and
                  Thang Luong and
                  Quoc V. Le},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {4972--4981},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/trinh18a.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TrinhDLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiangNBLL18,
  author       = {Chen Liang and
                  Mohammad Norouzi and
                  Jonathan Berant and
                  Quoc V. Le and
                  Ni Lao},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Memory Augmented Policy Optimization for Program Synthesis and Semantic
                  Parsing},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {10015--10027},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/f4e369c0a468d3aeeda0593ba90b5e55-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LiangNBLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GhiasiLL18,
  author       = {Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Quoc V. Le},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {DropBlock: {A} regularization method for convolutional networks},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {10750--10760},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/7edcfb2d8f6a659ef4cd1e6c9b6d7079-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GhiasiLL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-03526,
  author       = {Daniel A. Abolafia and
                  Mohammad Norouzi and
                  Quoc V. Le},
  title        = {Neural Program Synthesis with Priority Queue Training},
  journal      = {CoRR},
  volume       = {abs/1801.03526},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.03526},
  eprinttype    = {arXiv},
  eprint       = {1801.03526},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-03526.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-07860,
  author       = {Alvin Rajkomar and
                  Eyal Oren and
                  Kai Chen and
                  Andrew M. Dai and
                  Nissan Hajaj and
                  Peter J. Liu and
                  Xiaobing Liu and
                  Mimi Sun and
                  Patrik Sundberg and
                  Hector Yee and
                  Kun Zhang and
                  Gavin E. Duggan and
                  Gerardo Flores and
                  Michaela Hardt and
                  Jamie Irvine and
                  Quoc V. Le and
                  Kurt Litsch and
                  Jake Marcus and
                  Alexander Mossin and
                  Justin Tansuwan and
                  De Wang and
                  James Wexler and
                  Jimbo Wilson and
                  Dana Ludwig and
                  Samuel L. Volchenboum and
                  Katherine Chou and
                  Michael Pearson and
                  Srinivasan Madabushi and
                  Nigam H. Shah and
                  Atul J. Butte and
                  Michael D. Howell and
                  Claire Cui and
                  Greg Corrado and
                  Jeff Dean},
  title        = {Scalable and accurate deep learning for electronic health records},
  journal      = {CoRR},
  volume       = {abs/1801.07860},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.07860},
  eprinttype    = {arXiv},
  eprint       = {1801.07860},
  timestamp    = {Fri, 14 Apr 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-07860.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-01548,
  author       = {Esteban Real and
                  Alok Aggarwal and
                  Yanping Huang and
                  Quoc V. Le},
  title        = {Regularized Evolution for Image Classifier Architecture Search},
  journal      = {CoRR},
  volume       = {abs/1802.01548},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.01548},
  eprinttype    = {arXiv},
  eprint       = {1802.01548},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-01548.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-03268,
  author       = {Hieu Pham and
                  Melody Y. Guan and
                  Barret Zoph and
                  Quoc V. Le and
                  Jeff Dean},
  title        = {Efficient Neural Architecture Search via Parameter Sharing},
  journal      = {CoRR},
  volume       = {abs/1802.03268},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.03268},
  eprinttype    = {arXiv},
  eprint       = {1802.03268},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-03268.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-00144,
  author       = {Trieu H. Trinh and
                  Andrew M. Dai and
                  Thang Luong and
                  Quoc V. Le},
  title        = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses},
  journal      = {CoRR},
  volume       = {abs/1803.00144},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.00144},
  eprinttype    = {arXiv},
  eprint       = {1803.00144},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-00144.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-09541,
  author       = {Adams Wei Yu and
                  David Dohan and
                  Minh{-}Thang Luong and
                  Rui Zhao and
                  Kai Chen and
                  Mohammad Norouzi and
                  Quoc V. Le},
  title        = {QANet: Combining Local Convolution with Global Self-Attention for
                  Reading Comprehension},
  journal      = {CoRR},
  volume       = {abs/1804.09541},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.09541},
  eprinttype    = {arXiv},
  eprint       = {1804.09541},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-09541.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-08974,
  author       = {Simon Kornblith and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Do Better ImageNet Models Transfer Better?},
  journal      = {CoRR},
  volume       = {abs/1805.08974},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.08974},
  eprinttype    = {arXiv},
  eprint       = {1805.08974},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-08974.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-09501,
  author       = {Ekin Dogus Cubuk and
                  Barret Zoph and
                  Dandelion Man{\'{e}} and
                  Vijay Vasudevan and
                  Quoc V. Le},
  title        = {AutoAugment: Learning Augmentation Policies from Data},
  journal      = {CoRR},
  volume       = {abs/1805.09501},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.09501},
  eprinttype    = {arXiv},
  eprint       = {1805.09501},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-09501.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-02847,
  author       = {Trieu H. Trinh and
                  Quoc V. Le},
  title        = {A Simple Method for Commonsense Reasoning},
  journal      = {CoRR},
  volume       = {abs/1806.02847},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.02847},
  eprinttype    = {arXiv},
  eprint       = {1806.02847},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-02847.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-09597,
  author       = {Samuel L. Smith and
                  Daniel Duckworth and
                  Quoc V. Le and
                  Jascha Sohl{-}Dickstein},
  title        = {Stochastic natural gradient descent draws posterior samples in function
                  space},
  journal      = {CoRR},
  volume       = {abs/1806.09597},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.09597},
  eprinttype    = {arXiv},
  eprint       = {1806.09597},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-09597.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-02322,
  author       = {Chen Liang and
                  Mohammad Norouzi and
                  Jonathan Berant and
                  Quoc V. Le and
                  Ni Lao},
  title        = {Memory Augmented Policy Optimization for Program Synthesis with Generalization},
  journal      = {CoRR},
  volume       = {abs/1807.02322},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.02322},
  eprinttype    = {arXiv},
  eprint       = {1807.02322},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-02322.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-11626,
  author       = {Mingxing Tan and
                  Bo Chen and
                  Ruoming Pang and
                  Vijay Vasudevan and
                  Quoc V. Le},
  title        = {MnasNet: Platform-Aware Neural Architecture Search for Mobile},
  journal      = {CoRR},
  volume       = {abs/1807.11626},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.11626},
  eprinttype    = {arXiv},
  eprint       = {1807.11626},
  timestamp    = {Mon, 31 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-11626.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-02822,
  author       = {Maximilian Alber and
                  Irwan Bello and
                  Barret Zoph and
                  Pieter{-}Jan Kindermans and
                  Prajit Ramachandran and
                  Quoc V. Le},
  title        = {Backprop Evolution},
  journal      = {CoRR},
  volume       = {abs/1808.02822},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.02822},
  eprinttype    = {arXiv},
  eprint       = {1808.02822},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-02822.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-08370,
  author       = {Kevin Clark and
                  Minh{-}Thang Luong and
                  Christopher D. Manning and
                  Quoc V. Le},
  title        = {Semi-Supervised Sequence Modeling with Cross-View Training},
  journal      = {CoRR},
  volume       = {abs/1809.08370},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.08370},
  eprinttype    = {arXiv},
  eprint       = {1809.08370},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-08370.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-12890,
  author       = {Golnaz Ghiasi and
                  Tsung{-}Yi Lin and
                  Quoc V. Le},
  title        = {DropBlock: {A} regularization method for convolutional networks},
  journal      = {CoRR},
  volume       = {abs/1810.12890},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.12890},
  eprinttype    = {arXiv},
  eprint       = {1810.12890},
  timestamp    = {Thu, 08 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-12890.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-06965,
  author       = {Yanping Huang and
                  Yonglong Cheng and
                  Dehao Chen and
                  HyoukJoong Lee and
                  Jiquan Ngiam and
                  Quoc V. Le and
                  Zhifeng Chen},
  title        = {GPipe: Efficient Training of Giant Neural Networks using Pipeline
                  Parallelism},
  journal      = {CoRR},
  volume       = {abs/1811.06965},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.06965},
  eprinttype    = {arXiv},
  eprint       = {1811.06965},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-06965.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-07056,
  author       = {Jiquan Ngiam and
                  Daiyi Peng and
                  Vijay Vasudevan and
                  Simon Kornblith and
                  Quoc V. Le and
                  Ruoming Pang},
  title        = {Domain Adaptive Transfer Learning with Specialist Models},
  journal      = {CoRR},
  volume       = {abs/1811.07056},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.07056},
  eprinttype    = {arXiv},
  eprint       = {1811.07056},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-07056.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/JohnsonSLKWCTVW17,
  author       = {Melvin Johnson and
                  Mike Schuster and
                  Quoc V. Le and
                  Maxim Krikun and
                  Yonghui Wu and
                  Zhifeng Chen and
                  Nikhil Thorat and
                  Fernanda B. Vi{\'{e}}gas and
                  Martin Wattenberg and
                  Greg Corrado and
                  Macduff Hughes and
                  Jeffrey Dean},
  title        = {Google's Multilingual Neural Machine Translation System: Enabling
                  Zero-Shot Translation},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {5},
  pages        = {339--351},
  year         = {2017},
  url          = {https://doi.org/10.1162/tacl\_a\_00065},
  doi          = {10.1162/TACL\_A\_00065},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/JohnsonSLKWCTVW17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LiangBLFL17,
  author       = {Chen Liang and
                  Jonathan Berant and
                  Quoc V. Le and
                  Kenneth D. Forbus and
                  Ni Lao},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with
                  Weak Supervision},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {23--33},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1003},
  doi          = {10.18653/V1/P17-1003},
  timestamp    = {Fri, 06 Aug 2021 00:40:58 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LiangBLFL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/YuLL17,
  author       = {Adams Wei Yu and
                  Hongrae Lee and
                  Quoc V. Le},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Learning to Skim Text},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {1880--1890},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1172},
  doi          = {10.18653/V1/P17-1172},
  timestamp    = {Tue, 20 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/YuLL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/RamachandranLL17,
  author       = {Prajit Ramachandran and
                  Peter J. Liu and
                  Quoc V. Le},
  editor       = {Martha Palmer and
                  Rebecca Hwa and
                  Sebastian Riedel},
  title        = {Unsupervised Pretraining for Sequence to Sequence Learning},
  booktitle    = {Proceedings of the 2017 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September
                  9-11, 2017},
  pages        = {383--391},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/d17-1039},
  doi          = {10.18653/V1/D17-1039},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/RamachandranLL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BelloPL0B17,
  author       = {Irwan Bello and
                  Hieu Pham and
                  Quoc V. Le and
                  Mohammad Norouzi and
                  Samy Bengio},
  title        = {Neural Combinatorial Optimization with Reinforcement Learning},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=Bk9mxlSFx},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/BelloPL0B17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ChanZLJ17,
  author       = {William Chan and
                  Yu Zhang and
                  Quoc V. Le and
                  Navdeep Jaitly},
  title        = {Latent Sequence Decompositions},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SyQq185lg},
  timestamp    = {Tue, 09 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/ChanZLJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HaDL17,
  author       = {David Ha and
                  Andrew M. Dai and
                  Quoc V. Le},
  title        = {HyperNetworks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=rkpACe1lx},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HaDL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/NeelakantanLAMA17,
  author       = {Arvind Neelakantan and
                  Quoc V. Le and
                  Mart{\'{\i}}n Abadi and
                  Andrew McCallum and
                  Dario Amodei},
  title        = {Learning a Natural Language Interface with Neural Programmer},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=ry2YOrcge},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/NeelakantanLAMA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ShazeerMMDLHD17,
  author       = {Noam Shazeer and
                  Azalia Mirhoseini and
                  Krzysztof Maziarz and
                  Andy Davis and
                  Quoc V. Le and
                  Geoffrey E. Hinton and
                  Jeff Dean},
  title        = {Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts
                  Layer},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=B1ckMDqlg},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ShazeerMMDLHD17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZophL17,
  author       = {Barret Zoph and
                  Quoc V. Le},
  title        = {Neural Architecture Search with Reinforcement Learning},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=r1Ue8Hcxg},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZophL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BelloZVL17,
  author       = {Irwan Bello and
                  Barret Zoph and
                  Vijay Vasudevan and
                  Quoc V. Le},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Neural Optimizer Search with Reinforcement Learning},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {459--468},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/bello17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BelloZVL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MirhoseiniPLSLZ17,
  author       = {Azalia Mirhoseini and
                  Hieu Pham and
                  Quoc V. Le and
                  Benoit Steiner and
                  Rasmus Larsen and
                  Yuefeng Zhou and
                  Naveen Kumar and
                  Mohammad Norouzi and
                  Samy Bengio and
                  Jeff Dean},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Device Placement Optimization with Reinforcement Learning},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {2430--2439},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/mirhoseini17a.html},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/MirhoseiniPLSLZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RealMSSSTLK17,
  author       = {Esteban Real and
                  Sherry Moore and
                  Andrew Selle and
                  Saurabh Saxena and
                  Yutaka I. Leon{-}Suematsu and
                  Jie Tan and
                  Quoc V. Le and
                  Alexey Kurakin},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Large-Scale Evolution of Image Classifiers},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {2902--2911},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/real17a.html},
  timestamp    = {Tue, 04 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RealMSSSTLK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/WangSSWWJYXCBLA17,
  author       = {Yuxuan Wang and
                  R. J. Skerry{-}Ryan and
                  Daisy Stanton and
                  Yonghui Wu and
                  Ron J. Weiss and
                  Navdeep Jaitly and
                  Zongheng Yang and
                  Ying Xiao and
                  Zhifeng Chen and
                  Samy Bengio and
                  Quoc V. Le and
                  Yannis Agiomyrgiannakis and
                  Rob Clark and
                  Rif A. Saurous},
  editor       = {Francisco Lacerda},
  title        = {Tacotron: Towards End-to-End Speech Synthesis},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {4006--4010},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-1452},
  doi          = {10.21437/INTERSPEECH.2017-1452},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/WangSSWWJYXCBLA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/BritzLP17,
  author       = {Denny Britz and
                  Quoc V. Le and
                  Reid Pryzant},
  editor       = {Ondrej Bojar and
                  Christian Buck and
                  Rajen Chatterjee and
                  Christian Federmann and
                  Yvette Graham and
                  Barry Haddow and
                  Matthias Huck and
                  Antonio Jimeno{-}Yepes and
                  Philipp Koehn and
                  Julia Kreutzer},
  title        = {Effective Domain Mixing for Neural Machine Translation},
  booktitle    = {Proceedings of the Second Conference on Machine Translation, {WMT}
                  2017, Copenhagen, Denmark, September 7-8, 2017},
  pages        = {118--126},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-4712},
  doi          = {10.18653/V1/W17-4712},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wmt/BritzLP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ShazeerMMDLHD17,
  author       = {Noam Shazeer and
                  Azalia Mirhoseini and
                  Krzysztof Maziarz and
                  Andy Davis and
                  Quoc V. Le and
                  Geoffrey E. Hinton and
                  Jeff Dean},
  title        = {Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts
                  Layer},
  journal      = {CoRR},
  volume       = {abs/1701.06538},
  year         = {2017},
  url          = {http://arxiv.org/abs/1701.06538},
  eprinttype    = {arXiv},
  eprint       = {1701.06538},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ShazeerMMDLHD17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RealMSSSLK17,
  author       = {Esteban Real and
                  Sherry Moore and
                  Andrew Selle and
                  Saurabh Saxena and
                  Yutaka I. Leon{-}Suematsu and
                  Quoc V. Le and
                  Alex Kurakin},
  title        = {Large-Scale Evolution of Image Classifiers},
  journal      = {CoRR},
  volume       = {abs/1703.01041},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.01041},
  eprinttype    = {arXiv},
  eprint       = {1703.01041},
  timestamp    = {Tue, 04 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RealMSSSLK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BritzGLL17,
  author       = {Denny Britz and
                  Anna Goldie and
                  Minh{-}Thang Luong and
                  Quoc V. Le},
  title        = {Massive Exploration of Neural Machine Translation Architectures},
  journal      = {CoRR},
  volume       = {abs/1703.03906},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.03906},
  eprinttype    = {arXiv},
  eprint       = {1703.03906},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BritzGLL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WangSSWWJYXCBLA17,
  author       = {Yuxuan Wang and
                  R. J. Skerry{-}Ryan and
                  Daisy Stanton and
                  Yonghui Wu and
                  Ron J. Weiss and
                  Navdeep Jaitly and
                  Zongheng Yang and
                  Ying Xiao and
                  Zhifeng Chen and
                  Samy Bengio and
                  Quoc V. Le and
                  Yannis Agiomyrgiannakis and
                  Rob Clark and
                  Rif A. Saurous},
  title        = {Tacotron: {A} Fully End-to-End Text-To-Speech Synthesis Model},
  journal      = {CoRR},
  volume       = {abs/1703.10135},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.10135},
  eprinttype    = {arXiv},
  eprint       = {1703.10135},
  timestamp    = {Mon, 25 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/WangSSWWJYXCBLA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/YuLL17,
  author       = {Adams Wei Yu and
                  Hongrae Lee and
                  Quoc V. Le},
  title        = {Learning to Skim Text},
  journal      = {CoRR},
  volume       = {abs/1704.06877},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.06877},
  eprinttype    = {arXiv},
  eprint       = {1704.06877},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YuLL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MirhoseiniPLSLZ17,
  author       = {Azalia Mirhoseini and
                  Hieu Pham and
                  Quoc V. Le and
                  Benoit Steiner and
                  Rasmus Larsen and
                  Yuefeng Zhou and
                  Naveen Kumar and
                  Mohammad Norouzi and
                  Samy Bengio and
                  Jeff Dean},
  title        = {Device Placement Optimization with Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1706.04972},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.04972},
  eprinttype    = {arXiv},
  eprint       = {1706.04972},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MirhoseiniPLSLZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZophVSL17,
  author       = {Barret Zoph and
                  Vijay Vasudevan and
                  Jonathon Shlens and
                  Quoc V. Le},
  title        = {Learning Transferable Architectures for Scalable Image Recognition},
  journal      = {CoRR},
  volume       = {abs/1707.07012},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.07012},
  eprinttype    = {arXiv},
  eprint       = {1707.07012},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZophVSL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-07417,
  author       = {Irwan Bello and
                  Barret Zoph and
                  Vijay Vasudevan and
                  Quoc V. Le},
  title        = {Neural Optimizer Search with Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1709.07417},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.07417},
  eprinttype    = {arXiv},
  eprint       = {1709.07417},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-07417.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-05941,
  author       = {Prajit Ramachandran and
                  Barret Zoph and
                  Quoc V. Le},
  title        = {Searching for Activation Functions},
  journal      = {CoRR},
  volume       = {abs/1710.05941},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.05941},
  eprinttype    = {arXiv},
  eprint       = {1710.05941},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-05941.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-06451,
  author       = {Samuel L. Smith and
                  Quoc V. Le},
  title        = {A Bayesian Perspective on Generalization and Stochastic Gradient Descent},
  journal      = {CoRR},
  volume       = {abs/1710.06451},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.06451},
  eprinttype    = {arXiv},
  eprint       = {1710.06451},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-06451.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-00489,
  author       = {Samuel L. Smith and
                  Pieter{-}Jan Kindermans and
                  Quoc V. Le},
  title        = {Don't Decay the Learning Rate, Increase the Batch Size},
  journal      = {CoRR},
  volume       = {abs/1711.00489},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.00489},
  eprinttype    = {arXiv},
  eprint       = {1711.00489},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-00489.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02301,
  author       = {Maithra Raghu and
                  Alex Irpan and
                  Jacob Andreas and
                  Robert Kleinberg and
                  Quoc V. Le and
                  Jon M. Kleinberg},
  title        = {Can Deep Reinforcement Learning Solve Erdos-Selfridge-Spencer Games?},
  journal      = {CoRR},
  volume       = {abs/1711.02301},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02301},
  eprinttype    = {arXiv},
  eprint       = {1711.02301},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02301.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02846,
  author       = {Ekin Dogus Cubuk and
                  Barret Zoph and
                  Samuel S. Schoenholz and
                  Quoc V. Le},
  title        = {Intriguing Properties of Adversarial Examples},
  journal      = {CoRR},
  volume       = {abs/1711.02846},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02846},
  eprinttype    = {arXiv},
  eprint       = {1711.02846},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02846.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ChanJLV16,
  author       = {William Chan and
                  Navdeep Jaitly and
                  Quoc V. Le and
                  Oriol Vinyals},
  title        = {Listen, attend and spell: {A} neural network for large vocabulary
                  conversational speech recognition},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {4960--4964},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472621},
  doi          = {10.1109/ICASSP.2016.7472621},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ChanJLV16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/JaitlyLVSSB16,
  author       = {Navdeep Jaitly and
                  Quoc V. Le and
                  Oriol Vinyals and
                  Ilya Sutskever and
                  David Sussillo and
                  Samy Bengio},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {An Online Sequence-to-Sequence Model Using Partial Conditioning},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {5067--5075},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/312351bff07989769097660a56395065-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/JaitlyLVSSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssw/Le16,
  author       = {Quoc V. Le},
  title        = {End-to-end Learning for Text and Speech},
  booktitle    = {The 9th {ISCA} Speech Synthesis Workshop, Sunnyvale, CA, USA, 13-15
                  September 2016},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {http://www.isca-speech.org/archive/SSW\_2016/abstracts/ssw9\_KN3\_Le.html},
  timestamp    = {Mon, 28 Aug 2023 21:17:54 +0200},
  biburl       = {https://dblp.org/rec/conf/ssw/Le16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/LuongLSVK15,
  author       = {Minh{-}Thang Luong and
                  Quoc V. Le and
                  Ilya Sutskever and
                  Oriol Vinyals and
                  Lukasz Kaiser},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Multi-task Sequence to Sequence Learning},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.06114},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LuongLSVK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/NeelakantanLS15,
  author       = {Arvind Neelakantan and
                  Quoc V. Le and
                  Ilya Sutskever},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Neural Programmer: Inducing Latent Programs with Gradient Descent},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1511.04834},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/NeelakantanLS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WuSCLNMKCGMKSJL16,
  author       = {Yonghui Wu and
                  Mike Schuster and
                  Zhifeng Chen and
                  Quoc V. Le and
                  Mohammad Norouzi and
                  Wolfgang Macherey and
                  Maxim Krikun and
                  Yuan Cao and
                  Qin Gao and
                  Klaus Macherey and
                  Jeff Klingner and
                  Apurva Shah and
                  Melvin Johnson and
                  Xiaobing Liu and
                  Lukasz Kaiser and
                  Stephan Gouws and
                  Yoshikiyo Kato and
                  Taku Kudo and
                  Hideto Kazawa and
                  Keith Stevens and
                  George Kurian and
                  Nishant Patil and
                  Wei Wang and
                  Cliff Young and
                  Jason Smith and
                  Jason Riesa and
                  Alex Rudnick and
                  Oriol Vinyals and
                  Greg Corrado and
                  Macduff Hughes and
                  Jeffrey Dean},
  title        = {Google's Neural Machine Translation System: Bridging the Gap between
                  Human and Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1609.08144},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.08144},
  eprinttype    = {arXiv},
  eprint       = {1609.08144},
  timestamp    = {Thu, 14 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/WuSCLNMKCGMKSJL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HaDL16,
  author       = {David Ha and
                  Andrew M. Dai and
                  Quoc V. Le},
  title        = {HyperNetworks},
  journal      = {CoRR},
  volume       = {abs/1609.09106},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.09106},
  eprinttype    = {arXiv},
  eprint       = {1609.09106},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HaDL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChanZLJ16,
  author       = {William Chan and
                  Yu Zhang and
                  Quoc V. Le and
                  Navdeep Jaitly},
  title        = {Latent Sequence Decompositions},
  journal      = {CoRR},
  volume       = {abs/1610.03035},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.03035},
  eprinttype    = {arXiv},
  eprint       = {1610.03035},
  timestamp    = {Tue, 09 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/ChanZLJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiangBLFL16,
  author       = {Chen Liang and
                  Jonathan Berant and
                  Quoc V. Le and
                  Kenneth D. Forbus and
                  Ni Lao},
  title        = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with
                  Weak Supervision},
  journal      = {CoRR},
  volume       = {abs/1611.00020},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.00020},
  eprinttype    = {arXiv},
  eprint       = {1611.00020},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiangBLFL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZophL16,
  author       = {Barret Zoph and
                  Quoc V. Le},
  title        = {Neural Architecture Search with Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1611.01578},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.01578},
  eprinttype    = {arXiv},
  eprint       = {1611.01578},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZophL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RamachandranLL16,
  author       = {Prajit Ramachandran and
                  Peter J. Liu and
                  Quoc V. Le},
  title        = {Unsupervised Pretraining for Sequence to Sequence Learning},
  journal      = {CoRR},
  volume       = {abs/1611.02683},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.02683},
  eprinttype    = {arXiv},
  eprint       = {1611.02683},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RamachandranLL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JohnsonSLKWCTVW16,
  author       = {Melvin Johnson and
                  Mike Schuster and
                  Quoc V. Le and
                  Maxim Krikun and
                  Yonghui Wu and
                  Zhifeng Chen and
                  Nikhil Thorat and
                  Fernanda B. Vi{\'{e}}gas and
                  Martin Wattenberg and
                  Greg Corrado and
                  Macduff Hughes and
                  Jeffrey Dean},
  title        = {Google's Multilingual Neural Machine Translation System: Enabling
                  Zero-Shot Translation},
  journal      = {CoRR},
  volume       = {abs/1611.04558},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.04558},
  eprinttype    = {arXiv},
  eprint       = {1611.04558},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JohnsonSLKWCTVW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/NeelakantanLAMA16,
  author       = {Arvind Neelakantan and
                  Quoc V. Le and
                  Mart{\'{\i}}n Abadi and
                  Andrew McCallum and
                  Dario Amodei},
  title        = {Learning a Natural Language Interface with Neural Programmer},
  journal      = {CoRR},
  volume       = {abs/1611.08945},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.08945},
  eprinttype    = {arXiv},
  eprint       = {1611.08945},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/NeelakantanLAMA16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BelloPLNB16,
  author       = {Irwan Bello and
                  Hieu Pham and
                  Quoc V. Le and
                  Mohammad Norouzi and
                  Samy Bengio},
  title        = {Neural Combinatorial Optimization with Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1611.09940},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.09940},
  eprinttype    = {arXiv},
  eprint       = {1611.09940},
  timestamp    = {Thu, 11 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BelloPLNB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LiangBLFL16a,
  author       = {Chen Liang and
                  Jonathan Berant and
                  Quoc V. Le and
                  Kenneth D. Forbus and
                  Ni Lao},
  title        = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with
                  Weak Supervision (Short Version)},
  journal      = {CoRR},
  volume       = {abs/1612.01197},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.01197},
  eprinttype    = {arXiv},
  eprint       = {1612.01197},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LiangBLFL16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LuongSLVZ15,
  author       = {Thang Luong and
                  Ilya Sutskever and
                  Quoc V. Le and
                  Oriol Vinyals and
                  Wojciech Zaremba},
  title        = {Addressing the Rare Word Problem in Neural Machine Translation},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers},
  pages        = {11--19},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-1002},
  doi          = {10.3115/V1/P15-1002},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LuongSLVZ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DaiL15,
  author       = {Andrew M. Dai and
                  Quoc V. Le},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Semi-supervised Sequence Learning},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {3079--3087},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/7137debd45ae4d0ab9aa953017286b20-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DaiL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LeJH15,
  author       = {Quoc V. Le and
                  Navdeep Jaitly and
                  Geoffrey E. Hinton},
  title        = {A Simple Way to Initialize Recurrent Networks of Rectified Linear
                  Units},
  journal      = {CoRR},
  volume       = {abs/1504.00941},
  year         = {2015},
  url          = {http://arxiv.org/abs/1504.00941},
  eprinttype    = {arXiv},
  eprint       = {1504.00941},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LeJH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/VinyalsL15,
  author       = {Oriol Vinyals and
                  Quoc V. Le},
  title        = {A Neural Conversational Model},
  journal      = {CoRR},
  volume       = {abs/1506.05869},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.05869},
  eprinttype    = {arXiv},
  eprint       = {1506.05869},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/VinyalsL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DaiOL15,
  author       = {Andrew M. Dai and
                  Christopher Olah and
                  Quoc V. Le},
  title        = {Document Embedding with Paragraph Vectors},
  journal      = {CoRR},
  volume       = {abs/1507.07998},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.07998},
  eprinttype    = {arXiv},
  eprint       = {1507.07998},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DaiOL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChanJLV15,
  author       = {William Chan and
                  Navdeep Jaitly and
                  Quoc V. Le and
                  Oriol Vinyals},
  title        = {Listen, Attend and Spell},
  journal      = {CoRR},
  volume       = {abs/1508.01211},
  year         = {2015},
  url          = {http://arxiv.org/abs/1508.01211},
  eprinttype    = {arXiv},
  eprint       = {1508.01211},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChanJLV15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DaiL15a,
  author       = {Andrew M. Dai and
                  Quoc V. Le},
  title        = {Semi-supervised Sequence Learning},
  journal      = {CoRR},
  volume       = {abs/1511.01432},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.01432},
  eprinttype    = {arXiv},
  eprint       = {1511.01432},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DaiL15a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JaitlyLVSB15,
  author       = {Navdeep Jaitly and
                  Quoc V. Le and
                  Oriol Vinyals and
                  Ilya Sutskever and
                  Samy Bengio},
  title        = {An Online Sequence-to-Sequence Model Using Partial Conditioning},
  journal      = {CoRR},
  volume       = {abs/1511.04868},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.04868},
  eprinttype    = {arXiv},
  eprint       = {1511.04868},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JaitlyLVSB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/NeelakantanVLSK15,
  author       = {Arvind Neelakantan and
                  Luke Vilnis and
                  Quoc V. Le and
                  Ilya Sutskever and
                  Lukasz Kaiser and
                  Karol Kurach and
                  James Martens},
  title        = {Adding Gradient Noise Improves Learning for Very Deep Networks},
  journal      = {CoRR},
  volume       = {abs/1511.06807},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06807},
  eprinttype    = {arXiv},
  eprint       = {1511.06807},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/NeelakantanVLSK15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/SocherKLMN14,
  author       = {Richard Socher and
                  Andrej Karpathy and
                  Quoc V. Le and
                  Christopher D. Manning and
                  Andrew Y. Ng},
  title        = {Grounded Compositional Semantics for Finding and Describing Images
                  with Sentences},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {2},
  pages        = {207--218},
  year         = {2014},
  url          = {https://doi.org/10.1162/tacl\_a\_00177},
  doi          = {10.1162/TACL\_A\_00177},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/SocherKLMN14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeM14,
  author       = {Quoc V. Le and
                  Tom{\'{a}}s Mikolov},
  title        = {Distributed Representations of Sentences and Documents},
  booktitle    = {Proceedings of the 31th International Conference on Machine Learning,
                  {ICML} 2014, Beijing, China, 21-26 June 2014},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {32},
  pages        = {1188--1196},
  publisher    = {JMLR.org},
  year         = {2014},
  url          = {http://proceedings.mlr.press/v32/le14.html},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LeM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SutskeverVL14,
  author       = {Ilya Sutskever and
                  Oriol Vinyals and
                  Quoc V. Le},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Sequence to Sequence Learning with Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {3104--3112},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/a14ac55a4f27472c5d894ec1c3c743d2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SutskeverVL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LeM14,
  author       = {Quoc V. Le and
                  Tom{\'{a}}s Mikolov},
  title        = {Distributed Representations of Sentences and Documents},
  journal      = {CoRR},
  volume       = {abs/1405.4053},
  year         = {2014},
  url          = {http://arxiv.org/abs/1405.4053},
  eprinttype    = {arXiv},
  eprint       = {1405.4053},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/LeM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LeSS14,
  author       = {Quoc Viet Le and
                  Tam{\'{a}}s Sarl{\'{o}}s and
                  Alexander Johannes Smola},
  title        = {Fastfood: Approximate Kernel Expansions in Loglinear Time},
  journal      = {CoRR},
  volume       = {abs/1408.3060},
  year         = {2014},
  url          = {http://arxiv.org/abs/1408.3060},
  eprinttype    = {arXiv},
  eprint       = {1408.3060},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LeSS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SutskeverVL14,
  author       = {Ilya Sutskever and
                  Oriol Vinyals and
                  Quoc V. Le},
  title        = {Sequence to Sequence Learning with Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1409.3215},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.3215},
  eprinttype    = {arXiv},
  eprint       = {1409.3215},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SutskeverVL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LuongSLVZ14,
  author       = {Thang Luong and
                  Ilya Sutskever and
                  Quoc V. Le and
                  Oriol Vinyals and
                  Wojciech Zaremba},
  title        = {Addressing the Rare Word Problem in Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1410.8206},
  year         = {2014},
  url          = {http://arxiv.org/abs/1410.8206},
  eprinttype    = {arXiv},
  eprint       = {1410.8206},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LuongSLVZ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/us/Le13a,
  author       = {Quoc V. Le},
  title        = {Scalable feature learning},
  school       = {Stanford University, {USA}},
  year         = {2013},
  url          = {https://searchworks.stanford.edu/view/10164968},
  timestamp    = {Fri, 02 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/us/Le13a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ZeilerRMMYLNSVDH13,
  author       = {Matthew D. Zeiler and
                  Marc'Aurelio Ranzato and
                  Rajat Monga and
                  Mark Z. Mao and
                  K. Yang and
                  Quoc Viet Le and
                  Patrick Nguyen and
                  Andrew W. Senior and
                  Vincent Vanhoucke and
                  Jeffrey Dean and
                  Geoffrey E. Hinton},
  title        = {On rectified linear units for speech processing},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {3517--3521},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6638312},
  doi          = {10.1109/ICASSP.2013.6638312},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ZeilerRMMYLNSVDH13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Le13,
  author       = {Quoc V. Le},
  title        = {Building high-level features using large scale unsupervised learning},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {8595--8598},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639343},
  doi          = {10.1109/ICASSP.2013.6639343},
  timestamp    = {Fri, 19 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Le13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeSS13,
  author       = {Quoc V. Le and
                  Tam{\'{a}}s Sarl{\'{o}}s and
                  Alexander J. Smola},
  title        = {Fastfood - Computing Hilbert Space Expansions in loglinear time},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {244--252},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/le13.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LeSS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MikolovLS13,
  author       = {Tom{\'{a}}s Mikolov and
                  Quoc V. Le and
                  Ilya Sutskever},
  title        = {Exploiting Similarities among Languages for Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1309.4168},
  year         = {2013},
  url          = {http://arxiv.org/abs/1309.4168},
  eprinttype    = {arXiv},
  eprint       = {1309.4168},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MikolovLS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioDEILRSS13,
  author       = {Samy Bengio and
                  Jeffrey Dean and
                  Dumitru Erhan and
                  Eugene Ie and
                  Quoc V. Le and
                  Andrew Rabinovich and
                  Jonathon Shlens and
                  Yoram Singer},
  title        = {Using Web Co-occurrence Statistics for Improving Image Categorization},
  journal      = {CoRR},
  volume       = {abs/1312.5697},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.5697},
  eprinttype    = {arXiv},
  eprint       = {1312.5697},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioDEILRSS13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeRMDCCDN12,
  author       = {Quoc V. Le and
                  Marc'Aurelio Ranzato and
                  Rajat Monga and
                  Matthieu Devin and
                  Greg Corrado and
                  Kai Chen and
                  Jeffrey Dean and
                  Andrew Y. Ng},
  title        = {Building high-level features using large scale unsupervised learning},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/73.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LeRMDCCDN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MaasLOVNN12,
  author       = {Andrew L. Maas and
                  Quoc V. Le and
                  Tyler M. O'Neil and
                  Oriol Vinyals and
                  Patrick Nguyen and
                  Andrew Y. Ng},
  title        = {Recurrent Neural Networks for Noise Reduction in Robust {ASR}},
  booktitle    = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech
                  Communication Association, Portland, Oregon, USA, September 9-13,
                  2012},
  pages        = {22--25},
  publisher    = {{ISCA}},
  year         = {2012},
  url          = {https://doi.org/10.21437/Interspeech.2012-6},
  doi          = {10.21437/INTERSPEECH.2012-6},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MaasLOVNN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isbi/LeHGSBP12,
  author       = {Quoc V. Le and
                  Ju Han and
                  Joe W. Gray and
                  Paul T. Spellman and
                  Alexander Borowsky and
                  Bahram Parvin},
  title        = {Learning invariant features of tumor signatures},
  booktitle    = {9th {IEEE} International Symposium on Biomedical Imaging: From Nano
                  to Macro, {ISBI} 2012, May 2-5, 2012, Barcelona, Spain, Proceedings},
  pages        = {302--305},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ISBI.2012.6235544},
  doi          = {10.1109/ISBI.2012.6235544},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/isbi/LeHGSBP12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DeanCMCDLMRSTYN12,
  author       = {Jeffrey Dean and
                  Greg Corrado and
                  Rajat Monga and
                  Kai Chen and
                  Matthieu Devin and
                  Quoc V. Le and
                  Mark Z. Mao and
                  Marc'Aurelio Ranzato and
                  Andrew W. Senior and
                  Paul A. Tucker and
                  Ke Yang and
                  Andrew Y. Ng},
  editor       = {Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Kilian Q. Weinberger},
  title        = {Large Scale Distributed Deep Networks},
  booktitle    = {Advances in Neural Information Processing Systems 25: 26th Annual
                  Conference on Neural Information Processing Systems 2012. Proceedings
                  of a meeting held December 3-6, 2012, Lake Tahoe, Nevada, United States},
  pages        = {1232--1240},
  year         = {2012},
  url          = {https://proceedings.neurips.cc/paper/2012/hash/6aca97005c68f1206823815f66102863-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DeanCMCDLMRSTYN12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/LeZYN11,
  author       = {Quoc V. Le and
                  Will Y. Zou and
                  Serena Y. Yeung and
                  Andrew Y. Ng},
  title        = {Learning hierarchical invariant spatio-temporal features for action
                  recognition with independent subspace analysis},
  booktitle    = {The 24th {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2011, Colorado Springs, CO, USA, 20-25 June 2011},
  pages        = {3361--3368},
  publisher    = {{IEEE} Computer Society},
  year         = {2011},
  url          = {https://doi.org/10.1109/CVPR.2011.5995496},
  doi          = {10.1109/CVPR.2011.5995496},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/LeZYN11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeNCLPN11,
  author       = {Quoc V. Le and
                  Jiquan Ngiam and
                  Adam Coates and
                  Ahbik Lahiri and
                  Bobby Prochnow and
                  Andrew Y. Ng},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {On optimization methods for deep learning},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {265--272},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/210\_icmlpaper.pdf},
  timestamp    = {Mon, 23 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LeNCLPN11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LeKNN11,
  author       = {Quoc V. Le and
                  Alexandre Karpenko and
                  Jiquan Ngiam and
                  Andrew Y. Ng},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {{ICA} with Reconstruction Cost for Efficient Overcomplete Feature
                  Learning},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {1017--1025},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/233509073ed3432027d48b1a83f5fbd2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LeKNN11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1112-6209,
  author       = {Quoc V. Le and
                  Rajat Monga and
                  Matthieu Devin and
                  Greg Corrado and
                  Kai Chen and
                  Marc'Aurelio Ranzato and
                  Jeffrey Dean and
                  Andrew Y. Ng},
  title        = {Building high-level features using large scale unsupervised learning},
  journal      = {CoRR},
  volume       = {abs/1112.6209},
  year         = {2011},
  url          = {http://arxiv.org/abs/1112.6209},
  eprinttype    = {arXiv},
  eprint       = {1112.6209},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1112-6209.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TeoVSL10,
  author       = {Choon Hui Teo and
                  S. V. N. Vishwanathan and
                  Alexander J. Smola and
                  Quoc V. Le},
  title        = {Bundle Methods for Regularized Risk Minimization},
  journal      = {J. Mach. Learn. Res.},
  volume       = {11},
  pages        = {311--365},
  year         = {2010},
  url          = {https://dl.acm.org/doi/10.5555/1756006.1756016},
  doi          = {10.5555/1756006.1756016},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TeoVSL10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/LeKKN10,
  author       = {Quoc V. Le and
                  David Kamm and
                  Arda F. Kara and
                  Andrew Y. Ng},
  title        = {Learning to grasp objects with multiple contact points},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2010, Anchorage, Alaska, USA, 3-7 May 2010},
  pages        = {5062--5069},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ROBOT.2010.5509508},
  doi          = {10.1109/ROBOT.2010.5509508},
  timestamp    = {Wed, 03 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/LeKKN10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/RaoLPQSN10,
  author       = {Deepak Rao and
                  Quoc V. Le and
                  Thanathorn Phoka and
                  Morgan Quigley and
                  Attawith Sudsang and
                  Andrew Y. Ng},
  title        = {Grasping novel objects with depth segmentation},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {2578--2585},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5650493},
  doi          = {10.1109/IROS.2010.5650493},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/RaoLPQSN10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/QuigleyBSPLN10,
  author       = {Morgan Quigley and
                  Reuben D. Brewer and
                  Sai Prashanth Soundararaj and
                  Vijay Pradeep and
                  Quoc V. Le and
                  Andrew Y. Ng},
  title        = {Low-cost accelerometers for robotic manipulator perception},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {6168--6174},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5649804},
  doi          = {10.1109/IROS.2010.5649804},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/QuigleyBSPLN10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LeNCCKN10,
  author       = {Quoc V. Le and
                  Jiquan Ngiam and
                  Zhenghao Chen and
                  Daniel Jin hao Chia and
                  Pang Wei Koh and
                  Andrew Y. Ng},
  editor       = {John D. Lafferty and
                  Christopher K. I. Williams and
                  John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Aron Culotta},
  title        = {Tiled convolutional neural networks},
  booktitle    = {Advances in Neural Information Processing Systems 23: 24th Annual
                  Conference on Neural Information Processing Systems 2010. Proceedings
                  of a meeting held 6-9 December 2010, Vancouver, British Columbia,
                  Canada},
  pages        = {1279--1287},
  publisher    = {Curran Associates, Inc.},
  year         = {2010},
  url          = {https://proceedings.neurips.cc/paper/2010/hash/01f78be6f7cad02658508fe4616098a9-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LeNCCKN10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/QuadriantoSCL09,
  author       = {Novi Quadrianto and
                  Alexander J. Smola and
                  Tib{\'{e}}rio S. Caetano and
                  Quoc V. Le},
  title        = {Estimating Labels from Label Proportions},
  journal      = {J. Mach. Learn. Res.},
  volume       = {10},
  pages        = {2349--2374},
  year         = {2009},
  url          = {https://dl.acm.org/doi/10.5555/1577069.1755865},
  doi          = {10.5555/1577069.1755865},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/QuadriantoSCL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/CaetanoMCLS09,
  author       = {Tib{\'{e}}rio S. Caetano and
                  Julian J. McAuley and
                  Li Cheng and
                  Quoc V. Le and
                  Alexander J. Smola},
  title        = {Learning Graph Matching},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {31},
  number       = {6},
  pages        = {1048--1058},
  year         = {2009},
  url          = {https://doi.org/10.1109/TPAMI.2009.28},
  doi          = {10.1109/TPAMI.2009.28},
  timestamp    = {Mon, 07 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pami/CaetanoMCLS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DoLF09,
  author       = {Chuong B. Do and
                  Quoc V. Le and
                  Chuan{-}Sheng Foo},
  editor       = {Andrea Pohoreckyj Danyluk and
                  L{\'{e}}on Bottou and
                  Michael L. Littman},
  title        = {Proximal regularization for online and batch learning},
  booktitle    = {Proceedings of the 26th Annual International Conference on Machine
                  Learning, {ICML} 2009, Montreal, Quebec, Canada, June 14-18, 2009},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {382},
  pages        = {257--264},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1553374.1553407},
  doi          = {10.1145/1553374.1553407},
  timestamp    = {Tue, 06 Nov 2018 16:58:29 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/DoLF09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/QuigleyBGKLWN09,
  author       = {Morgan Quigley and
                  Siddharth Batra and
                  Stephen Gould and
                  Ellen Klingbeil and
                  Quoc V. Le and
                  Ashley Wellman and
                  Andrew Y. Ng},
  title        = {High-accuracy 3D sensing for mobile manipulation: Improving object
                  detection and door opening},
  booktitle    = {2009 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2009, Kobe, Japan, May 12-17, 2009},
  pages        = {2816--2822},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/ROBOT.2009.5152750},
  doi          = {10.1109/ROBOT.2009.5152750},
  timestamp    = {Mon, 22 May 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/QuigleyBGKLWN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/LeN09,
  author       = {Quoc V. Le and
                  Andrew Y. Ng},
  title        = {Joint calibration of multiple sensors},
  booktitle    = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 11-15, 2009, St. Louis, MO, {USA}},
  pages        = {3651--3658},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/IROS.2009.5354272},
  doi          = {10.1109/IROS.2009.5354272},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/LeN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/CoatesBLN09,
  author       = {Adam Coates and
                  Paul Baumstarck and
                  Quoc V. Le and
                  Andrew Y. Ng},
  title        = {Scalable learning for object detection with {GPU} hardware},
  booktitle    = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 11-15, 2009, St. Louis, MO, {USA}},
  pages        = {4287--4293},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/IROS.2009.5354084},
  doi          = {10.1109/IROS.2009.5354084},
  timestamp    = {Mon, 23 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/CoatesBLN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoodfellowLSLN09,
  author       = {Ian J. Goodfellow and
                  Quoc V. Le and
                  Andrew M. Saxe and
                  Honglak Lee and
                  Andrew Y. Ng},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Measuring Invariances in Deep Networks},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {646--654},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/428fca9bc1921c25c5121f9da7815cde-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GoodfellowLSLN09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/QuadriantoSCL08,
  author       = {Novi Quadrianto and
                  Alexander J. Smola and
                  Tib{\'{e}}rio S. Caetano and
                  Quoc V. Le},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Estimating labels from label proportions},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {776--783},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390254},
  doi          = {10.1145/1390156.1390254},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/QuadriantoSCL08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChapelleDLST08,
  author       = {Olivier Chapelle and
                  Chuong B. Do and
                  Quoc V. Le and
                  Alexander J. Smola and
                  Choon Hui Teo},
  editor       = {Daphne Koller and
                  Dale Schuurmans and
                  Yoshua Bengio and
                  L{\'{e}}on Bottou},
  title        = {Tighter Bounds for Structured Estimation},
  booktitle    = {Advances in Neural Information Processing Systems 21, Proceedings
                  of the Twenty-Second Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 8-11, 2008},
  pages        = {281--288},
  publisher    = {Curran Associates, Inc.},
  year         = {2008},
  url          = {https://proceedings.neurips.cc/paper/2008/hash/6bc24fc1ab650b25b4114e93a98f1eba-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChapelleDLST08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0806-2890,
  author       = {Tib{\'{e}}rio S. Caetano and
                  Julian J. McAuley and
                  Li Cheng and
                  Quoc V. Le and
                  Alexander J. Smola},
  title        = {Learning Graph Matching},
  journal      = {CoRR},
  volume       = {abs/0806.2890},
  year         = {2008},
  url          = {http://arxiv.org/abs/0806.2890},
  eprinttype    = {arXiv},
  eprint       = {0806.2890},
  timestamp    = {Mon, 07 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0806-2890.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/CaetanoCLS07,
  author       = {Tib{\'{e}}rio S. Caetano and
                  Li Cheng and
                  Quoc V. Le and
                  Alexander J. Smola},
  title        = {Learning Graph Matching},
  booktitle    = {{IEEE} 11th International Conference on Computer Vision, {ICCV} 2007,
                  Rio de Janeiro, Brazil, October 14-20, 2007},
  pages        = {1--8},
  publisher    = {{IEEE} Computer Society},
  year         = {2007},
  url          = {https://doi.org/10.1109/ICCV.2007.4408838},
  doi          = {10.1109/ICCV.2007.4408838},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/CaetanoCLS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/TeoSVL07,
  author       = {Choon Hui Teo and
                  Alexander J. Smola and
                  S. V. N. Vishwanathan and
                  Quoc V. Le},
  editor       = {Pavel Berkhin and
                  Rich Caruana and
                  Xindong Wu},
  title        = {A scalable modular convex solver for regularized risk minimization},
  booktitle    = {Proceedings of the 13th {ACM} {SIGKDD} International Conference on
                  Knowledge Discovery and Data Mining, San Jose, California, USA, August
                  12-15, 2007},
  pages        = {727--736},
  publisher    = {{ACM}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1281192.1281270},
  doi          = {10.1145/1281192.1281270},
  timestamp    = {Fri, 10 Mar 2023 14:55:31 +0100},
  biburl       = {https://dblp.org/rec/conf/kdd/TeoSVL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SmolaVL07,
  author       = {Alexander J. Smola and
                  S. V. N. Vishwanathan and
                  Quoc V. Le},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Bundle Methods for Machine Learning},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {1377--1384},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/26337353b7962f533d78c762373b3318-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/SmolaVL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WeimerKLS07,
  author       = {Markus Weimer and
                  Alexandros Karatzoglou and
                  Quoc V. Le and
                  Alexander J. Smola},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {{COFI} {RANK} - Maximum Margin Matrix Factorization for Collaborative
                  Ranking},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {1593--1600},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/f76a89f0cb91bc419542ce9fa43902dc-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WeimerKLS07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0704-3359,
  author       = {Quoc V. Le and
                  Alexander J. Smola},
  title        = {Direct Optimization of Ranking Measures},
  journal      = {CoRR},
  volume       = {abs/0704.3359},
  year         = {2007},
  url          = {http://arxiv.org/abs/0704.3359},
  eprinttype    = {arXiv},
  eprint       = {0704.3359},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0704-3359.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/TakeuchiLSS06,
  author       = {Ichiro Takeuchi and
                  Quoc V. Le and
                  Tim D. Sears and
                  Alexander J. Smola},
  title        = {Nonparametric Quantile Estimation},
  journal      = {J. Mach. Learn. Res.},
  volume       = {7},
  pages        = {1231--1264},
  year         = {2006},
  url          = {http://jmlr.org/papers/v7/takeuchi06a.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/TakeuchiLSS06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ecml/LeSGA06,
  author       = {Quoc V. Le and
                  Alexander J. Smola and
                  Thomas G{\"{a}}rtner and
                  Yasemin Altun},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Tobias Scheffer and
                  Myra Spiliopoulou},
  title        = {Transductive Gaussian Process Regression with Automatic Model Selection},
  booktitle    = {Machine Learning: {ECML} 2006, 17th European Conference on Machine
                  Learning, Berlin, Germany, September 18-22, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4212},
  pages        = {306--317},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11871842\_31},
  doi          = {10.1007/11871842\_31},
  timestamp    = {Thu, 05 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ecml/LeSGA06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeSG06,
  author       = {Quoc V. Le and
                  Alexander J. Smola and
                  Thomas G{\"{a}}rtner},
  editor       = {William W. Cohen and
                  Andrew W. Moore},
  title        = {Simpler knowledge-based support vector machines},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Third International Conference
                  {(ICML} 2006), Pittsburgh, Pennsylvania, USA, June 25-29, 2006},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {148},
  pages        = {521--528},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143844.1143910},
  doi          = {10.1145/1143844.1143910},
  timestamp    = {Thu, 05 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LeSG06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BurgesRL06,
  author       = {Christopher J. C. Burges and
                  Robert Ragno and
                  Quoc Viet Le},
  editor       = {Bernhard Sch{\"{o}}lkopf and
                  John C. Platt and
                  Thomas Hofmann},
  title        = {Learning to Rank with Nonsmooth Cost Functions},
  booktitle    = {Advances in Neural Information Processing Systems 19, Proceedings
                  of the Twentieth Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 4-7, 2006},
  pages        = {193--200},
  publisher    = {{MIT} Press},
  year         = {2006},
  url          = {https://proceedings.neurips.cc/paper/2006/hash/af44c4c56f385c43f2529f9b1b018f6a-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BurgesRL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LeSC05,
  author       = {Quoc V. Le and
                  Alexander J. Smola and
                  St{\'{e}}phane Canu},
  editor       = {Luc De Raedt and
                  Stefan Wrobel},
  title        = {Heteroscedastic Gaussian process regression},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Second International Conference
                  {(ICML} 2005), Bonn, Germany, August 7-11, 2005},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {119},
  pages        = {489--496},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1102351.1102413},
  doi          = {10.1145/1102351.1102413},
  timestamp    = {Wed, 25 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LeSC05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GartnerLBSV05,
  author       = {Thomas G{\"{a}}rtner and
                  Quoc V. Le and
                  Simon Burton and
                  Alexander J. Smola and
                  S. V. N. Vishwanathan},
  title        = {Large-Scale Multiclass Transduction},
  booktitle    = {Advances in Neural Information Processing Systems 18 [Neural Information
                  Processing Systems, {NIPS} 2005, December 5-8, 2005, Vancouver, British
                  Columbia, Canada]},
  pages        = {411--418},
  year         = {2005},
  url          = {https://proceedings.neurips.cc/paper/2005/hash/445e1050156c6ae8c082a8422bb7dfc0-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GartnerLBSV05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/vldb/McCannALNVD05,
  author       = {Robert McCann and
                  Bedoor K. AlShebli and
                  Quoc Le and
                  Hoa Nguyen and
                  Long H. Vu and
                  AnHai Doan},
  editor       = {Klemens B{\"{o}}hm and
                  Christian S. Jensen and
                  Laura M. Haas and
                  Martin L. Kersten and
                  Per{-}{\AA}ke Larson and
                  Beng Chin Ooi},
  title        = {Mapping Maintenance for Data Integration Systems},
  booktitle    = {Proceedings of the 31st International Conference on Very Large Data
                  Bases, Trondheim, Norway, August 30 - September 2, 2005},
  pages        = {1018--1030},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {http://www.vldb.org/archives/website/2005/program/paper/fri/p1018-mccann.pdf},
  timestamp    = {Thu, 03 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/vldb/McCannALNVD05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics