Stop the war!
Остановите войну!
for scientists:
default search action
BibTeX records: Quoc V. Le
@article{DBLP:journals/nature/TrinhWLHL24, author = {Trieu H. Trinh and Yuhuai Wu and Quoc V. Le and He He and Thang Luong}, title = {Solving olympiad geometry without human demonstrations}, journal = {Nat.}, volume = {625}, number = {7995}, pages = {476--482}, year = {2024}, url = {https://doi.org/10.1038/s41586-023-06747-5}, doi = {10.1038/S41586-023-06747-5}, timestamp = {Fri, 08 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nature/TrinhWLHL24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-03620, author = {Pei Zhou and Jay Pujara and Xiang Ren and Xinyun Chen and Heng{-}Tze Cheng and Quoc V. Le and Ed H. Chi and Denny Zhou and Swaroop Mishra and Huaixiu Steven Zheng}, title = {Self-Discover: Large Language Models Self-Compose Reasoning Structures}, journal = {CoRR}, volume = {abs/2402.03620}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.03620}, doi = {10.48550/ARXIV.2402.03620}, eprinttype = {arXiv}, eprint = {2402.03620}, timestamp = {Mon, 12 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-03620.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ijon/PhamDGKLYYCLWTL23, author = {Hieu Pham and Zihang Dai and Golnaz Ghiasi and Kenji Kawaguchi and Hanxiao Liu and Adams Wei Yu and Jiahui Yu and Yi{-}Ting Chen and Minh{-}Thang Luong and Yonghui Wu and Mingxing Tan and Quoc V. Le}, title = {Combined scaling for zero-shot transfer learning}, journal = {Neurocomputing}, volume = {555}, pages = {126658}, year = {2023}, url = {https://doi.org/10.1016/j.neucom.2023.126658}, doi = {10.1016/J.NEUCOM.2023.126658}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ijon/PhamDGKLYYCLWTL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/SuzgunSSGTCCLCZ23, author = {Mirac Suzgun and Nathan Scales and Nathanael Sch{\"{a}}rli and Sebastian Gehrmann and Yi Tay and Hyung Won Chung and Aakanksha Chowdhery and Quoc V. Le and Ed H. Chi and Denny Zhou and Jason Wei}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {Challenging BIG-Bench Tasks and Whether Chain-of-Thought Can Solve Them}, booktitle = {Findings of the Association for Computational Linguistics: {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {13003--13051}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.findings-acl.824}, doi = {10.18653/V1/2023.FINDINGS-ACL.824}, timestamp = {Mon, 29 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/acl/SuzgunSSGTCCLCZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asplos/LiACCGHLLLLLLNP23, author = {Sheng Li and Garrett Andersen and Tao Chen and Liqun Cheng and Julian Grady and Da Huang and Quoc V. Le and Andrew Li and Xin Li and Yang Li and Chen Liang and Yifeng Lu and Yun Ni and Ruoming Pang and Mingxing Tan and Martin Wicke and Gang Wu and Shengqi Zhu and Parthasarathy Ranganathan and Norman P. Jouppi}, editor = {Tor M. Aamodt and Natalie D. Enright Jerger and Michael M. Swift}, title = {Hyperscale Hardware Optimized Neural Architecture Search}, booktitle = {Proceedings of the 28th {ACM} International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 3, {ASPLOS} 2023, Vancouver, BC, Canada, March 25-29, 2023}, pages = {343--358}, publisher = {{ACM}}, year = {2023}, url = {https://doi.org/10.1145/3582016.3582049}, doi = {10.1145/3582016.3582049}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/asplos/LiACCGHLLLLLLNP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/WeiHLCHTCLZ0L23, author = {Jerry W. Wei and Le Hou and Andrew K. Lampinen and Xiangning Chen and Da Huang and Yi Tay and Xinyun Chen and Yifeng Lu and Denny Zhou and Tengyu Ma and Quoc V. Le}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {Symbol tuning improves in-context learning in language models}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {968--979}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://aclanthology.org/2023.emnlp-main.61}, timestamp = {Wed, 13 Dec 2023 17:20:20 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/WeiHLCHTCLZ0L23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/TayWC0SSGZRCZMP23, author = {Yi Tay and Jason Wei and Hyung Won Chung and Vinh Q. Tran and David R. So and Siamak Shakeri and Xavier Garcia and Huaixiu Steven Zheng and Jinfeng Rao and Aakanksha Chowdhery and Denny Zhou and Donald Metzler and Slav Petrov and Neil Houlsby and Quoc V. Le and Mostafa Dehghani}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {Transcending Scaling Laws with 0.1{\%} Extra Compute}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {1471--1486}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://aclanthology.org/2023.emnlp-main.91}, timestamp = {Thu, 14 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/TayWC0SSGZRCZMP23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/WeiKTL23, author = {Jason Wei and Najoung Kim and Yi Tay and Quoc V. Le}, editor = {Houda Bouamor and Juan Pino and Kalika Bali}, title = {Inverse Scaling Can Become U-Shaped}, booktitle = {Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2023, Singapore, December 6-10, 2023}, pages = {15580--15591}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://aclanthology.org/2023.emnlp-main.963}, timestamp = {Thu, 14 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/WeiKTL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/0002WSLCNCZ23, author = {Xuezhi Wang and Jason Wei and Dale Schuurmans and Quoc V. Le and Ed H. Chi and Sharan Narang and Aakanksha Chowdhery and Denny Zhou}, title = {Self-Consistency Improves Chain of Thought Reasoning in Language Models}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=1PL1NIMMrw}, timestamp = {Fri, 30 Jun 2023 14:38:38 +0200}, biburl = {https://dblp.org/rec/conf/iclr/0002WSLCNCZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ZhouSHWS0SCBLC23, author = {Denny Zhou and Nathanael Sch{\"{a}}rli and Le Hou and Jason Wei and Nathan Scales and Xuezhi Wang and Dale Schuurmans and Claire Cui and Olivier Bousquet and Quoc V. Le and Ed H. Chi}, title = {Least-to-Most Prompting Enables Complex Reasoning in Large Language Models}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=WZH7099tgfM}, timestamp = {Fri, 30 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ZhouSHWS0SCBLC23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LongpreHVWCTZLZ23, author = {Shayne Longpre and Le Hou and Tu Vu and Albert Webson and Hyung Won Chung and Yi Tay and Denny Zhou and Quoc V. Le and Barret Zoph and Jason Wei and Adam Roberts}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {The Flan Collection: Designing Data and Methods for Effective Instruction Tuning}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {22631--22648}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/longpre23a.html}, timestamp = {Mon, 28 Aug 2023 17:23:08 +0200}, biburl = {https://dblp.org/rec/conf/icml/LongpreHVWCTZLZ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ZhouDHPLHSSDLCL23, author = {Yanqi Zhou and Nan Du and Yanping Huang and Daiyi Peng and Chang Lan and Da Huang and Siamak Shakeri and David R. So and Andrew M. Dai and Yifeng Lu and Zhifeng Chen and Quoc V. Le and Claire Cui and James Laudon and Jeff Dean}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {Brainformers: Trading Simplicity for Efficiency}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {42531--42542}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/zhou23c.html}, timestamp = {Fri, 01 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/ZhouDHPLHSSDLCL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ChenLHRW0DLHLL23, author = {Xiangning Chen and Chen Liang and Da Huang and Esteban Real and Kaiyuan Wang and Hieu Pham and Xuanyi Dong and Thang Luong and Cho{-}Jui Hsieh and Yifeng Lu and Quoc V. Le}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Symbolic Discovery of Optimization Algorithms}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/9a39b4925e35cf447ccba8757137d84f-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ChenLHRW0DLHLL23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Xie0DDLLLL0Y23, author = {Sang Michael Xie and Hieu Pham and Xuanyi Dong and Nan Du and Hanxiao Liu and Yifeng Lu and Percy Liang and Quoc V. Le and Tengyu Ma and Adams Wei Yu}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {DoReMi: Optimizing Data Mixtures Speeds Up Language Model Pretraining}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/dcba6be91359358c2355cd920da3fcbd-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Xie0DDLLLL0Y23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-13688, author = {Shayne Longpre and Le Hou and Tu Vu and Albert Webson and Hyung Won Chung and Yi Tay and Denny Zhou and Quoc V. Le and Barret Zoph and Jason Wei and Adam Roberts}, title = {The Flan Collection: Designing Data and Methods for Effective Instruction Tuning}, journal = {CoRR}, volume = {abs/2301.13688}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.13688}, doi = {10.48550/ARXIV.2301.13688}, eprinttype = {arXiv}, eprint = {2301.13688}, timestamp = {Thu, 02 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-13688.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-01918, author = {Daiyi Peng and Xuanyi Dong and Esteban Real and Yifeng Lu and Quoc V. Le}, title = {PyGlove: Efficiently Exchanging {ML} Ideas as Code}, journal = {CoRR}, volume = {abs/2302.01918}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.01918}, doi = {10.48550/ARXIV.2302.01918}, eprinttype = {arXiv}, eprint = {2302.01918}, timestamp = {Fri, 10 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-01918.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-03917, author = {Qingqing Huang and Daniel S. Park and Tao Wang and Timo I. Denk and Andy Ly and Nanxin Chen and Zhengdong Zhang and Zhishuai Zhang and Jiahui Yu and Christian Havn{\o} Frank and Jesse H. Engel and Quoc V. Le and William Chan and Wei Han}, title = {Noise2Music: Text-conditioned Music Generation with Diffusion Models}, journal = {CoRR}, volume = {abs/2302.03917}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.03917}, doi = {10.48550/ARXIV.2302.03917}, eprinttype = {arXiv}, eprint = {2302.03917}, timestamp = {Fri, 10 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-03917.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-05433, author = {Ryan Gillard and Stephen Jonany and Yingjie Miao and Michael Munn and Connal de Souza and Jonathan Dungay and Chen Liang and David R. So and Quoc V. Le and Esteban Real}, title = {Unified Functional Hashing in Automatic Machine Learning}, journal = {CoRR}, volume = {abs/2302.05433}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.05433}, doi = {10.48550/ARXIV.2302.05433}, eprinttype = {arXiv}, eprint = {2302.05433}, timestamp = {Mon, 13 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-05433.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-06675, author = {Xiangning Chen and Chen Liang and Da Huang and Esteban Real and Kaiyuan Wang and Yao Liu and Hieu Pham and Xuanyi Dong and Thang Luong and Cho{-}Jui Hsieh and Yifeng Lu and Quoc V. Le}, title = {Symbolic Discovery of Optimization Algorithms}, journal = {CoRR}, volume = {abs/2302.06675}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.06675}, doi = {10.48550/ARXIV.2302.06675}, eprinttype = {arXiv}, eprint = {2302.06675}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-06675.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-08298, author = {Jerry W. Wei and Le Hou and Andrew K. Lampinen and Xiangning Chen and Da Huang and Yi Tay and Xinyun Chen and Yifeng Lu and Denny Zhou and Tengyu Ma and Quoc V. Le}, title = {Symbol tuning improves in-context learning in language models}, journal = {CoRR}, volume = {abs/2305.08298}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.08298}, doi = {10.48550/ARXIV.2305.08298}, eprinttype = {arXiv}, eprint = {2305.08298}, timestamp = {Thu, 01 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-08298.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-10429, author = {Sang Michael Xie and Hieu Pham and Xuanyi Dong and Nan Du and Hanxiao Liu and Yifeng Lu and Percy Liang and Quoc V. Le and Tengyu Ma and Adams Wei Yu}, title = {DoReMi: Optimizing Data Mixtures Speeds Up Language Model Pretraining}, journal = {CoRR}, volume = {abs/2305.10429}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.10429}, doi = {10.48550/ARXIV.2305.10429}, eprinttype = {arXiv}, eprint = {2305.10429}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-10429.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-00008, author = {Yanqi Zhou and Nan Du and Yanping Huang and Daiyi Peng and Chang Lan and Da Huang and Siamak Shakeri and David R. So and Andrew M. Dai and Yifeng Lu and Zhifeng Chen and Quoc V. Le and Claire Cui and James Laudon and Jeff Dean}, title = {Brainformers: Trading Simplicity for Efficiency}, journal = {CoRR}, volume = {abs/2306.00008}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.00008}, doi = {10.48550/ARXIV.2306.00008}, eprinttype = {arXiv}, eprint = {2306.00008}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-00008.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-03290, author = {Jordan Dotzel and Gang Wu and Andrew Li and Muhammad Umar and Yun Ni and Mohamed S. Abdelfattah and Zhiru Zhang and Liqun Cheng and Martin G. Dixon and Norman P. Jouppi and Quoc V. Le and Sheng Li}, title = {{FLIQS:} One-Shot Mixed-Precision Floating-Point and Integer Quantization Search}, journal = {CoRR}, volume = {abs/2308.03290}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.03290}, doi = {10.48550/ARXIV.2308.03290}, eprinttype = {arXiv}, eprint = {2308.03290}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-03290.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2308-03958, author = {Jerry W. Wei and Da Huang and Yifeng Lu and Denny Zhou and Quoc V. Le}, title = {Simple synthetic data reduces sycophancy in large language models}, journal = {CoRR}, volume = {abs/2308.03958}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2308.03958}, doi = {10.48550/ARXIV.2308.03958}, eprinttype = {arXiv}, eprint = {2308.03958}, timestamp = {Tue, 22 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2308-03958.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-03409, author = {Chengrun Yang and Xuezhi Wang and Yifeng Lu and Hanxiao Liu and Quoc V. Le and Denny Zhou and Xinyun Chen}, title = {Large Language Models as Optimizers}, journal = {CoRR}, volume = {abs/2309.03409}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.03409}, doi = {10.48550/ARXIV.2309.03409}, eprinttype = {arXiv}, eprint = {2309.03409}, timestamp = {Tue, 12 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-03409.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-03214, author = {Tu Vu and Mohit Iyyer and Xuezhi Wang and Noah Constant and Jerry W. Wei and Jason Wei and Chris Tar and Yun{-}Hsuan Sung and Denny Zhou and Quoc V. Le and Thang Luong}, title = {FreshLLMs: Refreshing Large Language Models with Search Engine Augmentation}, journal = {CoRR}, volume = {abs/2310.03214}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.03214}, doi = {10.48550/ARXIV.2310.03214}, eprinttype = {arXiv}, eprint = {2310.03214}, timestamp = {Thu, 19 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-03214.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-06117, author = {Huaixiu Steven Zheng and Swaroop Mishra and Xinyun Chen and Heng{-}Tze Cheng and Ed H. Chi and Quoc V. Le and Denny Zhou}, title = {Take a Step Back: Evoking Reasoning via Abstraction in Large Language Models}, journal = {CoRR}, volume = {abs/2310.06117}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.06117}, doi = {10.48550/ARXIV.2310.06117}, eprinttype = {arXiv}, eprint = {2310.06117}, timestamp = {Tue, 24 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-06117.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2312-00763, author = {Xiao Ma and Swaroop Mishra and Ariel Liu and Sophie Su and Jilin Chen and Chinmay Kulkarni and Heng{-}Tze Cheng and Quoc V. Le and Ed H. Chi}, title = {Beyond ChatBots: ExploreLLM for Structured Thoughts and Personalized Model Responses}, journal = {CoRR}, volume = {abs/2312.00763}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2312.00763}, doi = {10.48550/ARXIV.2312.00763}, eprinttype = {arXiv}, eprint = {2312.00763}, timestamp = {Mon, 11 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2312-00763.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2312-08472, author = {Esteban Real and Yao Chen and Mirko Rossini and Connal de Souza and Manav Garg and Akhil Verghese and Moritz Firsching and Quoc V. Le and Ekin Dogus Cubuk and David H. Park}, title = {AutoNumerics-Zero: Automated Discovery of State-of-the-Art Mathematical Functions}, journal = {CoRR}, volume = {abs/2312.08472}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2312.08472}, doi = {10.48550/ARXIV.2312.08472}, eprinttype = {arXiv}, eprint = {2312.08472}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2312-08472.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/computer/PattersonGHLLMR22, author = {David A. Patterson and Joseph Gonzalez and Urs H{\"{o}}lzle and Quoc V. Le and Chen Liang and Lluis{-}Miquel Munguia and Daniel Rothchild and David R. So and Maud Texier and Jeff Dean}, title = {The Carbon Footprint of Machine Learning Training Will Plateau, Then Shrink}, journal = {Computer}, volume = {55}, number = {7}, pages = {18--28}, year = {2022}, url = {https://doi.org/10.1109/MC.2022.3148714}, doi = {10.1109/MC.2022.3148714}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/computer/PattersonGHLLMR22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jstsp/ZhangPHQGSJXHWZ22, author = {Yu Zhang and Daniel S. Park and Wei Han and James Qin and Anmol Gulati and Joel Shor and Aren Jansen and Yuanzhong Xu and Yanping Huang and Shibo Wang and Zongwei Zhou and Bo Li and Min Ma and William Chan and Jiahui Yu and Yongqiang Wang and Liangliang Cao and Khe Chai Sim and Bhuvana Ramabhadran and Tara N. Sainath and Fran{\c{c}}oise Beaufays and Zhifeng Chen and Quoc V. Le and Chung{-}Cheng Chiu and Ruoming Pang and Yonghui Wu}, title = {BigSSL: Exploring the Frontier of Large-Scale Semi-Supervised Learning for Automatic Speech Recognition}, journal = {{IEEE} J. Sel. Top. Signal Process.}, volume = {16}, number = {6}, pages = {1519--1532}, year = {2022}, url = {https://doi.org/10.1109/JSTSP.2022.3182537}, doi = {10.1109/JSTSP.2022.3182537}, timestamp = {Sun, 13 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jstsp/ZhangPHQGSJXHWZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/asplos/ZhangHSPLGM22, author = {Dan Zhang and Safeen Huda and Ebrahim M. Songhori and Kartik Prabhu and Quoc V. Le and Anna Goldie and Azalia Mirhoseini}, editor = {Babak Falsafi and Michael Ferdman and Shan Lu and Thomas F. Wenisch}, title = {A full-stack search technique for domain optimized deep learning accelerators}, booktitle = {{ASPLOS} '22: 27th {ACM} International Conference on Architectural Support for Programming Languages and Operating Systems, Lausanne, Switzerland, 28 February 2022 - 4 March 2022}, pages = {27--42}, publisher = {{ACM}}, year = {2022}, url = {https://doi.org/10.1145/3503222.3507767}, doi = {10.1145/3503222.3507767}, timestamp = {Fri, 23 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/asplos/ZhangHSPLGM22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/LiYMCNPSLZLYT22, author = {Yingwei Li and Adams Wei Yu and Tianjian Meng and Benjamin Caine and Jiquan Ngiam and Daiyi Peng and Junyang Shen and Yifeng Lu and Denny Zhou and Quoc V. Le and Alan L. Yuille and Mingxing Tan}, title = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection}, booktitle = {{IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2022, New Orleans, LA, USA, June 18-24, 2022}, pages = {17161--17170}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/CVPR52688.2022.01667}, doi = {10.1109/CVPR52688.2022.01667}, timestamp = {Wed, 05 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/LiYMCNPSLZLYT22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/WeiBZGYLDDL22, author = {Jason Wei and Maarten Bosma and Vincent Y. Zhao and Kelvin Guu and Adams Wei Yu and Brian Lester and Nan Du and Andrew M. Dai and Quoc V. Le}, title = {Finetuned Language Models are Zero-Shot Learners}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=gEZrGCozdqR}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/WeiBZGYLDDL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DuHDTLXKZYFZFBZ22, author = {Nan Du and Yanping Huang and Andrew M. Dai and Simon Tong and Dmitry Lepikhin and Yuanzhong Xu and Maxim Krikun and Yanqi Zhou and Adams Wei Yu and Orhan Firat and Barret Zoph and Liam Fedus and Maarten P. Bosma and Zongwei Zhou and Tao Wang and Yu Emma Wang and Kellie Webster and Marie Pellat and Kevin Robinson and Kathleen S. Meier{-}Hellstern and Toju Duke and Lucas Dixon and Kun Zhang and Quoc V. Le and Yonghui Wu and Zhifeng Chen and Claire Cui}, editor = {Kamalika Chaudhuri and Stefanie Jegelka and Le Song and Csaba Szepesv{\'{a}}ri and Gang Niu and Sivan Sabato}, title = {GLaM: Efficient Scaling of Language Models with Mixture-of-Experts}, booktitle = {International Conference on Machine Learning, {ICML} 2022, 17-23 July 2022, Baltimore, Maryland, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {162}, pages = {5547--5569}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v162/du22c.html}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/DuHDTLXKZYFZFBZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/HuaDLL22, author = {Weizhe Hua and Zihang Dai and Hanxiao Liu and Quoc V. Le}, editor = {Kamalika Chaudhuri and Stefanie Jegelka and Le Song and Csaba Szepesv{\'{a}}ri and Gang Niu and Sivan Sabato}, title = {Transformer Quality in Linear Time}, booktitle = {International Conference on Machine Learning, {ICML} 2022, 17-23 July 2022, Baltimore, Maryland, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {162}, pages = {9099--9117}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v162/hua22a.html}, timestamp = {Tue, 12 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/HuaDLL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Wei0SBIXCLZ22, author = {Jason Wei and Xuezhi Wang and Dale Schuurmans and Maarten Bosma and Brian Ichter and Fei Xia and Ed H. Chi and Quoc V. Le and Denny Zhou}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Chain-of-Thought Prompting Elicits Reasoning in Large Language Models}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/9d5609613524ecf4f15af0f7b31abca4-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/Wei0SBIXCLZ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/YangBLKULLH22, author = {Chengrun Yang and Gabriel Bender and Hanxiao Liu and Pieter{-}Jan Kindermans and Madeleine Udell and Yifeng Lu and Quoc V. Le and Da Huang}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {TabNAS: Rejection Sampling for Neural Architecture Search on Tabular Datasets}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/4e392aa9bc70ed731d3c9c32810f92fb-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/YangBLKULLH22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ZhouLLDHZDCLL22, author = {Yanqi Zhou and Tao Lei and Hanxiao Liu and Nan Du and Yanping Huang and Vincent Y. Zhao and Andrew M. Dai and Zhifeng Chen and Quoc V. Le and James Laudon}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Mixture-of-Experts with Expert Choice Routing}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/2f00ecd787b432c1d36f3de9800728eb-Abstract-Conference.html}, timestamp = {Tue, 27 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ZhouLLDHZDCLL22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/slt/WangCRCWRMLP22, author = {Gary Wang and Ekin D. Cubuk and Andrew Rosenberg and Shuyang Cheng and Ron J. Weiss and Bhuvana Ramabhadran and Pedro J. Moreno and Quoc V. Le and Daniel S. Park}, title = {G-Augment: Searching for the Meta-Structure of Data Augmentation Policies for {ASR}}, booktitle = {{IEEE} Spoken Language Technology Workshop, {SLT} 2022, Doha, Qatar, January 9-12, 2023}, pages = {23--30}, publisher = {{IEEE}}, year = {2022}, url = {https://doi.org/10.1109/SLT54892.2023.10022748}, doi = {10.1109/SLT54892.2023.10022748}, timestamp = {Mon, 06 Feb 2023 22:19:30 +0100}, biburl = {https://dblp.org/rec/conf/slt/WangCRCWRMLP22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-08239, author = {Romal Thoppilan and Daniel De Freitas and Jamie Hall and Noam Shazeer and Apoorv Kulshreshtha and Heng{-}Tze Cheng and Alicia Jin and Taylor Bos and Leslie Baker and Yu Du and YaGuang Li and Hongrae Lee and Huaixiu Steven Zheng and Amin Ghafouri and Marcelo Menegali and Yanping Huang and Maxim Krikun and Dmitry Lepikhin and James Qin and Dehao Chen and Yuanzhong Xu and Zhifeng Chen and Adam Roberts and Maarten Bosma and Yanqi Zhou and Chung{-}Ching Chang and Igor Krivokon and Will Rusch and Marc Pickett and Kathleen S. Meier{-}Hellstern and Meredith Ringel Morris and Tulsee Doshi and Renelito Delos Santos and Toju Duke and Johnny Soraker and Ben Zevenbergen and Vinodkumar Prabhakaran and Mark Diaz and Ben Hutchinson and Kristen Olson and Alejandra Molina and Erin Hoffman{-}John and Josh Lee and Lora Aroyo and Ravi Rajakumar and Alena Butryna and Matthew Lamm and Viktoriya Kuzmina and Joe Fenton and Aaron Cohen and Rachel Bernstein and Ray Kurzweil and Blaise Ag{\"{u}}era y Arcas and Claire Cui and Marian Croak and Ed H. Chi and Quoc Le}, title = {LaMDA: Language Models for Dialog Applications}, journal = {CoRR}, volume = {abs/2201.08239}, year = {2022}, url = {https://arxiv.org/abs/2201.08239}, eprinttype = {arXiv}, eprint = {2201.08239}, timestamp = {Fri, 16 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-08239.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2201-11903, author = {Jason Wei and Xuezhi Wang and Dale Schuurmans and Maarten Bosma and Ed H. Chi and Quoc Le and Denny Zhou}, title = {Chain of Thought Prompting Elicits Reasoning in Large Language Models}, journal = {CoRR}, volume = {abs/2201.11903}, year = {2022}, url = {https://arxiv.org/abs/2201.11903}, eprinttype = {arXiv}, eprint = {2201.11903}, timestamp = {Fri, 22 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2201-11903.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-09368, author = {Yanqi Zhou and Tao Lei and Hanxiao Liu and Nan Du and Yanping Huang and Vincent Y. Zhao and Andrew M. Dai and Zhifeng Chen and Quoc Le and James Laudon}, title = {Mixture-of-Experts with Expert Choice Routing}, journal = {CoRR}, volume = {abs/2202.09368}, year = {2022}, url = {https://arxiv.org/abs/2202.09368}, eprinttype = {arXiv}, eprint = {2202.09368}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-09368.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-10447, author = {Weizhe Hua and Zihang Dai and Hanxiao Liu and Quoc V. Le}, title = {Transformer Quality in Linear Time}, journal = {CoRR}, volume = {abs/2202.10447}, year = {2022}, url = {https://arxiv.org/abs/2202.10447}, eprinttype = {arXiv}, eprint = {2202.10447}, timestamp = {Wed, 02 Mar 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-10447.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-08195, author = {Yingwei Li and Adams Wei Yu and Tianjian Meng and Benjamin Caine and Jiquan Ngiam and Daiyi Peng and Junyang Shen and Bo Wu and Yifeng Lu and Denny Zhou and Quoc V. Le and Alan L. Yuille and Mingxing Tan}, title = {DeepFusion: Lidar-Camera Deep Fusion for Multi-Modal 3D Object Detection}, journal = {CoRR}, volume = {abs/2203.08195}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.08195}, doi = {10.48550/ARXIV.2203.08195}, eprinttype = {arXiv}, eprint = {2203.08195}, timestamp = {Mon, 28 Mar 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-08195.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-11171, author = {Xuezhi Wang and Jason Wei and Dale Schuurmans and Quoc V. Le and Ed H. Chi and Denny Zhou}, title = {Self-Consistency Improves Chain of Thought Reasoning in Language Models}, journal = {CoRR}, volume = {abs/2203.11171}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.11171}, doi = {10.48550/ARXIV.2203.11171}, eprinttype = {arXiv}, eprint = {2203.11171}, timestamp = {Fri, 22 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-11171.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2203-12683, author = {Tianjian Meng and Golnaz Ghiasi and Reza Mahjourian and Quoc V. Le and Mingxing Tan}, title = {Revisiting Multi-Scale Feature Fusion for Semantic Segmentation}, journal = {CoRR}, volume = {abs/2203.12683}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2203.12683}, doi = {10.48550/ARXIV.2203.12683}, eprinttype = {arXiv}, eprint = {2203.12683}, timestamp = {Tue, 29 Mar 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2203-12683.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-05149, author = {David A. Patterson and Joseph Gonzalez and Urs H{\"{o}}lzle and Quoc V. Le and Chen Liang and Lluis{-}Miquel Munguia and Daniel Rothchild and David R. So and Maud Texier and Jeff Dean}, title = {The Carbon Footprint of Machine Learning Training Will Plateau, Then Shrink}, journal = {CoRR}, volume = {abs/2204.05149}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.05149}, doi = {10.48550/ARXIV.2204.05149}, eprinttype = {arXiv}, eprint = {2204.05149}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-05149.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-07615, author = {Chengrun Yang and Gabriel Bender and Hanxiao Liu and Pieter{-}Jan Kindermans and Madeleine Udell and Yifeng Lu and Quoc V. Le and Da Huang}, title = {Resource-Constrained Neural Architecture Search on Tabular Datasets}, journal = {CoRR}, volume = {abs/2204.07615}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.07615}, doi = {10.48550/ARXIV.2204.07615}, eprinttype = {arXiv}, eprint = {2204.07615}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-07615.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-10625, author = {Denny Zhou and Nathanael Sch{\"{a}}rli and Le Hou and Jason Wei and Nathan Scales and Xuezhi Wang and Dale Schuurmans and Olivier Bousquet and Quoc Le and Ed H. Chi}, title = {Least-to-Most Prompting Enables Complex Reasoning in Large Language Models}, journal = {CoRR}, volume = {abs/2205.10625}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.10625}, doi = {10.48550/ARXIV.2205.10625}, eprinttype = {arXiv}, eprint = {2205.10625}, timestamp = {Wed, 01 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-10625.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2207-00747, author = {Xuezhi Wang and Jason Wei and Dale Schuurmans and Quoc V. Le and Ed H. Chi and Denny Zhou}, title = {Rationale-Augmented Ensembles in Language Models}, journal = {CoRR}, volume = {abs/2207.00747}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2207.00747}, doi = {10.48550/ARXIV.2207.00747}, eprinttype = {arXiv}, eprint = {2207.00747}, timestamp = {Wed, 06 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2207-00747.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-09261, author = {Mirac Suzgun and Nathan Scales and Nathanael Sch{\"{a}}rli and Sebastian Gehrmann and Yi Tay and Hyung Won Chung and Aakanksha Chowdhery and Quoc V. Le and Ed H. Chi and Denny Zhou and Jason Wei}, title = {Challenging BIG-Bench Tasks and Whether Chain-of-Thought Can Solve Them}, journal = {CoRR}, volume = {abs/2210.09261}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.09261}, doi = {10.48550/ARXIV.2210.09261}, eprinttype = {arXiv}, eprint = {2210.09261}, timestamp = {Wed, 19 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-09261.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-10879, author = {Gary Wang and Ekin D. Cubuk and Andrew Rosenberg and Shuyang Cheng and Ron J. Weiss and Bhuvana Ramabhadran and Pedro J. Moreno and Quoc V. Le and Daniel S. Park}, title = {G-Augment: Searching for the Meta-Structure of Data Augmentation Policies for {ASR}}, journal = {CoRR}, volume = {abs/2210.10879}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.10879}, doi = {10.48550/ARXIV.2210.10879}, eprinttype = {arXiv}, eprint = {2210.10879}, timestamp = {Fri, 28 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-10879.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-11399, author = {Yi Tay and Jason Wei and Hyung Won Chung and Vinh Q. Tran and David R. So and Siamak Shakeri and Xavier Garcia and Huaixiu Steven Zheng and Jinfeng Rao and Aakanksha Chowdhery and Denny Zhou and Donald Metzler and Slav Petrov and Neil Houlsby and Quoc V. Le and Mostafa Dehghani}, title = {Transcending Scaling Laws with 0.1{\%} Extra Compute}, journal = {CoRR}, volume = {abs/2210.11399}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.11399}, doi = {10.48550/ARXIV.2210.11399}, eprinttype = {arXiv}, eprint = {2210.11399}, timestamp = {Tue, 25 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-11399.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-11416, author = {Hyung Won Chung and Le Hou and Shayne Longpre and Barret Zoph and Yi Tay and William Fedus and Eric Li and Xuezhi Wang and Mostafa Dehghani and Siddhartha Brahma and Albert Webson and Shixiang Shane Gu and Zhuyun Dai and Mirac Suzgun and Xinyun Chen and Aakanksha Chowdhery and Sharan Narang and Gaurav Mishra and Adams Yu and Vincent Y. Zhao and Yanping Huang and Andrew M. Dai and Hongkun Yu and Slav Petrov and Ed H. Chi and Jeff Dean and Jacob Devlin and Adam Roberts and Denny Zhou and Quoc V. Le and Jason Wei}, title = {Scaling Instruction-Finetuned Language Models}, journal = {CoRR}, volume = {abs/2210.11416}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.11416}, doi = {10.48550/ARXIV.2210.11416}, eprinttype = {arXiv}, eprint = {2210.11416}, timestamp = {Mon, 04 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-11416.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-02011, author = {Jason Wei and Yi Tay and Quoc V. Le}, title = {Inverse scaling can become U-shaped}, journal = {CoRR}, volume = {abs/2211.02011}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.02011}, doi = {10.48550/ARXIV.2211.02011}, eprinttype = {arXiv}, eprint = {2211.02011}, timestamp = {Fri, 04 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-02011.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/nature/MirhoseiniGYJSW21, author = {Azalia Mirhoseini and Anna Goldie and Mustafa Yazgan and Joe Wenjie Jiang and Ebrahim M. Songhori and Shen Wang and Young{-}Joon Lee and Eric Johnson and Omkar Pathak and Azade Nazi and Jiwoo Pak and Andy Tong and Kavya Srinivasa and William Hang and Emre Tuncer and Quoc V. Le and James Laudon and Richard Ho and Roger Carpenter and Jeff Dean}, title = {A graph placement methodology for fast chip design}, journal = {Nat.}, volume = {594}, number = {7862}, pages = {207--212}, year = {2021}, url = {https://doi.org/10.1038/s41586-021-03544-w}, doi = {10.1038/S41586-021-03544-W}, timestamp = {Mon, 05 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/nature/MirhoseiniGYJSW21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/PhamL21, author = {Hieu Pham and Quoc V. Le}, title = {AutoDropout: Learning Dropout Patterns to Regularize Deep Networks}, booktitle = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI} 2021, Thirty-Third Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9, 2021}, pages = {9351--9359}, publisher = {{AAAI} Press}, year = {2021}, url = {https://doi.org/10.1609/aaai.v35i11.17127}, doi = {10.1609/AAAI.V35I11.17127}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/aaai/PhamL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/GhiasiCSQLCLZ21, author = {Golnaz Ghiasi and Yin Cui and Aravind Srinivas and Rui Qian and Tsung{-}Yi Lin and Ekin D. Cubuk and Quoc V. Le and Barret Zoph}, title = {Simple Copy-Paste Is a Strong Data Augmentation Method for Instance Segmentation}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2021, virtual, June 19-25, 2021}, pages = {2918--2928}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2021}, url = {https://openaccess.thecvf.com/content/CVPR2021/html/Ghiasi\_Simple\_Copy-Paste\_Is\_a\_Strong\_Data\_Augmentation\_Method\_for\_Instance\_CVPR\_2021\_paper.html}, doi = {10.1109/CVPR46437.2021.00294}, timestamp = {Mon, 18 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/GhiasiCSQLCLZ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/0007TPLCLJ21, author = {Sheng Li and Mingxing Tan and Ruoming Pang and Andrew Li and Liqun Cheng and Quoc V. Le and Norman P. Jouppi}, title = {Searching for Fast Model Families on Datacenter Accelerators}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2021, virtual, June 19-25, 2021}, pages = {8085--8095}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2021}, url = {https://openaccess.thecvf.com/content/CVPR2021/html/Li\_Searching\_for\_Fast\_Model\_Families\_on\_Datacenter\_Accelerators\_CVPR\_2021\_paper.html}, doi = {10.1109/CVPR46437.2021.00799}, timestamp = {Mon, 18 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/0007TPLCLJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/PhamDXL21, author = {Hieu Pham and Zihang Dai and Qizhe Xie and Quoc V. Le}, title = {Meta Pseudo Labels}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2021, virtual, June 19-25, 2021}, pages = {11557--11568}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2021}, url = {https://openaccess.thecvf.com/content/CVPR2021/html/Pham\_Meta\_Pseudo\_Labels\_CVPR\_2021\_paper.html}, doi = {10.1109/CVPR46437.2021.01139}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/PhamDXL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/VuLLSI21, author = {Tu Vu and Minh{-}Thang Luong and Quoc V. Le and Grady Simon and Mohit Iyyer}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {STraTA: Self-Training with Task Augmentation for Better Few-shot Learning}, booktitle = {Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 7-11 November, 2021}, pages = {5715--5731}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.emnlp-main.462}, doi = {10.18653/V1/2021.EMNLP-MAIN.462}, timestamp = {Fri, 16 Feb 2024 08:27:36 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/VuLLSI21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/GhiasiZCLL21, author = {Golnaz Ghiasi and Barret Zoph and Ekin D. Cubuk and Quoc V. Le and Tsung{-}Yi Lin}, title = {Multi-Task Self-Training for Learning General Representations}, booktitle = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV} 2021, Montreal, QC, Canada, October 10-17, 2021}, pages = {8836--8845}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICCV48922.2021.00873}, doi = {10.1109/ICCV48922.2021.00873}, timestamp = {Fri, 11 Mar 2022 10:01:27 +0100}, biburl = {https://dblp.org/rec/conf/iccv/GhiasiZCLL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/Co-ReyesMPRLLLF21, author = {John D. Co{-}Reyes and Yingjie Miao and Daiyi Peng and Esteban Real and Quoc V. Le and Sergey Levine and Honglak Lee and Aleksandra Faust}, title = {Evolving Reinforcement Learning Algorithms}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=0XXpJ4OtjW}, timestamp = {Wed, 23 Jun 2021 17:36:39 +0200}, biburl = {https://dblp.org/rec/conf/iclr/Co-ReyesMPRLLLF21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/JiaYXCPPLSLD21, author = {Chao Jia and Yinfei Yang and Ye Xia and Yi{-}Ting Chen and Zarana Parekh and Hieu Pham and Quoc V. Le and Yun{-}Hsuan Sung and Zhen Li and Tom Duerig}, editor = {Marina Meila and Tong Zhang}, title = {Scaling Up Visual and Vision-Language Representation Learning With Noisy Text Supervision}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {4904--4916}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/jia21b.html}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/JiaYXCPPLSLD21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/TanL21, author = {Mingxing Tan and Quoc V. Le}, editor = {Marina Meila and Tong Zhang}, title = {EfficientNetV2: Smaller Models and Faster Training}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {10096--10106}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/tan21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/TanL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/VermaLKPL21, author = {Vikas Verma and Thang Luong and Kenji Kawaguchi and Hieu Pham and Quoc V. Le}, editor = {Marina Meila and Tong Zhang}, title = {Towards Domain-Agnostic Contrastive Learning}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {10530--10541}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/verma21a.html}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/VermaLKPL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ipps/WongpanichPDTLY21, author = {Arissa Wongpanich and Hieu Pham and James Demmel and Mingxing Tan and Quoc V. Le and Yang You and Sameer Kumar}, title = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1 Accuracy in One Hour}, booktitle = {{IEEE} International Parallel and Distributed Processing Symposium Workshops, {IPDPS} Workshops 2021, Portland, OR, USA, June 17-21, 2021}, pages = {947--950}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/IPDPSW52791.2021.00146}, doi = {10.1109/IPDPSW52791.2021.00146}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ipps/WongpanichPDTLY21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DaiLLT21, author = {Zihang Dai and Hanxiao Liu and Quoc V. Le and Mingxing Tan}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {CoAtNet: Marrying Convolution and Attention for All Data Sizes}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {3965--3977}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/20568692db622456cc42a2e853ca21f8-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/DaiLLT21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SoMLDSL21, author = {David R. So and Wojciech Manke and Hanxiao Liu and Zihang Dai and Noam Shazeer and Quoc V. Le}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Searching for Efficient Transformers for Language Modeling}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {6010--6022}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/2f3c6a4cd8af177f6456e7e51a916ff3-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/SoMLDSL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuDSL21, author = {Hanxiao Liu and Zihang Dai and David R. So and Quoc V. Le}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Pay Attention to MLPs}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {9204--9215}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/4cc05b35c2f937c5bd9e7d41d3686fff-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/LiuDSL21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-01761, author = {Hieu Pham and Quoc V. Le}, title = {AutoDropout: Learning Dropout Patterns to Regularize Deep Networks}, journal = {CoRR}, volume = {abs/2101.01761}, year = {2021}, url = {https://arxiv.org/abs/2101.01761}, eprinttype = {arXiv}, eprint = {2101.01761}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-01761.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-03958, author = {John D. Co{-}Reyes and Yingjie Miao and Daiyi Peng and Esteban Real and Sergey Levine and Quoc V. Le and Honglak Lee and Aleksandra Faust}, title = {Evolving Reinforcement Learning Algorithms}, journal = {CoRR}, volume = {abs/2101.03958}, year = {2021}, url = {https://arxiv.org/abs/2101.03958}, eprinttype = {arXiv}, eprint = {2101.03958}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-03958.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2101-08809, author = {Daiyi Peng and Xuanyi Dong and Esteban Real and Mingxing Tan and Yifeng Lu and Hanxiao Liu and Gabriel Bender and Adam Kraft and Chen Liang and Quoc V. Le}, title = {PyGlove: Symbolic Programming for Automated Machine Learning}, journal = {CoRR}, volume = {abs/2101.08809}, year = {2021}, url = {https://arxiv.org/abs/2101.08809}, eprinttype = {arXiv}, eprint = {2101.08809}, timestamp = {Sat, 30 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2101-08809.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-05610, author = {Sheng Li and Mingxing Tan and Ruoming Pang and Andrew Li and Liqun Cheng and Quoc V. Le and Norman P. Jouppi}, title = {Searching for Fast Model Families on Datacenter Accelerators}, journal = {CoRR}, volume = {abs/2102.05610}, year = {2021}, url = {https://arxiv.org/abs/2102.05610}, eprinttype = {arXiv}, eprint = {2102.05610}, timestamp = {Thu, 18 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-05610.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-05918, author = {Chao Jia and Yinfei Yang and Ye Xia and Yi{-}Ting Chen and Zarana Parekh and Hieu Pham and Quoc V. Le and Yun{-}Hsuan Sung and Zhen Li and Tom Duerig}, title = {Scaling Up Visual and Vision-Language Representation Learning With Noisy Text Supervision}, journal = {CoRR}, volume = {abs/2102.05918}, year = {2021}, url = {https://arxiv.org/abs/2102.05918}, eprinttype = {arXiv}, eprint = {2102.05918}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-05918.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-00298, author = {Mingxing Tan and Quoc V. Le}, title = {EfficientNetV2: Smaller Models and Faster Training}, journal = {CoRR}, volume = {abs/2104.00298}, year = {2021}, url = {https://arxiv.org/abs/2104.00298}, eprinttype = {arXiv}, eprint = {2104.00298}, timestamp = {Mon, 12 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-00298.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-02133, author = {William Chan and Daniel S. Park and Chris A. Lee and Yu Zhang and Quoc V. Le and Mohammad Norouzi}, title = {SpeechStew: Simply Mix All Available Speech Recognition Data to Train One Large Neural Network}, journal = {CoRR}, volume = {abs/2104.02133}, year = {2021}, url = {https://arxiv.org/abs/2104.02133}, eprinttype = {arXiv}, eprint = {2104.02133}, timestamp = {Tue, 16 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-02133.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-10350, author = {David A. Patterson and Joseph Gonzalez and Quoc V. Le and Chen Liang and Lluis{-}Miquel Munguia and Daniel Rothchild and David R. So and Maud Texier and Jeff Dean}, title = {Carbon Emissions and Large Neural Network Training}, journal = {CoRR}, volume = {abs/2104.10350}, year = {2021}, url = {https://arxiv.org/abs/2104.10350}, eprinttype = {arXiv}, eprint = {2104.10350}, timestamp = {Thu, 13 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-10350.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-08050, author = {Hanxiao Liu and Zihang Dai and David R. So and Quoc V. Le}, title = {Pay Attention to MLPs}, journal = {CoRR}, volume = {abs/2105.08050}, year = {2021}, url = {https://arxiv.org/abs/2105.08050}, eprinttype = {arXiv}, eprint = {2105.08050}, timestamp = {Tue, 18 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-08050.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-12842, author = {Dan Zhang and Safeen Huda and Ebrahim M. Songhori and Quoc V. Le and Anna Goldie and Azalia Mirhoseini}, title = {A Full-stack Accelerator Search Technique for Vision Applications}, journal = {CoRR}, volume = {abs/2105.12842}, year = {2021}, url = {https://arxiv.org/abs/2105.12842}, eprinttype = {arXiv}, eprint = {2105.12842}, timestamp = {Fri, 23 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-12842.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-04803, author = {Zihang Dai and Hanxiao Liu and Quoc V. Le and Mingxing Tan}, title = {CoAtNet: Marrying Convolution and Attention for All Data Sizes}, journal = {CoRR}, volume = {abs/2106.04803}, year = {2021}, url = {https://arxiv.org/abs/2106.04803}, eprinttype = {arXiv}, eprint = {2106.04803}, timestamp = {Tue, 15 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-04803.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-07732, author = {Jacob Austin and Augustus Odena and Maxwell I. Nye and Maarten Bosma and Henryk Michalewski and David Dohan and Ellen Jiang and Carrie J. Cai and Michael Terry and Quoc V. Le and Charles Sutton}, title = {Program Synthesis with Large Language Models}, journal = {CoRR}, volume = {abs/2108.07732}, year = {2021}, url = {https://arxiv.org/abs/2108.07732}, eprinttype = {arXiv}, eprint = {2108.07732}, timestamp = {Fri, 29 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-07732.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-11353, author = {Golnaz Ghiasi and Barret Zoph and Ekin D. Cubuk and Quoc V. Le and Tsung{-}Yi Lin}, title = {Multi-Task Self-Training for Learning General Representations}, journal = {CoRR}, volume = {abs/2108.11353}, year = {2021}, url = {https://arxiv.org/abs/2108.11353}, eprinttype = {arXiv}, eprint = {2108.11353}, timestamp = {Fri, 27 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-11353.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-01652, author = {Jason Wei and Maarten Bosma and Vincent Y. Zhao and Kelvin Guu and Adams Wei Yu and Brian Lester and Nan Du and Andrew M. Dai and Quoc V. Le}, title = {Finetuned Language Models Are Zero-Shot Learners}, journal = {CoRR}, volume = {abs/2109.01652}, year = {2021}, url = {https://arxiv.org/abs/2109.01652}, eprinttype = {arXiv}, eprint = {2109.01652}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-01652.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-06270, author = {Tu Vu and Minh{-}Thang Luong and Quoc V. Le and Grady Simon and Mohit Iyyer}, title = {STraTA: Self-Training with Task Augmentation for Better Few-shot Learning}, journal = {CoRR}, volume = {abs/2109.06270}, year = {2021}, url = {https://arxiv.org/abs/2109.06270}, eprinttype = {arXiv}, eprint = {2109.06270}, timestamp = {Tue, 21 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-06270.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-08668, author = {David R. So and Wojciech Manke and Hanxiao Liu and Zihang Dai and Noam Shazeer and Quoc V. Le}, title = {Primer: Searching for Efficient Transformers for Language Modeling}, journal = {CoRR}, volume = {abs/2109.08668}, year = {2021}, url = {https://arxiv.org/abs/2109.08668}, eprinttype = {arXiv}, eprint = {2109.08668}, timestamp = {Wed, 22 Sep 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-08668.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-13226, author = {Yu Zhang and Daniel S. Park and Wei Han and James Qin and Anmol Gulati and Joel Shor and Aren Jansen and Yuanzhong Xu and Yanping Huang and Shibo Wang and Zongwei Zhou and Bo Li and Min Ma and William Chan and Jiahui Yu and Yongqiang Wang and Liangliang Cao and Khe Chai Sim and Bhuvana Ramabhadran and Tara N. Sainath and Fran{\c{c}}oise Beaufays and Zhifeng Chen and Quoc V. Le and Chung{-}Cheng Chiu and Ruoming Pang and Yonghui Wu}, title = {BigSSL: Exploring the Frontier of Large-Scale Semi-Supervised Learning for Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/2109.13226}, year = {2021}, url = {https://arxiv.org/abs/2109.13226}, eprinttype = {arXiv}, eprint = {2109.13226}, timestamp = {Wed, 20 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-13226.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2111-10050, author = {Hieu Pham and Zihang Dai and Golnaz Ghiasi and Hanxiao Liu and Adams Wei Yu and Minh{-}Thang Luong and Mingxing Tan and Quoc V. Le}, title = {Combined Scaling for Zero-shot Transfer Learning}, journal = {CoRR}, volume = {abs/2111.10050}, year = {2021}, url = {https://arxiv.org/abs/2111.10050}, eprinttype = {arXiv}, eprint = {2111.10050}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2111-10050.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2112-06905, author = {Nan Du and Yanping Huang and Andrew M. Dai and Simon Tong and Dmitry Lepikhin and Yuanzhong Xu and Maxim Krikun and Yanqi Zhou and Adams Wei Yu and Orhan Firat and Barret Zoph and Liam Fedus and Maarten Bosma and Zongwei Zhou and Tao Wang and Yu Emma Wang and Kellie Webster and Marie Pellat and Kevin Robinson and Kathy Meier{-}Hellstern and Toju Duke and Lucas Dixon and Kun Zhang and Quoc V. Le and Yonghui Wu and Zhifeng Chen and Claire Cui}, title = {GLaM: Efficient Scaling of Language Models with Mixture-of-Experts}, journal = {CoRR}, volume = {abs/2112.06905}, year = {2021}, url = {https://arxiv.org/abs/2112.06905}, eprinttype = {arXiv}, eprint = {2112.06905}, timestamp = {Wed, 16 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2112-06905.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/XieTGWYL20, author = {Cihang Xie and Mingxing Tan and Boqing Gong and Jiang Wang and Alan L. Yuille and Quoc V. Le}, title = {Adversarial Examples Improve Image Recognition}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {816--825}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Xie\_Adversarial\_Examples\_Improve\_Image\_Recognition\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.00090}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/XieTGWYL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/CubukZSL20, author = {Ekin D. Cubuk and Barret Zoph and Jonathon Shlens and Quoc V. Le}, title = {Randaugment: Practical automated data augmentation with a reduced search space}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} Workshops 2020, Seattle, WA, USA, June 14-19, 2020}, pages = {3008--3017}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPRW\_2020/html/w40/Cubuk\_Randaugment\_Practical\_Automated\_Data\_Augmentation\_With\_a\_Reduced\_Search\_Space\_CVPRW\_2020\_paper.html}, doi = {10.1109/CVPRW50498.2020.00359}, timestamp = {Tue, 31 Aug 2021 14:00:09 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/CubukZSL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/XieLHL20, author = {Qizhe Xie and Minh{-}Thang Luong and Eduard H. Hovy and Quoc V. Le}, title = {Self-Training With Noisy Student Improves ImageNet Classification}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {10684--10695}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Xie\_Self-Training\_With\_Noisy\_Student\_Improves\_ImageNet\_Classification\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.01070}, timestamp = {Mon, 30 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/XieLHL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/TanPL20, author = {Mingxing Tan and Ruoming Pang and Quoc V. Le}, title = {EfficientDet: Scalable and Efficient Object Detection}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {10778--10787}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Tan\_EfficientDet\_Scalable\_and\_Efficient\_Object\_Detection\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.01079}, timestamp = {Mon, 30 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/TanPL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/DuLJGTCLS20, author = {Xianzhi Du and Tsung{-}Yi Lin and Pengchong Jin and Golnaz Ghiasi and Mingxing Tan and Yin Cui and Quoc V. Le and Xiaodan Song}, title = {SpineNet: Learning Scale-Permuted Backbone for Recognition and Localization}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {11589--11598}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Du\_SpineNet\_Learning\_Scale-Permuted\_Backbone\_for\_Recognition\_and\_Localization\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.01161}, timestamp = {Mon, 30 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/DuLJGTCLS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/ChenGLLKAL20, author = {Bo Chen and Golnaz Ghiasi and Hanxiao Liu and Tsung{-}Yi Lin and Dmitry Kalenichenko and Hartwig Adam and Quoc V. Le}, title = {MnasFPN: Learning Latency-Aware Pyramid Architecture for Object Detection on Mobile Devices}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {13604--13613}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Chen\_MnasFPN\_Learning\_Latency-Aware\_Pyramid\_Architecture\_for\_Object\_Detection\_on\_Mobile\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.01362}, timestamp = {Mon, 30 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/ChenGLLKAL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/BenderLCCCKL20, author = {Gabriel Bender and Hanxiao Liu and Bo Chen and Grace Chu and Shuyang Cheng and Pieter{-}Jan Kindermans and Quoc V. Le}, title = {Can Weight Sharing Outperform Random Architecture Search? An Investigation With TuNAS}, booktitle = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition, {CVPR} 2020, Seattle, WA, USA, June 13-19, 2020}, pages = {14311--14320}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2020}, url = {https://openaccess.thecvf.com/content\_CVPR\_2020/html/Bender\_Can\_Weight\_Sharing\_Outperform\_Random\_Architecture\_Search\_An\_Investigation\_With\_CVPR\_2020\_paper.html}, doi = {10.1109/CVPR42600.2020.01433}, timestamp = {Mon, 30 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/BenderLCCCKL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eccv/ChengLCZBNSCVLL20, author = {Shuyang Cheng and Zhaoqi Leng and Ekin Dogus Cubuk and Barret Zoph and Chunyan Bai and Jiquan Ngiam and Yang Song and Benjamin Caine and Vijay Vasudevan and Congcong Li and Quoc V. Le and Jonathon Shlens and Dragomir Anguelov}, editor = {Andrea Vedaldi and Horst Bischof and Thomas Brox and Jan{-}Michael Frahm}, title = {Improving 3D Object Detection Through Progressive Population Based Augmentation}, booktitle = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part {XXI}}, series = {Lecture Notes in Computer Science}, volume = {12366}, pages = {279--294}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-58589-1\_17}, doi = {10.1007/978-3-030-58589-1\_17}, timestamp = {Thu, 12 Nov 2020 17:00:57 +0100}, biburl = {https://dblp.org/rec/conf/eccv/ChengLCZBNSCVLL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eccv/ZophCGLSL20, author = {Barret Zoph and Ekin D. Cubuk and Golnaz Ghiasi and Tsung{-}Yi Lin and Jonathon Shlens and Quoc V. Le}, editor = {Andrea Vedaldi and Horst Bischof and Thomas Brox and Jan{-}Michael Frahm}, title = {Learning Data Augmentation Strategies for Object Detection}, booktitle = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part {XXVII}}, series = {Lecture Notes in Computer Science}, volume = {12372}, pages = {566--583}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-58583-9\_34}, doi = {10.1007/978-3-030-58583-9\_34}, timestamp = {Mon, 23 Nov 2020 08:37:00 +0100}, biburl = {https://dblp.org/rec/conf/eccv/ZophCGLSL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eccv/DuLJCTLS20, author = {Xianzhi Du and Tsung{-}Yi Lin and Pengchong Jin and Yin Cui and Mingxing Tan and Quoc V. Le and Xiaodan Song}, editor = {Andrea Vedaldi and Horst Bischof and Thomas Brox and Jan{-}Michael Frahm}, title = {Efficient Scale-Permuted Backbone with Learned Resource Distribution}, booktitle = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part {XXIII}}, series = {Lecture Notes in Computer Science}, volume = {12368}, pages = {572--586}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-58592-1\_34}, doi = {10.1007/978-3-030-58592-1\_34}, timestamp = {Tue, 03 Nov 2020 17:25:00 +0100}, biburl = {https://dblp.org/rec/conf/eccv/DuLJCTLS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/eccv/YuJLBKTHSPL20, author = {Jiahui Yu and Pengchong Jin and Hanxiao Liu and Gabriel Bender and Pieter{-}Jan Kindermans and Mingxing Tan and Thomas S. Huang and Xiaodan Song and Ruoming Pang and Quoc Le}, editor = {Andrea Vedaldi and Horst Bischof and Thomas Brox and Jan{-}Michael Frahm}, title = {BigNAS: Scaling up Neural Architecture Search with Big Single-Stage Models}, booktitle = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow, UK, August 23-28, 2020, Proceedings, Part {VII}}, series = {Lecture Notes in Computer Science}, volume = {12352}, pages = {702--717}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-58571-6\_41}, doi = {10.1007/978-3-030-58571-6\_41}, timestamp = {Thu, 03 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/eccv/YuJLBKTHSPL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ClarkLLM20, author = {Kevin Clark and Minh{-}Thang Luong and Quoc V. Le and Christopher D. Manning}, editor = {Bonnie Webber and Trevor Cohn and Yulan He and Yang Liu}, title = {Pre-Training Transformers as Energy-Based Cloze Models}, booktitle = {Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2020, Online, November 16-20, 2020}, pages = {285--294}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.emnlp-main.20}, doi = {10.18653/V1/2020.EMNLP-MAIN.20}, timestamp = {Wed, 23 Mar 2022 10:11:55 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/ClarkLLM20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ParkZCCLCLW20, author = {Daniel S. Park and Yu Zhang and Chung{-}Cheng Chiu and Youzheng Chen and Bo Li and William Chan and Quoc V. Le and Yonghui Wu}, title = {Specaugment on Large Scale Datasets}, booktitle = {2020 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020}, pages = {6879--6883}, publisher = {{IEEE}}, year = {2020}, url = {https://doi.org/10.1109/ICASSP40776.2020.9053205}, doi = {10.1109/ICASSP40776.2020.9053205}, timestamp = {Thu, 26 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icassp/ParkZCCLCLW20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ChenLYZSL20, author = {Xinyun Chen and Chen Liang and Adams Wei Yu and Denny Zhou and Dawn Song and Quoc V. Le}, title = {Neural Symbolic Reader: Scalable Integration of Distributed and Symbolic Representations for Reading Comprehension}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=ryxjnREFwH}, timestamp = {Thu, 07 May 2020 17:11:47 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ChenLYZSL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ClarkLLM20, author = {Kevin Clark and Minh{-}Thang Luong and Quoc V. Le and Christopher D. Manning}, title = {{ELECTRA:} Pre-training Text Encoders as Discriminators Rather Than Generators}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=r1xMH1BtvB}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ClarkLLM20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/RealLSL20, author = {Esteban Real and Chen Liang and David R. So and Quoc V. Le}, title = {AutoML-Zero: Evolving Machine Learning Algorithms From Scratch}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {8007--8019}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/real20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/RealLSL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ZhouYCMTSLLS20, author = {Denny Zhou and Mao Ye and Chen Chen and Tianjian Meng and Mingxing Tan and Xiaodan Song and Quoc V. Le and Qiang Liu and Dale Schuurmans}, title = {Go Wide, Then Narrow: Efficient Training of Deep Thin Networks}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {11546--11555}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/zhou20f.html}, timestamp = {Wed, 15 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/ZhouYCMTSLLS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ParkZJHCLWL20, author = {Daniel S. Park and Yu Zhang and Ye Jia and Wei Han and Chung{-}Cheng Chiu and Bo Li and Yonghui Wu and Quoc V. Le}, editor = {Helen Meng and Bo Xu and Thomas Fang Zheng}, title = {Improved Noisy Student Training for Automatic Speech Recognition}, booktitle = {Interspeech 2020, 21st Annual Conference of the International Speech Communication Association, Virtual Event, Shanghai, China, 25-29 October 2020}, pages = {2817--2821}, publisher = {{ISCA}}, year = {2020}, url = {https://doi.org/10.21437/Interspeech.2020-1470}, doi = {10.21437/INTERSPEECH.2020-1470}, timestamp = {Tue, 09 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/ParkZJHCLWL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/kdd/JoglekarLCXWAKL20, author = {Manas R. Joglekar and Cong Li and Mei Chen and Taibai Xu and Xiaoming Wang and Jay K. Adams and Pranav Khaitan and Jiahui Liu and Quoc V. Le}, editor = {Rajesh Gupta and Yan Liu and Jiliang Tang and B. Aditya Prakash}, title = {Neural Input Search for Large Scale Recommendation Models}, booktitle = {{KDD} '20: The 26th {ACM} {SIGKDD} Conference on Knowledge Discovery and Data Mining, Virtual Event, CA, USA, August 23-27, 2020}, pages = {2387--2397}, publisher = {{ACM}}, year = {2020}, url = {https://doi.org/10.1145/3394486.3403288}, doi = {10.1145/3394486.3403288}, timestamp = {Tue, 09 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/kdd/JoglekarLCXWAKL20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/CubukZS020, author = {Ekin Dogus Cubuk and Barret Zoph and Jonathon Shlens and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {RandAugment: Practical Automated Data Augmentation with a Reduced Search Space}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/d85b63ef0ccb114d0a3bb7b7d808028f-Abstract.html}, timestamp = {Mon, 02 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/CubukZS020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DaiLY020, author = {Zihang Dai and Guokun Lai and Yiming Yang and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Funnel-Transformer: Filtering out Sequential Redundancy for Efficient Language Processing}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/2cd2915e69546904e4e5d4a2ac9e1652-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DaiLY020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiuBS020, author = {Hanxiao Liu and Andy Brock and Karen Simonyan and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Evolving Normalization-Activation Layers}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/9d4c03631b8b0c85ae08bf05eda37d0f-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/LiuBS020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PengDRTLBLKL020, author = {Daiyi Peng and Xuanyi Dong and Esteban Real and Mingxing Tan and Yifeng Lu and Gabriel Bender and Hanxiao Liu and Adam Kraft and Chen Liang and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {PyGlove: Symbolic Programming for Automated Machine Learning}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/012a91467f210472fab4e11359bbfef6-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PengDRTLBLKL020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/XieDHL020, author = {Qizhe Xie and Zihang Dai and Eduard H. Hovy and Thang Luong and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Unsupervised Data Augmentation for Consistency Training}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/44feb0096faa8326192570788b38c1d1-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/XieDHL020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ZophGLCLC020, author = {Barret Zoph and Golnaz Ghiasi and Tsung{-}Yi Lin and Yin Cui and Hanxiao Liu and Ekin Dogus Cubuk and Quoc Le}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Rethinking Pre-training and Self-training}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/27e9661e033a73a6ad8cefcde965c54d-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ZophGLCLC020.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2001-09977, author = {Daniel Adiwardana and Minh{-}Thang Luong and David R. So and Jamie Hall and Noah Fiedel and Romal Thoppilan and Zi Yang and Apoorv Kulshreshtha and Gaurav Nemade and Yifeng Lu and Quoc V. Le}, title = {Towards a Human-like Open-Domain Chatbot}, journal = {CoRR}, volume = {abs/2001.09977}, year = {2020}, url = {https://arxiv.org/abs/2001.09977}, eprinttype = {arXiv}, eprint = {2001.09977}, timestamp = {Thu, 30 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2001-09977.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-03384, author = {Esteban Real and Chen Liang and David R. So and Quoc V. Le}, title = {AutoML-Zero: Evolving Machine Learning Algorithms From Scratch}, journal = {CoRR}, volume = {abs/2003.03384}, year = {2020}, url = {https://arxiv.org/abs/2003.03384}, eprinttype = {arXiv}, eprint = {2003.03384}, timestamp = {Tue, 10 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-03384.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-10555, author = {Kevin Clark and Minh{-}Thang Luong and Quoc V. Le and Christopher D. Manning}, title = {{ELECTRA:} Pre-training Text Encoders as Discriminators Rather Than Generators}, journal = {CoRR}, volume = {abs/2003.10555}, year = {2020}, url = {https://arxiv.org/abs/2003.10555}, eprinttype = {arXiv}, eprint = {2003.10555}, timestamp = {Wed, 01 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-10555.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-10580, author = {Hieu Pham and Qizhe Xie and Zihang Dai and Quoc V. Le}, title = {Meta Pseudo Labels}, journal = {CoRR}, volume = {abs/2003.10580}, year = {2020}, url = {https://arxiv.org/abs/2003.10580}, eprinttype = {arXiv}, eprint = {2003.10580}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-10580.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-11142, author = {Jiahui Yu and Pengchong Jin and Hanxiao Liu and Gabriel Bender and Pieter{-}Jan Kindermans and Mingxing Tan and Thomas S. Huang and Xiaodan Song and Ruoming Pang and Quoc V. Le}, title = {BigNAS: Scaling Up Neural Architecture Search with Big Single-Stage Models}, journal = {CoRR}, volume = {abs/2003.11142}, year = {2020}, url = {https://arxiv.org/abs/2003.11142}, eprinttype = {arXiv}, eprint = {2003.11142}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-11142.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-00831, author = {Shuyang Cheng and Zhaoqi Leng and Ekin Dogus Cubuk and Barret Zoph and Chunyan Bai and Jiquan Ngiam and Yang Song and Benjamin Caine and Vijay Vasudevan and Congcong Li and Quoc V. Le and Jonathon Shlens and Dragomir Anguelov}, title = {Improving 3D Object Detection through Progressive Population Based Augmentation}, journal = {CoRR}, volume = {abs/2004.00831}, year = {2020}, url = {https://arxiv.org/abs/2004.00831}, eprinttype = {arXiv}, eprint = {2004.00831}, timestamp = {Wed, 08 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-00831.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-02967, author = {Hanxiao Liu and Andrew Brock and Karen Simonyan and Quoc V. Le}, title = {Evolving Normalization-Activation Layers}, journal = {CoRR}, volume = {abs/2004.02967}, year = {2020}, url = {https://arxiv.org/abs/2004.02967}, eprinttype = {arXiv}, eprint = {2004.02967}, timestamp = {Wed, 08 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-02967.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-10746, author = {Azalia Mirhoseini and Anna Goldie and Mustafa Yazgan and Joe W. J. Jiang and Ebrahim M. Songhori and Shen Wang and Young{-}Joon Lee and Eric Johnson and Omkar Pathak and Sungmin Bae and Azade Nazi and Jiwoo Pak and Andy Tong and Kavya Srinivasa and William Hang and Emre Tuncer and Anand Babu and Quoc V. Le and James Laudon and Richard Ho and Roger Carpenter and Jeff Dean}, title = {Chip Placement with Deep Reinforcement Learning}, journal = {CoRR}, volume = {abs/2004.10746}, year = {2020}, url = {https://arxiv.org/abs/2004.10746}, eprinttype = {arXiv}, eprint = {2004.10746}, timestamp = {Fri, 29 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-10746.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2005-09629, author = {Daniel S. Park and Yu Zhang and Ye Jia and Wei Han and Chung{-}Cheng Chiu and Bo Li and Yonghui Wu and Quoc V. Le}, title = {Improved Noisy Student Training for Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/2005.09629}, year = {2020}, url = {https://arxiv.org/abs/2005.09629}, eprinttype = {arXiv}, eprint = {2005.09629}, timestamp = {Thu, 26 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2005-09629.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-03236, author = {Zihang Dai and Guokun Lai and Yiming Yang and Quoc V. Le}, title = {Funnel-Transformer: Filtering out Sequential Redundancy for Efficient Language Processing}, journal = {CoRR}, volume = {abs/2006.03236}, year = {2020}, url = {https://arxiv.org/abs/2006.03236}, eprinttype = {arXiv}, eprint = {2006.03236}, timestamp = {Mon, 08 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-03236.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-03656, author = {Xuanyi Dong and Mingxing Tan and Adams Wei Yu and Daiyi Peng and Bogdan Gabrys and Quoc V. Le}, title = {AutoHAS: Differentiable Hyper-parameter and Architecture Search}, journal = {CoRR}, volume = {abs/2006.03656}, year = {2020}, url = {https://arxiv.org/abs/2006.03656}, eprinttype = {arXiv}, eprint = {2006.03656}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-03656.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-06882, author = {Barret Zoph and Golnaz Ghiasi and Tsung{-}Yi Lin and Yin Cui and Hanxiao Liu and Ekin D. Cubuk and Quoc V. Le}, title = {Rethinking Pre-training and Self-training}, journal = {CoRR}, volume = {abs/2006.06882}, year = {2020}, url = {https://arxiv.org/abs/2006.06882}, eprinttype = {arXiv}, eprint = {2006.06882}, timestamp = {Wed, 17 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-06882.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-14536, author = {Cihang Xie and Mingxing Tan and Boqing Gong and Alan L. Yuille and Quoc V. Le}, title = {Smooth Adversarial Training}, journal = {CoRR}, volume = {abs/2006.14536}, year = {2020}, url = {https://arxiv.org/abs/2006.14536}, eprinttype = {arXiv}, eprint = {2006.14536}, timestamp = {Wed, 01 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-14536.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2007-00811, author = {Denny Zhou and Mao Ye and Chen Chen and Tianjian Meng and Mingxing Tan and Xiaodan Song and Quoc V. Le and Qiang Liu and Dale Schuurmans}, title = {Go Wide, Then Narrow: Efficient Training of Deep Thin Networks}, journal = {CoRR}, volume = {abs/2007.00811}, year = {2020}, url = {https://arxiv.org/abs/2007.00811}, eprinttype = {arXiv}, eprint = {2007.00811}, timestamp = {Wed, 15 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2007-00811.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-06120, author = {Gabriel Bender and Hanxiao Liu and Bo Chen and Grace Chu and Shuyang Cheng and Pieter{-}Jan Kindermans and Quoc Le}, title = {Can weight sharing outperform random architecture search? An investigation with TuNAS}, journal = {CoRR}, volume = {abs/2008.06120}, year = {2020}, url = {https://arxiv.org/abs/2008.06120}, eprinttype = {arXiv}, eprint = {2008.06120}, timestamp = {Mon, 31 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-06120.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-10504, author = {Yu Zhang and James Qin and Daniel S. Park and Wei Han and Chung{-}Cheng Chiu and Ruoming Pang and Quoc V. Le and Yonghui Wu}, title = {Pushing the Limits of Semi-Supervised Learning for Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/2010.10504}, year = {2020}, url = {https://arxiv.org/abs/2010.10504}, eprinttype = {arXiv}, eprint = {2010.10504}, timestamp = {Thu, 26 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-10504.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2010-11426, author = {Xianzhi Du and Tsung{-}Yi Lin and Pengchong Jin and Yin Cui and Mingxing Tan and Quoc V. Le and Xiaodan Song}, title = {Efficient Scale-Permuted Backbone with Learned Resource Distribution}, journal = {CoRR}, volume = {abs/2010.11426}, year = {2020}, url = {https://arxiv.org/abs/2010.11426}, eprinttype = {arXiv}, eprint = {2010.11426}, timestamp = {Tue, 03 Nov 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2010-11426.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-00071, author = {Arissa Wongpanich and Hieu Pham and James Demmel and Mingxing Tan and Quoc V. Le and Yang You and Sameer Kumar}, title = {Training EfficientNets at Supercomputer Scale: 83{\%} ImageNet Top-1 Accuracy in One Hour}, journal = {CoRR}, volume = {abs/2011.00071}, year = {2020}, url = {https://arxiv.org/abs/2011.00071}, eprinttype = {arXiv}, eprint = {2011.00071}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-00071.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-04419, author = {Vikas Verma and Minh{-}Thang Luong and Kenji Kawaguchi and Hieu Pham and Quoc V. Le}, title = {Towards Domain-Agnostic Contrastive Learning}, journal = {CoRR}, volume = {abs/2011.04419}, year = {2020}, url = {https://arxiv.org/abs/2011.04419}, eprinttype = {arXiv}, eprint = {2011.04419}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-04419.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-07177, author = {Golnaz Ghiasi and Yin Cui and Aravind Srinivas and Rui Qian and Tsung{-}Yi Lin and Ekin D. Cubuk and Quoc V. Le and Barret Zoph}, title = {Simple Copy-Paste is a Strong Data Augmentation Method for Instance Segmentation}, journal = {CoRR}, volume = {abs/2012.07177}, year = {2020}, url = {https://arxiv.org/abs/2012.07177}, eprinttype = {arXiv}, eprint = {2012.07177}, timestamp = {Sat, 02 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-07177.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-08561, author = {Kevin Clark and Minh{-}Thang Luong and Quoc V. Le and Christopher D. Manning}, title = {Pre-Training Transformers as Energy-Based Cloze Models}, journal = {CoRR}, volume = {abs/2012.08561}, year = {2020}, url = {https://arxiv.org/abs/2012.08561}, eprinttype = {arXiv}, eprint = {2012.08561}, timestamp = {Sat, 02 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-08561.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tacl/KwiatkowskiPRCP19, author = {Tom Kwiatkowski and Jennimaria Palomaki and Olivia Redfield and Michael Collins and Ankur P. Parikh and Chris Alberti and Danielle Epstein and Illia Polosukhin and Jacob Devlin and Kenton Lee and Kristina Toutanova and Llion Jones and Matthew Kelcey and Ming{-}Wei Chang and Andrew M. Dai and Jakob Uszkoreit and Quoc Le and Slav Petrov}, title = {Natural Questions: a Benchmark for Question Answering Research}, journal = {Trans. Assoc. Comput. Linguistics}, volume = {7}, pages = {452--466}, year = {2019}, url = {https://doi.org/10.1162/tacl\_a\_00276}, doi = {10.1162/TACL\_A\_00276}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tacl/KwiatkowskiPRCP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/RealAHL19, author = {Esteban Real and Alok Aggarwal and Yanping Huang and Quoc V. Le}, title = {Regularized Evolution for Image Classifier Architecture Search}, booktitle = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI} 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019}, pages = {4780--4789}, publisher = {{AAAI} Press}, year = {2019}, url = {https://doi.org/10.1609/aaai.v33i01.33014780}, doi = {10.1609/AAAI.V33I01.33014780}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/RealAHL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/DaiYYCLS19, author = {Zihang Dai and Zhilin Yang and Yiming Yang and Jaime G. Carbonell and Quoc Viet Le and Ruslan Salakhutdinov}, editor = {Anna Korhonen and David R. Traum and Llu{\'{\i}}s M{\`{a}}rquez}, title = {Transformer-XL: Attentive Language Models beyond a Fixed-Length Context}, booktitle = {Proceedings of the 57th Conference of the Association for Computational Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers}, pages = {2978--2988}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/p19-1285}, doi = {10.18653/V1/P19-1285}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/DaiYYCLS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/ClarkLKML19, author = {Kevin Clark and Minh{-}Thang Luong and Urvashi Khandelwal and Christopher D. Manning and Quoc V. Le}, editor = {Anna Korhonen and David R. Traum and Llu{\'{\i}}s M{\`{a}}rquez}, title = {BAM! Born-Again Multi-Task Networks for Natural Language Understanding}, booktitle = {Proceedings of the 57th Conference of the Association for Computational Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019, Volume 1: Long Papers}, pages = {5931--5937}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/p19-1595}, doi = {10.18653/V1/P19-1595}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/ClarkLKML19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/bmvc/TanL19, author = {Mingxing Tan and Quoc V. Le}, title = {MixConv: Mixed Depthwise Convolutional Kernels}, booktitle = {30th British Machine Vision Conference 2019, {BMVC} 2019, Cardiff, UK, September 9-12, 2019}, pages = {74}, publisher = {{BMVA} Press}, year = {2019}, url = {https://bmvc2019.org/wp-content/uploads/papers/0583-paper.pdf}, timestamp = {Wed, 03 Feb 2021 08:35:59 +0100}, biburl = {https://dblp.org/rec/conf/bmvc/TanL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/CubukZMVL19, author = {Ekin D. Cubuk and Barret Zoph and Dandelion Man{\'{e}} and Vijay Vasudevan and Quoc V. Le}, title = {AutoAugment: Learning Augmentation Strategies From Data}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2019, Long Beach, CA, USA, June 16-20, 2019}, pages = {113--123}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2019}, url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Cubuk\_AutoAugment\_Learning\_Augmentation\_Strategies\_From\_Data\_CVPR\_2019\_paper.html}, doi = {10.1109/CVPR.2019.00020}, timestamp = {Mon, 30 Aug 2021 17:01:14 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/CubukZMVL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/KornblithSL19, author = {Simon Kornblith and Jonathon Shlens and Quoc V. Le}, title = {Do Better ImageNet Models Transfer Better?}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2019, Long Beach, CA, USA, June 16-20, 2019}, pages = {2661--2671}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2019}, url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Kornblith\_Do\_Better\_ImageNet\_Models\_Transfer\_Better\_CVPR\_2019\_paper.html}, doi = {10.1109/CVPR.2019.00277}, timestamp = {Mon, 20 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/KornblithSL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/TanCPVSHL19, author = {Mingxing Tan and Bo Chen and Ruoming Pang and Vijay Vasudevan and Mark Sandler and Andrew Howard and Quoc V. Le}, title = {MnasNet: Platform-Aware Neural Architecture Search for Mobile}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2019, Long Beach, CA, USA, June 16-20, 2019}, pages = {2820--2828}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2019}, url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Tan\_MnasNet\_Platform-Aware\_Neural\_Architecture\_Search\_for\_Mobile\_CVPR\_2019\_paper.html}, doi = {10.1109/CVPR.2019.00293}, timestamp = {Thu, 27 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/cvpr/TanCPVSHL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/GhiasiLL19, author = {Golnaz Ghiasi and Tsung{-}Yi Lin and Quoc V. Le}, title = {{NAS-FPN:} Learning Scalable Feature Pyramid Architecture for Object Detection}, booktitle = {{IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2019, Long Beach, CA, USA, June 16-20, 2019}, pages = {7036--7045}, publisher = {Computer Vision Foundation / {IEEE}}, year = {2019}, url = {http://openaccess.thecvf.com/content\_CVPR\_2019/html/Ghiasi\_NAS-FPN\_Learning\_Scalable\_Feature\_Pyramid\_Architecture\_for\_Object\_Detection\_CVPR\_2019\_paper.html}, doi = {10.1109/CVPR.2019.00720}, timestamp = {Mon, 20 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/GhiasiLL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/HowardPALSCWCTC19, author = {Andrew Howard and Ruoming Pang and Hartwig Adam and Quoc V. Le and Mark Sandler and Bo Chen and Weijun Wang and Liang{-}Chieh Chen and Mingxing Tan and Grace Chu and Vijay Vasudevan and Yukun Zhu}, title = {Searching for MobileNetV3}, booktitle = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV} 2019, Seoul, Korea (South), October 27 - November 2, 2019}, pages = {1314--1324}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICCV.2019.00140}, doi = {10.1109/ICCV.2019.00140}, timestamp = {Thu, 27 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iccv/HowardPALSCWCTC19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/BelloZLVS19, author = {Irwan Bello and Barret Zoph and Quoc Le and Ashish Vaswani and Jonathon Shlens}, title = {Attention Augmented Convolutional Networks}, booktitle = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV} 2019, Seoul, Korea (South), October 27 - November 2, 2019}, pages = {3285--3294}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/ICCV.2019.00338}, doi = {10.1109/ICCV.2019.00338}, timestamp = {Thu, 03 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iccv/BelloZLVS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/RamachandranL19, author = {Prajit Ramachandran and Quoc V. Le}, title = {Diversity and Depth in Per-Example Routing Models}, booktitle = {7th International Conference on Learning Representations, {ICLR} 2019, New Orleans, LA, USA, May 6-9, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=BkxWJnC9tX}, timestamp = {Thu, 25 Jul 2019 13:03:15 +0200}, biburl = {https://dblp.org/rec/conf/iclr/RamachandranL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/ParkSLS19, author = {Daniel S. Park and Jascha Sohl{-}Dickstein and Quoc V. Le and Samuel L. Smith}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {The Effect of Network Width on Stochastic Gradient Descent and Generalization: an Empirical Study}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {5042--5051}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/park19b.html}, timestamp = {Tue, 11 Jun 2019 15:37:38 +0200}, biburl = {https://dblp.org/rec/conf/icml/ParkSLS19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SoLL19, author = {David R. So and Quoc V. Le and Chen Liang}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {The Evolved Transformer}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {5877--5886}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/so19a.html}, timestamp = {Thu, 26 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/SoLL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/TanL19, author = {Mingxing Tan and Quoc V. Le}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {6105--6114}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/tan19a.html}, timestamp = {Tue, 11 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/TanL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/ParkCZCZCL19, author = {Daniel S. Park and William Chan and Yu Zhang and Chung{-}Cheng Chiu and Barret Zoph and Ekin D. Cubuk and Quoc V. Le}, editor = {Gernot Kubin and Zdravko Kacic}, title = {SpecAugment: {A} Simple Data Augmentation Method for Automatic Speech Recognition}, booktitle = {Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019}, pages = {2613--2617}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-2680}, doi = {10.21437/INTERSPEECH.2019-2680}, timestamp = {Fri, 29 Jan 2021 17:41:10 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/ParkCZCZCL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/VillegasPKELL19, author = {Ruben Villegas and Arkanath Pathak and Harini Kannan and Dumitru Erhan and Quoc V. Le and Honglak Lee}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {High Fidelity Video Prediction with Large Stochastic Recurrent Neural Networks}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {81--91}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/f7177163c833dff4b38fc8d2872f1ec6-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/VillegasPKELL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/HuangCBFCCLNLWC19, author = {Yanping Huang and Youlong Cheng and Ankur Bapna and Orhan Firat and Dehao Chen and Mia Xu Chen and HyoukJoong Lee and Jiquan Ngiam and Quoc V. Le and Yonghui Wu and Zhifeng Chen}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {GPipe: Efficient Training of Giant Neural Networks using Pipeline Parallelism}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {103--112}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/093f65e080a295f8076b1c5722a46aa2-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/HuangCBFCCLNLWC19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ElsayedKL19, author = {Gamaleldin F. Elsayed and Simon Kornblith and Quoc V. Le}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Saccader: Improving Accuracy of Hard Attention Models for Vision}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {700--712}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/8dd48d6a2e2cad213179a3992c0be53c-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/ElsayedKL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/YangBLN19, author = {Brandon Yang and Gabriel Bender and Quoc V. Le and Jiquan Ngiam}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {CondConv: Conditionally Parameterized Convolutions for Efficient Inference}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {1305--1316}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/f2201f5191c4e92cc5af043eebfd0946-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/YangBLN19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/YangDYCSL19, author = {Zhilin Yang and Zihang Dai and Yiming Yang and Jaime G. Carbonell and Ruslan Salakhutdinov and Quoc V. Le}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {XLNet: Generalized Autoregressive Pretraining for Language Understanding}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {5754--5764}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/dc6a7e655d7e5840e66733e9ee67cc69-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/YangDYCSL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/YangLSL19, author = {Zhilin Yang and Thang Luong and Ruslan Salakhutdinov and Quoc V. Le}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Mixtape: Breaking the Softmax Bottleneck Efficiently}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {15922--15930}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/512fc3c5227f637e41437c999a2d3169-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/YangLSL19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-02860, author = {Zihang Dai and Zhilin Yang and Yiming Yang and Jaime G. Carbonell and Quoc V. Le and Ruslan Salakhutdinov}, title = {Transformer-XL: Attentive Language Models Beyond a Fixed-Length Context}, journal = {CoRR}, volume = {abs/1901.02860}, year = {2019}, url = {http://arxiv.org/abs/1901.02860}, eprinttype = {arXiv}, eprint = {1901.02860}, timestamp = {Fri, 01 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-02860.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-11117, author = {David R. So and Chen Liang and Quoc V. Le}, title = {The Evolved Transformer}, journal = {CoRR}, volume = {abs/1901.11117}, year = {2019}, url = {http://arxiv.org/abs/1901.11117}, eprinttype = {arXiv}, eprint = {1901.11117}, timestamp = {Mon, 04 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-11117.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-04971, author = {Brandon Yang and Gabriel Bender and Quoc V. Le and Jiquan Ngiam}, title = {Soft Conditional Computation}, journal = {CoRR}, volume = {abs/1904.04971}, year = {2019}, url = {http://arxiv.org/abs/1904.04971}, eprinttype = {arXiv}, eprint = {1904.04971}, timestamp = {Thu, 25 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-04971.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-07392, author = {Golnaz Ghiasi and Tsung{-}Yi Lin and Ruoming Pang and Quoc V. Le}, title = {{NAS-FPN:} Learning Scalable Feature Pyramid Architecture for Object Detection}, journal = {CoRR}, volume = {abs/1904.07392}, year = {2019}, url = {http://arxiv.org/abs/1904.07392}, eprinttype = {arXiv}, eprint = {1904.07392}, timestamp = {Thu, 25 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-07392.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-08779, author = {Daniel S. Park and William Chan and Yu Zhang and Chung{-}Cheng Chiu and Barret Zoph and Ekin D. Cubuk and Quoc V. Le}, title = {SpecAugment: {A} Simple Data Augmentation Method for Automatic Speech Recognition}, journal = {CoRR}, volume = {abs/1904.08779}, year = {2019}, url = {http://arxiv.org/abs/1904.08779}, eprinttype = {arXiv}, eprint = {1904.08779}, timestamp = {Tue, 27 Oct 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-08779.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-09925, author = {Irwan Bello and Barret Zoph and Ashish Vaswani and Jonathon Shlens and Quoc V. Le}, title = {Attention Augmented Convolutional Networks}, journal = {CoRR}, volume = {abs/1904.09925}, year = {2019}, url = {http://arxiv.org/abs/1904.09925}, eprinttype = {arXiv}, eprint = {1904.09925}, timestamp = {Fri, 26 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-09925.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-10076, author = {Keren Gu and Brandon Yang and Jiquan Ngiam and Quoc V. Le and Jonathon Shlens}, title = {Using Videos to Evaluate Image Model Robustness}, journal = {CoRR}, volume = {abs/1904.10076}, year = {2019}, url = {http://arxiv.org/abs/1904.10076}, eprinttype = {arXiv}, eprint = {1904.10076}, timestamp = {Sat, 27 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-10076.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-12848, author = {Qizhe Xie and Zihang Dai and Eduard H. Hovy and Minh{-}Thang Luong and Quoc V. Le}, title = {Unsupervised Data Augmentation}, journal = {CoRR}, volume = {abs/1904.12848}, year = {2019}, url = {http://arxiv.org/abs/1904.12848}, eprinttype = {arXiv}, eprint = {1904.12848}, timestamp = {Thu, 02 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-12848.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-02244, author = {Andrew Howard and Mark Sandler and Grace Chu and Liang{-}Chieh Chen and Bo Chen and Mingxing Tan and Weijun Wang and Yukun Zhu and Ruoming Pang and Vijay Vasudevan and Quoc V. Le and Hartwig Adam}, title = {Searching for MobileNetV3}, journal = {CoRR}, volume = {abs/1905.02244}, year = {2019}, url = {http://arxiv.org/abs/1905.02244}, eprinttype = {arXiv}, eprint = {1905.02244}, timestamp = {Thu, 27 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-02244.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-03776, author = {Daniel S. Park and Jascha Sohl{-}Dickstein and Quoc V. Le and Samuel L. Smith}, title = {The Effect of Network Width on Stochastic Gradient Descent and Generalization: an Empirical Study}, journal = {CoRR}, volume = {abs/1905.03776}, year = {2019}, url = {http://arxiv.org/abs/1905.03776}, eprinttype = {arXiv}, eprint = {1905.03776}, timestamp = {Mon, 27 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-03776.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-11946, author = {Mingxing Tan and Quoc V. Le}, title = {EfficientNet: Rethinking Model Scaling for Convolutional Neural Networks}, journal = {CoRR}, volume = {abs/1905.11946}, year = {2019}, url = {http://arxiv.org/abs/1905.11946}, eprinttype = {arXiv}, eprint = {1905.11946}, timestamp = {Mon, 03 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-11946.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-02940, author = {Trieu H. Trinh and Minh{-}Thang Luong and Quoc V. Le}, title = {Selfie: Self-supervised Pretraining for Image Embedding}, journal = {CoRR}, volume = {abs/1906.02940}, year = {2019}, url = {http://arxiv.org/abs/1906.02940}, eprinttype = {arXiv}, eprint = {1906.02940}, timestamp = {Fri, 14 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-02940.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-08237, author = {Zhilin Yang and Zihang Dai and Yiming Yang and Jaime G. Carbonell and Ruslan Salakhutdinov and Quoc V. Le}, title = {XLNet: Generalized Autoregressive Pretraining for Language Understanding}, journal = {CoRR}, volume = {abs/1906.08237}, year = {2019}, url = {http://arxiv.org/abs/1906.08237}, eprinttype = {arXiv}, eprint = {1906.08237}, timestamp = {Mon, 24 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-08237.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-11172, author = {Barret Zoph and Ekin D. Cubuk and Golnaz Ghiasi and Tsung{-}Yi Lin and Jonathon Shlens and Quoc V. Le}, title = {Learning Data Augmentation Strategies for Object Detection}, journal = {CoRR}, volume = {abs/1906.11172}, year = {2019}, url = {http://arxiv.org/abs/1906.11172}, eprinttype = {arXiv}, eprint = {1906.11172}, timestamp = {Thu, 27 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-11172.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-04471, author = {Manas R. Joglekar and Cong Li and Jay K. Adams and Pranav Khaitan and Quoc V. Le}, title = {Neural Input Search for Large Scale Recommendation Models}, journal = {CoRR}, volume = {abs/1907.04471}, year = {2019}, url = {http://arxiv.org/abs/1907.04471}, eprinttype = {arXiv}, eprint = {1907.04471}, timestamp = {Wed, 17 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-04471.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-04829, author = {Kevin Clark and Minh{-}Thang Luong and Urvashi Khandelwal and Christopher D. Manning and Quoc V. Le}, title = {BAM! Born-Again Multi-Task Networks for Natural Language Understanding}, journal = {CoRR}, volume = {abs/1907.04829}, year = {2019}, url = {http://arxiv.org/abs/1907.04829}, eprinttype = {arXiv}, eprint = {1907.04829}, timestamp = {Wed, 17 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-04829.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-09595, author = {Mingxing Tan and Quoc V. Le}, title = {MixConv: Mixed Depthwise Convolutional Kernels}, journal = {CoRR}, volume = {abs/1907.09595}, year = {2019}, url = {http://arxiv.org/abs/1907.09595}, eprinttype = {arXiv}, eprint = {1907.09595}, timestamp = {Fri, 02 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-09595.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1908-07644, author = {Gamaleldin F. Elsayed and Simon Kornblith and Quoc V. Le}, title = {Saccader: Improving Accuracy of Hard Attention Models for Vision}, journal = {CoRR}, volume = {abs/1908.07644}, year = {2019}, url = {http://arxiv.org/abs/1908.07644}, eprinttype = {arXiv}, eprint = {1908.07644}, timestamp = {Mon, 26 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1908-07644.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1909-13719, author = {Ekin D. Cubuk and Barret Zoph and Jonathon Shlens and Quoc V. Le}, title = {RandAugment: Practical data augmentation with no separate search}, journal = {CoRR}, volume = {abs/1909.13719}, year = {2019}, url = {http://arxiv.org/abs/1909.13719}, eprinttype = {arXiv}, eprint = {1909.13719}, timestamp = {Wed, 02 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1909-13719.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-01655, author = {Ruben Villegas and Arkanath Pathak and Harini Kannan and Dumitru Erhan and Quoc V. Le and Honglak Lee}, title = {High Fidelity Video Prediction with Large Stochastic Recurrent Neural Networks}, journal = {CoRR}, volume = {abs/1911.01655}, year = {2019}, url = {http://arxiv.org/abs/1911.01655}, eprinttype = {arXiv}, eprint = {1911.01655}, timestamp = {Mon, 11 Nov 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-01655.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-04252, author = {Qizhe Xie and Eduard H. Hovy and Minh{-}Thang Luong and Quoc V. Le}, title = {Self-training with Noisy Student improves ImageNet classification}, journal = {CoRR}, volume = {abs/1911.04252}, year = {2019}, url = {http://arxiv.org/abs/1911.04252}, eprinttype = {arXiv}, eprint = {1911.04252}, timestamp = {Sun, 01 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-04252.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-09070, author = {Mingxing Tan and Ruoming Pang and Quoc V. Le}, title = {EfficientDet: Scalable and Efficient Object Detection}, journal = {CoRR}, volume = {abs/1911.09070}, year = {2019}, url = {http://arxiv.org/abs/1911.09070}, eprinttype = {arXiv}, eprint = {1911.09070}, timestamp = {Tue, 03 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-09070.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-09665, author = {Cihang Xie and Mingxing Tan and Boqing Gong and Jiang Wang and Alan L. Yuille and Quoc V. Le}, title = {Adversarial Examples Improve Image Recognition}, journal = {CoRR}, volume = {abs/1911.09665}, year = {2019}, url = {http://arxiv.org/abs/1911.09665}, eprinttype = {arXiv}, eprint = {1911.09665}, timestamp = {Tue, 13 Oct 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-09665.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-01106, author = {Bo Chen and Golnaz Ghiasi and Hanxiao Liu and Tsung{-}Yi Lin and Dmitry Kalenichenko and Hartwig Adam and Quoc V. Le}, title = {MnasFPN: Learning Latency-aware Pyramid Architecture for Object Detection on Mobile Devices}, journal = {CoRR}, volume = {abs/1912.01106}, year = {2019}, url = {http://arxiv.org/abs/1912.01106}, eprinttype = {arXiv}, eprint = {1912.01106}, timestamp = {Mon, 31 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-01106.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-05027, author = {Xianzhi Du and Tsung{-}Yi Lin and Pengchong Jin and Golnaz Ghiasi and Mingxing Tan and Yin Cui and Quoc V. Le and Xiaodan Song}, title = {SpineNet: Learning Scale-Permuted Backbone for Recognition and Localization}, journal = {CoRR}, volume = {abs/1912.05027}, year = {2019}, url = {http://arxiv.org/abs/1912.05027}, eprinttype = {arXiv}, eprint = {1912.05027}, timestamp = {Thu, 02 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-05027.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-05533, author = {Daniel S. Park and Yu Zhang and Chung{-}Cheng Chiu and Youzheng Chen and Bo Li and William Chan and Quoc V. Le and Yonghui Wu}, title = {SpecAugment on Large Scale Datasets}, journal = {CoRR}, volume = {abs/1912.05533}, year = {2019}, url = {http://arxiv.org/abs/1912.05533}, eprinttype = {arXiv}, eprint = {1912.05533}, timestamp = {Tue, 07 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-05533.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/npjdm/RajkomarO0DHHLL18, author = {Alvin Rajkomar and Eyal Oren and Kai Chen and Andrew M. Dai and Nissan Hajaj and Michaela Hardt and Peter J. Liu and Xiaobing Liu and Jake Marcus and Mimi Sun and Patrik Sundberg and Hector Yee and Kun Zhang and Yi Zhang and Gerardo Flores and Gavin E. Duggan and Jamie Irvine and Quoc Le and Kurt Litsch and Alexander Mossin and Justin Tansuwan and De Wang and James Wexler and Jimbo Wilson and Dana Ludwig and Samuel L. Volchenboum and Katherine Chou and Michael Pearson and Srinivasan Madabushi and Nigam H. Shah and Atul J. Butte and Michael D. Howell and Claire Cui and Gregory S. Corrado and Jeffrey Dean}, title = {Scalable and accurate deep learning with electronic health records}, journal = {npj Digit. Medicine}, volume = {1}, year = {2018}, url = {https://doi.org/10.1038/s41746-018-0029-1}, doi = {10.1038/S41746-018-0029-1}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/npjdm/RajkomarO0DHHLL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/ZophVSL18, author = {Barret Zoph and Vijay Vasudevan and Jonathon Shlens and Quoc V. Le}, title = {Learning Transferable Architectures for Scalable Image Recognition}, booktitle = {2018 {IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2018, Salt Lake City, UT, USA, June 18-22, 2018}, pages = {8697--8710}, publisher = {Computer Vision Foundation / {IEEE} Computer Society}, year = {2018}, url = {http://openaccess.thecvf.com/content\_cvpr\_2018/html/Zoph\_Learning\_Transferable\_Architectures\_CVPR\_2018\_paper.html}, doi = {10.1109/CVPR.2018.00907}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/ZophVSL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ClarkLML18, author = {Kevin Clark and Minh{-}Thang Luong and Christopher D. Manning and Quoc V. Le}, editor = {Ellen Riloff and David Chiang and Julia Hockenmaier and Jun'ichi Tsujii}, title = {Semi-Supervised Sequence Modeling with Cross-View Training}, booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, pages = {1914--1925}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/d18-1217}, doi = {10.18653/V1/D18-1217}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/ClarkLML18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/WeiLDL18, author = {Wei Wei and Quoc V. Le and Andrew M. Dai and Jia Li}, editor = {Ellen Riloff and David Chiang and Julia Hockenmaier and Jun'ichi Tsujii}, title = {AirDialogue: An Environment for Goal-Oriented Dialogue Research}, booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, Brussels, Belgium, October 31 - November 4, 2018}, pages = {3844--3854}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/d18-1419}, doi = {10.18653/V1/D18-1419}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/WeiLDL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/gecco/DohanSL18, author = {David Dohan and David R. So and Quoc V. Le}, editor = {Hern{\'{a}}n E. Aguirre and Keiki Takadama}, title = {Evolving modular neural sequence architectures with genetic programming}, booktitle = {Proceedings of the Genetic and Evolutionary Computation Conference Companion, {GECCO} 2018, Kyoto, Japan, July 15-19, 2018}, pages = {37--38}, publisher = {{ACM}}, year = {2018}, url = {https://doi.org/10.1145/3205651.3208782}, doi = {10.1145/3205651.3208782}, timestamp = {Mon, 04 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/gecco/DohanSL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/CubukZSL18, author = {Ekin Dogus Cubuk and Barret Zoph and Samuel S. Schoenholz and Quoc V. Le}, title = {Intriguing Properties of Adversarial Examples}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=Skz1zaRLz}, timestamp = {Thu, 04 Apr 2019 13:20:09 +0200}, biburl = {https://dblp.org/rec/conf/iclr/CubukZSL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/MirhoseiniGPSLD18, author = {Azalia Mirhoseini and Anna Goldie and Hieu Pham and Benoit Steiner and Quoc V. Le and Jeff Dean}, title = {A Hierarchical Model for Device Placement}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=Hkc-TeZ0W}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iclr/MirhoseiniGPSLD18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PhamGZLD18, author = {Hieu Pham and Melody Y. Guan and Barret Zoph and Quoc V. Le and Jeff Dean}, title = {Faster Discovery of Neural Architectures by Searching for Paths in a Large Model}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=rJkCq4JvM}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iclr/PhamGZLD18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/RaghuIAKLK18, author = {Maithra Raghu and Alex Irpan and Jacob Andreas and Robert Kleinberg and Quoc V. Le and Jon M. Kleinberg}, title = {Can Deep Reinforcement Learning solve Erdos-Selfridge-Spencer Games?}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=SJbKi81wf}, timestamp = {Thu, 04 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/RaghuIAKLK18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/RamachandranZL18, author = {Prajit Ramachandran and Barret Zoph and Quoc V. Le}, title = {Searching for Activation Functions}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=Hkuq2EkPf}, timestamp = {Thu, 04 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/RamachandranZL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/SmithKYL18, author = {Samuel L. Smith and Pieter{-}Jan Kindermans and Chris Ying and Quoc V. Le}, title = {Don't Decay the Learning Rate, Increase the Batch Size}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=B1Yy1BxCZ}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/SmithKYL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/SmithL18, author = {Samuel L. Smith and Quoc V. Le}, title = {A Bayesian Perspective on Generalization and Stochastic Gradient Descent}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=BJij4yg0Z}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/SmithL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/TrinhDLL18, author = {Trieu H. Trinh and Andrew M. Dai and Minh{-}Thang Luong and Quoc V. Le}, title = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=Hy9xDwyPM}, timestamp = {Thu, 04 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/TrinhDLL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/YuDLZ00L18, author = {Adams Wei Yu and David Dohan and Minh{-}Thang Luong and Rui Zhao and Kai Chen and Mohammad Norouzi and Quoc V. Le}, title = {QANet: Combining Local Convolution with Global Self-Attention for Reading Comprehension}, booktitle = {6th International Conference on Learning Representations, {ICLR} 2018, Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2018}, url = {https://openreview.net/forum?id=B14TlG-RW}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/YuDLZ00L18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/BenderKZVL18, author = {Gabriel Bender and Pieter{-}Jan Kindermans and Barret Zoph and Vijay Vasudevan and Quoc V. Le}, editor = {Jennifer G. Dy and Andreas Krause}, title = {Understanding and Simplifying One-Shot Architecture Search}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {549--558}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/bender18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:30 +0200}, biburl = {https://dblp.org/rec/conf/icml/BenderKZVL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/PhamGZLD18, author = {Hieu Pham and Melody Y. Guan and Barret Zoph and Quoc V. Le and Jeff Dean}, editor = {Jennifer G. Dy and Andreas Krause}, title = {Efficient Neural Architecture Search via Parameter Sharing}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {4092--4101}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/pham18a.html}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/PhamGZLD18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/RaghuIAKLK18, author = {Maithra Raghu and Alex Irpan and Jacob Andreas and Robert Kleinberg and Quoc V. Le and Jon M. Kleinberg}, editor = {Jennifer G. Dy and Andreas Krause}, title = {Can Deep Reinforcement Learning Solve Erdos-Selfridge-Spencer Games?}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {4235--4243}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/raghu18a.html}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/RaghuIAKLK18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/TrinhDLL18, author = {Trieu H. Trinh and Andrew M. Dai and Thang Luong and Quoc V. Le}, editor = {Jennifer G. Dy and Andreas Krause}, title = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {4972--4981}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/trinh18a.html}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/TrinhDLL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LiangNBLL18, author = {Chen Liang and Mohammad Norouzi and Jonathan Berant and Quoc V. Le and Ni Lao}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Memory Augmented Policy Optimization for Program Synthesis and Semantic Parsing}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {10015--10027}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/f4e369c0a468d3aeeda0593ba90b5e55-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/LiangNBLL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GhiasiLL18, author = {Golnaz Ghiasi and Tsung{-}Yi Lin and Quoc V. Le}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {DropBlock: {A} regularization method for convolutional networks}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {10750--10760}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/7edcfb2d8f6a659ef4cd1e6c9b6d7079-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/GhiasiLL18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1801-03526, author = {Daniel A. Abolafia and Mohammad Norouzi and Quoc V. Le}, title = {Neural Program Synthesis with Priority Queue Training}, journal = {CoRR}, volume = {abs/1801.03526}, year = {2018}, url = {http://arxiv.org/abs/1801.03526}, eprinttype = {arXiv}, eprint = {1801.03526}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1801-03526.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1801-07860, author = {Alvin Rajkomar and Eyal Oren and Kai Chen and Andrew M. Dai and Nissan Hajaj and Peter J. Liu and Xiaobing Liu and Mimi Sun and Patrik Sundberg and Hector Yee and Kun Zhang and Gavin E. Duggan and Gerardo Flores and Michaela Hardt and Jamie Irvine and Quoc V. Le and Kurt Litsch and Jake Marcus and Alexander Mossin and Justin Tansuwan and De Wang and James Wexler and Jimbo Wilson and Dana Ludwig and Samuel L. Volchenboum and Katherine Chou and Michael Pearson and Srinivasan Madabushi and Nigam H. Shah and Atul J. Butte and Michael D. Howell and Claire Cui and Greg Corrado and Jeff Dean}, title = {Scalable and accurate deep learning for electronic health records}, journal = {CoRR}, volume = {abs/1801.07860}, year = {2018}, url = {http://arxiv.org/abs/1801.07860}, eprinttype = {arXiv}, eprint = {1801.07860}, timestamp = {Fri, 14 Apr 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1801-07860.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-01548, author = {Esteban Real and Alok Aggarwal and Yanping Huang and Quoc V. Le}, title = {Regularized Evolution for Image Classifier Architecture Search}, journal = {CoRR}, volume = {abs/1802.01548}, year = {2018}, url = {http://arxiv.org/abs/1802.01548}, eprinttype = {arXiv}, eprint = {1802.01548}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-01548.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1802-03268, author = {Hieu Pham and Melody Y. Guan and Barret Zoph and Quoc V. Le and Jeff Dean}, title = {Efficient Neural Architecture Search via Parameter Sharing}, journal = {CoRR}, volume = {abs/1802.03268}, year = {2018}, url = {http://arxiv.org/abs/1802.03268}, eprinttype = {arXiv}, eprint = {1802.03268}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1802-03268.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1803-00144, author = {Trieu H. Trinh and Andrew M. Dai and Thang Luong and Quoc V. Le}, title = {Learning Longer-term Dependencies in RNNs with Auxiliary Losses}, journal = {CoRR}, volume = {abs/1803.00144}, year = {2018}, url = {http://arxiv.org/abs/1803.00144}, eprinttype = {arXiv}, eprint = {1803.00144}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1803-00144.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1804-09541, author = {Adams Wei Yu and David Dohan and Minh{-}Thang Luong and Rui Zhao and Kai Chen and Mohammad Norouzi and Quoc V. Le}, title = {QANet: Combining Local Convolution with Global Self-Attention for Reading Comprehension}, journal = {CoRR}, volume = {abs/1804.09541}, year = {2018}, url = {http://arxiv.org/abs/1804.09541}, eprinttype = {arXiv}, eprint = {1804.09541}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-09541.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-08974, author = {Simon Kornblith and Jonathon Shlens and Quoc V. Le}, title = {Do Better ImageNet Models Transfer Better?}, journal = {CoRR}, volume = {abs/1805.08974}, year = {2018}, url = {http://arxiv.org/abs/1805.08974}, eprinttype = {arXiv}, eprint = {1805.08974}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-08974.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1805-09501, author = {Ekin Dogus Cubuk and Barret Zoph and Dandelion Man{\'{e}} and Vijay Vasudevan and Quoc V. Le}, title = {AutoAugment: Learning Augmentation Policies from Data}, journal = {CoRR}, volume = {abs/1805.09501}, year = {2018}, url = {http://arxiv.org/abs/1805.09501}, eprinttype = {arXiv}, eprint = {1805.09501}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1805-09501.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-02847, author = {Trieu H. Trinh and Quoc V. Le}, title = {A Simple Method for Commonsense Reasoning}, journal = {CoRR}, volume = {abs/1806.02847}, year = {2018}, url = {http://arxiv.org/abs/1806.02847}, eprinttype = {arXiv}, eprint = {1806.02847}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-02847.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-09597, author = {Samuel L. Smith and Daniel Duckworth and Quoc V. Le and Jascha Sohl{-}Dickstein}, title = {Stochastic natural gradient descent draws posterior samples in function space}, journal = {CoRR}, volume = {abs/1806.09597}, year = {2018}, url = {http://arxiv.org/abs/1806.09597}, eprinttype = {arXiv}, eprint = {1806.09597}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-09597.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-02322, author = {Chen Liang and Mohammad Norouzi and Jonathan Berant and Quoc V. Le and Ni Lao}, title = {Memory Augmented Policy Optimization for Program Synthesis with Generalization}, journal = {CoRR}, volume = {abs/1807.02322}, year = {2018}, url = {http://arxiv.org/abs/1807.02322}, eprinttype = {arXiv}, eprint = {1807.02322}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-02322.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1807-11626, author = {Mingxing Tan and Bo Chen and Ruoming Pang and Vijay Vasudevan and Quoc V. Le}, title = {MnasNet: Platform-Aware Neural Architecture Search for Mobile}, journal = {CoRR}, volume = {abs/1807.11626}, year = {2018}, url = {http://arxiv.org/abs/1807.11626}, eprinttype = {arXiv}, eprint = {1807.11626}, timestamp = {Mon, 31 May 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1807-11626.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-02822, author = {Maximilian Alber and Irwan Bello and Barret Zoph and Pieter{-}Jan Kindermans and Prajit Ramachandran and Quoc V. Le}, title = {Backprop Evolution}, journal = {CoRR}, volume = {abs/1808.02822}, year = {2018}, url = {http://arxiv.org/abs/1808.02822}, eprinttype = {arXiv}, eprint = {1808.02822}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-02822.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-08370, author = {Kevin Clark and Minh{-}Thang Luong and Christopher D. Manning and Quoc V. Le}, title = {Semi-Supervised Sequence Modeling with Cross-View Training}, journal = {CoRR}, volume = {abs/1809.08370}, year = {2018}, url = {http://arxiv.org/abs/1809.08370}, eprinttype = {arXiv}, eprint = {1809.08370}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-08370.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-12890, author = {Golnaz Ghiasi and Tsung{-}Yi Lin and Quoc V. Le}, title = {DropBlock: {A} regularization method for convolutional networks}, journal = {CoRR}, volume = {abs/1810.12890}, year = {2018}, url = {http://arxiv.org/abs/1810.12890}, eprinttype = {arXiv}, eprint = {1810.12890}, timestamp = {Thu, 08 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-12890.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-06965, author = {Yanping Huang and Yonglong Cheng and Dehao Chen and HyoukJoong Lee and Jiquan Ngiam and Quoc V. Le and Zhifeng Chen}, title = {GPipe: Efficient Training of Giant Neural Networks using Pipeline Parallelism}, journal = {CoRR}, volume = {abs/1811.06965}, year = {2018}, url = {http://arxiv.org/abs/1811.06965}, eprinttype = {arXiv}, eprint = {1811.06965}, timestamp = {Sun, 25 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-06965.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1811-07056, author = {Jiquan Ngiam and Daiyi Peng and Vijay Vasudevan and Simon Kornblith and Quoc V. Le and Ruoming Pang}, title = {Domain Adaptive Transfer Learning with Specialist Models}, journal = {CoRR}, volume = {abs/1811.07056}, year = {2018}, url = {http://arxiv.org/abs/1811.07056}, eprinttype = {arXiv}, eprint = {1811.07056}, timestamp = {Sun, 25 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1811-07056.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tacl/JohnsonSLKWCTVW17, author = {Melvin Johnson and Mike Schuster and Quoc V. Le and Maxim Krikun and Yonghui Wu and Zhifeng Chen and Nikhil Thorat and Fernanda B. Vi{\'{e}}gas and Martin Wattenberg and Greg Corrado and Macduff Hughes and Jeffrey Dean}, title = {Google's Multilingual Neural Machine Translation System: Enabling Zero-Shot Translation}, journal = {Trans. Assoc. Comput. Linguistics}, volume = {5}, pages = {339--351}, year = {2017}, url = {https://doi.org/10.1162/tacl\_a\_00065}, doi = {10.1162/TACL\_A\_00065}, timestamp = {Fri, 10 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tacl/JohnsonSLKWCTVW17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LiangBLFL17, author = {Chen Liang and Jonathan Berant and Quoc V. Le and Kenneth D. Forbus and Ni Lao}, editor = {Regina Barzilay and Min{-}Yen Kan}, title = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with Weak Supervision}, booktitle = {Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume 1: Long Papers}, pages = {23--33}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/P17-1003}, doi = {10.18653/V1/P17-1003}, timestamp = {Fri, 06 Aug 2021 00:40:58 +0200}, biburl = {https://dblp.org/rec/conf/acl/LiangBLFL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/YuLL17, author = {Adams Wei Yu and Hongrae Lee and Quoc V. Le}, editor = {Regina Barzilay and Min{-}Yen Kan}, title = {Learning to Skim Text}, booktitle = {Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume 1: Long Papers}, pages = {1880--1890}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/P17-1172}, doi = {10.18653/V1/P17-1172}, timestamp = {Tue, 20 Aug 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/YuLL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/RamachandranLL17, author = {Prajit Ramachandran and Peter J. Liu and Quoc V. Le}, editor = {Martha Palmer and Rebecca Hwa and Sebastian Riedel}, title = {Unsupervised Pretraining for Sequence to Sequence Learning}, booktitle = {Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2017, Copenhagen, Denmark, September 9-11, 2017}, pages = {383--391}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/d17-1039}, doi = {10.18653/V1/D17-1039}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/emnlp/RamachandranLL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/BelloPL0B17, author = {Irwan Bello and Hieu Pham and Quoc V. Le and Mohammad Norouzi and Samy Bengio}, title = {Neural Combinatorial Optimization with Reinforcement Learning}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Workshop Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=Bk9mxlSFx}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iclr/BelloPL0B17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ChanZLJ17, author = {William Chan and Yu Zhang and Quoc V. Le and Navdeep Jaitly}, title = {Latent Sequence Decompositions}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=SyQq185lg}, timestamp = {Tue, 09 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iclr/ChanZLJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/HaDL17, author = {David Ha and Andrew M. Dai and Quoc V. Le}, title = {HyperNetworks}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=rkpACe1lx}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/HaDL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/NeelakantanLAMA17, author = {Arvind Neelakantan and Quoc V. Le and Mart{\'{\i}}n Abadi and Andrew McCallum and Dario Amodei}, title = {Learning a Natural Language Interface with Neural Programmer}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=ry2YOrcge}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/NeelakantanLAMA17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ShazeerMMDLHD17, author = {Noam Shazeer and Azalia Mirhoseini and Krzysztof Maziarz and Andy Davis and Quoc V. Le and Geoffrey E. Hinton and Jeff Dean}, title = {Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts Layer}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=B1ckMDqlg}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ShazeerMMDLHD17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ZophL17, author = {Barret Zoph and Quoc V. Le}, title = {Neural Architecture Search with Reinforcement Learning}, booktitle = {5th International Conference on Learning Representations, {ICLR} 2017, Toulon, France, April 24-26, 2017, Conference Track Proceedings}, publisher = {OpenReview.net}, year = {2017}, url = {https://openreview.net/forum?id=r1Ue8Hcxg}, timestamp = {Thu, 04 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ZophL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/BelloZVL17, author = {Irwan Bello and Barret Zoph and Vijay Vasudevan and Quoc V. Le}, editor = {Doina Precup and Yee Whye Teh}, title = {Neural Optimizer Search with Reinforcement Learning}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {459--468}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/bello17a.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/BelloZVL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/MirhoseiniPLSLZ17, author = {Azalia Mirhoseini and Hieu Pham and Quoc V. Le and Benoit Steiner and Rasmus Larsen and Yuefeng Zhou and Naveen Kumar and Mohammad Norouzi and Samy Bengio and Jeff Dean}, editor = {Doina Precup and Yee Whye Teh}, title = {Device Placement Optimization with Reinforcement Learning}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {2430--2439}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/mirhoseini17a.html}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/MirhoseiniPLSLZ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/RealMSSSTLK17, author = {Esteban Real and Sherry Moore and Andrew Selle and Saurabh Saxena and Yutaka I. Leon{-}Suematsu and Jie Tan and Quoc V. Le and Alexey Kurakin}, editor = {Doina Precup and Yee Whye Teh}, title = {Large-Scale Evolution of Image Classifiers}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {2902--2911}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/real17a.html}, timestamp = {Tue, 04 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/RealMSSSTLK17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/WangSSWWJYXCBLA17, author = {Yuxuan Wang and R. J. Skerry{-}Ryan and Daisy Stanton and Yonghui Wu and Ron J. Weiss and Navdeep Jaitly and Zongheng Yang and Ying Xiao and Zhifeng Chen and Samy Bengio and Quoc V. Le and Yannis Agiomyrgiannakis and Rob Clark and Rif A. Saurous}, editor = {Francisco Lacerda}, title = {Tacotron: Towards End-to-End Speech Synthesis}, booktitle = {Interspeech 2017, 18th Annual Conference of the International Speech Communication Association, Stockholm, Sweden, August 20-24, 2017}, pages = {4006--4010}, publisher = {{ISCA}}, year = {2017}, url = {https://doi.org/10.21437/Interspeech.2017-1452}, doi = {10.21437/INTERSPEECH.2017-1452}, timestamp = {Mon, 26 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/WangSSWWJYXCBLA17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/wmt/BritzLP17, author = {Denny Britz and Quoc V. Le and Reid Pryzant}, editor = {Ondrej Bojar and Christian Buck and Rajen Chatterjee and Christian Federmann and Yvette Graham and Barry Haddow and Matthias Huck and Antonio Jimeno{-}Yepes and Philipp Koehn and Julia Kreutzer}, title = {Effective Domain Mixing for Neural Machine Translation}, booktitle = {Proceedings of the Second Conference on Machine Translation, {WMT} 2017, Copenhagen, Denmark, September 7-8, 2017}, pages = {118--126}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/w17-4712}, doi = {10.18653/V1/W17-4712}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/wmt/BritzLP17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ShazeerMMDLHD17, author = {Noam Shazeer and Azalia Mirhoseini and Krzysztof Maziarz and Andy Davis and Quoc V. Le and Geoffrey E. Hinton and Jeff Dean}, title = {Outrageously Large Neural Networks: The Sparsely-Gated Mixture-of-Experts Layer}, journal = {CoRR}, volume = {abs/1701.06538}, year = {2017}, url = {http://arxiv.org/abs/1701.06538}, eprinttype = {arXiv}, eprint = {1701.06538}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ShazeerMMDLHD17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RealMSSSLK17, author = {Esteban Real and Sherry Moore and Andrew Selle and Saurabh Saxena and Yutaka I. Leon{-}Suematsu and Quoc V. Le and Alex Kurakin}, title = {Large-Scale Evolution of Image Classifiers}, journal = {CoRR}, volume = {abs/1703.01041}, year = {2017}, url = {http://arxiv.org/abs/1703.01041}, eprinttype = {arXiv}, eprint = {1703.01041}, timestamp = {Tue, 04 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RealMSSSLK17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BritzGLL17, author = {Denny Britz and Anna Goldie and Minh{-}Thang Luong and Quoc V. Le}, title = {Massive Exploration of Neural Machine Translation Architectures}, journal = {CoRR}, volume = {abs/1703.03906}, year = {2017}, url = {http://arxiv.org/abs/1703.03906}, eprinttype = {arXiv}, eprint = {1703.03906}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BritzGLL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/WangSSWWJYXCBLA17, author = {Yuxuan Wang and R. J. Skerry{-}Ryan and Daisy Stanton and Yonghui Wu and Ron J. Weiss and Navdeep Jaitly and Zongheng Yang and Ying Xiao and Zhifeng Chen and Samy Bengio and Quoc V. Le and Yannis Agiomyrgiannakis and Rob Clark and Rif A. Saurous}, title = {Tacotron: {A} Fully End-to-End Text-To-Speech Synthesis Model}, journal = {CoRR}, volume = {abs/1703.10135}, year = {2017}, url = {http://arxiv.org/abs/1703.10135}, eprinttype = {arXiv}, eprint = {1703.10135}, timestamp = {Mon, 25 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/WangSSWWJYXCBLA17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/YuLL17, author = {Adams Wei Yu and Hongrae Lee and Quoc V. Le}, title = {Learning to Skim Text}, journal = {CoRR}, volume = {abs/1704.06877}, year = {2017}, url = {http://arxiv.org/abs/1704.06877}, eprinttype = {arXiv}, eprint = {1704.06877}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/YuLL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MirhoseiniPLSLZ17, author = {Azalia Mirhoseini and Hieu Pham and Quoc V. Le and Benoit Steiner and Rasmus Larsen and Yuefeng Zhou and Naveen Kumar and Mohammad Norouzi and Samy Bengio and Jeff Dean}, title = {Device Placement Optimization with Reinforcement Learning}, journal = {CoRR}, volume = {abs/1706.04972}, year = {2017}, url = {http://arxiv.org/abs/1706.04972}, eprinttype = {arXiv}, eprint = {1706.04972}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/MirhoseiniPLSLZ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ZophVSL17, author = {Barret Zoph and Vijay Vasudevan and Jonathon Shlens and Quoc V. Le}, title = {Learning Transferable Architectures for Scalable Image Recognition}, journal = {CoRR}, volume = {abs/1707.07012}, year = {2017}, url = {http://arxiv.org/abs/1707.07012}, eprinttype = {arXiv}, eprint = {1707.07012}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ZophVSL17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1709-07417, author = {Irwan Bello and Barret Zoph and Vijay Vasudevan and Quoc V. Le}, title = {Neural Optimizer Search with Reinforcement Learning}, journal = {CoRR}, volume = {abs/1709.07417}, year = {2017}, url = {http://arxiv.org/abs/1709.07417}, eprinttype = {arXiv}, eprint = {1709.07417}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1709-07417.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1710-05941, author = {Prajit Ramachandran and Barret Zoph and Quoc V. Le}, title = {Searching for Activation Functions}, journal = {CoRR}, volume = {abs/1710.05941}, year = {2017}, url = {http://arxiv.org/abs/1710.05941}, eprinttype = {arXiv}, eprint = {1710.05941}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1710-05941.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1710-06451, author = {Samuel L. Smith and Quoc V. Le}, title = {A Bayesian Perspective on Generalization and Stochastic Gradient Descent}, journal = {CoRR}, volume = {abs/1710.06451}, year = {2017}, url = {http://arxiv.org/abs/1710.06451}, eprinttype = {arXiv}, eprint = {1710.06451}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1710-06451.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-00489, author = {Samuel L. Smith and Pieter{-}Jan Kindermans and Quoc V. Le}, title = {Don't Decay the Learning Rate, Increase the Batch Size}, journal = {CoRR}, volume = {abs/1711.00489}, year = {2017}, url = {http://arxiv.org/abs/1711.00489}, eprinttype = {arXiv}, eprint = {1711.00489}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-00489.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-02301, author = {Maithra Raghu and Alex Irpan and Jacob Andreas and Robert Kleinberg and Quoc V. Le and Jon M. Kleinberg}, title = {Can Deep Reinforcement Learning Solve Erdos-Selfridge-Spencer Games?}, journal = {CoRR}, volume = {abs/1711.02301}, year = {2017}, url = {http://arxiv.org/abs/1711.02301}, eprinttype = {arXiv}, eprint = {1711.02301}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-02301.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-02846, author = {Ekin Dogus Cubuk and Barret Zoph and Samuel S. Schoenholz and Quoc V. Le}, title = {Intriguing Properties of Adversarial Examples}, journal = {CoRR}, volume = {abs/1711.02846}, year = {2017}, url = {http://arxiv.org/abs/1711.02846}, eprinttype = {arXiv}, eprint = {1711.02846}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-02846.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ChanJLV16, author = {William Chan and Navdeep Jaitly and Quoc V. Le and Oriol Vinyals}, title = {Listen, attend and spell: {A} neural network for large vocabulary conversational speech recognition}, booktitle = {2016 {IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016}, pages = {4960--4964}, publisher = {{IEEE}}, year = {2016}, url = {https://doi.org/10.1109/ICASSP.2016.7472621}, doi = {10.1109/ICASSP.2016.7472621}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ChanJLV16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/JaitlyLVSSB16, author = {Navdeep Jaitly and Quoc V. Le and Oriol Vinyals and Ilya Sutskever and David Sussillo and Samy Bengio}, editor = {Daniel D. Lee and Masashi Sugiyama and Ulrike von Luxburg and Isabelle Guyon and Roman Garnett}, title = {An Online Sequence-to-Sequence Model Using Partial Conditioning}, booktitle = {Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, December 5-10, 2016, Barcelona, Spain}, pages = {5067--5075}, year = {2016}, url = {https://proceedings.neurips.cc/paper/2016/hash/312351bff07989769097660a56395065-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/JaitlyLVSSB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ssw/Le16, author = {Quoc V. Le}, title = {End-to-end Learning for Text and Speech}, booktitle = {The 9th {ISCA} Speech Synthesis Workshop, Sunnyvale, CA, USA, 13-15 September 2016}, publisher = {{ISCA}}, year = {2016}, url = {http://www.isca-speech.org/archive/SSW\_2016/abstracts/ssw9\_KN3\_Le.html}, timestamp = {Mon, 28 Aug 2023 21:17:54 +0200}, biburl = {https://dblp.org/rec/conf/ssw/Le16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/LuongLSVK15, author = {Minh{-}Thang Luong and Quoc V. Le and Ilya Sutskever and Oriol Vinyals and Lukasz Kaiser}, editor = {Yoshua Bengio and Yann LeCun}, title = {Multi-task Sequence to Sequence Learning}, booktitle = {4th International Conference on Learning Representations, {ICLR} 2016, San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings}, year = {2016}, url = {http://arxiv.org/abs/1511.06114}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LuongLSVK15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/corr/NeelakantanLS15, author = {Arvind Neelakantan and Quoc V. Le and Ilya Sutskever}, editor = {Yoshua Bengio and Yann LeCun}, title = {Neural Programmer: Inducing Latent Programs with Gradient Descent}, booktitle = {4th International Conference on Learning Representations, {ICLR} 2016, San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings}, year = {2016}, url = {http://arxiv.org/abs/1511.04834}, timestamp = {Thu, 25 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/NeelakantanLS15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/WuSCLNMKCGMKSJL16, author = {Yonghui Wu and Mike Schuster and Zhifeng Chen and Quoc V. Le and Mohammad Norouzi and Wolfgang Macherey and Maxim Krikun and Yuan Cao and Qin Gao and Klaus Macherey and Jeff Klingner and Apurva Shah and Melvin Johnson and Xiaobing Liu and Lukasz Kaiser and Stephan Gouws and Yoshikiyo Kato and Taku Kudo and Hideto Kazawa and Keith Stevens and George Kurian and Nishant Patil and Wei Wang and Cliff Young and Jason Smith and Jason Riesa and Alex Rudnick and Oriol Vinyals and Greg Corrado and Macduff Hughes and Jeffrey Dean}, title = {Google's Neural Machine Translation System: Bridging the Gap between Human and Machine Translation}, journal = {CoRR}, volume = {abs/1609.08144}, year = {2016}, url = {http://arxiv.org/abs/1609.08144}, eprinttype = {arXiv}, eprint = {1609.08144}, timestamp = {Thu, 14 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/WuSCLNMKCGMKSJL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/HaDL16, author = {David Ha and Andrew M. Dai and Quoc V. Le}, title = {HyperNetworks}, journal = {CoRR}, volume = {abs/1609.09106}, year = {2016}, url = {http://arxiv.org/abs/1609.09106}, eprinttype = {arXiv}, eprint = {1609.09106}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/HaDL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ChanZLJ16, author = {William Chan and Yu Zhang and Quoc V. Le and Navdeep Jaitly}, title = {Latent Sequence Decompositions}, journal = {CoRR}, volume = {abs/1610.03035}, year = {2016}, url = {http://arxiv.org/abs/1610.03035}, eprinttype = {arXiv}, eprint = {1610.03035}, timestamp = {Tue, 09 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/ChanZLJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LiangBLFL16, author = {Chen Liang and Jonathan Berant and Quoc V. Le and Kenneth D. Forbus and Ni Lao}, title = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with Weak Supervision}, journal = {CoRR}, volume = {abs/1611.00020}, year = {2016}, url = {http://arxiv.org/abs/1611.00020}, eprinttype = {arXiv}, eprint = {1611.00020}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LiangBLFL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ZophL16, author = {Barret Zoph and Quoc V. Le}, title = {Neural Architecture Search with Reinforcement Learning}, journal = {CoRR}, volume = {abs/1611.01578}, year = {2016}, url = {http://arxiv.org/abs/1611.01578}, eprinttype = {arXiv}, eprint = {1611.01578}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ZophL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RamachandranLL16, author = {Prajit Ramachandran and Peter J. Liu and Quoc V. Le}, title = {Unsupervised Pretraining for Sequence to Sequence Learning}, journal = {CoRR}, volume = {abs/1611.02683}, year = {2016}, url = {http://arxiv.org/abs/1611.02683}, eprinttype = {arXiv}, eprint = {1611.02683}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RamachandranLL16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/JohnsonSLKWCTVW16, author = {Melvin Johnson and Mike Schuster and Quoc V. Le and Maxim Krikun and Yonghui Wu and Zhifeng Chen and Nikhil Thorat and Fernanda B. Vi{\'{e}}gas and Martin Wattenberg and Greg Corrado and Macduff Hughes and Jeffrey Dean}, title = {Google's Multilingual Neural Machine Translation System: Enabling Zero-Shot Translation}, journal = {CoRR}, volume = {abs/1611.04558}, year = {2016}, url = {http://arxiv.org/abs/1611.04558}, eprinttype = {arXiv}, eprint = {1611.04558}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/JohnsonSLKWCTVW16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/NeelakantanLAMA16, author = {Arvind Neelakantan and Quoc V. Le and Mart{\'{\i}}n Abadi and Andrew McCallum and Dario Amodei}, title = {Learning a Natural Language Interface with Neural Programmer}, journal = {CoRR}, volume = {abs/1611.08945}, year = {2016}, url = {http://arxiv.org/abs/1611.08945}, eprinttype = {arXiv}, eprint = {1611.08945}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/NeelakantanLAMA16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BelloPLNB16, author = {Irwan Bello and Hieu Pham and Quoc V. Le and Mohammad Norouzi and Samy Bengio}, title = {Neural Combinatorial Optimization with Reinforcement Learning}, journal = {CoRR}, volume = {abs/1611.09940}, year = {2016}, url = {http://arxiv.org/abs/1611.09940}, eprinttype = {arXiv}, eprint = {1611.09940}, timestamp = {Thu, 11 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/BelloPLNB16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LiangBLFL16a, author = {Chen Liang and Jonathan Berant and Quoc V. Le and Kenneth D. Forbus and Ni Lao}, title = {Neural Symbolic Machines: Learning Semantic Parsers on Freebase with Weak Supervision (Short Version)}, journal = {CoRR}, volume = {abs/1612.01197}, year = {2016}, url = {http://arxiv.org/abs/1612.01197}, eprinttype = {arXiv}, eprint = {1612.01197}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LiangBLFL16a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/LuongSLVZ15, author = {Thang Luong and Ilya Sutskever and Quoc V. Le and Oriol Vinyals and Wojciech Zaremba}, title = {Addressing the Rare Word Problem in Neural Machine Translation}, booktitle = {Proceedings of the 53rd Annual Meeting of the Association for Computational Linguistics and the 7th International Joint Conference on Natural Language Processing of the Asian Federation of Natural Language Processing, {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers}, pages = {11--19}, publisher = {The Association for Computer Linguistics}, year = {2015}, url = {https://doi.org/10.3115/v1/p15-1002}, doi = {10.3115/V1/P15-1002}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/LuongSLVZ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DaiL15, author = {Andrew M. Dai and Quoc V. Le}, editor = {Corinna Cortes and Neil D. Lawrence and Daniel D. Lee and Masashi Sugiyama and Roman Garnett}, title = {Semi-supervised Sequence Learning}, booktitle = {Advances in Neural Information Processing Systems 28: Annual Conference on Neural Information Processing Systems 2015, December 7-12, 2015, Montreal, Quebec, Canada}, pages = {3079--3087}, year = {2015}, url = {https://proceedings.neurips.cc/paper/2015/hash/7137debd45ae4d0ab9aa953017286b20-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/DaiL15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LeJH15, author = {Quoc V. Le and Navdeep Jaitly and Geoffrey E. Hinton}, title = {A Simple Way to Initialize Recurrent Networks of Rectified Linear Units}, journal = {CoRR}, volume = {abs/1504.00941}, year = {2015}, url = {http://arxiv.org/abs/1504.00941}, eprinttype = {arXiv}, eprint = {1504.00941}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LeJH15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/VinyalsL15, author = {Oriol Vinyals and Quoc V. Le}, title = {A Neural Conversational Model}, journal = {CoRR}, volume = {abs/1506.05869}, year = {2015}, url = {http://arxiv.org/abs/1506.05869}, eprinttype = {arXiv}, eprint = {1506.05869}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/VinyalsL15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/DaiOL15, author = {Andrew M. Dai and Christopher Olah and Quoc V. Le}, title = {Document Embedding with Paragraph Vectors}, journal = {CoRR}, volume = {abs/1507.07998}, year = {2015}, url = {http://arxiv.org/abs/1507.07998}, eprinttype = {arXiv}, eprint = {1507.07998}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/DaiOL15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/ChanJLV15, author = {William Chan and Navdeep Jaitly and Quoc V. Le and Oriol Vinyals}, title = {Listen, Attend and Spell}, journal = {CoRR}, volume = {abs/1508.01211}, year = {2015}, url = {http://arxiv.org/abs/1508.01211}, eprinttype = {arXiv}, eprint = {1508.01211}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/ChanJLV15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/DaiL15a, author = {Andrew M. Dai and Quoc V. Le}, title = {Semi-supervised Sequence Learning}, journal = {CoRR}, volume = {abs/1511.01432}, year = {2015}, url = {http://arxiv.org/abs/1511.01432}, eprinttype = {arXiv}, eprint = {1511.01432}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/DaiL15a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/JaitlyLVSB15, author = {Navdeep Jaitly and Quoc V. Le and Oriol Vinyals and Ilya Sutskever and Samy Bengio}, title = {An Online Sequence-to-Sequence Model Using Partial Conditioning}, journal = {CoRR}, volume = {abs/1511.04868}, year = {2015}, url = {http://arxiv.org/abs/1511.04868}, eprinttype = {arXiv}, eprint = {1511.04868}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/JaitlyLVSB15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/NeelakantanVLSK15, author = {Arvind Neelakantan and Luke Vilnis and Quoc V. Le and Ilya Sutskever and Lukasz Kaiser and Karol Kurach and James Martens}, title = {Adding Gradient Noise Improves Learning for Very Deep Networks}, journal = {CoRR}, volume = {abs/1511.06807}, year = {2015}, url = {http://arxiv.org/abs/1511.06807}, eprinttype = {arXiv}, eprint = {1511.06807}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/NeelakantanVLSK15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tacl/SocherKLMN14, author = {Richard Socher and Andrej Karpathy and Quoc V. Le and Christopher D. Manning and Andrew Y. Ng}, title = {Grounded Compositional Semantics for Finding and Describing Images with Sentences}, journal = {Trans. Assoc. Comput. Linguistics}, volume = {2}, pages = {207--218}, year = {2014}, url = {https://doi.org/10.1162/tacl\_a\_00177}, doi = {10.1162/TACL\_A\_00177}, timestamp = {Fri, 10 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tacl/SocherKLMN14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeM14, author = {Quoc V. Le and Tom{\'{a}}s Mikolov}, title = {Distributed Representations of Sentences and Documents}, booktitle = {Proceedings of the 31th International Conference on Machine Learning, {ICML} 2014, Beijing, China, 21-26 June 2014}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {32}, pages = {1188--1196}, publisher = {JMLR.org}, year = {2014}, url = {http://proceedings.mlr.press/v32/le14.html}, timestamp = {Mon, 28 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/LeM14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SutskeverVL14, author = {Ilya Sutskever and Oriol Vinyals and Quoc V. Le}, editor = {Zoubin Ghahramani and Max Welling and Corinna Cortes and Neil D. Lawrence and Kilian Q. Weinberger}, title = {Sequence to Sequence Learning with Neural Networks}, booktitle = {Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems 2014, December 8-13 2014, Montreal, Quebec, Canada}, pages = {3104--3112}, year = {2014}, url = {https://proceedings.neurips.cc/paper/2014/hash/a14ac55a4f27472c5d894ec1c3c743d2-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/SutskeverVL14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LeM14, author = {Quoc V. Le and Tom{\'{a}}s Mikolov}, title = {Distributed Representations of Sentences and Documents}, journal = {CoRR}, volume = {abs/1405.4053}, year = {2014}, url = {http://arxiv.org/abs/1405.4053}, eprinttype = {arXiv}, eprint = {1405.4053}, timestamp = {Mon, 28 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/LeM14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LeSS14, author = {Quoc Viet Le and Tam{\'{a}}s Sarl{\'{o}}s and Alexander Johannes Smola}, title = {Fastfood: Approximate Kernel Expansions in Loglinear Time}, journal = {CoRR}, volume = {abs/1408.3060}, year = {2014}, url = {http://arxiv.org/abs/1408.3060}, eprinttype = {arXiv}, eprint = {1408.3060}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LeSS14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SutskeverVL14, author = {Ilya Sutskever and Oriol Vinyals and Quoc V. Le}, title = {Sequence to Sequence Learning with Neural Networks}, journal = {CoRR}, volume = {abs/1409.3215}, year = {2014}, url = {http://arxiv.org/abs/1409.3215}, eprinttype = {arXiv}, eprint = {1409.3215}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SutskeverVL14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LuongSLVZ14, author = {Thang Luong and Ilya Sutskever and Quoc V. Le and Oriol Vinyals and Wojciech Zaremba}, title = {Addressing the Rare Word Problem in Neural Machine Translation}, journal = {CoRR}, volume = {abs/1410.8206}, year = {2014}, url = {http://arxiv.org/abs/1410.8206}, eprinttype = {arXiv}, eprint = {1410.8206}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LuongSLVZ14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@phdthesis{DBLP:phd/us/Le13a, author = {Quoc V. Le}, title = {Scalable feature learning}, school = {Stanford University, {USA}}, year = {2013}, url = {https://searchworks.stanford.edu/view/10164968}, timestamp = {Fri, 02 Sep 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/phd/us/Le13a.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/ZeilerRMMYLNSVDH13, author = {Matthew D. Zeiler and Marc'Aurelio Ranzato and Rajat Monga and Mark Z. Mao and K. Yang and Quoc Viet Le and Patrick Nguyen and Andrew W. Senior and Vincent Vanhoucke and Jeffrey Dean and Geoffrey E. Hinton}, title = {On rectified linear units for speech processing}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013}, pages = {3517--3521}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ICASSP.2013.6638312}, doi = {10.1109/ICASSP.2013.6638312}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/icassp/ZeilerRMMYLNSVDH13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icassp/Le13, author = {Quoc V. Le}, title = {Building high-level features using large scale unsupervised learning}, booktitle = {{IEEE} International Conference on Acoustics, Speech and Signal Processing, {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013}, pages = {8595--8598}, publisher = {{IEEE}}, year = {2013}, url = {https://doi.org/10.1109/ICASSP.2013.6639343}, doi = {10.1109/ICASSP.2013.6639343}, timestamp = {Fri, 19 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icassp/Le13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeSS13, author = {Quoc V. Le and Tam{\'{a}}s Sarl{\'{o}}s and Alexander J. Smola}, title = {Fastfood - Computing Hilbert Space Expansions in loglinear time}, booktitle = {Proceedings of the 30th International Conference on Machine Learning, {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {28}, pages = {244--252}, publisher = {JMLR.org}, year = {2013}, url = {http://proceedings.mlr.press/v28/le13.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/LeSS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MikolovLS13, author = {Tom{\'{a}}s Mikolov and Quoc V. Le and Ilya Sutskever}, title = {Exploiting Similarities among Languages for Machine Translation}, journal = {CoRR}, volume = {abs/1309.4168}, year = {2013}, url = {http://arxiv.org/abs/1309.4168}, eprinttype = {arXiv}, eprint = {1309.4168}, timestamp = {Mon, 28 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/MikolovLS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/BengioDEILRSS13, author = {Samy Bengio and Jeffrey Dean and Dumitru Erhan and Eugene Ie and Quoc V. Le and Andrew Rabinovich and Jonathon Shlens and Yoram Singer}, title = {Using Web Co-occurrence Statistics for Improving Image Categorization}, journal = {CoRR}, volume = {abs/1312.5697}, year = {2013}, url = {http://arxiv.org/abs/1312.5697}, eprinttype = {arXiv}, eprint = {1312.5697}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/BengioDEILRSS13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeRMDCCDN12, author = {Quoc V. Le and Marc'Aurelio Ranzato and Rajat Monga and Matthieu Devin and Greg Corrado and Kai Chen and Jeffrey Dean and Andrew Y. Ng}, title = {Building high-level features using large scale unsupervised learning}, booktitle = {Proceedings of the 29th International Conference on Machine Learning, {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012}, publisher = {icml.cc / Omnipress}, year = {2012}, url = {http://icml.cc/2012/papers/73.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/LeRMDCCDN12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/MaasLOVNN12, author = {Andrew L. Maas and Quoc V. Le and Tyler M. O'Neil and Oriol Vinyals and Patrick Nguyen and Andrew Y. Ng}, title = {Recurrent Neural Networks for Noise Reduction in Robust {ASR}}, booktitle = {{INTERSPEECH} 2012, 13th Annual Conference of the International Speech Communication Association, Portland, Oregon, USA, September 9-13, 2012}, pages = {22--25}, publisher = {{ISCA}}, year = {2012}, url = {https://doi.org/10.21437/Interspeech.2012-6}, doi = {10.21437/INTERSPEECH.2012-6}, timestamp = {Fri, 23 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/interspeech/MaasLOVNN12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/isbi/LeHGSBP12, author = {Quoc V. Le and Ju Han and Joe W. Gray and Paul T. Spellman and Alexander Borowsky and Bahram Parvin}, title = {Learning invariant features of tumor signatures}, booktitle = {9th {IEEE} International Symposium on Biomedical Imaging: From Nano to Macro, {ISBI} 2012, May 2-5, 2012, Barcelona, Spain, Proceedings}, pages = {302--305}, publisher = {{IEEE}}, year = {2012}, url = {https://doi.org/10.1109/ISBI.2012.6235544}, doi = {10.1109/ISBI.2012.6235544}, timestamp = {Wed, 16 Oct 2019 14:14:52 +0200}, biburl = {https://dblp.org/rec/conf/isbi/LeHGSBP12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DeanCMCDLMRSTYN12, author = {Jeffrey Dean and Greg Corrado and Rajat Monga and Kai Chen and Matthieu Devin and Quoc V. Le and Mark Z. Mao and Marc'Aurelio Ranzato and Andrew W. Senior and Paul A. Tucker and Ke Yang and Andrew Y. Ng}, editor = {Peter L. Bartlett and Fernando C. N. Pereira and Christopher J. C. Burges and L{\'{e}}on Bottou and Kilian Q. Weinberger}, title = {Large Scale Distributed Deep Networks}, booktitle = {Advances in Neural Information Processing Systems 25: 26th Annual Conference on Neural Information Processing Systems 2012. Proceedings of a meeting held December 3-6, 2012, Lake Tahoe, Nevada, United States}, pages = {1232--1240}, year = {2012}, url = {https://proceedings.neurips.cc/paper/2012/hash/6aca97005c68f1206823815f66102863-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/DeanCMCDLMRSTYN12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/cvpr/LeZYN11, author = {Quoc V. Le and Will Y. Zou and Serena Y. Yeung and Andrew Y. Ng}, title = {Learning hierarchical invariant spatio-temporal features for action recognition with independent subspace analysis}, booktitle = {The 24th {IEEE} Conference on Computer Vision and Pattern Recognition, {CVPR} 2011, Colorado Springs, CO, USA, 20-25 June 2011}, pages = {3361--3368}, publisher = {{IEEE} Computer Society}, year = {2011}, url = {https://doi.org/10.1109/CVPR.2011.5995496}, doi = {10.1109/CVPR.2011.5995496}, timestamp = {Fri, 24 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/cvpr/LeZYN11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeNCLPN11, author = {Quoc V. Le and Jiquan Ngiam and Adam Coates and Ahbik Lahiri and Bobby Prochnow and Andrew Y. Ng}, editor = {Lise Getoor and Tobias Scheffer}, title = {On optimization methods for deep learning}, booktitle = {Proceedings of the 28th International Conference on Machine Learning, {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011}, pages = {265--272}, publisher = {Omnipress}, year = {2011}, url = {https://icml.cc/2011/papers/210\_icmlpaper.pdf}, timestamp = {Mon, 23 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/LeNCLPN11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LeKNN11, author = {Quoc V. Le and Alexandre Karpenko and Jiquan Ngiam and Andrew Y. Ng}, editor = {John Shawe{-}Taylor and Richard S. Zemel and Peter L. Bartlett and Fernando C. N. Pereira and Kilian Q. Weinberger}, title = {{ICA} with Reconstruction Cost for Efficient Overcomplete Feature Learning}, booktitle = {Advances in Neural Information Processing Systems 24: 25th Annual Conference on Neural Information Processing Systems 2011. Proceedings of a meeting held 12-14 December 2011, Granada, Spain}, pages = {1017--1025}, year = {2011}, url = {https://proceedings.neurips.cc/paper/2011/hash/233509073ed3432027d48b1a83f5fbd2-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/LeKNN11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1112-6209, author = {Quoc V. Le and Rajat Monga and Matthieu Devin and Greg Corrado and Kai Chen and Marc'Aurelio Ranzato and Jeffrey Dean and Andrew Y. Ng}, title = {Building high-level features using large scale unsupervised learning}, journal = {CoRR}, volume = {abs/1112.6209}, year = {2011}, url = {http://arxiv.org/abs/1112.6209}, eprinttype = {arXiv}, eprint = {1112.6209}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1112-6209.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/TeoVSL10, author = {Choon Hui Teo and S. V. N. Vishwanathan and Alexander J. Smola and Quoc V. Le}, title = {Bundle Methods for Regularized Risk Minimization}, journal = {J. Mach. Learn. Res.}, volume = {11}, pages = {311--365}, year = {2010}, url = {https://dl.acm.org/doi/10.5555/1756006.1756016}, doi = {10.5555/1756006.1756016}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/TeoVSL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/LeKKN10, author = {Quoc V. Le and David Kamm and Arda F. Kara and Andrew Y. Ng}, title = {Learning to grasp objects with multiple contact points}, booktitle = {{IEEE} International Conference on Robotics and Automation, {ICRA} 2010, Anchorage, Alaska, USA, 3-7 May 2010}, pages = {5062--5069}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/ROBOT.2010.5509508}, doi = {10.1109/ROBOT.2010.5509508}, timestamp = {Wed, 03 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/LeKKN10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/RaoLPQSN10, author = {Deepak Rao and Quoc V. Le and Thanathorn Phoka and Morgan Quigley and Attawith Sudsang and Andrew Y. Ng}, title = {Grasping novel objects with depth segmentation}, booktitle = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 18-22, 2010, Taipei, Taiwan}, pages = {2578--2585}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/IROS.2010.5650493}, doi = {10.1109/IROS.2010.5650493}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/RaoLPQSN10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/QuigleyBSPLN10, author = {Morgan Quigley and Reuben D. Brewer and Sai Prashanth Soundararaj and Vijay Pradeep and Quoc V. Le and Andrew Y. Ng}, title = {Low-cost accelerometers for robotic manipulator perception}, booktitle = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 18-22, 2010, Taipei, Taiwan}, pages = {6168--6174}, publisher = {{IEEE}}, year = {2010}, url = {https://doi.org/10.1109/IROS.2010.5649804}, doi = {10.1109/IROS.2010.5649804}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iros/QuigleyBSPLN10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LeNCCKN10, author = {Quoc V. Le and Jiquan Ngiam and Zhenghao Chen and Daniel Jin hao Chia and Pang Wei Koh and Andrew Y. Ng}, editor = {John D. Lafferty and Christopher K. I. Williams and John Shawe{-}Taylor and Richard S. Zemel and Aron Culotta}, title = {Tiled convolutional neural networks}, booktitle = {Advances in Neural Information Processing Systems 23: 24th Annual Conference on Neural Information Processing Systems 2010. Proceedings of a meeting held 6-9 December 2010, Vancouver, British Columbia, Canada}, pages = {1279--1287}, publisher = {Curran Associates, Inc.}, year = {2010}, url = {https://proceedings.neurips.cc/paper/2010/hash/01f78be6f7cad02658508fe4616098a9-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/LeNCCKN10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/QuadriantoSCL09, author = {Novi Quadrianto and Alexander J. Smola and Tib{\'{e}}rio S. Caetano and Quoc V. Le}, title = {Estimating Labels from Label Proportions}, journal = {J. Mach. Learn. Res.}, volume = {10}, pages = {2349--2374}, year = {2009}, url = {https://dl.acm.org/doi/10.5555/1577069.1755865}, doi = {10.5555/1577069.1755865}, timestamp = {Thu, 02 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/QuadriantoSCL09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/pami/CaetanoMCLS09, author = {Tib{\'{e}}rio S. Caetano and Julian J. McAuley and Li Cheng and Quoc V. Le and Alexander J. Smola}, title = {Learning Graph Matching}, journal = {{IEEE} Trans. Pattern Anal. Mach. Intell.}, volume = {31}, number = {6}, pages = {1048--1058}, year = {2009}, url = {https://doi.org/10.1109/TPAMI.2009.28}, doi = {10.1109/TPAMI.2009.28}, timestamp = {Mon, 07 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/pami/CaetanoMCLS09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DoLF09, author = {Chuong B. Do and Quoc V. Le and Chuan{-}Sheng Foo}, editor = {Andrea Pohoreckyj Danyluk and L{\'{e}}on Bottou and Michael L. Littman}, title = {Proximal regularization for online and batch learning}, booktitle = {Proceedings of the 26th Annual International Conference on Machine Learning, {ICML} 2009, Montreal, Quebec, Canada, June 14-18, 2009}, series = {{ACM} International Conference Proceeding Series}, volume = {382}, pages = {257--264}, publisher = {{ACM}}, year = {2009}, url = {https://doi.org/10.1145/1553374.1553407}, doi = {10.1145/1553374.1553407}, timestamp = {Tue, 06 Nov 2018 16:58:29 +0100}, biburl = {https://dblp.org/rec/conf/icml/DoLF09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icra/QuigleyBGKLWN09, author = {Morgan Quigley and Siddharth Batra and Stephen Gould and Ellen Klingbeil and Quoc V. Le and Ashley Wellman and Andrew Y. Ng}, title = {High-accuracy 3D sensing for mobile manipulation: Improving object detection and door opening}, booktitle = {2009 {IEEE} International Conference on Robotics and Automation, {ICRA} 2009, Kobe, Japan, May 12-17, 2009}, pages = {2816--2822}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/ROBOT.2009.5152750}, doi = {10.1109/ROBOT.2009.5152750}, timestamp = {Mon, 22 May 2017 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icra/QuigleyBGKLWN09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/LeN09, author = {Quoc V. Le and Andrew Y. Ng}, title = {Joint calibration of multiple sensors}, booktitle = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 11-15, 2009, St. Louis, MO, {USA}}, pages = {3651--3658}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IROS.2009.5354272}, doi = {10.1109/IROS.2009.5354272}, timestamp = {Wed, 16 Oct 2019 14:14:51 +0200}, biburl = {https://dblp.org/rec/conf/iros/LeN09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iros/CoatesBLN09, author = {Adam Coates and Paul Baumstarck and Quoc V. Le and Andrew Y. Ng}, title = {Scalable learning for object detection with {GPU} hardware}, booktitle = {2009 {IEEE/RSJ} International Conference on Intelligent Robots and Systems, October 11-15, 2009, St. Louis, MO, {USA}}, pages = {4287--4293}, publisher = {{IEEE}}, year = {2009}, url = {https://doi.org/10.1109/IROS.2009.5354084}, doi = {10.1109/IROS.2009.5354084}, timestamp = {Mon, 23 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iros/CoatesBLN09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GoodfellowLSLN09, author = {Ian J. Goodfellow and Quoc V. Le and Andrew M. Saxe and Honglak Lee and Andrew Y. Ng}, editor = {Yoshua Bengio and Dale Schuurmans and John D. Lafferty and Christopher K. I. Williams and Aron Culotta}, title = {Measuring Invariances in Deep Networks}, booktitle = {Advances in Neural Information Processing Systems 22: 23rd Annual Conference on Neural Information Processing Systems 2009. Proceedings of a meeting held 7-10 December 2009, Vancouver, British Columbia, Canada}, pages = {646--654}, publisher = {Curran Associates, Inc.}, year = {2009}, url = {https://proceedings.neurips.cc/paper/2009/hash/428fca9bc1921c25c5121f9da7815cde-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/GoodfellowLSLN09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/QuadriantoSCL08, author = {Novi Quadrianto and Alexander J. Smola and Tib{\'{e}}rio S. Caetano and Quoc V. Le}, editor = {William W. Cohen and Andrew McCallum and Sam T. Roweis}, title = {Estimating labels from label proportions}, booktitle = {Machine Learning, Proceedings of the Twenty-Fifth International Conference {(ICML} 2008), Helsinki, Finland, June 5-9, 2008}, series = {{ACM} International Conference Proceeding Series}, volume = {307}, pages = {776--783}, publisher = {{ACM}}, year = {2008}, url = {https://doi.org/10.1145/1390156.1390254}, doi = {10.1145/1390156.1390254}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/QuadriantoSCL08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/ChapelleDLST08, author = {Olivier Chapelle and Chuong B. Do and Quoc V. Le and Alexander J. Smola and Choon Hui Teo}, editor = {Daphne Koller and Dale Schuurmans and Yoshua Bengio and L{\'{e}}on Bottou}, title = {Tighter Bounds for Structured Estimation}, booktitle = {Advances in Neural Information Processing Systems 21, Proceedings of the Twenty-Second Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 8-11, 2008}, pages = {281--288}, publisher = {Curran Associates, Inc.}, year = {2008}, url = {https://proceedings.neurips.cc/paper/2008/hash/6bc24fc1ab650b25b4114e93a98f1eba-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/ChapelleDLST08.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-0806-2890, author = {Tib{\'{e}}rio S. Caetano and Julian J. McAuley and Li Cheng and Quoc V. Le and Alexander J. Smola}, title = {Learning Graph Matching}, journal = {CoRR}, volume = {abs/0806.2890}, year = {2008}, url = {http://arxiv.org/abs/0806.2890}, eprinttype = {arXiv}, eprint = {0806.2890}, timestamp = {Mon, 07 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-0806-2890.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/CaetanoCLS07, author = {Tib{\'{e}}rio S. Caetano and Li Cheng and Quoc V. Le and Alexander J. Smola}, title = {Learning Graph Matching}, booktitle = {{IEEE} 11th International Conference on Computer Vision, {ICCV} 2007, Rio de Janeiro, Brazil, October 14-20, 2007}, pages = {1--8}, publisher = {{IEEE} Computer Society}, year = {2007}, url = {https://doi.org/10.1109/ICCV.2007.4408838}, doi = {10.1109/ICCV.2007.4408838}, timestamp = {Thu, 23 Mar 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/iccv/CaetanoCLS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/kdd/TeoSVL07, author = {Choon Hui Teo and Alexander J. Smola and S. V. N. Vishwanathan and Quoc V. Le}, editor = {Pavel Berkhin and Rich Caruana and Xindong Wu}, title = {A scalable modular convex solver for regularized risk minimization}, booktitle = {Proceedings of the 13th {ACM} {SIGKDD} International Conference on Knowledge Discovery and Data Mining, San Jose, California, USA, August 12-15, 2007}, pages = {727--736}, publisher = {{ACM}}, year = {2007}, url = {https://doi.org/10.1145/1281192.1281270}, doi = {10.1145/1281192.1281270}, timestamp = {Fri, 10 Mar 2023 14:55:31 +0100}, biburl = {https://dblp.org/rec/conf/kdd/TeoSVL07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SmolaVL07, author = {Alexander J. Smola and S. V. N. Vishwanathan and Quoc V. Le}, editor = {John C. Platt and Daphne Koller and Yoram Singer and Sam T. Roweis}, title = {Bundle Methods for Machine Learning}, booktitle = {Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007}, pages = {1377--1384}, publisher = {Curran Associates, Inc.}, year = {2007}, url = {https://proceedings.neurips.cc/paper/2007/hash/26337353b7962f533d78c762373b3318-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/SmolaVL07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/WeimerKLS07, author = {Markus Weimer and Alexandros Karatzoglou and Quoc V. Le and Alexander J. Smola}, editor = {John C. Platt and Daphne Koller and Yoram Singer and Sam T. Roweis}, title = {{COFI} {RANK} - Maximum Margin Matrix Factorization for Collaborative Ranking}, booktitle = {Advances in Neural Information Processing Systems 20, Proceedings of the Twenty-First Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 3-6, 2007}, pages = {1593--1600}, publisher = {Curran Associates, Inc.}, year = {2007}, url = {https://proceedings.neurips.cc/paper/2007/hash/f76a89f0cb91bc419542ce9fa43902dc-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/WeimerKLS07.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-0704-3359, author = {Quoc V. Le and Alexander J. Smola}, title = {Direct Optimization of Ranking Measures}, journal = {CoRR}, volume = {abs/0704.3359}, year = {2007}, url = {http://arxiv.org/abs/0704.3359}, eprinttype = {arXiv}, eprint = {0704.3359}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-0704-3359.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/TakeuchiLSS06, author = {Ichiro Takeuchi and Quoc V. Le and Tim D. Sears and Alexander J. Smola}, title = {Nonparametric Quantile Estimation}, journal = {J. Mach. Learn. Res.}, volume = {7}, pages = {1231--1264}, year = {2006}, url = {http://jmlr.org/papers/v7/takeuchi06a.html}, timestamp = {Wed, 10 Jul 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/TakeuchiLSS06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/ecml/LeSGA06, author = {Quoc V. Le and Alexander J. Smola and Thomas G{\"{a}}rtner and Yasemin Altun}, editor = {Johannes F{\"{u}}rnkranz and Tobias Scheffer and Myra Spiliopoulou}, title = {Transductive Gaussian Process Regression with Automatic Model Selection}, booktitle = {Machine Learning: {ECML} 2006, 17th European Conference on Machine Learning, Berlin, Germany, September 18-22, 2006, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {4212}, pages = {306--317}, publisher = {Springer}, year = {2006}, url = {https://doi.org/10.1007/11871842\_31}, doi = {10.1007/11871842\_31}, timestamp = {Thu, 05 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/ecml/LeSGA06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeSG06, author = {Quoc V. Le and Alexander J. Smola and Thomas G{\"{a}}rtner}, editor = {William W. Cohen and Andrew W. Moore}, title = {Simpler knowledge-based support vector machines}, booktitle = {Machine Learning, Proceedings of the Twenty-Third International Conference {(ICML} 2006), Pittsburgh, Pennsylvania, USA, June 25-29, 2006}, series = {{ACM} International Conference Proceeding Series}, volume = {148}, pages = {521--528}, publisher = {{ACM}}, year = {2006}, url = {https://doi.org/10.1145/1143844.1143910}, doi = {10.1145/1143844.1143910}, timestamp = {Thu, 05 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/LeSG06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/BurgesRL06, author = {Christopher J. C. Burges and Robert Ragno and Quoc Viet Le}, editor = {Bernhard Sch{\"{o}}lkopf and John C. Platt and Thomas Hofmann}, title = {Learning to Rank with Nonsmooth Cost Functions}, booktitle = {Advances in Neural Information Processing Systems 19, Proceedings of the Twentieth Annual Conference on Neural Information Processing Systems, Vancouver, British Columbia, Canada, December 4-7, 2006}, pages = {193--200}, publisher = {{MIT} Press}, year = {2006}, url = {https://proceedings.neurips.cc/paper/2006/hash/af44c4c56f385c43f2529f9b1b018f6a-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/BurgesRL06.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LeSC05, author = {Quoc V. Le and Alexander J. Smola and St{\'{e}}phane Canu}, editor = {Luc De Raedt and Stefan Wrobel}, title = {Heteroscedastic Gaussian process regression}, booktitle = {Machine Learning, Proceedings of the Twenty-Second International Conference {(ICML} 2005), Bonn, Germany, August 7-11, 2005}, series = {{ACM} International Conference Proceeding Series}, volume = {119}, pages = {489--496}, publisher = {{ACM}}, year = {2005}, url = {https://doi.org/10.1145/1102351.1102413}, doi = {10.1145/1102351.1102413}, timestamp = {Wed, 25 Sep 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/LeSC05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/GartnerLBSV05, author = {Thomas G{\"{a}}rtner and Quoc V. Le and Simon Burton and Alexander J. Smola and S. V. N. Vishwanathan}, title = {Large-Scale Multiclass Transduction}, booktitle = {Advances in Neural Information Processing Systems 18 [Neural Information Processing Systems, {NIPS} 2005, December 5-8, 2005, Vancouver, British Columbia, Canada]}, pages = {411--418}, year = {2005}, url = {https://proceedings.neurips.cc/paper/2005/hash/445e1050156c6ae8c082a8422bb7dfc0-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/GartnerLBSV05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/vldb/McCannALNVD05, author = {Robert McCann and Bedoor K. AlShebli and Quoc Le and Hoa Nguyen and Long H. Vu and AnHai Doan}, editor = {Klemens B{\"{o}}hm and Christian S. Jensen and Laura M. Haas and Martin L. Kersten and Per{-}{\AA}ke Larson and Beng Chin Ooi}, title = {Mapping Maintenance for Data Integration Systems}, booktitle = {Proceedings of the 31st International Conference on Very Large Data Bases, Trondheim, Norway, August 30 - September 2, 2005}, pages = {1018--1030}, publisher = {{ACM}}, year = {2005}, url = {http://www.vldb.org/archives/website/2005/program/paper/fri/p1018-mccann.pdf}, timestamp = {Thu, 03 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/vldb/McCannALNVD05.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.