BibTeX records: Yoshua Bengio

download as .bib file

@inproceedings{DBLP:conf/aaai/000300LB24,
  author       = {Xu Tan and
                  Tao Qin and
                  Jiang Bian and
                  Tie{-}Yan Liu and
                  Yoshua Bengio},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Regeneration Learning: {A} Learning Paradigm for Data Generation},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {22614--22622},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i20.30271},
  doi          = {10.1609/AAAI.V38I20.30271},
  timestamp    = {Wed, 27 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/000300LB24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-01207,
  author       = {Thomas Jiralerspong and
                  Xiaoyin Chen and
                  Yash More and
                  Vedant Shah and
                  Yoshua Bengio},
  title        = {Efficient Causal Graph Discovery Using Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2402.01207},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.01207},
  doi          = {10.48550/ARXIV.2402.01207},
  eprinttype    = {arXiv},
  eprint       = {2402.01207},
  timestamp    = {Fri, 09 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-01207.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-05098,
  author       = {Marcin Sendera and
                  Minsu Kim and
                  Sarthak Mittal and
                  Pablo Lemos and
                  Luca Scimeca and
                  Jarrid Rector{-}Brooks and
                  Alexandre Adam and
                  Yoshua Bengio and
                  Nikolay Malkin},
  title        = {On diffusion models for amortized inference: Benchmarking and improving
                  stochastic control and sampling},
  journal      = {CoRR},
  volume       = {abs/2402.05098},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.05098},
  doi          = {10.48550/ARXIV.2402.05098},
  eprinttype    = {arXiv},
  eprint       = {2402.05098},
  timestamp    = {Wed, 14 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-05098.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-06121,
  author       = {Tara Akhound{-}Sadegh and
                  Jarrid Rector{-}Brooks and
                  Avishek Joey Bose and
                  Sarthak Mittal and
                  Pablo Lemos and
                  Cheng{-}Hao Liu and
                  Marcin Sendera and
                  Siamak Ravanbakhsh and
                  Gauthier Gidel and
                  Yoshua Bengio and
                  Nikolay Malkin and
                  Alexander Tong},
  title        = {Iterated Denoising Energy Matching for Sampling from Boltzmann Densities},
  journal      = {CoRR},
  volume       = {abs/2402.06121},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.06121},
  doi          = {10.48550/ARXIV.2402.06121},
  eprinttype    = {arXiv},
  eprint       = {2402.06121},
  timestamp    = {Fri, 16 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-06121.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-08797,
  author       = {Girish Sastry and
                  Lennart Heim and
                  Haydn Belfield and
                  Markus Anderljung and
                  Miles Brundage and
                  Julian Hazell and
                  Cullen O'Keefe and
                  Gillian K. Hadfield and
                  Richard Ngo and
                  Konstantin Pilz and
                  George Gor and
                  Emma Bluemke and
                  Sarah Shoker and
                  Janet Egan and
                  Robert F. Trager and
                  Shahar Avin and
                  Adrian Weller and
                  Yoshua Bengio and
                  Diane Coyle},
  title        = {Computing Power and the Governance of Artificial Intelligence},
  journal      = {CoRR},
  volume       = {abs/2402.08797},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.08797},
  doi          = {10.48550/ARXIV.2402.08797},
  eprinttype    = {arXiv},
  eprint       = {2402.08797},
  timestamp    = {Mon, 19 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-08797.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-10309,
  author       = {Tristan Deleu and
                  Padideh Nouri and
                  Nikolay Malkin and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Discrete Probabilistic Inference as Control in Multi-path Environments},
  journal      = {CoRR},
  volume       = {abs/2402.10309},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.10309},
  doi          = {10.48550/ARXIV.2402.10309},
  eprinttype    = {arXiv},
  eprint       = {2402.10309},
  timestamp    = {Mon, 26 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-10309.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csur/RolnickDKKLSRMJ23,
  author       = {David Rolnick and
                  Priya L. Donti and
                  Lynn H. Kaack and
                  Kelly Kochanski and
                  Alexandre Lacoste and
                  Kris Sankaran and
                  Andrew Slavin Ross and
                  Nikola Milojevic{-}Dupont and
                  Natasha Jaques and
                  Anna Waldman{-}Brown and
                  Alexandra Sasha Luccioni and
                  Tegan Maharaj and
                  Evan D. Sherwin and
                  S. Karthik Mukkavilli and
                  Konrad P. Kording and
                  Carla P. Gomes and
                  Andrew Y. Ng and
                  Demis Hassabis and
                  John C. Platt and
                  Felix Creutzig and
                  Jennifer T. Chayes and
                  Yoshua Bengio},
  title        = {Tackling Climate Change with Machine Learning},
  journal      = {{ACM} Comput. Surv.},
  volume       = {55},
  number       = {2},
  pages        = {42:1--42:96},
  year         = {2023},
  url          = {https://doi.org/10.1145/3485128},
  doi          = {10.1145/3485128},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csur/RolnickDKKLSRMJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ethicsit/KnottPCCLBETTBRB23,
  author       = {Alistair Knott and
                  Dino Pedreschi and
                  Raja Chatila and
                  Tapabrata Chakraborti and
                  Susan Leavy and
                  Ricardo Baeza{-}Yates and
                  David M. Eyers and
                  Andrew Trotman and
                  Paul D. Teal and
                  Przemyslaw Biecek and
                  Stuart Russell and
                  Yoshua Bengio},
  title        = {Generative {AI} models should include detection mechanisms as a condition
                  for public release},
  journal      = {Ethics Inf. Technol.},
  volume       = {25},
  number       = {4},
  pages        = {55},
  year         = {2023},
  url          = {https://doi.org/10.1007/s10676-023-09728-4},
  doi          = {10.1007/S10676-023-09728-4},
  timestamp    = {Sun, 17 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ethicsit/KnottPCCLBETTBRB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/DwivediJL0BB23,
  author       = {Vijay Prakash Dwivedi and
                  Chaitanya K. Joshi and
                  Anh Tuan Luu and
                  Thomas Laurent and
                  Yoshua Bengio and
                  Xavier Bresson},
  title        = {Benchmarking Graph Neural Networks},
  journal      = {J. Mach. Learn. Res.},
  volume       = {24},
  pages        = {43:1--43:48},
  year         = {2023},
  url          = {http://jmlr.org/papers/v24/22-0567.html},
  timestamp    = {Tue, 13 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/DwivediJL0BB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BengioLDHTB23,
  author       = {Yoshua Bengio and
                  Salem Lahlou and
                  Tristan Deleu and
                  Edward J. Hu and
                  Mo Tiwari and
                  Emmanuel Bengio},
  title        = {GFlowNet Foundations},
  journal      = {J. Mach. Learn. Res.},
  volume       = {24},
  pages        = {210:1--210:55},
  year         = {2023},
  url          = {http://jmlr.org/papers/v24/22-0364.html},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BengioLDHTB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nature/WangFD0HLCLKDAB23,
  author       = {Hanchen Wang and
                  Tianfan Fu and
                  Yuanqi Du and
                  Wenhao Gao and
                  Kexin Huang and
                  Ziming Liu and
                  Payal Chandak and
                  Shengchao Liu and
                  Peter Van Katwyk and
                  Andreea Deac and
                  Anima Anandkumar and
                  Karianne Bergen and
                  Carla P. Gomes and
                  Shirley Ho and
                  Pushmeet Kohli and
                  Joan Lasenby and
                  Jure Leskovec and
                  Tie{-}Yan Liu and
                  Arjun Manrai and
                  Debora S. Marks and
                  Bharath Ramsundar and
                  Le Song and
                  Jimeng Sun and
                  Jian Tang and
                  Petar Velickovic and
                  Max Welling and
                  Linfeng Zhang and
                  Connor W. Coley and
                  Yoshua Bengio and
                  Marinka Zitnik},
  title        = {Scientific discovery in the age of artificial intelligence},
  journal      = {Nat.},
  volume       = {620},
  number       = {7972},
  pages        = {47--60},
  year         = {2023},
  url          = {https://doi.org/10.1038/s41586-023-06221-2},
  doi          = {10.1038/S41586-023-06221-2},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nature/WangFD0HLCLKDAB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/LahlouJNBBRKB23,
  author       = {Salem Lahlou and
                  Moksh Jain and
                  Hadi Nekoei and
                  Victor Butoi and
                  Paul Bertin and
                  Jarrid Rector{-}Brooks and
                  Maksym Korablyov and
                  Yoshua Bengio},
  title        = {{DEUP:} Direct Epistemic Uncertainty Prediction},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2023},
  year         = {2023},
  url          = {https://openreview.net/forum?id=eGLdVRvvfQ},
  timestamp    = {Thu, 18 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/LahlouJNBBRKB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KumarDB23,
  author       = {Ramnath Kumar and
                  Tristan Deleu and
                  Yoshua Bengio},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {The Effect of Diversity in Meta-Learning},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {8396--8404},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i7.26012},
  doi          = {10.1609/AAAI.V37I7.26012},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KumarDB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LiuLJNMBK23,
  author       = {Dianbo Liu and
                  Alex Lamb and
                  Xu Ji and
                  Pascal Tikeng Notsawo Jr. and
                  Michael Mozer and
                  Yoshua Bengio and
                  Kenji Kawaguchi},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {Adaptive Discrete Communication Bottlenecks with Dynamic Vector Quantization
                  for Heterogeneous Representational Coarseness},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {8825--8833},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i7.26061},
  doi          = {10.1609/AAAI.V37I7.26061},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LiuLJNMBK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/PontiSBR23,
  author       = {Edoardo Maria Ponti and
                  Alessandro Sordoni and
                  Yoshua Bengio and
                  Siva Reddy},
  editor       = {Andreas Vlachos and
                  Isabelle Augenstein},
  title        = {Combining Parameter-efficient Modules for Task-level Generalisation},
  booktitle    = {Proceedings of the 17th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2023, Dubrovnik,
                  Croatia, May 2-6, 2023},
  pages        = {687--702},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.eacl-main.49},
  doi          = {10.18653/V1/2023.EACL-MAIN.49},
  timestamp    = {Thu, 05 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/PontiSBR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/FengHBA23,
  author       = {Leo Feng and
                  Hossein Hajimirsadeghi and
                  Yoshua Bengio and
                  Mohamed Osama Ahmed},
  title        = {Latent Bottlenecked Attentive Neural Processes},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=yIxtevizEA},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/FengHBA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LiuSBMGSMHB23,
  author       = {Dianbo Liu and
                  Vedant Shah and
                  Oussama Boussif and
                  Cristian Meo and
                  Anirudh Goyal and
                  Tianmin Shu and
                  Michael Curtis Mozer and
                  Nicolas Heess and
                  Yoshua Bengio},
  title        = {Stateful Active Facilitator: Coordination and Environmental Heterogeneity
                  in Cooperative Multi-Agent Reinforcement Learning},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=B4maZQLLW0\_},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LiuSBMGSMHB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MalkinLDJHEZB23,
  author       = {Nikolay Malkin and
                  Salem Lahlou and
                  Tristan Deleu and
                  Xu Ji and
                  Edward J. Hu and
                  Katie Everett and
                  Dinghuai Zhang and
                  Yoshua Bengio},
  title        = {GFlowNets and variational inference},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=uKiE0VIluA-},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MalkinLDJHEZB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PanZCHB23,
  author       = {Ling Pan and
                  Dinghuai Zhang and
                  Aaron C. Courville and
                  Longbo Huang and
                  Yoshua Bengio},
  title        = {Generative Augmented Flow Networks},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=urF\_CBK5XC0},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PanZCHB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TengWZB0Y23,
  author       = {Jiaye Teng and
                  Chuan Wen and
                  Dinghuai Zhang and
                  Yoshua Bengio and
                  Yang Gao and
                  Yang Yuan},
  title        = {Predictive Inference with Feature Conformal Prediction},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=0uRm1YmFTu},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TengWZB0Y23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhangCBZ0C23,
  author       = {Dinghuai Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Qinqing Zheng and
                  Amy Zhang and
                  Ricky T. Q. Chen},
  title        = {Latent State Marginalization as a Low-cost Approach for Improving
                  Exploration},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=b0UksKFcTOL},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhangCBZ0C23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhangCIW0BP23,
  author       = {Ruixiang Zhang and
                  Tong Che and
                  Boris Ivanovic and
                  Renhao Wang and
                  Marco Pavone and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {Robust and Controllable Object-Centric Learning through Energy-based
                  Models},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=wcNtbEtcGIC},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhangCIW0BP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/AhujaMWB23,
  author       = {Kartik Ahuja and
                  Divyat Mahajan and
                  Yixin Wang and
                  Yoshua Bengio},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Interventional Causal Representation Learning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {372--407},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/ahuja23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/AhujaMWB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DuvalSHMMBR23,
  author       = {Alexandre Duval and
                  Victor Schmidt and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Santiago Miret and
                  Fragkiskos D. Malliaros and
                  Yoshua Bengio and
                  David Rolnick},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {FAENet: Frame Averaging Equivariant {GNN} for Materials Modeling},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {9013--9033},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/duval23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DuvalSHMMBR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/HuMJEGB23,
  author       = {Edward J. Hu and
                  Nikolay Malkin and
                  Moksh Jain and
                  Katie E. Everett and
                  Alexandros Graikos and
                  Yoshua Bengio},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {GFlowNet-EM for Learning Compositional Latent Variable Models},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {13528--13549},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/hu23c.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/HuMJEGB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JainRHRBMB23,
  author       = {Moksh Jain and
                  Sharath Chandra Raparthy and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Jarrid Rector{-}Brooks and
                  Yoshua Bengio and
                  Santiago Miret and
                  Emmanuel Bengio},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Multi-Objective GFlowNets},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {14631--14653},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/jain23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JainRHRBMB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KabaMZBR23,
  author       = {S{\'{e}}kou{-}Oumar Kaba and
                  Arnab Kumar Mondal and
                  Yan Zhang and
                  Yoshua Bengio and
                  Siamak Ravanbakhsh},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Equivariance with Learned Canonicalization Functions},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {15546--15566},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/kaba23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KabaMZBR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LachapelleDMMBL23,
  author       = {S{\'{e}}bastien Lachapelle and
                  Tristan Deleu and
                  Divyat Mahajan and
                  Ioannis Mitliagkas and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien and
                  Quentin Bertrand},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Synergies between Disentanglement and Sparsity: Generalization and
                  Identifiability in Multi-Task Learning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {18171--18206},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/lachapelle23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LachapelleDMMBL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LahlouDLZVHEBM23,
  author       = {Salem Lahlou and
                  Tristan Deleu and
                  Pablo Lemos and
                  Dinghuai Zhang and
                  Alexandra Volokhova and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  L{\'{e}}na N{\'{e}}hale Ezzine and
                  Yoshua Bengio and
                  Nikolay Malkin},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {A theory of continuous generative flow networks},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {18269--18300},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/lahlou23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LahlouDLZVHEBM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LiuJDSLGMEZHJKB23,
  author       = {Dianbo Liu and
                  Moksh Jain and
                  Bonaventure F. P. Dossou and
                  Qianli Shen and
                  Salem Lahlou and
                  Anirudh Goyal and
                  Nikolay Malkin and
                  Chris Chinenye Emezue and
                  Dinghuai Zhang and
                  Nadhir Hassen and
                  Xu Ji and
                  Kenji Kawaguchi and
                  Yoshua Bengio},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {GFlowOut: Dropout with Generative Flow Networks},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {21715--21729},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/liu23r.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LiuJDSLGMEZHJKB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MadanRKBJNBBM23,
  author       = {Kanika Madan and
                  Jarrid Rector{-}Brooks and
                  Maksym Korablyov and
                  Emmanuel Bengio and
                  Moksh Jain and
                  Andrei Cristian Nica and
                  Tom Bosc and
                  Yoshua Bengio and
                  Nikolay Malkin},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Learning GFlowNets From Partial Episodes For Improved Convergence
                  And Stability},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {23467--23483},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/madan23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MadanRKBJNBBM23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PanMZB23,
  author       = {Ling Pan and
                  Nikolay Malkin and
                  Dinghuai Zhang and
                  Yoshua Bengio},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Better Training of GFlowNets with Local Credit and Incomplete Trajectories},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {26878--26890},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/pan23c.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PanMZB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PoliMNFDBBER23,
  author       = {Michael Poli and
                  Stefano Massaroli and
                  Eric Nguyen and
                  Daniel Y. Fu and
                  Tri Dao and
                  Stephen Baccus and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Christopher R{\'{e}}},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Hyena Hierarchy: Towards Larger Convolutional Language Models},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {28043--28078},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/poli23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PoliMNFDBBER23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/TraubleGRMKBS23,
  author       = {Frederik Tr{\"{a}}uble and
                  Anirudh Goyal and
                  Nasim Rahaman and
                  Michael Curtis Mozer and
                  Kenji Kawaguchi and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Discrete Key-Value Bottleneck},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {34431--34455},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/trauble23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/TraubleGRMKBS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/0007YJMABR23,
  author       = {Chen Sun and
                  Wannan Yang and
                  Thomas Jiralerspong and
                  Dane Malenfant and
                  Benjamin Alsbury{-}Nealy and
                  Yoshua Bengio and
                  Blake A. Richards},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Contrastive Retrospection: honing in on critical steps for rapid learning
                  and generalization in {RL}},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/6357d6d068622c962391081d296bed69-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/0007YJMABR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Atanackovic0WLB23,
  author       = {Lazar Atanackovic and
                  Alexander Tong and
                  Bo Wang and
                  Leo J. Lee and
                  Yoshua Bengio and
                  Jason S. Hartford},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {DynGFN: Towards Bayesian Inference of Gene Regulatory Networks with
                  GFlowNets},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/eb5254c4ee813d05af9c098f2d9c5708-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Atanackovic0WLB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BoussifBAMYBB23,
  author       = {Oussama Boussif and
                  Ghait Boukachab and
                  Dan Assouline and
                  Stefano Massaroli and
                  Tianle Yuan and
                  Loubna Benabbou and
                  Yoshua Bengio},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Improving *day-ahead* Solar Irradiance Time Series Forecasting by
                  Leveraging Spatio-Temporal Context},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/070a57c5ef1e58cc90201b11d369b3c2-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BoussifBAMYBB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DeleuNSMCB23,
  author       = {Tristan Deleu and
                  Mizu Nishikawa{-}Toomey and
                  Jithendaraa Subramanian and
                  Nikolay Malkin and
                  Laurent Charlin and
                  Yoshua Bengio},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Joint Bayesian Inference of Graphical Structure and Parameters with
                  a Single Generative Flow Network},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/639a9a172c044fbb64175b5fad42e9a5-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DeleuNSMCB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LacosteLRSKLIDA23,
  author       = {Alexandre Lacoste and
                  Nils Lehmann and
                  Pau Rodr{\'{\i}}guez and
                  Evan D. Sherwin and
                  Hannah Kerner and
                  Bj{\"{o}}rn L{\"{u}}tjens and
                  Jeremy Irvin and
                  David Dao and
                  Hamed Alemohammad and
                  Alexandre Drouin and
                  Mehmet Gunturkun and
                  Gabriel Huang and
                  David V{\'{a}}zquez and
                  Dava Newman and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Xiaoxiang Zhu},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {GEO-Bench: Toward Foundation Models for Earth Monitoring},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/a0644215d9cff6646fa334dfa5d29c5a-Abstract-Datasets\_and\_Benchmarks.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LacosteLRSKLIDA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MassaroliPFKPRT23,
  author       = {Stefano Massaroli and
                  Michael Poli and
                  Daniel Y. Fu and
                  Hermann Kumbong and
                  Rom N. Parnichkun and
                  David W. Romero and
                  Aman Timalsina and
                  Quinn McIntyre and
                  Beidi Chen and
                  Atri Rudra and
                  Ce Zhang and
                  Christopher R{\'{e}} and
                  Stefano Ermon and
                  Yoshua Bengio},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Laughing Hyena Distillery: Extracting Compact Recurrences From Convolutions},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/371355cd42caaf83412c3fbef4688979-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MassaroliPFKPRT23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/NguyenMMNALB23,
  author       = {Trang Nguyen and
                  Amin Mansouri and
                  Kanika Madan and
                  Khuong Nguyen and
                  Kartik Ahuja and
                  Dianbo Liu and
                  Yoshua Bengio},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Reusable Slotwise Mechanisms},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/49ff6951ef47bc9bab276a31a965528e-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/NguyenMMNALB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/NguyenPFTWBMPRB23,
  author       = {Eric Nguyen and
                  Michael Poli and
                  Marjan Faizi and
                  Armin W. Thomas and
                  Michael Wornow and
                  Callum Birch{-}Sykes and
                  Stefano Massaroli and
                  Aman Patel and
                  Clayton M. Rabideau and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Christopher R{\'{e}} and
                  Stephen Baccus},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {HyenaDNA: Long-Range Genomic Sequence Modeling at Single Nucleotide
                  Resolution},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/86ab6927ee4ae9bde4247793c46797c7-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/NguyenPFTWBMPRB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TengEABALR23,
  author       = {M{\'{e}}lisande Teng and
                  Amna Elmustafa and
                  Benjamin Akera and
                  Yoshua Bengio and
                  Hager Radi Abdelwahed and
                  Hugo Larochelle and
                  David Rolnick},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {SatBird: a Dataset for Bird Species Distribution Modeling using Remote
                  Sensing and Citizen Science Data},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/ef7653bbc4655305efb89a32362e332a-Abstract-Datasets\_and\_Benchmarks.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/TengEABALR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhangDMCBP23,
  author       = {Dinghuai Zhang and
                  Hanjun Dai and
                  Nikolay Malkin and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Ling Pan},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Let the Flows Tell: Solving Graph Combinatorial Problems with GFlowNets},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/27571b74d6cd650b8eb6cf1837953ae8-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhangDMCBP23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/PanZJHB23,
  author       = {Ling Pan and
                  Dinghuai Zhang and
                  Moksh Jain and
                  Longbo Huang and
                  Yoshua Bengio},
  editor       = {Robin J. Evans and
                  Ilya Shpitser},
  title        = {Stochastic Generative Flow Networks},
  booktitle    = {Uncertainty in Artificial Intelligence, {UAI} 2023, July 31 - 4 August
                  2023, Pittsburgh, PA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {216},
  pages        = {1628--1638},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v216/pan23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/PanZJHB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/ZouVMTPKBSK23,
  author       = {Yingtian Zou and
                  Vikas Verma and
                  Sarthak Mittal and
                  Wai Hoh Tang and
                  Hieu Pham and
                  Juho Kannala and
                  Yoshua Bengio and
                  Arno Solin and
                  Kenji Kawaguchi},
  editor       = {Robin J. Evans and
                  Ilya Shpitser},
  title        = {MixupE: Understanding and improving Mixup from directional derivative
                  perspective},
  booktitle    = {Uncertainty in Artificial Intelligence, {UAI} 2023, July 31 - 4 August
                  2023, Pittsburgh, PA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {216},
  pages        = {2597--2607},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v216/zou23a.html},
  timestamp    = {Mon, 15 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/ZouVMTPKBSK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-08846,
  author       = {Xu Tan and
                  Tao Qin and
                  Jiang Bian and
                  Tie{-}Yan Liu and
                  Yoshua Bengio},
  title        = {Regeneration Learning: {A} Learning Paradigm for Data Generation},
  journal      = {CoRR},
  volume       = {abs/2301.08846},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.08846},
  doi          = {10.48550/ARXIV.2301.08846},
  eprinttype    = {arXiv},
  eprint       = {2301.08846},
  timestamp    = {Mon, 29 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-08846.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-11790,
  author       = {Sumukh K. Aithal and
                  Anirudh Goyal and
                  Alex Lamb and
                  Yoshua Bengio and
                  Michael Mozer},
  title        = {Leveraging the Third Dimension in Contrastive Learning},
  journal      = {CoRR},
  volume       = {abs/2301.11790},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.11790},
  doi          = {10.48550/ARXIV.2301.11790},
  eprinttype    = {arXiv},
  eprint       = {2301.11790},
  timestamp    = {Tue, 31 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-11790.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-12594,
  author       = {Salem Lahlou and
                  Tristan Deleu and
                  Pablo Lemos and
                  Dinghuai Zhang and
                  Alexandra Volokhova and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  L{\'{e}}na N{\'{e}}hale Ezzine and
                  Yoshua Bengio and
                  Nikolay Malkin},
  title        = {A theory of continuous generative flow networks},
  journal      = {CoRR},
  volume       = {abs/2301.12594},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.12594},
  doi          = {10.48550/ARXIV.2301.12594},
  eprinttype    = {arXiv},
  eprint       = {2301.12594},
  timestamp    = {Wed, 01 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-12594.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-00482,
  author       = {Alexander Tong and
                  Nikolay Malkin and
                  Guillaume Huguet and
                  Yanlei Zhang and
                  Jarrid Rector{-}Brooks and
                  Kilian Fatras and
                  Guy Wolf and
                  Yoshua Bengio},
  title        = {Conditional Flow Matching: Simulation-Free Dynamic Optimal Transport},
  journal      = {CoRR},
  volume       = {abs/2302.00482},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.00482},
  doi          = {10.48550/ARXIV.2302.00482},
  eprinttype    = {arXiv},
  eprint       = {2302.00482},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-00482.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-00615,
  author       = {Moksh Jain and
                  Tristan Deleu and
                  Jason S. Hartford and
                  Cheng{-}Hao Liu and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Yoshua Bengio},
  title        = {GFlowNets for AI-Driven Scientific Discovery},
  journal      = {CoRR},
  volume       = {abs/2302.00615},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.00615},
  doi          = {10.48550/ARXIV.2302.00615},
  eprinttype    = {arXiv},
  eprint       = {2302.00615},
  timestamp    = {Thu, 04 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-00615.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-01687,
  author       = {Ling Pan and
                  Nikolay Malkin and
                  Dinghuai Zhang and
                  Yoshua Bengio},
  title        = {Better Training of GFlowNets with Local Credit and Incomplete Trajectories},
  journal      = {CoRR},
  volume       = {abs/2302.01687},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.01687},
  doi          = {10.48550/ARXIV.2302.01687},
  eprinttype    = {arXiv},
  eprint       = {2302.01687},
  timestamp    = {Thu, 09 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-01687.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-04178,
  author       = {Lazar Atanackovic and
                  Alexander Tong and
                  Jason S. Hartford and
                  Leo J. Lee and
                  Bo Wang and
                  Yoshua Bengio},
  title        = {DynGFN: Bayesian Dynamic Causal Discovery using Generative Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2302.04178},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.04178},
  doi          = {10.48550/ARXIV.2302.04178},
  eprinttype    = {arXiv},
  eprint       = {2302.04178},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-04178.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-05793,
  author       = {Dinghuai Zhang and
                  Ling Pan and
                  Ricky T. Q. Chen and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Distributional GFlowNets with Quantile Flows},
  journal      = {CoRR},
  volume       = {abs/2302.05793},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.05793},
  doi          = {10.48550/ARXIV.2302.05793},
  eprinttype    = {arXiv},
  eprint       = {2302.05793},
  timestamp    = {Sun, 19 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-05793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-06403,
  author       = {Xu Ji and
                  Eric Elmoznino and
                  George Deane and
                  Axel Constant and
                  Guillaume Dumas and
                  Guillaume Lajoie and
                  Jonathan Simon and
                  Yoshua Bengio},
  title        = {Sources of Richness and Ineffability for Phenomenally Conscious States},
  journal      = {CoRR},
  volume       = {abs/2302.06403},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.06403},
  doi          = {10.48550/ARXIV.2302.06403},
  eprinttype    = {arXiv},
  eprint       = {2302.06403},
  timestamp    = {Mon, 20 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-06403.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-06576,
  author       = {Edward J. Hu and
                  Nikolay Malkin and
                  Moksh Jain and
                  Katie Everett and
                  Alexandros Graikos and
                  Yoshua Bengio},
  title        = {GFlowNet-EM for learning compositional latent variable models},
  journal      = {CoRR},
  volume       = {abs/2302.06576},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.06576},
  doi          = {10.48550/ARXIV.2302.06576},
  eprinttype    = {arXiv},
  eprint       = {2302.06576},
  timestamp    = {Mon, 20 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-06576.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-09465,
  author       = {Ling Pan and
                  Dinghuai Zhang and
                  Moksh Jain and
                  Longbo Huang and
                  Yoshua Bengio},
  title        = {Stochastic Generative Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2302.09465},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.09465},
  doi          = {10.48550/ARXIV.2302.09465},
  eprinttype    = {arXiv},
  eprint       = {2302.09465},
  timestamp    = {Thu, 23 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-09465.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-10503,
  author       = {Trang Nguyen and
                  Amin Mansouri and
                  Kanika Madan and
                  Khuong Nguyen and
                  Kartik Ahuja and
                  Dianbo Liu and
                  Yoshua Bengio},
  title        = {Reusable Slotwise Mechanisms},
  journal      = {CoRR},
  volume       = {abs/2302.10503},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.10503},
  doi          = {10.48550/ARXIV.2302.10503},
  eprinttype    = {arXiv},
  eprint       = {2302.10503},
  timestamp    = {Fri, 24 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-10503.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-10866,
  author       = {Michael Poli and
                  Stefano Massaroli and
                  Eric Nguyen and
                  Daniel Y. Fu and
                  Tri Dao and
                  Stephen Baccus and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Christopher R{\'{e}}},
  title        = {Hyena Hierarchy: Towards Larger Convolutional Language Models},
  journal      = {CoRR},
  volume       = {abs/2302.10866},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.10866},
  doi          = {10.48550/ARXIV.2302.10866},
  eprinttype    = {arXiv},
  eprint       = {2302.10866},
  timestamp    = {Fri, 24 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-10866.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-05577,
  author       = {Alexandre Duval and
                  Victor Schmidt and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Santiago Miret and
                  Fragkiskos D. Malliaros and
                  Yoshua Bengio and
                  David Rolnick},
  title        = {FAENet: Frame Averaging Equivariant {GNN} for Materials Modeling},
  journal      = {CoRR},
  volume       = {abs/2305.05577},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.05577},
  doi          = {10.48550/ARXIV.2305.05577},
  eprinttype    = {arXiv},
  eprint       = {2305.05577},
  timestamp    = {Mon, 15 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-05577.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-14567,
  author       = {Leo Feng and
                  Frederick Tung and
                  Hossein Hajimirsadeghi and
                  Yoshua Bengio and
                  Mohamed Osama Ahmed},
  title        = {Constant Memory Attentive Neural Processes},
  journal      = {CoRR},
  volume       = {abs/2305.14567},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.14567},
  doi          = {10.48550/ARXIV.2305.14567},
  eprinttype    = {arXiv},
  eprint       = {2305.14567},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-14567.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-15324,
  author       = {Toby Shevlane and
                  Sebastian Farquhar and
                  Ben Garfinkel and
                  Mary Phuong and
                  Jess Whittlestone and
                  Jade Leung and
                  Daniel Kokotajlo and
                  Nahema Marchal and
                  Markus Anderljung and
                  Noam Kolt and
                  Lewis Ho and
                  Divya Siddarth and
                  Shahar Avin and
                  Will Hawkins and
                  Been Kim and
                  Iason Gabriel and
                  Vijay Bolina and
                  Jack Clark and
                  Yoshua Bengio and
                  Paul F. Christiano and
                  Allan Dafoe},
  title        = {Model evaluation for extreme risks},
  journal      = {CoRR},
  volume       = {abs/2305.15324},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.15324},
  doi          = {10.48550/ARXIV.2305.15324},
  eprinttype    = {arXiv},
  eprint       = {2305.15324},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-15324.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-17010,
  author       = {Dinghuai Zhang and
                  Hanjun Dai and
                  Nikolay Malkin and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Ling Pan},
  title        = {Let the Flows Tell: Solving Graph Combinatorial Optimization Problems
                  with GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2305.17010},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17010},
  doi          = {10.48550/ARXIV.2305.17010},
  eprinttype    = {arXiv},
  eprint       = {2305.17010},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17010.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-17375,
  author       = {Dianbo Liu and
                  Samuele Bolotta and
                  He Zhu and
                  Yoshua Bengio and
                  Guillaume Dumas},
  title        = {Attention Schema in Neural Agents},
  journal      = {CoRR},
  volume       = {abs/2305.17375},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17375},
  doi          = {10.48550/ARXIV.2305.17375},
  eprinttype    = {arXiv},
  eprint       = {2305.17375},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17375.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-19366,
  author       = {Tristan Deleu and
                  Mizu Nishikawa{-}Toomey and
                  Jithendaraa Subramanian and
                  Nikolay Malkin and
                  Laurent Charlin and
                  Yoshua Bengio},
  title        = {Joint Bayesian Inference of Graphical Structure and Parameters with
                  a Single Generative Flow Network},
  journal      = {CoRR},
  volume       = {abs/2305.19366},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.19366},
  doi          = {10.48550/ARXIV.2305.19366},
  eprinttype    = {arXiv},
  eprint       = {2305.19366},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-19366.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-19550,
  author       = {Ayush Chakravarthy and
                  Trang Nguyen and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Michael C. Mozer},
  title        = {Spotlight Attention: Robust Object-Centric Learning With a Spatial
                  Locality Prior},
  journal      = {CoRR},
  volume       = {abs/2305.19550},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.19550},
  doi          = {10.48550/ARXIV.2305.19550},
  eprinttype    = {arXiv},
  eprint       = {2305.19550},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-19550.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-01112,
  author       = {Oussama Boussif and
                  Ghait Boukachab and
                  Dan Assouline and
                  Stefano Massaroli and
                  Tianle Yuan and
                  Loubna Benabbou and
                  Yoshua Bengio},
  title        = {What if We Enrich day-ahead Solar Irradiance Time Series Forecasting
                  with Spatio-Temporal Context?},
  journal      = {CoRR},
  volume       = {abs/2306.01112},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.01112},
  doi          = {10.48550/ARXIV.2306.01112},
  eprinttype    = {arXiv},
  eprint       = {2306.01112},
  timestamp    = {Mon, 12 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-01112.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-02204,
  author       = {Aniket Didolkar and
                  Anirudh Goyal and
                  Yoshua Bengio},
  title        = {Cycle Consistency Driven Object Discovery},
  journal      = {CoRR},
  volume       = {abs/2306.02204},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.02204},
  doi          = {10.48550/ARXIV.2306.02204},
  eprinttype    = {arXiv},
  eprint       = {2306.02204},
  timestamp    = {Mon, 12 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-02204.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-03831,
  author       = {Alexandre Lacoste and
                  Nils Lehmann and
                  Pau Rodr{\'{\i}}guez and
                  Evan David Sherwin and
                  Hannah Kerner and
                  Bj{\"{o}}rn L{\"{u}}tjens and
                  Jeremy Andrew Irvin and
                  David Dao and
                  Hamed Alemohammad and
                  Alexandre Drouin and
                  Mehmet Gunturkun and
                  Gabriel Huang and
                  David V{\'{a}}zquez and
                  Dava Newman and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Xiao Xiang Zhu},
  title        = {GEO-Bench: Toward Foundation Models for Earth Monitoring},
  journal      = {CoRR},
  volume       = {abs/2306.03831},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.03831},
  doi          = {10.48550/ARXIV.2306.03831},
  eprinttype    = {arXiv},
  eprint       = {2306.03831},
  timestamp    = {Tue, 13 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-03831.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-11715,
  author       = {Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Nikita Saxena and
                  Moksh Jain and
                  Cheng{-}Hao Liu and
                  Yoshua Bengio},
  title        = {Multi-Fidelity Active Learning with GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2306.11715},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.11715},
  doi          = {10.48550/ARXIV.2306.11715},
  eprinttype    = {arXiv},
  eprint       = {2306.11715},
  timestamp    = {Sun, 25 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-11715.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-12599,
  author       = {Leo Feng and
                  Frederick Tung and
                  Hossein Hajimirsadeghi and
                  Yoshua Bengio and
                  Mohamed Osama Ahmed},
  title        = {Constant Memory Attention Block},
  journal      = {CoRR},
  volume       = {abs/2306.12599},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.12599},
  doi          = {10.48550/ARXIV.2306.12599},
  eprinttype    = {arXiv},
  eprint       = {2306.12599},
  timestamp    = {Tue, 27 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-12599.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-15058,
  author       = {Shreshth A. Malik and
                  Salem Lahlou and
                  Andrew Jesson and
                  Moksh Jain and
                  Nikolay Malkin and
                  Tristan Deleu and
                  Yoshua Bengio and
                  Yarin Gal},
  title        = {BatchGFN: Generative Flow Networks for Batch Active Learning},
  journal      = {CoRR},
  volume       = {abs/2306.15058},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.15058},
  doi          = {10.48550/ARXIV.2306.15058},
  eprinttype    = {arXiv},
  eprint       = {2306.15058},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-15058.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-15794,
  author       = {Eric Nguyen and
                  Michael Poli and
                  Marjan Faizi and
                  Armin W. Thomas and
                  Callum Birch{-}Sykes and
                  Michael Wornow and
                  Aman Patel and
                  Clayton M. Rabideau and
                  Stefano Massaroli and
                  Yoshua Bengio and
                  Stefano Ermon and
                  Stephen A. Baccus and
                  Christopher R{\'{e}}},
  title        = {HyenaDNA: Long-Range Genomic Sequence Modeling at Single Nucleotide
                  Resolution},
  journal      = {CoRR},
  volume       = {abs/2306.15794},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.15794},
  doi          = {10.48550/ARXIV.2306.15794},
  eprinttype    = {arXiv},
  eprint       = {2306.15794},
  timestamp    = {Fri, 30 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-15794.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-17693,
  author       = {Jarrid Rector{-}Brooks and
                  Kanika Madan and
                  Moksh Jain and
                  Maksym Korablyov and
                  Cheng{-}Hao Liu and
                  Sarath Chandar and
                  Nikolay Malkin and
                  Yoshua Bengio},
  title        = {Thompson sampling for improved exploration in GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2306.17693},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.17693},
  doi          = {10.48550/ARXIV.2306.17693},
  eprinttype    = {arXiv},
  eprint       = {2306.17693},
  timestamp    = {Mon, 03 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-17693.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-01422,
  author       = {Tristan Deleu and
                  Yoshua Bengio},
  title        = {Generative Flow Networks: a Markov Chain Perspective},
  journal      = {CoRR},
  volume       = {abs/2307.01422},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.01422},
  doi          = {10.48550/ARXIV.2307.01422},
  eprinttype    = {arXiv},
  eprint       = {2307.01422},
  timestamp    = {Mon, 10 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-01422.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-03672,
  author       = {Alexander Tong and
                  Nikolay Malkin and
                  Kilian Fatras and
                  Lazar Atanackovic and
                  Yanlei Zhang and
                  Guillaume Huguet and
                  Guy Wolf and
                  Yoshua Bengio},
  title        = {Simulation-free Schr{\"{o}}dinger bridges via score and flow
                  matching},
  journal      = {CoRR},
  volume       = {abs/2307.03672},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.03672},
  doi          = {10.48550/ARXIV.2307.03672},
  eprinttype    = {arXiv},
  eprint       = {2307.03672},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-03672.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-04699,
  author       = {Lewis Ho and
                  Joslyn Barnhart and
                  Robert Trager and
                  Yoshua Bengio and
                  Miles Brundage and
                  Allison Carnegie and
                  Rumman Chowdhury and
                  Allan Dafoe and
                  Gillian K. Hadfield and
                  Margaret Levi and
                  Duncan Snidal},
  title        = {International Institutions for Advanced {AI}},
  journal      = {CoRR},
  volume       = {abs/2307.04699},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.04699},
  doi          = {10.48550/ARXIV.2307.04699},
  eprinttype    = {arXiv},
  eprint       = {2307.04699},
  timestamp    = {Mon, 24 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-04699.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-04988,
  author       = {Chris Chinenye Emezue and
                  Alexandre Drouin and
                  Tristan Deleu and
                  Stefan Bauer and
                  Yoshua Bengio},
  title        = {Benchmarking Bayesian Causal Discovery Methods for Downstream Treatment
                  Effect Estimation},
  journal      = {CoRR},
  volume       = {abs/2307.04988},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.04988},
  doi          = {10.48550/ARXIV.2307.04988},
  eprinttype    = {arXiv},
  eprint       = {2307.04988},
  timestamp    = {Mon, 24 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-04988.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-06951,
  author       = {Yoshua Bengio and
                  Prateek Gupta and
                  Lu Li and
                  Soham Phade and
                  Sunil Srinivasa and
                  Andrew Williams and
                  Tianyu Zhang and
                  Yang Zhang and
                  Stephan Zheng},
  title        = {{AI} For Global Climate Cooperation 2023 Competition Proceedings},
  journal      = {CoRR},
  volume       = {abs/2307.06951},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.06951},
  doi          = {10.48550/ARXIV.2307.06951},
  eprinttype    = {arXiv},
  eprint       = {2307.06951},
  timestamp    = {Mon, 24 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-06951.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2308-08708,
  author       = {Patrick Butlin and
                  Robert Long and
                  Eric Elmoznino and
                  Yoshua Bengio and
                  Jonathan Birch and
                  Axel Constant and
                  George Deane and
                  Stephen M. Fleming and
                  Chris Frith and
                  Xu Ji and
                  Ryota Kanai and
                  Colin Klein and
                  Grace Lindsay and
                  Matthias Michel and
                  Liad Mudrik and
                  Megan A. K. Peters and
                  Eric Schwitzgebel and
                  Jonathan Simon and
                  Rufin VanRullen},
  title        = {Consciousness in Artificial Intelligence: Insights from the Science
                  of Consciousness},
  journal      = {CoRR},
  volume       = {abs/2308.08708},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2308.08708},
  doi          = {10.48550/ARXIV.2308.08708},
  eprinttype    = {arXiv},
  eprint       = {2308.08708},
  timestamp    = {Fri, 25 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2308-08708.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-17388,
  author       = {Leo Feng and
                  Frederick Tung and
                  Hossein Hajimirsadeghi and
                  Yoshua Bengio and
                  Mohamed Osama Ahmed},
  title        = {Tree Cross Attention},
  journal      = {CoRR},
  volume       = {abs/2309.17388},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.17388},
  doi          = {10.48550/ARXIV.2309.17388},
  eprinttype    = {arXiv},
  eprint       = {2309.17388},
  timestamp    = {Tue, 17 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-17388.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-00229,
  author       = {Mingde Zhao and
                  Safa Alver and
                  Harm van Seijen and
                  Romain Laroche and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Combining Spatial and Temporal Abstraction in Planning for Better
                  Generalization},
  journal      = {CoRR},
  volume       = {abs/2310.00229},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.00229},
  doi          = {10.48550/ARXIV.2310.00229},
  eprinttype    = {arXiv},
  eprint       = {2310.00229},
  timestamp    = {Wed, 18 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-00229.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-01807,
  author       = {Andrew Nam and
                  Eric Elmoznino and
                  Nikolay Malkin and
                  Chen Sun and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Discrete, compositional, and symbolic representations through attractor
                  dynamics},
  journal      = {CoRR},
  volume       = {abs/2310.01807},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.01807},
  doi          = {10.48550/ARXIV.2310.01807},
  eprinttype    = {arXiv},
  eprint       = {2310.01807},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-01807.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02230,
  author       = {Luca Scimeca and
                  Alexander Rubinstein and
                  Armand Mihai Nicolicioiu and
                  Damien Teney and
                  Yoshua Bengio},
  title        = {Leveraging Diffusion Disentangled Representations to Mitigate Shortcuts
                  in Underspecified Visual Tasks},
  journal      = {CoRR},
  volume       = {abs/2310.02230},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02230},
  doi          = {10.48550/ARXIV.2310.02230},
  eprinttype    = {arXiv},
  eprint       = {2310.02230},
  timestamp    = {Mon, 06 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02230.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02423,
  author       = {Jean{-}Pierre Falet and
                  Hae Beom Lee and
                  Nikolay Malkin and
                  Chen Sun and
                  Dragos Secrieru and
                  Dinghuai Zhang and
                  Guillaume Lajoie and
                  Yoshua Bengio},
  title        = {Delta-AI: Local objectives for amortized inference in sparse graphical
                  models},
  journal      = {CoRR},
  volume       = {abs/2310.02423},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02423},
  doi          = {10.48550/ARXIV.2310.02423},
  eprinttype    = {arXiv},
  eprint       = {2310.02423},
  timestamp    = {Fri, 20 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02423.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02679,
  author       = {Dinghuai Zhang and
                  Ricky Tian Qi Chen and
                  Cheng{-}Hao Liu and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Diffusion Generative Flow Samplers: Improving learning signals through
                  partial trajectory optimization},
  journal      = {CoRR},
  volume       = {abs/2310.02679},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02679},
  doi          = {10.48550/ARXIV.2310.02679},
  eprinttype    = {arXiv},
  eprint       = {2310.02679},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02679.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02710,
  author       = {Minsu Kim and
                  Taeyoung Yun and
                  Emmanuel Bengio and
                  Dinghuai Zhang and
                  Yoshua Bengio and
                  Sungsoo Ahn and
                  Jinkyoo Park},
  title        = {Local Search GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2310.02710},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02710},
  doi          = {10.48550/ARXIV.2310.02710},
  eprinttype    = {arXiv},
  eprint       = {2310.02710},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02710.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02779,
  author       = {Marco Jiralerspong and
                  Bilun Sun and
                  Danilo Vucetic and
                  Tianyu Zhang and
                  Yoshua Bengio and
                  Gauthier Gidel and
                  Nikolay Malkin},
  title        = {Expected flow networks in stochastic environments and two-player zero-sum
                  games},
  journal      = {CoRR},
  volume       = {abs/2310.02779},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02779},
  doi          = {10.48550/ARXIV.2310.02779},
  eprinttype    = {arXiv},
  eprint       = {2310.02779},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02779.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-02823,
  author       = {Minsu Kim and
                  Joohwan Ko and
                  Dinghuai Zhang and
                  Ling Pan and
                  Taeyoung Yun and
                  Woochang Kim and
                  Jinkyoo Park and
                  Yoshua Bengio},
  title        = {Learning to Scale Logits for Temperature-Conditional GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2310.02823},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.02823},
  doi          = {10.48550/ARXIV.2310.02823},
  eprinttype    = {arXiv},
  eprint       = {2310.02823},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-02823.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-03419,
  author       = {Ling Pan and
                  Moksh Jain and
                  Kanika Madan and
                  Yoshua Bengio},
  title        = {Pre-Training and Fine-Tuning Generative Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2310.03419},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.03419},
  doi          = {10.48550/ARXIV.2310.03419},
  eprinttype    = {arXiv},
  eprint       = {2310.03419},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-03419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-03579,
  author       = {Trang Nguyen and
                  Alexander Tong and
                  Kanika Madan and
                  Yoshua Bengio and
                  Dianbo Liu},
  title        = {Causal Inference in Gene Regulatory Networks with GFlowNet: Towards
                  Scalability in Large Systems},
  journal      = {CoRR},
  volume       = {abs/2310.03579},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.03579},
  doi          = {10.48550/ARXIV.2310.03579},
  eprinttype    = {arXiv},
  eprint       = {2310.03579},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-03579.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-04363,
  author       = {Edward J. Hu and
                  Moksh Jain and
                  Eric Elmoznino and
                  Younesse Kaddar and
                  Guillaume Lajoie and
                  Yoshua Bengio and
                  Nikolay Malkin},
  title        = {Amortizing intractable inference in large language models},
  journal      = {CoRR},
  volume       = {abs/2310.04363},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.04363},
  doi          = {10.48550/ARXIV.2310.04363},
  eprinttype    = {arXiv},
  eprint       = {2310.04363},
  timestamp    = {Fri, 20 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-04363.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-04925,
  author       = {Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Alexandre Duval and
                  Alexandra Volokhova and
                  Yoshua Bengio and
                  Divya Sharma and
                  Pierre Luc Carrier and
                  Michal Koziarski and
                  Victor Schmidt},
  title        = {Crystal-GFN: sampling crystals with desirable properties and constraints},
  journal      = {CoRR},
  volume       = {abs/2310.04925},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.04925},
  doi          = {10.48550/ARXIV.2310.04925},
  eprinttype    = {arXiv},
  eprint       = {2310.04925},
  timestamp    = {Mon, 23 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-04925.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-06682,
  author       = {Alvaro Carbonero and
                  Alexandre Duval and
                  Victor Schmidt and
                  Santiago Miret and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Yoshua Bengio and
                  David Rolnick},
  title        = {On the importance of catalyst-adsorbate 3D interactions for relaxed
                  energy predictions},
  journal      = {CoRR},
  volume       = {abs/2310.06682},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.06682},
  doi          = {10.48550/ARXIV.2310.06682},
  eprinttype    = {arXiv},
  eprint       = {2310.06682},
  timestamp    = {Tue, 24 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-06682.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08338,
  author       = {Charles C. Onu and
                  Samantha Latremouille and
                  Arsenii Gorin and
                  Junhao Wang and
                  Uchenna Ekwochi and
                  Peter O. Ubuane and
                  Omolara A. Kehinde and
                  Muhammad A. Salisu and
                  Datonye Briggs and
                  Yoshua Bengio and
                  Doina Precup},
  title        = {A cry for help: Early detection of brain injury in newborns},
  journal      = {CoRR},
  volume       = {abs/2310.08338},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08338},
  doi          = {10.48550/ARXIV.2310.08338},
  eprinttype    = {arXiv},
  eprint       = {2310.08338},
  timestamp    = {Thu, 26 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08338.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-08774,
  author       = {Mingyang Zhou and
                  Zichao Yan and
                  Elliot Layne and
                  Nikolay Malkin and
                  Dinghuai Zhang and
                  Moksh Jain and
                  Mathieu Blanchette and
                  Yoshua Bengio},
  title        = {PhyloGFN: Phylogenetic inference with generative flow networks},
  journal      = {CoRR},
  volume       = {abs/2310.08774},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.08774},
  doi          = {10.48550/ARXIV.2310.08774},
  eprinttype    = {arXiv},
  eprint       = {2310.08774},
  timestamp    = {Thu, 26 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-08774.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-14782,
  author       = {Alexandra Volokhova and
                  Michal Koziarski and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Cheng{-}Hao Liu and
                  Santiago Miret and
                  Pablo Lemos and
                  Luca A. Thiede and
                  Zichao Yan and
                  Al{\'{a}}n Aspuru{-}Guzik and
                  Yoshua Bengio},
  title        = {Towards equilibrium molecular conformation generation with GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2310.14782},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.14782},
  doi          = {10.48550/ARXIV.2310.14782},
  eprinttype    = {arXiv},
  eprint       = {2310.14782},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-14782.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-14935,
  author       = {Alejandro Tejada{-}Lapuerta and
                  Paul Bertin and
                  Stefan Bauer and
                  Hananeh Aliee and
                  Yoshua Bengio and
                  Fabian J. Theis},
  title        = {Causal machine learning for single-cell genomics},
  journal      = {CoRR},
  volume       = {abs/2310.14935},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.14935},
  doi          = {10.48550/ARXIV.2310.14935},
  eprinttype    = {arXiv},
  eprint       = {2310.14935},
  timestamp    = {Mon, 30 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-14935.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-17688,
  author       = {Yoshua Bengio and
                  Geoffrey E. Hinton and
                  Andrew Yao and
                  Dawn Song and
                  Pieter Abbeel and
                  Yuval Noah Harari and
                  Ya{-}Qin Zhang and
                  Lan Xue and
                  Shai Shalev{-}Shwartz and
                  Gillian K. Hadfield and
                  Jeff Clune and
                  Tegan Maharaj and
                  Frank Hutter and
                  Atilim G{\"{u}}nes Baydin and
                  Sheila A. McIlraith and
                  Qiqi Gao and
                  Ashwin Acharya and
                  David Krueger and
                  Anca D. Dragan and
                  Philip H. S. Torr and
                  Stuart Russell and
                  Daniel Kahneman and
                  Jan Brauner and
                  S{\"{o}}ren Mindermann},
  title        = {Managing {AI} Risks in an Era of Rapid Progress},
  journal      = {CoRR},
  volume       = {abs/2310.17688},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.17688},
  doi          = {10.48550/ARXIV.2310.17688},
  eprinttype    = {arXiv},
  eprint       = {2310.17688},
  timestamp    = {Mon, 04 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-17688.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-18780,
  author       = {Stefano Massaroli and
                  Michael Poli and
                  Daniel Y. Fu and
                  Hermann Kumbong and
                  Rom N. Parnichkun and
                  Aman Timalsina and
                  David W. Romero and
                  Quinn McIntyre and
                  Beidi Chen and
                  Atri Rudra and
                  Ce Zhang and
                  Christopher R{\'{e}} and
                  Stefano Ermon and
                  Yoshua Bengio},
  title        = {Laughing Hyena Distillery: Extracting Compact Recurrences From Convolutions},
  journal      = {CoRR},
  volume       = {abs/2310.18780},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.18780},
  doi          = {10.48550/ARXIV.2310.18780},
  eprinttype    = {arXiv},
  eprint       = {2310.18780},
  timestamp    = {Wed, 20 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-18780.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-18807,
  author       = {Rim Assouel and
                  Pau Rodr{\'{\i}}guez and
                  Perouz Taslakian and
                  David V{\'{a}}zquez and
                  Yoshua Bengio},
  title        = {{OC-NMN:} Object-centric Compositional Neural Module Network for Generative
                  Visual Analogical Reasoning},
  journal      = {CoRR},
  volume       = {abs/2310.18807},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.18807},
  doi          = {10.48550/ARXIV.2310.18807},
  eprinttype    = {arXiv},
  eprint       = {2310.18807},
  timestamp    = {Thu, 02 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-18807.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-19054,
  author       = {Amin Mansouri and
                  Jason S. Hartford and
                  Yan Zhang and
                  Yoshua Bengio},
  title        = {Object-centric architectures enable efficient causal representation
                  learning},
  journal      = {CoRR},
  volume       = {abs/2310.19054},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.19054},
  doi          = {10.48550/ARXIV.2310.19054},
  eprinttype    = {arXiv},
  eprint       = {2310.19054},
  timestamp    = {Thu, 02 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-19054.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-00936,
  author       = {M{\'{e}}lisande Teng and
                  Amna Elmustafa and
                  Benjamin Akera and
                  Yoshua Bengio and
                  Hager Radi Abdelwahed and
                  Hugo Larochelle and
                  David Rolnick},
  title        = {SatBird: Bird Species Distribution Modeling with Remote Sensing and
                  Citizen Science Data},
  journal      = {CoRR},
  volume       = {abs/2311.00936},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.00936},
  doi          = {10.48550/ARXIV.2311.00936},
  eprinttype    = {arXiv},
  eprint       = {2311.00936},
  timestamp    = {Tue, 07 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-00936.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-15268,
  author       = {Vedant Shah and
                  Frederik Tr{\"{a}}uble and
                  Ashish Malik and
                  Hugo Larochelle and
                  Michael Mozer and
                  Sanjeev Arora and
                  Yoshua Bengio and
                  Anirudh Goyal},
  title        = {Unlearning via Sparse Representations},
  journal      = {CoRR},
  volume       = {abs/2311.15268},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.15268},
  doi          = {10.48550/ARXIV.2311.15268},
  eprinttype    = {arXiv},
  eprint       = {2311.15268},
  timestamp    = {Fri, 01 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-15268.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-16176,
  author       = {Luca Scimeca and
                  Alexander Rubinstein and
                  Damien Teney and
                  Seong Joon Oh and
                  Armand Mihai Nicolicioiu and
                  Yoshua Bengio},
  title        = {Shortcut Bias Mitigation via Ensemble Diversity Using Diffusion Probabilistic
                  Models},
  journal      = {CoRR},
  volume       = {abs/2311.16176},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.16176},
  doi          = {10.48550/ARXIV.2311.16176},
  eprinttype    = {arXiv},
  eprint       = {2311.16176},
  timestamp    = {Mon, 04 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-16176.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-03911,
  author       = {Pablo Lemos and
                  Nikolay Malkin and
                  Will Handley and
                  Yoshua Bengio and
                  Yashar Hezaveh and
                  Laurence Perreault Levasseur},
  title        = {Improving Gradient-guided Nested Sampling for Posterior Inference},
  journal      = {CoRR},
  volume       = {abs/2312.03911},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.03911},
  doi          = {10.48550/ARXIV.2312.03911},
  eprinttype    = {arXiv},
  eprint       = {2312.03911},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-03911.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-07511,
  author       = {Alexandre Duval and
                  Simon V. Mathis and
                  Chaitanya K. Joshi and
                  Victor Schmidt and
                  Santiago Miret and
                  Fragkiskos D. Malliaros and
                  Taco Cohen and
                  Pietro Lio and
                  Yoshua Bengio and
                  Michael M. Bronstein},
  title        = {A Hitchhiker's Guide to Geometric GNNs for 3D Atomic Systems},
  journal      = {CoRR},
  volume       = {abs/2312.07511},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.07511},
  doi          = {10.48550/ARXIV.2312.07511},
  eprinttype    = {arXiv},
  eprint       = {2312.07511},
  timestamp    = {Thu, 04 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-07511.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/informs/LarsenLBFLL22,
  author       = {Eric Larsen and
                  S{\'{e}}bastien Lachapelle and
                  Yoshua Bengio and
                  Emma Frejinger and
                  Simon Lacoste{-}Julien and
                  Andrea Lodi},
  title        = {Predicting Tactical Solutions to Operational Planning Problems Under
                  Imperfect Information},
  journal      = {{INFORMS} J. Comput.},
  volume       = {34},
  number       = {1},
  pages        = {227--242},
  year         = {2022},
  url          = {https://doi.org/10.1287/ijoc.2021.1091},
  doi          = {10.1287/IJOC.2021.1091},
  timestamp    = {Wed, 27 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/informs/LarsenLBFLL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcisd/LiuKJWBS22,
  author       = {Cheng{-}Hao Liu and
                  Maksym Korablyov and
                  Stanislaw Jastrzebski and
                  Pawel Wlodarczyk{-}Pruszynski and
                  Yoshua Bengio and
                  Marwin H. S. Segler},
  title        = {RetroGNN: Fast Estimation of Synthesizability for Virtual Screening
                  and De Novo Design by Learning from Slow Retrosynthesis Software},
  journal      = {J. Chem. Inf. Model.},
  volume       = {62},
  number       = {10},
  pages        = {2293--2300},
  year         = {2022},
  url          = {https://doi.org/10.1021/acs.jcim.1c01476},
  doi          = {10.1021/ACS.JCIM.1C01476},
  timestamp    = {Mon, 13 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jcisd/LiuKJWBS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/VermaKLKSBL22,
  author       = {Vikas Verma and
                  Kenji Kawaguchi and
                  Alex Lamb and
                  Juho Kannala and
                  Arno Solin and
                  Yoshua Bengio and
                  David Lopez{-}Paz},
  title        = {Interpolation consistency training for semi-supervised learning},
  journal      = {Neural Networks},
  volume       = {145},
  pages        = {90--106},
  year         = {2022},
  url          = {https://doi.org/10.1016/j.neunet.2021.10.008},
  doi          = {10.1016/J.NEUNET.2021.10.008},
  timestamp    = {Fri, 13 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/VermaKLKSBL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/LambVKMKKB22,
  author       = {Alex Lamb and
                  Vikas Verma and
                  Kenji Kawaguchi and
                  Alexander Matyasko and
                  Savya Khosla and
                  Juho Kannala and
                  Yoshua Bengio},
  title        = {Interpolated Adversarial Training: Achieving robust neural networks
                  without sacrificing too much accuracy},
  journal      = {Neural Networks},
  volume       = {154},
  pages        = {218--233},
  year         = {2022},
  url          = {https://doi.org/10.1016/j.neunet.2022.07.012},
  doi          = {10.1016/J.NEUNET.2022.07.012},
  timestamp    = {Mon, 24 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/LambVKMKKB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/GuptaKCGLBK22,
  author       = {Prateek Gupta and
                  Elias Boutros Khalil and
                  Didier Ch{\'{e}}telat and
                  Maxime Gasse and
                  Andrea Lodi and
                  Yoshua Bengio and
                  M. Pawan Kumar},
  title        = {Lookback for Learning to Branch},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2022},
  year         = {2022},
  url          = {https://openreview.net/forum?id=EQpGkw5rvL},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/GuptaKCGLBK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/LaoJHB22,
  author       = {Qicheng Lao and
                  Xiang Jiang and
                  Mohammad Havaei and
                  Yoshua Bengio},
  title        = {A Two-Stream Continual Learning System With Variational Domain-Agnostic
                  Feature Replay},
  journal      = {{IEEE} Trans. Neural Networks Learn. Syst.},
  volume       = {33},
  number       = {9},
  pages        = {4466--4478},
  year         = {2022},
  url          = {https://doi.org/10.1109/TNNLS.2021.3057453},
  doi          = {10.1109/TNNLS.2021.3057453},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnn/LaoJHB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bigdataconf/ZhangZCBL22,
  author       = {Tianyi Zhang and
                  Shirui Zhang and
                  Ziwei Chen and
                  Yoshua Bengio and
                  Dianbo Liu},
  editor       = {Shusaku Tsumoto and
                  Yukio Ohsawa and
                  Lei Chen and
                  Dirk Van den Poel and
                  Xiaohua Hu and
                  Yoichi Motomura and
                  Takuya Takagi and
                  Lingfei Wu and
                  Ying Xie and
                  Akihiro Abe and
                  Vijay Raghavan},
  title        = {{PMFL:} Partial Meta-Federated Learning for heterogeneous tasks and
                  its applications on real-world medical records},
  booktitle    = {{IEEE} International Conference on Big Data, Big Data 2022, Osaka,
                  Japan, December 17-20, 2022},
  pages        = {4453--4462},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/BigData55660.2022.10020281},
  doi          = {10.1109/BIGDATA55660.2022.10020281},
  timestamp    = {Fri, 18 Aug 2023 17:39:03 +0200},
  biburl       = {https://dblp.org/rec/conf/bigdataconf/ZhangZCBL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/clear2/AssouelCCBB22,
  author       = {Rim Assouel and
                  Llu{\'{\i}}s Castrej{\'{o}}n and
                  Aaron C. Courville and
                  Nicolas Ballas and
                  Yoshua Bengio},
  editor       = {Bernhard Sch{\"{o}}lkopf and
                  Caroline Uhler and
                  Kun Zhang},
  title        = {{VIM:} Variational Independent Modules for Video Prediction},
  booktitle    = {1st Conference on Causal Learning and Reasoning, CLeaR 2022, Sequoia
                  Conference Center, Eureka, CA, USA, 11-13 April, 2022},
  series       = {Proceedings of Machine Learning Research},
  volume       = {177},
  pages        = {70--89},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v177/assouel22a.html},
  timestamp    = {Wed, 06 Jul 2022 16:57:27 +0200},
  biburl       = {https://dblp.org/rec/conf/clear2/AssouelCCBB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AhujaHB22,
  author       = {Kartik Ahuja and
                  Jason S. Hartford and
                  Yoshua Bengio},
  title        = {Properties from mechanisms: an equivariance perspective on identifiable
                  representation learning},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=g5ynW-jMq4M},
  timestamp    = {Thu, 04 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AhujaHB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/DeleuKFKBLB22,
  author       = {Tristan Deleu and
                  David Kanaa and
                  Leo Feng and
                  Giancarlo Kerg and
                  Yoshua Bengio and
                  Guillaume Lajoie and
                  Pierre{-}Luc Bacon},
  title        = {Continuous-Time Meta-Learning with Forward Mode Differentiation},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=57PipS27Km},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/DeleuKFKBLB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/DwivediL0BB22,
  author       = {Vijay Prakash Dwivedi and
                  Anh Tuan Luu and
                  Thomas Laurent and
                  Yoshua Bengio and
                  Xavier Bresson},
  title        = {Graph Neural Networks with Learnable Structural and Positional Representations},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=wTTjnvGphYj},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/DwivediL0BB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalDLBKRBBMB22,
  author       = {Anirudh Goyal and
                  Aniket Rajiv Didolkar and
                  Alex Lamb and
                  Kartikeya Badola and
                  Nan Rosemary Ke and
                  Nasim Rahaman and
                  Jonathan Binas and
                  Charles Blundell and
                  Michael Curtis Mozer and
                  Yoshua Bengio},
  title        = {Coordination Among Neural Modules Through a Shared Global Workspace},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=XzTtHjgPDsT},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalDLBKRBBMB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MittalRRBL22,
  author       = {Sarthak Mittal and
                  Sharath Chandra Raparthy and
                  Irina Rish and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Compositional Attention: Disentangling Search and Retrieval},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=IwJPj2MBcIa},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MittalRRBL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MorrisonKKSCB22,
  author       = {Max Morrison and
                  Rithesh Kumar and
                  Kundan Kumar and
                  Prem Seetharaman and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Chunked Autoregressive {GAN} for Conditional Waveform Synthesis},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=v3aeIsY\_vVX},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MorrisonKKSCB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SchmidtLTZRRCJV22,
  author       = {Victor Schmidt and
                  Alexandra Luccioni and
                  M{\'{e}}lisande Teng and
                  Tianyu Zhang and
                  Alexia Reynaud and
                  Sunand Raghupathi and
                  Gautier Cosne and
                  Adrien Juraver and
                  Vahe Vardanyan and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Yoshua Bengio},
  title        = {ClimateGAN: Raising Climate Change Awareness by Generating Images
                  of Floods},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=EZNOb\_uNpJk},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SchmidtLTZRRCJV22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhangFBC22,
  author       = {Dinghuai Zhang and
                  Jie Fu and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Unifying Likelihood-free Inference with Black-box Optimization and
                  Beyond},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=1HxTO6CTkz},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhangFBC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ErnoultNMSBRRB22,
  author       = {Maxence Ernoult and
                  Fabrice Normandin and
                  Abhinav Moudgil and
                  Sean Spinney and
                  Eugene Belilovsky and
                  Irina Rish and
                  Blake A. Richards and
                  Yoshua Bengio},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Towards Scaling Difference Target Propagation by Learning Backprop
                  Targets},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {5968--5987},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/ernoult22a.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ErnoultNMSBRRB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JainBHRDEFZKZSD22,
  author       = {Moksh Jain and
                  Emmanuel Bengio and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Jarrid Rector{-}Brooks and
                  Bonaventure F. P. Dossou and
                  Chanakya Ajit Ekbote and
                  Jie Fu and
                  Tianyu Zhang and
                  Michael Kilgour and
                  Dinghuai Zhang and
                  Lena Simine and
                  Payel Das and
                  Yoshua Bengio},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Biological Sequence Design with GFlowNets},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {9786--9801},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/jain22a.html},
  timestamp    = {Tue, 12 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JainBHRDEFZKZSD22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PezeshkiMBL22,
  author       = {Mohammad Pezeshki and
                  Amartya Mitra and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Multi-scale Feature Learning Dynamics: Insights for Double Descent},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {17669--17690},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/pezeshki22a.html},
  timestamp    = {Tue, 12 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PezeshkiMBL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ZhangMLVCB22,
  author       = {Dinghuai Zhang and
                  Nikolay Malkin and
                  Zhen Liu and
                  Alexandra Volokhova and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Generative Flow Networks for Discrete Probabilistic Modeling},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {26412--26428},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/zhang22v.html},
  timestamp    = {Mon, 06 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/ZhangMLVCB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ZhangZCBRS22,
  author       = {Dinghuai Zhang and
                  Hongyang Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Pradeep Ravikumar and
                  Arun Sai Suggala},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Building Robust Ensembles via Margin Boosting},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {26669--26692},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/zhang22aj.html},
  timestamp    = {Thu, 25 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ZhangZCBRS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AhujaHB22,
  author       = {Kartik Ahuja and
                  Jason S. Hartford and
                  Yoshua Bengio},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Weakly Supervised Representation Learning with Sparse Perturbations},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/63d3bae2c1f525745003f679e45bcf7b-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/AhujaHB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BoussifBBA22,
  author       = {Oussama Boussif and
                  Yoshua Bengio and
                  Loubna Benabbou and
                  Dan Assouline},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {MAgNet: Mesh Agnostic Neural {PDE} Solver},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/cf4c7ee0734cdfe09a099cf6cd7b117a-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BoussifBBA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DidolkarGGGLKB22,
  author       = {Aniket Didolkar and
                  Kshitij Gupta and
                  Anirudh Goyal and
                  Nitesh B. Gundavarapu and
                  Alex Lamb and
                  Nan Rosemary Ke and
                  Yoshua Bengio},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Temporal Latent Bottleneck: Synthesis of Fast and Slow Processing
                  Mechanisms in Sequence Learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/4446b84fdf15b17c091582e4b86f8a05-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DidolkarGGGLKB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Gallego-PosadaR22,
  author       = {Jose Gallego{-}Posada and
                  Juan Ramirez and
                  Akram Erraqabi and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Controlled Sparsity via Constrained Optimization or: How {I} Learned
                  to Stop Tuning Penalties and Love Constraints},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/089b592cccfafdca8e0178e85b609f19-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/Gallego-PosadaR22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/IslamZGLKLLBC22,
  author       = {Riashat Islam and
                  Hongyu Zang and
                  Anirudh Goyal and
                  Alex M. Lamb and
                  Kenji Kawaguchi and
                  Xin Li and
                  Romain Laroche and
                  Yoshua Bengio and
                  Remi Tachet des Combes},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Discrete Compositional Representations as an Abstraction for Goal
                  Conditioned Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/18ddfb199d71a8a24f83abc1ced077b7-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/IslamZGLKLLBC22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MalkinJBSB22,
  author       = {Nikolay Malkin and
                  Moksh Jain and
                  Emmanuel Bengio and
                  Chen Sun and
                  Yoshua Bengio},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Trajectory balance: Improved credit assignment in GFlowNets},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/27b51baca8377a0cf109f6ecc15a0f70-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MalkinJBSB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MittalBL22,
  author       = {Sarthak Mittal and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Is a Modular Architecture Enough?},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/b8d1d741f137d9b6ac4f3c1683791e4a-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MittalBL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WeissRLPBSLB22,
  author       = {Martin Weiss and
                  Nasim Rahaman and
                  Francesco Locatello and
                  Chris Pal and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf and
                  Li Erran Li and
                  Nicolas Ballas},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Neural Attentive Circuits},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/32f227c41a0b4e36f65bebb4aeda94a2-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WeissRLPBSLB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/DeleuGERLBB22,
  author       = {Tristan Deleu and
                  Ant{\'{o}}nio G{\'{o}}is and
                  Chris Emezue and
                  Mansi Rankawat and
                  Simon Lacoste{-}Julien and
                  Stefan Bauer and
                  Yoshua Bengio},
  editor       = {James Cussens and
                  Kun Zhang},
  title        = {Bayesian structure learning with generative flow networks},
  booktitle    = {Uncertainty in Artificial Intelligence, Proceedings of the Thirty-Eighth
                  Conference on Uncertainty in Artificial Intelligence, {UAI} 2022,
                  1-5 August 2022, Eindhoven, The Netherlands},
  series       = {Proceedings of Machine Learning Research},
  volume       = {180},
  pages        = {518--528},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v180/deleu22a.html},
  timestamp    = {Sat, 15 Oct 2022 12:08:13 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/DeleuGERLBB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/ErraqabiMZSLDB22,
  author       = {Akram Erraqabi and
                  Marlos C. Machado and
                  Mingde Zhao and
                  Sainbayar Sukhbaatar and
                  Alessandro Lazaric and
                  Ludovic Denoyer and
                  Yoshua Bengio},
  editor       = {James Cussens and
                  Kun Zhang},
  title        = {Temporal abstractions-augmented temporally contrastive learning: An
                  alternative to the Laplacian in {RL}},
  booktitle    = {Uncertainty in Artificial Intelligence, Proceedings of the Thirty-Eighth
                  Conference on Uncertainty in Artificial Intelligence, {UAI} 2022,
                  1-5 August 2022, Eindhoven, The Netherlands},
  series       = {Proceedings of Machine Learning Research},
  volume       = {180},
  pages        = {641--651},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v180/erraqabi22a.html},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/ErraqabiMZSLDB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-11775,
  author       = {Ramnath Kumar and
                  Tristan Deleu and
                  Yoshua Bengio},
  title        = {The Effect of Diversity in Meta-Learning},
  journal      = {CoRR},
  volume       = {abs/2201.11775},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.11775},
  eprinttype    = {arXiv},
  eprint       = {2201.11775},
  timestamp    = {Wed, 02 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-11775.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-11783,
  author       = {Ramnath Kumar and
                  Tristan Deleu and
                  Yoshua Bengio},
  title        = {Rethinking Learning Dynamics in {RL} using Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/2201.11783},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.11783},
  eprinttype    = {arXiv},
  eprint       = {2201.11783},
  timestamp    = {Wed, 02 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-11783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-13259,
  author       = {Nikolay Malkin and
                  Moksh Jain and
                  Emmanuel Bengio and
                  Chen Sun and
                  Yoshua Bengio},
  title        = {Trajectory Balance: Improved Credit Assignment in GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2201.13259},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.13259},
  eprinttype    = {arXiv},
  eprint       = {2201.13259},
  timestamp    = {Tue, 09 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-13259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-13415,
  author       = {Maxence Ernoult and
                  Fabrice Normandin and
                  Abhinav Moudgil and
                  Sean Spinney and
                  Eugene Belilovsky and
                  Irina Rish and
                  Blake A. Richards and
                  Yoshua Bengio},
  title        = {Towards Scaling Difference Target Propagation by Learning Backprop
                  Targets},
  journal      = {CoRR},
  volume       = {abs/2201.13415},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.13415},
  eprinttype    = {arXiv},
  eprint       = {2201.13415},
  timestamp    = {Thu, 17 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-13415.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-01334,
  author       = {Dianbo Liu and
                  Alex Lamb and
                  Xu Ji and
                  Pascal Notsawo and
                  Michael Mozer and
                  Yoshua Bengio and
                  Kenji Kawaguchi},
  title        = {Adaptive Discrete Communication Bottlenecks with Dynamic Vector Quantization},
  journal      = {CoRR},
  volume       = {abs/2202.01334},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.01334},
  eprinttype    = {arXiv},
  eprint       = {2202.01334},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-01334.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-01361,
  author       = {Dinghuai Zhang and
                  Nikolay Malkin and
                  Zhen Liu and
                  Alexandra Volokhova and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generative Flow Networks for Discrete Probabilistic Modeling},
  journal      = {CoRR},
  volume       = {abs/2202.01361},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.01361},
  eprinttype    = {arXiv},
  eprint       = {2202.01361},
  timestamp    = {Mon, 06 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-01361.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-04202,
  author       = {Paul Bertin and
                  Jarrid Rector{-}Brooks and
                  Deepak Sharma and
                  Thomas Gaudelet and
                  Andrew Anighoro and
                  Torsten Gross and
                  Francisco Martinez{-}Pena and
                  Eileen L. Tang and
                  Suraj M. S and
                  Cristian Regep and
                  Jeremy B. R. Hayter and
                  Maksym Korablyov and
                  Nicholas Valiante and
                  Almer van der Sloot and
                  Mike Tyers and
                  Charles Roberts and
                  Michael M. Bronstein and
                  Luke L. Lairson and
                  Jake P. Taylor{-}King and
                  Yoshua Bengio},
  title        = {{RECOVER:} sequential model optimization platform for combination
                  drug repurposing identifies novel synergistic compounds in vitro},
  journal      = {CoRR},
  volume       = {abs/2202.04202},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.04202},
  eprinttype    = {arXiv},
  eprint       = {2202.04202},
  timestamp    = {Tue, 01 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-04202.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-13903,
  author       = {Tristan Deleu and
                  Ant{\'{o}}nio G{\'{o}}is and
                  Chris Emezue and
                  Mansi Rankawat and
                  Simon Lacoste{-}Julien and
                  Stefan Bauer and
                  Yoshua Bengio},
  title        = {Bayesian Structure Learning with Generative Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2202.13903},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.13903},
  eprinttype    = {arXiv},
  eprint       = {2202.13903},
  timestamp    = {Thu, 03 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-13903.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-01443,
  author       = {Tristan Deleu and
                  David Kanaa and
                  Leo Feng and
                  Giancarlo Kerg and
                  Yoshua Bengio and
                  Guillaume Lajoie and
                  Pierre{-}Luc Bacon},
  title        = {Continuous-Time Meta-Learning with Forward Mode Differentiation},
  journal      = {CoRR},
  volume       = {abs/2203.01443},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.01443},
  doi          = {10.48550/ARXIV.2203.01443},
  eprinttype    = {arXiv},
  eprint       = {2203.01443},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-01443.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-03724,
  author       = {Fran{\c{c}}ois St{-}Hilaire and
                  Dung Do Vu and
                  Antoine Frau and
                  Nathan Burns and
                  Farid Faraji and
                  Joseph Potochny and
                  Stephane Robert and
                  Arnaud Roussel and
                  Selene Zheng and
                  Taylor Glazier and
                  Junfel Vincent Romano and
                  Robert Belfer and
                  Muhammad Shayan and
                  Ariella Smofsky and
                  Tommy Delarosbil and
                  Seulmin Ahn and
                  Simon Eden{-}Walker and
                  Kritika Sony and
                  Ansona Onyi Ching and
                  Sabina Elkins and
                  Anush Stepanyan and
                  Adela Matajova and
                  Victor Chen and
                  Hossein Sahraei and
                  Robert Larson and
                  Nadia Markova and
                  Andrew Barkett and
                  Laurent Charlin and
                  Yoshua Bengio and
                  Iulian Vlad Serban and
                  Ekaterina Kochmar},
  title        = {A New Era: Intelligent Tutoring Systems Will Transform Online Learning
                  for Millions},
  journal      = {CoRR},
  volume       = {abs/2203.03724},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.03724},
  doi          = {10.48550/ARXIV.2203.03724},
  eprinttype    = {arXiv},
  eprint       = {2203.03724},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-03724.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-04115,
  author       = {Moksh Jain and
                  Emmanuel Bengio and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Jarrid Rector{-}Brooks and
                  Bonaventure F. P. Dossou and
                  Chanakya Ekbote and
                  Jie Fu and
                  Tianyu Zhang and
                  Michael Kilgour and
                  Dinghuai Zhang and
                  Lena Simine and
                  Payel Das and
                  Yoshua Bengio},
  title        = {Biological Sequence Design with GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2203.04115},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.04115},
  doi          = {10.48550/ARXIV.2203.04115},
  eprinttype    = {arXiv},
  eprint       = {2203.04115},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-04115.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2203-11369,
  author       = {Akram Erraqabi and
                  Marlos C. Machado and
                  Mingde Zhao and
                  Sainbayar Sukhbaatar and
                  Alessandro Lazaric and
                  Ludovic Denoyer and
                  Yoshua Bengio},
  title        = {Temporal Abstractions-Augmented Temporally Contrastive Learning: An
                  Alternative to the Laplacian in {RL}},
  journal      = {CoRR},
  volume       = {abs/2203.11369},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2203.11369},
  doi          = {10.48550/ARXIV.2203.11369},
  eprinttype    = {arXiv},
  eprint       = {2203.11369},
  timestamp    = {Tue, 29 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2203-11369.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-00666,
  author       = {Yoshua Bengio and
                  Prateek Gupta and
                  Dylan R. Radovic and
                  Maarten Scholl and
                  Andrew Williams and
                  Christian Schr{\"{o}}der de Witt and
                  Tianyu Zhang and
                  Yang Zhang},
  title        = {(Private)-Retroactive Carbon Pricing [(P)ReCaP]: {A} Market-based
                  Approach for Climate Finance and Risk Assessment},
  journal      = {CoRR},
  volume       = {abs/2205.00666},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.00666},
  doi          = {10.48550/ARXIV.2205.00666},
  eprinttype    = {arXiv},
  eprint       = {2205.00666},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-00666.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-03027,
  author       = {Sanghyun Yoo and
                  Inchul Song and
                  Yoshua Bengio},
  title        = {A Highly Adaptive Acoustic Model for Accurate Multi-Dialect Speech
                  Recognition},
  journal      = {CoRR},
  volume       = {abs/2205.03027},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.03027},
  doi          = {10.48550/ARXIV.2205.03027},
  eprinttype    = {arXiv},
  eprint       = {2205.03027},
  timestamp    = {Wed, 11 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-03027.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-09305,
  author       = {Mike He Zhu and
                  L{\'{e}}na N{\'{e}}hale Ezzine and
                  Dianbo Liu and
                  Yoshua Bengio},
  title        = {FedILC: Weighted Geometric Mean and Invariant Gradient Covariance
                  for Federated Learning on Non-IID Data},
  journal      = {CoRR},
  volume       = {abs/2205.09305},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.09305},
  doi          = {10.48550/ARXIV.2205.09305},
  eprinttype    = {arXiv},
  eprint       = {2205.09305},
  timestamp    = {Mon, 23 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-09305.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-10607,
  author       = {Dianbo Liu and
                  Vedant Shah and
                  Oussama Boussif and
                  Cristian Meo and
                  Anirudh Goyal and
                  Tianmin Shu and
                  Michael Mozer and
                  Nicolas Heess and
                  Yoshua Bengio},
  title        = {Coordinating Policies Among Multiple Agents via an Intelligent Communication
                  Channel},
  journal      = {CoRR},
  volume       = {abs/2205.10607},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.10607},
  doi          = {10.48550/ARXIV.2205.10607},
  eprinttype    = {arXiv},
  eprint       = {2205.10607},
  timestamp    = {Mon, 30 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-10607.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-11101,
  author       = {Sharut Gupta and
                  Kartik Ahuja and
                  Mohammad Havaei and
                  Niladri Chatterjee and
                  Yoshua Bengio},
  title        = {{FL} Games: {A} federated learning framework for distribution shifts},
  journal      = {CoRR},
  volume       = {abs/2205.11101},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.11101},
  doi          = {10.48550/ARXIV.2205.11101},
  eprinttype    = {arXiv},
  eprint       = {2205.11101},
  timestamp    = {Mon, 30 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-11101.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-14794,
  author       = {Aniket Didolkar and
                  Kshitij Gupta and
                  Anirudh Goyal and
                  Alex Lamb and
                  Nan Rosemary Ke and
                  Yoshua Bengio},
  title        = {Temporal Latent Bottleneck: Synthesis of Fast and Slow Processing
                  Mechanisms in Sequence Learning},
  journal      = {CoRR},
  volume       = {abs/2205.14794},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.14794},
  doi          = {10.48550/ARXIV.2205.14794},
  eprinttype    = {arXiv},
  eprint       = {2205.14794},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-14794.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-15021,
  author       = {Benjamin Scellier and
                  Siddhartha Mishra and
                  Yoshua Bengio and
                  Yann Ollivier},
  title        = {Agnostic Physics-Driven Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2205.15021},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.15021},
  doi          = {10.48550/ARXIV.2205.15021},
  eprinttype    = {arXiv},
  eprint       = {2205.15021},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-15021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-01101,
  author       = {Kartik Ahuja and
                  Jason S. Hartford and
                  Yoshua Bengio},
  title        = {Weakly Supervised Representation Learning with Sparse Perturbations},
  journal      = {CoRR},
  volume       = {abs/2206.01101},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.01101},
  doi          = {10.48550/ARXIV.2206.01101},
  eprinttype    = {arXiv},
  eprint       = {2206.01101},
  timestamp    = {Thu, 04 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-01101.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-02713,
  author       = {Sarthak Mittal and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Is a Modular Architecture Enough?},
  journal      = {CoRR},
  volume       = {abs/2206.02713},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.02713},
  doi          = {10.48550/ARXIV.2206.02713},
  eprinttype    = {arXiv},
  eprint       = {2206.02713},
  timestamp    = {Tue, 14 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-02713.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-03362,
  author       = {Dinghuai Zhang and
                  Hongyang Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Pradeep Ravikumar and
                  Arun Sai Suggala},
  title        = {Building Robust Ensembles via Margin Boosting},
  journal      = {CoRR},
  volume       = {abs/2206.03362},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.03362},
  doi          = {10.48550/ARXIV.2206.03362},
  eprinttype    = {arXiv},
  eprint       = {2206.03362},
  timestamp    = {Thu, 25 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-03362.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-04620,
  author       = {Nino Scherrer and
                  Anirudh Goyal and
                  Stefan Bauer and
                  Yoshua Bengio and
                  Nan Rosemary Ke},
  title        = {On the Generalization and Adaption Performance of Causal Models},
  journal      = {CoRR},
  volume       = {abs/2206.04620},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.04620},
  doi          = {10.48550/ARXIV.2206.04620},
  eprinttype    = {arXiv},
  eprint       = {2206.04620},
  timestamp    = {Wed, 15 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-04620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-05056,
  author       = {Giancarlo Kerg and
                  Sarthak Mittal and
                  David Rolnick and
                  Yoshua Bengio and
                  Blake A. Richards and
                  Guillaume Lajoie},
  title        = {On Neural Architecture Inductive Biases for Relational Tasks},
  journal      = {CoRR},
  volume       = {abs/2206.05056},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.05056},
  doi          = {10.48550/ARXIV.2206.05056},
  eprinttype    = {arXiv},
  eprint       = {2206.05056},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-05056.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-12840,
  author       = {Yezhen Wang and
                  Tong Che and
                  Bo Li and
                  Kaitao Song and
                  Hengzhi Pei and
                  Yoshua Bengio and
                  Dongsheng Li},
  title        = {Your Autoregressive Generative Model Can be Better If You Treat It
                  as an Energy-Based One},
  journal      = {CoRR},
  volume       = {abs/2206.12840},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.12840},
  doi          = {10.48550/ARXIV.2206.12840},
  eprinttype    = {arXiv},
  eprint       = {2206.12840},
  timestamp    = {Sun, 19 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-12840.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-14987,
  author       = {Prateek Gupta and
                  Elias B. Khalil and
                  Didier Ch{\'{e}}telat and
                  Maxime Gasse and
                  Yoshua Bengio and
                  Andrea Lodi and
                  M. Pawan Kumar},
  title        = {Lookback for Learning to Branch},
  journal      = {CoRR},
  volume       = {abs/2206.14987},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.14987},
  doi          = {10.48550/ARXIV.2206.14987},
  eprinttype    = {arXiv},
  eprint       = {2206.14987},
  timestamp    = {Mon, 04 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-14987.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-11240,
  author       = {Frederik Tr{\"{a}}uble and
                  Anirudh Goyal and
                  Nasim Rahaman and
                  Michael Mozer and
                  Kenji Kawaguchi and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Discrete Key-Value Bottleneck},
  journal      = {CoRR},
  volume       = {abs/2207.11240},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.11240},
  doi          = {10.48550/ARXIV.2207.11240},
  eprinttype    = {arXiv},
  eprint       = {2207.11240},
  timestamp    = {Mon, 25 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-11240.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-04425,
  author       = {Jose Gallego{-}Posada and
                  Juan Ramirez and
                  Akram Erraqabi and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  title        = {Controlled Sparsity via Constrained Optimization or: How {I} Learned
                  to Stop Tuning Penalties and Love Constraints},
  journal      = {CoRR},
  volume       = {abs/2208.04425},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.04425},
  doi          = {10.48550/ARXIV.2208.04425},
  eprinttype    = {arXiv},
  eprint       = {2208.04425},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-04425.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-05341,
  author       = {Siba Moussa and
                  Michael Kilgour and
                  Clara Jans and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Miroslava Cuperlovic{-}Culf and
                  Yoshua Bengio and
                  Lena Simine},
  title        = {Diversifying Design of Nucleic Acid Aptamers Using Unsupervised Machine
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2208.05341},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.05341},
  doi          = {10.48550/ARXIV.2208.05341},
  eprinttype    = {arXiv},
  eprint       = {2208.05341},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-05341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-07004,
  author       = {Tianyu Zhang and
                  Andrew Williams and
                  Soham Phade and
                  Sunil Srinivasa and
                  Yang Zhang and
                  Prateek Gupta and
                  Yoshua Bengio and
                  Stephan Zheng},
  title        = {{AI} for Global Climate Cooperation: Modeling Global Climate Negotiations,
                  Agreements, and Long-Term Cooperation in {RICE-N}},
  journal      = {CoRR},
  volume       = {abs/2208.07004},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.07004},
  doi          = {10.48550/ARXIV.2208.07004},
  eprinttype    = {arXiv},
  eprint       = {2208.07004},
  timestamp    = {Wed, 17 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-07004.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-02606,
  author       = {Dinghuai Zhang and
                  Ricky T. Q. Chen and
                  Nikolay Malkin and
                  Yoshua Bengio},
  title        = {Unifying Generative Models with GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2209.02606},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.02606},
  doi          = {10.48550/ARXIV.2209.02606},
  eprinttype    = {arXiv},
  eprint       = {2209.02606},
  timestamp    = {Mon, 26 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-02606.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-06259,
  author       = {Leo Feng and
                  Padideh Nouri and
                  Aneri Muni and
                  Yoshua Bengio and
                  Pierre{-}Luc Bacon},
  title        = {Designing Biological Sequences via Meta-Reinforcement Learning and
                  Bayesian Optimization},
  journal      = {CoRR},
  volume       = {abs/2209.06259},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.06259},
  doi          = {10.48550/ARXIV.2209.06259},
  eprinttype    = {arXiv},
  eprint       = {2209.06259},
  timestamp    = {Tue, 27 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-06259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-11924,
  author       = {Kartik Ahuja and
                  Yixin Wang and
                  Divyat Mahajan and
                  Yoshua Bengio},
  title        = {Interventional Causal Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2209.11924},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.11924},
  doi          = {10.48550/ARXIV.2209.11924},
  eprinttype    = {arXiv},
  eprint       = {2209.11924},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-11924.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-12782,
  author       = {Kanika Madan and
                  Jarrid Rector{-}Brooks and
                  Maksym Korablyov and
                  Emmanuel Bengio and
                  Moksh Jain and
                  Andrei Cristian Nica and
                  Tom Bosc and
                  Yoshua Bengio and
                  Nikolay Malkin},
  title        = {Learning GFlowNets from partial episodes for improved convergence
                  and stability},
  journal      = {CoRR},
  volume       = {abs/2209.12782},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.12782},
  doi          = {10.48550/ARXIV.2209.12782},
  eprinttype    = {arXiv},
  eprint       = {2209.12782},
  timestamp    = {Wed, 16 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-12782.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-13518,
  author       = {Bonaventure F. P. Dossou and
                  Dianbo Liu and
                  Xu Ji and
                  Moksh Jain and
                  Almer M. van der Sloot and
                  Roger Palou and
                  Michael Tyers and
                  Yoshua Bengio},
  title        = {Graph-Based Active Machine Learning Method for Diverse and Novel Antimicrobial
                  Peptides Generation and Selection},
  journal      = {CoRR},
  volume       = {abs/2209.13518},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.13518},
  doi          = {10.48550/ARXIV.2209.13518},
  eprinttype    = {arXiv},
  eprint       = {2209.13518},
  timestamp    = {Thu, 06 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-13518.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-00173,
  author       = {Jiaye Teng and
                  Chuan Wen and
                  Dinghuai Zhang and
                  Yoshua Bengio and
                  Yang Gao and
                  Yang Yuan},
  title        = {Predictive Inference with Feature Conformal Prediction},
  journal      = {CoRR},
  volume       = {abs/2210.00173},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.00173},
  doi          = {10.48550/ARXIV.2210.00173},
  eprinttype    = {arXiv},
  eprint       = {2210.00173},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-00173.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-00580,
  author       = {Nikolay Malkin and
                  Salem Lahlou and
                  Tristan Deleu and
                  Xu Ji and
                  Edward J. Hu and
                  Katie Everett and
                  Dinghuai Zhang and
                  Yoshua Bengio},
  title        = {GFlowNets and variational inference},
  journal      = {CoRR},
  volume       = {abs/2210.00580},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.00580},
  doi          = {10.48550/ARXIV.2210.00580},
  eprinttype    = {arXiv},
  eprint       = {2210.00580},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-00580.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-00999,
  author       = {Dinghuai Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Qinqing Zheng and
                  Amy Zhang and
                  Ricky T. Q. Chen},
  title        = {Latent State Marginalization as a Low-cost Approach for Improving
                  Exploration},
  journal      = {CoRR},
  volume       = {abs/2210.00999},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.00999},
  doi          = {10.48550/ARXIV.2210.00999},
  eprinttype    = {arXiv},
  eprint       = {2210.00999},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-00999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-03022,
  author       = {Dianbo Liu and
                  Vedant Shah and
                  Oussama Boussif and
                  Cristian Meo and
                  Anirudh Goyal and
                  Tianmin Shu and
                  Michael Mozer and
                  Nicolas Heess and
                  Yoshua Bengio},
  title        = {Stateful active facilitator: Coordination and Environmental Heterogeneity
                  in Cooperative Multi-Agent Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2210.03022},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.03022},
  doi          = {10.48550/ARXIV.2210.03022},
  eprinttype    = {arXiv},
  eprint       = {2210.03022},
  timestamp    = {Fri, 07 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-03022.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-03308,
  author       = {Ling Pan and
                  Dinghuai Zhang and
                  Aaron C. Courville and
                  Longbo Huang and
                  Yoshua Bengio},
  title        = {Generative Augmented Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2210.03308},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.03308},
  doi          = {10.48550/ARXIV.2210.03308},
  eprinttype    = {arXiv},
  eprint       = {2210.03308},
  timestamp    = {Wed, 12 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-03308.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05495,
  author       = {Oussama Boussif and
                  Dan Assouline and
                  Loubna Benabbou and
                  Yoshua Bengio},
  title        = {MAgNet: Mesh Agnostic Neural {PDE} Solver},
  journal      = {CoRR},
  volume       = {abs/2210.05495},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05495},
  doi          = {10.48550/ARXIV.2210.05495},
  eprinttype    = {arXiv},
  eprint       = {2210.05495},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05495.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05519,
  author       = {Ruixiang Zhang and
                  Tong Che and
                  Boris Ivanovic and
                  Renhao Wang and
                  Marco Pavone and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {Robust and Controllable Object-Centric Learning through Energy-based
                  Models},
  journal      = {CoRR},
  volume       = {abs/2210.05519},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05519},
  doi          = {10.48550/ARXIV.2210.05519},
  eprinttype    = {arXiv},
  eprint       = {2210.05519},
  timestamp    = {Mon, 19 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05519.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-05845,
  author       = {Chen Sun and
                  Wannan Yang and
                  Benjamin Alsbury{-}Nealy and
                  Yoshua Bengio and
                  Blake A. Richards},
  title        = {Contrastive introspection (ConSpec) to rapidly identify invariant
                  steps for success},
  journal      = {CoRR},
  volume       = {abs/2210.05845},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.05845},
  doi          = {10.48550/ARXIV.2210.05845},
  eprinttype    = {arXiv},
  eprint       = {2210.05845},
  timestamp    = {Tue, 09 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-05845.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-08031,
  author       = {Nasim Rahaman and
                  Martin Weiss and
                  Francesco Locatello and
                  Chris Pal and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf and
                  Li Erran Li and
                  Nicolas Ballas},
  title        = {Neural Attentive Circuits},
  journal      = {CoRR},
  volume       = {abs/2210.08031},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.08031},
  doi          = {10.48550/ARXIV.2210.08031},
  eprinttype    = {arXiv},
  eprint       = {2210.08031},
  timestamp    = {Mon, 24 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-08031.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-08340,
  author       = {Anthony Zador and
                  Blake A. Richards and
                  Bence {\"{O}}lveczky and
                  Sean Escola and
                  Yoshua Bengio and
                  Kwabena Boahen and
                  Matthew M. Botvinick and
                  Dmitri B. Chklovskii and
                  Anne Churchland and
                  Claudia Clopath and
                  James DiCarlo and
                  Surya Ganguli and
                  Jeff Hawkins and
                  Konrad P. K{\"{o}}rding and
                  Alexei A. Koulakov and
                  Yann LeCun and
                  Timothy P. Lillicrap and
                  Adam H. Marblestone and
                  Bruno A. Olshausen and
                  Alexandre Pouget and
                  Cristina Savin and
                  Terrence J. Sejnowski and
                  Eero P. Simoncelli and
                  Sara A. Solla and
                  David Sussillo and
                  Andreas S. Tolias and
                  Doris Tsao},
  title        = {Toward Next-Generation Artificial Intelligence: Catalyzing the NeuroAI
                  Revolution},
  journal      = {CoRR},
  volume       = {abs/2210.08340},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.08340},
  doi          = {10.48550/ARXIV.2210.08340},
  eprinttype    = {arXiv},
  eprint       = {2210.08340},
  timestamp    = {Wed, 19 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-08340.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-12765,
  author       = {Moksh Jain and
                  Sharath Chandra Raparthy and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Jarrid Rector{-}Brooks and
                  Yoshua Bengio and
                  Santiago Miret and
                  Emmanuel Bengio},
  title        = {Multi-Objective GFlowNets},
  journal      = {CoRR},
  volume       = {abs/2210.12765},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.12765},
  doi          = {10.48550/ARXIV.2210.12765},
  eprinttype    = {arXiv},
  eprint       = {2210.12765},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-12765.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-12928,
  author       = {Dianbo Liu and
                  Moksh Jain and
                  Bonaventure Dossou and
                  Qianli Shen and
                  Salem Lahlou and
                  Anirudh Goyal and
                  Nikolay Malkin and
                  Chris Emezue and
                  Dinghuai Zhang and
                  Nadhir Hassen and
                  Xu Ji and
                  Kenji Kawaguchi and
                  Yoshua Bengio},
  title        = {GFlowOut: Dropout with Generative Flow Networks},
  journal      = {CoRR},
  volume       = {abs/2210.12928},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.12928},
  doi          = {10.48550/ARXIV.2210.12928},
  eprinttype    = {arXiv},
  eprint       = {2210.12928},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-12928.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00184,
  author       = {Sharut Gupta and
                  Kartik Ahuja and
                  Mohammad Havaei and
                  Niladri Chatterjee and
                  Yoshua Bengio},
  title        = {{FL} Games: {A} Federated Learning Framework for Distribution Shifts},
  journal      = {CoRR},
  volume       = {abs/2211.00184},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00184},
  doi          = {10.48550/ARXIV.2211.00184},
  eprinttype    = {arXiv},
  eprint       = {2211.00184},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00184.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00247,
  author       = {Riashat Islam and
                  Hongyu Zang and
                  Anirudh Goyal and
                  Alex Lamb and
                  Kenji Kawaguchi and
                  Xin Li and
                  Romain Laroche and
                  Yoshua Bengio and
                  Remi Tachet des Combes},
  title        = {Discrete Factorial Representations as an Abstraction for Goal Conditioned
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2211.00247},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00247},
  doi          = {10.48550/ARXIV.2211.00247},
  eprinttype    = {arXiv},
  eprint       = {2211.00247},
  timestamp    = {Thu, 04 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00247.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-00568,
  author       = {Chanakya Ekbote and
                  Moksh Jain and
                  Payel Das and
                  Yoshua Bengio},
  title        = {Consistent Training via Energy-Based GFlowNets for Modeling Discrete
                  Joint Distributions},
  journal      = {CoRR},
  volume       = {abs/2211.00568},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.00568},
  doi          = {10.48550/ARXIV.2211.00568},
  eprinttype    = {arXiv},
  eprint       = {2211.00568},
  timestamp    = {Fri, 04 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-00568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-02348,
  author       = {Nasim Rahaman and
                  Martin Weiss and
                  Frederik Tr{\"{a}}uble and
                  Francesco Locatello and
                  Alexandre Lacoste and
                  Yoshua Bengio and
                  Chris Pal and
                  Li Erran Li and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {A General Purpose Neural Architecture for Geospatial Systems},
  journal      = {CoRR},
  volume       = {abs/2211.02348},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.02348},
  doi          = {10.48550/ARXIV.2211.02348},
  eprinttype    = {arXiv},
  eprint       = {2211.02348},
  timestamp    = {Wed, 09 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-02348.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-02763,
  author       = {Mizu Nishikawa{-}Toomey and
                  Tristan Deleu and
                  Jithendaraa Subramanian and
                  Yoshua Bengio and
                  Laurent Charlin},
  title        = {Bayesian learning of Causal Structure and Mechanisms with GFlowNets
                  and Variational Bayes},
  journal      = {CoRR},
  volume       = {abs/2211.02763},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.02763},
  doi          = {10.48550/ARXIV.2211.02763},
  eprinttype    = {arXiv},
  eprint       = {2211.02763},
  timestamp    = {Wed, 09 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-02763.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-03812,
  author       = {Alexandre Adam and
                  Adam Coogan and
                  Nikolay Malkin and
                  Ronan Legin and
                  Laurence Perreault Levasseur and
                  Yashar Hezaveh and
                  Yoshua Bengio},
  title        = {Posterior samples of source galaxies in strong gravitational lenses
                  with score-based priors},
  journal      = {CoRR},
  volume       = {abs/2211.03812},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.03812},
  doi          = {10.48550/ARXIV.2211.03812},
  eprinttype    = {arXiv},
  eprint       = {2211.03812},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-03812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-06489,
  author       = {S{\'{e}}kou{-}Oumar Kaba and
                  Arnab Kumar Mondal and
                  Yan Zhang and
                  Yoshua Bengio and
                  Siamak Ravanbakhsh},
  title        = {Equivariance with Learned Canonicalization Functions},
  journal      = {CoRR},
  volume       = {abs/2211.06489},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.06489},
  doi          = {10.48550/ARXIV.2211.06489},
  eprinttype    = {arXiv},
  eprint       = {2211.06489},
  timestamp    = {Tue, 15 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-06489.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-08458,
  author       = {Leo Feng and
                  Hossein Hajimirsadeghi and
                  Yoshua Bengio and
                  Mohamed Osama Ahmed},
  title        = {Latent Bottlenecked Attentive Neural Processes},
  journal      = {CoRR},
  volume       = {abs/2211.08458},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.08458},
  doi          = {10.48550/ARXIV.2211.08458},
  eprinttype    = {arXiv},
  eprint       = {2211.08458},
  timestamp    = {Wed, 23 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-08458.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-12020,
  author       = {Alexandre Duval and
                  Victor Schmidt and
                  Santiago Miret and
                  Yoshua Bengio and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  David Rolnick},
  title        = {PhAST: Physics-Aware, Scalable, and Task-specific GNNs for Accelerated
                  Catalyst Design},
  journal      = {CoRR},
  volume       = {abs/2211.12020},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.12020},
  doi          = {10.48550/ARXIV.2211.12020},
  eprinttype    = {arXiv},
  eprint       = {2211.12020},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-12020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-14666,
  author       = {S{\'{e}}bastien Lachapelle and
                  Tristan Deleu and
                  Divyat Mahajan and
                  Ioannis Mitliagkas and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien and
                  Quentin Bertrand},
  title        = {Synergies Between Disentanglement and Sparsity: a Multi-Task Learning
                  Perspective},
  journal      = {CoRR},
  volume       = {abs/2211.14666},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.14666},
  doi          = {10.48550/ARXIV.2211.14666},
  eprinttype    = {arXiv},
  eprint       = {2211.14666},
  timestamp    = {Tue, 29 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-14666.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-13381,
  author       = {Vikas Verma and
                  Sarthak Mittal and
                  Wai Hoh Tang and
                  Hieu Pham and
                  Juho Kannala and
                  Yoshua Bengio and
                  Arno Solin and
                  Kenji Kawaguchi},
  title        = {MixupE: Understanding and Improving Mixup from Directional Derivative
                  Perspective},
  journal      = {CoRR},
  volume       = {abs/2212.13381},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.13381},
  doi          = {10.48550/ARXIV.2212.13381},
  eprinttype    = {arXiv},
  eprint       = {2212.13381},
  timestamp    = {Mon, 15 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-13381.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/BengioLH21,
  author       = {Yoshua Bengio and
                  Yann LeCun and
                  Geoffrey E. Hinton},
  title        = {Deep learning for {AI}},
  journal      = {Commun. {ACM}},
  volume       = {64},
  number       = {7},
  pages        = {58--65},
  year         = {2021},
  url          = {https://doi.org/10.1145/3448250},
  doi          = {10.1145/3448250},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cacm/BengioLH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cga/LuccioniSVBR21,
  author       = {Alexandra Luccioni and
                  Victor Schmidt and
                  Vahe Vardanyan and
                  Yoshua Bengio and
                  Theresa{-}Marie Rhyne},
  title        = {Using Artificial Intelligence to Visualize the Impacts of Climate
                  Change},
  journal      = {{IEEE} Computer Graphics and Applications},
  volume       = {41},
  number       = {1},
  pages        = {8--14},
  year         = {2021},
  url          = {https://doi.org/10.1109/MCG.2020.3025425},
  doi          = {10.1109/MCG.2020.3025425},
  timestamp    = {Wed, 27 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cga/LuccioniSVBR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/eor/BengioLP21,
  author       = {Yoshua Bengio and
                  Andrea Lodi and
                  Antoine Prouvost},
  title        = {Machine learning for combinatorial optimization: {A} methodological
                  tour d'horizon},
  journal      = {Eur. J. Oper. Res.},
  volume       = {290},
  number       = {2},
  pages        = {405--421},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.ejor.2020.07.063},
  doi          = {10.1016/J.EJOR.2020.07.063},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/eor/BengioLP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jamia/BengioIJJPRSY21,
  author       = {Yoshua Bengio and
                  Daphne Ippolito and
                  Richard Janda and
                  Max Jarvie and
                  Benjamin Prud'homme and
                  Jean{-}Franois Rousseau and
                  Abhinav Sharma and
                  Yun William Yu},
  title        = {Inherent privacy limitations of decentralized contact tracing apps},
  journal      = {J. Am. Medical Informatics Assoc.},
  volume       = {28},
  number       = {1},
  pages        = {193--195},
  year         = {2021},
  url          = {https://doi.org/10.1093/jamia/ocaa153},
  doi          = {10.1093/JAMIA/OCAA153},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jamia/BengioIJJPRSY21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pieee/ScholkopfLBKKGB21,
  author       = {Bernhard Sch{\"{o}}lkopf and
                  Francesco Locatello and
                  Stefan Bauer and
                  Nan Rosemary Ke and
                  Nal Kalchbrenner and
                  Anirudh Goyal and
                  Yoshua Bengio},
  title        = {Toward Causal Representation Learning},
  journal      = {Proc. {IEEE}},
  volume       = {109},
  number       = {5},
  pages        = {612--634},
  year         = {2021},
  url          = {https://doi.org/10.1109/JPROC.2021.3058954},
  doi          = {10.1109/JPROC.2021.3058954},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pieee/ScholkopfLBKKGB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ploscb/DaoudaDFBPCBHTM21,
  author       = {Tariq Daouda and
                  Maude Dumont{-}Lagac{\'{e}} and
                  Albert Feghaly and
                  Yahya Benslimane and
                  R{\'{e}}becca Panes and
                  Mathieu Courcelles and
                  Mohamed Benhammadi and
                  Lea Harrington and
                  Pierre Thibault and
                  Fran{\c{c}}ois Major and
                  Yoshua Bengio and
                  Etienne Gagnon and
                  S{\'{e}}bastien Lemieux and
                  Claude Perreault},
  title        = {{CAMAP:} Artificial neural networks unveil the role of codon arrangement
                  in modulating {MHC-I} peptides presentation},
  journal      = {PLoS Comput. Biol.},
  volume       = {17},
  number       = {10},
  year         = {2021},
  url          = {https://doi.org/10.1371/journal.pcbi.1009482},
  doi          = {10.1371/JOURNAL.PCBI.1009482},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ploscb/DaoudaDFBPCBHTM21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SylvainZBH021,
  author       = {Tristan Sylvain and
                  Pengchuan Zhang and
                  Yoshua Bengio and
                  R. Devon Hjelm and
                  Shikhar Sharma},
  title        = {Object-Centric Image Generation from Layouts},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {2647--2655},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i3.16368},
  doi          = {10.1609/AAAI.V35I3.16368},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SylvainZBH021.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZarpellonJ0B21,
  author       = {Giulia Zarpellon and
                  Jason Jo and
                  Andrea Lodi and
                  Yoshua Bengio},
  title        = {Parameterizing Branch-and-Bound Search Trees to Learn Branching Policies},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {3931--3939},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i5.16512},
  doi          = {10.1609/AAAI.V35I5.16512},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZarpellonJ0B21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Che0LGZXB21,
  author       = {Tong Che and
                  Xiaofeng Liu and
                  Site Li and
                  Yubin Ge and
                  Ruixiang Zhang and
                  Caiming Xiong and
                  Yoshua Bengio},
  title        = {Deep Verifier Networks: Verification of Deep Discriminative Models
                  with Deep Generative Models},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {7002--7010},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i8.16862},
  doi          = {10.1609/AAAI.V35I8.16862},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Che0LGZXB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KimKB21,
  author       = {Taesup Kim and
                  Sungwoong Kim and
                  Yoshua Bengio},
  title        = {Visual Concept Reasoning Networks},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {8172--8180},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i9.16995},
  doi          = {10.1609/AAAI.V35I9.16995},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KimKB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/OreshkinCCB21,
  author       = {Boris N. Oreshkin and
                  Dmitri Carpov and
                  Nicolas Chapados and
                  Yoshua Bengio},
  title        = {Meta-Learning Framework with Applications to Zero-Shot Time-Series
                  Forecasting},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {9242--9250},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i10.17115},
  doi          = {10.1609/AAAI.V35I10.17115},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/OreshkinCCB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/VermaQKLBKT21,
  author       = {Vikas Verma and
                  Meng Qu and
                  Kenji Kawaguchi and
                  Alex Lamb and
                  Yoshua Bengio and
                  Juho Kannala and
                  Jian Tang},
  title        = {GraphMix: Improved Training of GNNs for Semi-Supervised Learning},
  booktitle    = {Thirty-Fifth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2021, Thirty-Third Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2021, The Eleventh Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2021, Virtual Event, February 2-9,
                  2021},
  pages        = {10024--10032},
  publisher    = {{AAAI} Press},
  year         = {2021},
  url          = {https://doi.org/10.1609/aaai.v35i11.17203},
  doi          = {10.1609/AAAI.V35I11.17203},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/VermaQKLBKT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aied/St-HilaireBBSSV21,
  author       = {Fran{\c{c}}ois St{-}Hilaire and
                  Nathan Burns and
                  Robert Belfer and
                  Muhammad Shayan and
                  Ariella Smofsky and
                  Dung Do Vu and
                  Antoine Frau and
                  Joseph Potochny and
                  Farid Faraji and
                  Vincent Pavero and
                  Neroli Ko and
                  Ansona Onyi Ching and
                  Sabina Elkins and
                  Anush Stepanyan and
                  Adela Matajova and
                  Laurent Charlin and
                  Yoshua Bengio and
                  Iulian Vlad Serban and
                  Ekaterina Kochmar},
  editor       = {Ido Roll and
                  Danielle S. McNamara and
                  Sergey A. Sosnovsky and
                  Rose Luckin and
                  Vania Dimitrova},
  title        = {A Comparative Study of Learning Outcomes for Online Learning Platforms},
  booktitle    = {Artificial Intelligence in Education - 22nd International Conference,
                  {AIED} 2021, Utrecht, The Netherlands, June 14-18, 2021, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12749},
  pages        = {331--337},
  publisher    = {Springer},
  year         = {2021},
  url          = {https://doi.org/10.1007/978-3-030-78270-2\_59},
  doi          = {10.1007/978-3-030-78270-2\_59},
  timestamp    = {Mon, 14 Jun 2021 12:18:46 +0200},
  biburl       = {https://dblp.org/rec/conf/aied/St-HilaireBBSSV21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/PriolBBL21,
  author       = {R{\'{e}}mi Le Priol and
                  Reza Babanezhad and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  editor       = {Arindam Banerjee and
                  Kenji Fukumizu},
  title        = {An Analysis of the Adaptation Speed of Causal Models},
  booktitle    = {The 24th International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2021, April 13-15, 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {130},
  pages        = {775--783},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v130/le-priol21a.html},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aistats/PriolBBL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/LambGSMBB21,
  author       = {Alex Lamb and
                  Anirudh Goyal and
                  Agnieszka Slowik and
                  Michael Mozer and
                  Philippe Beaudoin and
                  Yoshua Bengio},
  editor       = {Arindam Banerjee and
                  Kenji Fukumizu},
  title        = {Neural Function Modules with Sparse Arguments: {A} Dynamic Approach
                  to Integrating Information across Layers},
  booktitle    = {The 24th International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2021, April 13-15, 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {130},
  pages        = {919--927},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v130/lamb21a.html},
  timestamp    = {Wed, 14 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/LambGSMBB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SylvainDBDLHB21,
  author       = {Tristan Sylvain and
                  Francis Dutil and
                  Tess Berthier and
                  Lisa Di{-}Jorio and
                  Margaux Luck and
                  R. Devon Hjelm and
                  Yoshua Bengio},
  title        = {{CMIM:} Cross-Modal Information Maximization For Medical Imaging},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2021, Toronto, ON, Canada, June 6-11, 2021},
  pages        = {1190--1194},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICASSP39728.2021.9414132},
  doi          = {10.1109/ICASSP39728.2021.9414132},
  timestamp    = {Thu, 08 Jul 2021 17:12:48 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SylvainDBDLHB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/ChengZJFPWSOLLB21,
  author       = {Yuwei Cheng and
                  Jiannan Zhu and
                  Mengxin Jiang and
                  Jie Fu and
                  Changsong Pang and
                  Peidong Wang and
                  Kris Sankaran and
                  Olawale Onabola and
                  Yimin Liu and
                  Dianbo Liu and
                  Yoshua Bengio},
  title        = {FloW: {A} Dataset and Benchmark for Floating Waste Detection in Inland
                  Waters},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {10933--10942},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.01077},
  doi          = {10.1109/ICCV48922.2021.01077},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/ChengZJFPWSOLLB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AhmedBSC21,
  author       = {Faruk Ahmed and
                  Yoshua Bengio and
                  Harm van Seijen and
                  Aaron C. Courville},
  title        = {Systematic generalisation with group invariant predictions},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=b9PoimzZFJ},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AhmedBSC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AhmedTGNWBSB21,
  author       = {Ossama Ahmed and
                  Frederik Tr{\"{a}}uble and
                  Anirudh Goyal and
                  Alexander Neitz and
                  Manuel Wuthrich and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf and
                  Stefan Bauer},
  title        = {CausalWorld: {A} Robotic Manipulation Benchmark for Causal Structure
                  and Transfer Learning},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=SK7A5pdrgov},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AhmedTGNWBSB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BengioGMRWDMQSS21,
  author       = {Yoshua Bengio and
                  Prateek Gupta and
                  Tegan Maharaj and
                  Nasim Rahaman and
                  Martin Weiss and
                  Tristan Deleu and
                  Eilif Benjamin M{\"{u}}ller and
                  Meng Qu and
                  Victor Schmidt and
                  Pierre{-}Luc St{-}Charles and
                  Hannah Alsdurf and
                  Olexa Bilaniuk and
                  David L. Buckeridge and
                  Ga{\'{e}}tan Marceau{-}Caron and
                  Pierre Luc Carrier and
                  Joumana Ghosn and
                  Satya Ortiz{-}Gagne and
                  Christopher J. Pal and
                  Irina Rish and
                  Bernhard Sch{\"{o}}lkopf and
                  Abhinav Sharma and
                  Jian Tang and
                  Andrew Williams},
  title        = {Predicting Infectiousness for Proactive Contact Tracing},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=lVgB2FUbzuQ},
  timestamp    = {Tue, 26 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BengioGMRWDMQSS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalLGBBLBM21,
  author       = {Anirudh Goyal and
                  Alex Lamb and
                  Phanideep Gampa and
                  Philippe Beaudoin and
                  Charles Blundell and
                  Sergey Levine and
                  Yoshua Bengio and
                  Michael Curtis Mozer},
  title        = {Factorizing Declarative and Procedural Knowledge in Structured, Dynamical
                  Environments},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=VVdmjgu7pKM},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalLGBBLBM21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalLHSLBS21,
  author       = {Anirudh Goyal and
                  Alex Lamb and
                  Jordan Hoffmann and
                  Shagun Sodhani and
                  Sergey Levine and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Recurrent Independent Mechanisms},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=mLcmdlEUxy-},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalLHSLBS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MadanKGSB21,
  author       = {Kanika Madan and
                  Nan Rosemary Ke and
                  Anirudh Goyal and
                  Bernhard Sch{\"{o}}lkopf and
                  Yoshua Bengio},
  title        = {Fast And Slow Learning Of Recurrent Independent Mechanisms},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=Lc28QAB4ypz},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MadanKGSB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/QuCXBT21,
  author       = {Meng Qu and
                  Junkun Chen and
                  Louis{-}Pascal A. C. Xhonneux and
                  Yoshua Bengio and
                  Jian Tang},
  title        = {RNNLogic: Learning Logic Rules for Reasoning on Knowledge Graphs},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=tGZu6DlbreV},
  timestamp    = {Tue, 10 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/QuCXBT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RahamanGGWBSBS21,
  author       = {Nasim Rahaman and
                  Anirudh Goyal and
                  Muhammad Waleed Gondal and
                  Manuel Wuthrich and
                  Stefan Bauer and
                  Yash Sharma and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Spatially Structured Recurrent Modules},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=5l9zj5G7vDY},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/RahamanGGWBSBS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/VivianoSDBC21,
  author       = {Joseph D. Viviano and
                  Becks Simpson and
                  Francis Dutil and
                  Yoshua Bengio and
                  Joseph Paul Cohen},
  title        = {Saliency is a Possible Red Herring When Diagnosing Poor Generalization},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=c9-WeM-ceB},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/VivianoSDBC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/XuLBPT21,
  author       = {Minkai Xu and
                  Shitong Luo and
                  Yoshua Bengio and
                  Jian Peng and
                  Jian Tang},
  title        = {Learning Neural Generative Dynamics for Molecular Conformation Generation},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=pAbm1qfheGk},
  timestamp    = {Wed, 30 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/XuLBPT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/XuWLSBGT21,
  author       = {Minkai Xu and
                  Wujie Wang and
                  Shitong Luo and
                  Chence Shi and
                  Yoshua Bengio and
                  Rafael G{\'{o}}mez{-}Bombarelli and
                  Jian Tang},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {An End-to-End Framework for Molecular Conformation Generation via
                  Bilevel Programming},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {11537--11547},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/xu21f.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/XuWLSBGT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/ZolnaSBHCBB21,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning},
  booktitle    = {International Joint Conference on Neural Networks, {IJCNN} 2021, Shenzhen,
                  China, July 18-22, 2021},
  pages        = {1--9},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/IJCNN52387.2021.9534032},
  doi          = {10.1109/IJCNN52387.2021.9534032},
  timestamp    = {Wed, 29 Sep 2021 17:00:55 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/ZolnaSBHCBB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ltedi/OnabolaMXAIXLB21,
  author       = {Olawale Onabola and
                  Zhuang Ma and
                  Yang Xie and
                  Benjamin Akera and
                  Abdulrahman Ibraheem and
                  Jia Xue and
                  Dianbo Liu and
                  Yoshua Bengio},
  editor       = {Bharathi Raja Chakravarthi and
                  John P. McCrae and
                  Manel Zarrouk and
                  Rajeev K. Bali and
                  Paul Buitelaar},
  title        = {hBERT + BiasCorp - Fighting Racism on the Web},
  booktitle    = {Proceedings of the First Workshop on Language Technology for Equality,
                  Diversity and Inclusion, LT-EDI@EACL 2021, Online, April 19, 2021},
  pages        = {26--33},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://www.aclweb.org/anthology/2021.ltedi-1.4/},
  timestamp    = {Mon, 01 Aug 2022 12:40:03 +0200},
  biburl       = {https://dblp.org/rec/conf/ltedi/OnabolaMXAIXLB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KeDMGLBRMBP21,
  author       = {Nan Rosemary Ke and
                  Aniket Didolkar and
                  Sarthak Mittal and
                  Anirudh Goyal and
                  Guillaume Lajoie and
                  Stefan Bauer and
                  Danilo Jimenez Rezende and
                  Michael Mozer and
                  Yoshua Bengio and
                  Chris Pal},
  editor       = {Joaquin Vanschoren and
                  Sai{-}Kit Yeung},
  title        = {Systematic Evaluation of Causal Discovery in Visual Model Based Reinforcement
                  Learning},
  booktitle    = {Proceedings of the Neural Information Processing Systems Track on
                  Datasets and Benchmarks 1, NeurIPS Datasets and Benchmarks 2021, December
                  2021, virtual},
  year         = {2021},
  url          = {https://datasets-benchmarks-proceedings.neurips.cc/paper/2021/hash/8f121ce07d74717e0b1f21d122e04521-Abstract-round2.html},
  timestamp    = {Thu, 05 May 2022 16:30:03 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/KeDMGLBRMBP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PezeshkiKBCPL21,
  author       = {Mohammad Pezeshki and
                  S{\'{e}}kou{-}Oumar Kaba and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Doina Precup and
                  Guillaume Lajoie},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Gradient Starvation: {A} Learning Proclivity in Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {1256--1272},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/0987b8b338d6c90bbedd8631bc499221-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/PezeshkiKBCPL21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhaoLLZPB21,
  author       = {Mingde Zhao and
                  Zhen Liu and
                  Sitao Luan and
                  Shuyuan Zhang and
                  Doina Precup and
                  Yoshua Bengio},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {A Consciousness-Inspired Planning Agent for Model-Based Reinforcement
                  Learning},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {1569--1581},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/0c215f194276000be6a6df6528067151-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ZhaoLLZPB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LiuLKGSMB21,
  author       = {Dianbo Liu and
                  Alex Lamb and
                  Kenji Kawaguchi and
                  Anirudh Goyal and
                  Chen Sun and
                  Michael C. Mozer and
                  Yoshua Bengio},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Discrete-Valued Neural Communication},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {2109--2121},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/10907813b97e249163587e6246612e21-Abstract.html},
  timestamp    = {Tue, 09 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LiuLKGSMB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AhujaCZGBMR21,
  author       = {Kartik Ahuja and
                  Ethan Caballero and
                  Dinghuai Zhang and
                  Jean{-}Christophe Gagnon{-}Audet and
                  Yoshua Bengio and
                  Ioannis Mitliagkas and
                  Irina Rish},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Invariance Principle Meets Information Bottleneck for Out-of-Distribution
                  Generalization},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {3438--3450},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/1c336b8080f82bcc2cd2499b4c57261d-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/AhujaCZGBMR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/XiaLBB21,
  author       = {Kevin Xia and
                  Kai{-}Zhan Lee and
                  Yoshua Bengio and
                  Elias Bareinboim},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {The Causal-Neural Connection: Expressiveness, Learnability, and Inference},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {10823--10836},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/5989add1703e4b0480f75e2390739f34-Abstract.html},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/XiaLBB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RahamanGJGBLS21,
  author       = {Nasim Rahaman and
                  Muhammad Waleed Gondal and
                  Shruti Joshi and
                  Peter V. Gehler and
                  Yoshua Bengio and
                  Francesco Locatello and
                  Bernhard Sch{\"{o}}lkopf},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Dynamic Inference with Neural Interpreters},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {10985--10998},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/5b4e9aa703d0bfa11041debaa2d1b633-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/RahamanGJGBLS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DidolkarGKBBHMB21,
  author       = {Aniket Didolkar and
                  Anirudh Goyal and
                  Nan Rosemary Ke and
                  Charles Blundell and
                  Philippe Beaudoin and
                  Nicolas Heess and
                  Michael Mozer and
                  Yoshua Bengio},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Neural Production Systems},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {25673--25687},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/d785bf9067f8af9e078b93cf26de2b54-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DidolkarGKBBHMB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioJKPB21,
  author       = {Emmanuel Bengio and
                  Moksh Jain and
                  Maksym Korablyov and
                  Doina Precup and
                  Yoshua Bengio},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Flow Network based Generative Models for Non-Iterative Diverse Candidate
                  Generation},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {27381--27394},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/e614f646836aaed9f89ce58e837e2310-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioJKPB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/spaca/SylvainLCC0B21,
  author       = {Tristan Sylvain and
                  Margaux Luck and
                  Joseph Paul Cohen and
                  H{\'{e}}lo{\"{\i}}se Cardinal and
                  Andrea Lodi and
                  Yoshua Bengio},
  editor       = {Russell Greiner and
                  Neeraj Kumar and
                  Thomas Alexander Gerds and
                  Mihaela van der Schaar},
  title        = {Exploring the Wasserstein metric for time-to-event analysis},
  booktitle    = {Proceedings of {AAAI} Symposium on Survival Prediction - Algorithms,
                  Challenges and Applications, {SPACA} 2021, Stanford University, Palo
                  Alto, CA, USA, March 22-24, 2021},
  series       = {Proceedings of Machine Learning Research},
  volume       = {146},
  pages        = {194--206},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {https://proceedings.mlr.press/v146/sylvain21a.html},
  timestamp    = {Fri, 15 Jul 2022 14:51:04 +0200},
  biburl       = {https://dblp.org/rec/conf/spaca/SylvainLCC0B21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-05536,
  author       = {Axel Laborieux and
                  Maxence Ernoult and
                  Benjamin Scellier and
                  Yoshua Bengio and
                  Julie Grollier and
                  Damien Querlioz},
  title        = {Scaling Equilibrium Propagation to Deep ConvNets by Drastically Reducing
                  its Gradient Estimator Bias},
  journal      = {CoRR},
  volume       = {abs/2101.05536},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.05536},
  eprinttype    = {arXiv},
  eprint       = {2101.05536},
  timestamp    = {Fri, 22 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-05536.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-03869,
  author       = {Tristan Deleu and
                  Yoshua Bengio},
  title        = {Structured Sparsity Inducing Adaptive Optimizers for Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2102.03869},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.03869},
  eprinttype    = {arXiv},
  eprint       = {2102.03869},
  timestamp    = {Wed, 10 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-03869.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-08501,
  author       = {Moksh Jain and
                  Salem Lahlou and
                  Hadi Nekoei and
                  Victor Butoi and
                  Paul Bertin and
                  Jarrid Rector{-}Brooks and
                  Maksym Korablyov and
                  Yoshua Bengio},
  title        = {{DEUP:} Direct Epistemic Uncertainty Prediction},
  journal      = {CoRR},
  volume       = {abs/2102.08501},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.08501},
  eprinttype    = {arXiv},
  eprint       = {2102.08501},
  timestamp    = {Fri, 19 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-08501.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-10240,
  author       = {Minkai Xu and
                  Shitong Luo and
                  Yoshua Bengio and
                  Jian Peng and
                  Jian Tang},
  title        = {Learning Neural Generative Dynamics for Molecular Conformation Generation},
  journal      = {CoRR},
  volume       = {abs/2102.10240},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.10240},
  eprinttype    = {arXiv},
  eprint       = {2102.10240},
  timestamp    = {Wed, 30 Mar 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-10240.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-11107,
  author       = {Bernhard Sch{\"{o}}lkopf and
                  Francesco Locatello and
                  Stefan Bauer and
                  Nan Rosemary Ke and
                  Nal Kalchbrenner and
                  Anirudh Goyal and
                  Yoshua Bengio},
  title        = {Towards Causal Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2102.11107},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.11107},
  eprinttype    = {arXiv},
  eprint       = {2102.11107},
  timestamp    = {Wed, 24 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-11107.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-00336,
  author       = {Alex Lamb and
                  Di He and
                  Anirudh Goyal and
                  Guolin Ke and
                  Chien{-}Feng Liao and
                  Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Transformers with Competitive Ensembles of Independent Mechanisms},
  journal      = {CoRR},
  volume       = {abs/2103.00336},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.00336},
  eprinttype    = {arXiv},
  eprint       = {2103.00336},
  timestamp    = {Tue, 14 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-00336.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-01197,
  author       = {Anirudh Goyal and
                  Aniket Didolkar and
                  Alex Lamb and
                  Kartikeya Badola and
                  Nan Rosemary Ke and
                  Nasim Rahaman and
                  Jonathan Binas and
                  Charles Blundell and
                  Michael Mozer and
                  Yoshua Bengio},
  title        = {Coordination Among Neural Modules Through a Shared Global Workspace},
  journal      = {CoRR},
  volume       = {abs/2103.01197},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.01197},
  eprinttype    = {arXiv},
  eprint       = {2103.01197},
  timestamp    = {Thu, 04 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-01197.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-01937,
  author       = {Anirudh Goyal and
                  Aniket Didolkar and
                  Nan Rosemary Ke and
                  Charles Blundell and
                  Philippe Beaudoin and
                  Nicolas Heess and
                  Michael Mozer and
                  Yoshua Bengio},
  title        = {Neural Production Systems},
  journal      = {CoRR},
  volume       = {abs/2103.01937},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.01937},
  eprinttype    = {arXiv},
  eprint       = {2103.01937},
  timestamp    = {Thu, 04 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-01937.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-02242,
  author       = {Olawale Onabola and
                  Zhuang Ma and
                  Yang Xie and
                  Benjamin Akera and
                  Abdulrahman Ibraheem and
                  Jia Xue and
                  Dianbo Liu and
                  Yoshua Bengio},
  title        = {hBert + BiasCorp - Fighting Racism on the Web},
  journal      = {CoRR},
  volume       = {abs/2104.02242},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.02242},
  eprinttype    = {arXiv},
  eprint       = {2104.02242},
  timestamp    = {Mon, 12 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-02242.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-07763,
  author       = {Fran{\c{c}}ois St{-}Hilaire and
                  Nathan Burns and
                  Robert Belfer and
                  Muhammad Shayan and
                  Ariella Smofsky and
                  Dung Do Vu and
                  Antoine Frau and
                  Joseph Potochny and
                  Farid Faraji and
                  Vincent Pavero and
                  Neroli Ko and
                  Ansona Onyi Ching and
                  Sabina Elkins and
                  Anush Stepanyan and
                  Adela Matajova and
                  Laurent Charlin and
                  Yoshua Bengio and
                  Iulian Vlad Serban and
                  Ekaterina Kochmar},
  title        = {Comparative Study of Learning Outcomes for Online Learning Platforms},
  journal      = {CoRR},
  volume       = {abs/2104.07763},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.07763},
  eprinttype    = {arXiv},
  eprint       = {2104.07763},
  timestamp    = {Mon, 19 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-07763.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-07246,
  author       = {Minkai Xu and
                  Wujie Wang and
                  Shitong Luo and
                  Chence Shi and
                  Yoshua Bengio and
                  Rafael G{\'{o}}mez{-}Bombarelli and
                  Jian Tang},
  title        = {An End-to-End Framework for Molecular Conformation Generation via
                  Bilevel Programming},
  journal      = {CoRR},
  volume       = {abs/2105.07246},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.07246},
  eprinttype    = {arXiv},
  eprint       = {2105.07246},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-07246.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-08710,
  author       = {Kanika Madan and
                  Nan Rosemary Ke and
                  Anirudh Goyal and
                  Bernhard Sch{\"{o}}lkopf and
                  Yoshua Bengio},
  title        = {Fast and Slow Learning of Recurrent Independent Mechanisms},
  journal      = {CoRR},
  volume       = {abs/2105.08710},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.08710},
  eprinttype    = {arXiv},
  eprint       = {2105.08710},
  timestamp    = {Mon, 31 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-08710.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-02097,
  author       = {Mingde Zhao and
                  Zhen Liu and
                  Sitao Luan and
                  Shuyuan Zhang and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {A Consciousness-Inspired Planning Agent for Model-Based Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2106.02097},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.02097},
  eprinttype    = {arXiv},
  eprint       = {2106.02097},
  timestamp    = {Mon, 06 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-02097.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04399,
  author       = {Emmanuel Bengio and
                  Moksh Jain and
                  Maksym Korablyov and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Flow Network based Generative Models for Non-Iterative Diverse Candidate
                  Generation},
  journal      = {CoRR},
  volume       = {abs/2106.04399},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04399},
  eprinttype    = {arXiv},
  eprint       = {2106.04399},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04399.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04624,
  author       = {Mirco Ravanelli and
                  Titouan Parcollet and
                  Peter Plantinga and
                  Aku Rouhe and
                  Samuele Cornell and
                  Loren Lugosch and
                  Cem Subakan and
                  Nauman Dawalatabad and
                  Abdelwahab Heba and
                  Jianyuan Zhong and
                  Ju{-}Chieh Chou and
                  Sung{-}Lin Yeh and
                  Szu{-}Wei Fu and
                  Chien{-}Feng Liao and
                  Elena Rastorgueva and
                  Fran{\c{c}}ois Grondin and
                  William Aris and
                  Hwidong Na and
                  Yan Gao and
                  Renato De Mori and
                  Yoshua Bengio},
  title        = {SpeechBrain: {A} General-Purpose Speech Toolkit},
  journal      = {CoRR},
  volume       = {abs/2106.04624},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04624},
  eprinttype    = {arXiv},
  eprint       = {2106.04624},
  timestamp    = {Wed, 16 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04624.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-06607,
  author       = {Kartik Ahuja and
                  Ethan Caballero and
                  Dinghuai Zhang and
                  Yoshua Bengio and
                  Ioannis Mitliagkas and
                  Irina Rish},
  title        = {Invariance Principle Meets Information Bottleneck for Out-of-Distribution
                  Generalization},
  journal      = {CoRR},
  volume       = {abs/2106.06607},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.06607},
  eprinttype    = {arXiv},
  eprint       = {2106.06607},
  timestamp    = {Tue, 15 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-06607.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-07635,
  author       = {Yashas Annadani and
                  Jonas Rothfuss and
                  Alexandre Lacoste and
                  Nino Scherrer and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Stefan Bauer},
  title        = {Variational Causal Networks: Approximate Bayesian Inference over Causal
                  Structures},
  journal      = {CoRR},
  volume       = {abs/2106.07635},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.07635},
  eprinttype    = {arXiv},
  eprint       = {2106.07635},
  timestamp    = {Wed, 16 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-07635.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-08365,
  author       = {Xu Ji and
                  Razvan Pascanu and
                  R. Devon Hjelm and
                  Andrea Vedaldi and
                  Balaji Lakshminarayanan and
                  Yoshua Bengio},
  title        = {Predicting Unreliable Predictions by Shattering a Neural Network},
  journal      = {CoRR},
  volume       = {abs/2106.08365},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.08365},
  eprinttype    = {arXiv},
  eprint       = {2106.08365},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-08365.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-00793,
  author       = {Kevin Xia and
                  Kai{-}Zhan Lee and
                  Yoshua Bengio and
                  Elias Bareinboim},
  title        = {The Causal-Neural Connection: Expressiveness, Learnability, and Inference},
  journal      = {CoRR},
  volume       = {abs/2107.00793},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.00793},
  eprinttype    = {arXiv},
  eprint       = {2107.00793},
  timestamp    = {Thu, 22 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-00793.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-00848,
  author       = {Nan Rosemary Ke and
                  Aniket Didolkar and
                  Sarthak Mittal and
                  Anirudh Goyal and
                  Guillaume Lajoie and
                  Stefan Bauer and
                  Danilo J. Rezende and
                  Yoshua Bengio and
                  Michael Mozer and
                  Christopher J. Pal},
  title        = {Systematic Evaluation of Causal Discovery in Visual Model Based Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2107.00848},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.00848},
  eprinttype    = {arXiv},
  eprint       = {2107.00848},
  timestamp    = {Wed, 07 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-00848.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-02367,
  author       = {Dianbo Liu and
                  Alex Lamb and
                  Kenji Kawaguchi and
                  Anirudh Goyal and
                  Chen Sun and
                  Michael Curtis Mozer and
                  Yoshua Bengio},
  title        = {Discrete-Valued Neural Communication},
  journal      = {CoRR},
  volume       = {abs/2107.02367},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.02367},
  eprinttype    = {arXiv},
  eprint       = {2107.02367},
  timestamp    = {Tue, 09 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-02367.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-02429,
  author       = {Nino Scherrer and
                  Olexa Bilaniuk and
                  Yashas Annadani and
                  Anirudh Goyal and
                  Patrick Schwab and
                  Bernhard Sch{\"{o}}lkopf and
                  Michael C. Mozer and
                  Yoshua Bengio and
                  Stefan Bauer and
                  Nan Rosemary Ke},
  title        = {Learning Neural Causal Models with Active Interventions},
  journal      = {CoRR},
  volume       = {abs/2109.02429},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.02429},
  eprinttype    = {arXiv},
  eprint       = {2109.02429},
  timestamp    = {Wed, 22 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-02429.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-02871,
  author       = {Victor Schmidt and
                  Alexandra Sasha Luccioni and
                  M{\'{e}}lisande Teng and
                  Tianyu Zhang and
                  Alexia Reynaud and
                  Sunand Raghupathi and
                  Gautier Cosne and
                  Adrien Juraver and
                  Vahe Vardanyan and
                  Alex Hern{\'{a}}ndez{-}Garc{\'{\i}}a and
                  Yoshua Bengio},
  title        = {ClimateGAN: Raising Climate Change Awareness by Generating Images
                  of Floods},
  journal      = {CoRR},
  volume       = {abs/2110.02871},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.02871},
  eprinttype    = {arXiv},
  eprint       = {2110.02871},
  timestamp    = {Thu, 21 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-02871.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-03372,
  author       = {Dinghuai Zhang and
                  Jie Fu and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Unifying Likelihood-free Inference with Black-box Sequence Design
                  and Beyond},
  journal      = {CoRR},
  volume       = {abs/2110.03372},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.03372},
  eprinttype    = {arXiv},
  eprint       = {2110.03372},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-03372.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-06399,
  author       = {Nasim Rahaman and
                  Muhammad Waleed Gondal and
                  Shruti Joshi and
                  Peter V. Gehler and
                  Yoshua Bengio and
                  Francesco Locatello and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Dynamic Inference with Neural Interpreters},
  journal      = {CoRR},
  volume       = {abs/2110.06399},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.06399},
  eprinttype    = {arXiv},
  eprint       = {2110.06399},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-06399.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-07875,
  author       = {Vijay Prakash Dwivedi and
                  Anh Tuan Luu and
                  Thomas Laurent and
                  Yoshua Bengio and
                  Xavier Bresson},
  title        = {Graph Neural Networks with Learnable Structural and Positional Representations},
  journal      = {CoRR},
  volume       = {abs/2110.07875},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.07875},
  eprinttype    = {arXiv},
  eprint       = {2110.07875},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-07875.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-09419,
  author       = {Sarthak Mittal and
                  Sharath Chandra Raparthy and
                  Irina Rish and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Compositional Attention: Disentangling Search and Retrieval},
  journal      = {CoRR},
  volume       = {abs/2110.09419},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.09419},
  eprinttype    = {arXiv},
  eprint       = {2110.09419},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-09419.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-10139,
  author       = {Max Morrison and
                  Rithesh Kumar and
                  Kundan Kumar and
                  Prem Seetharaman and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Chunked Autoregressive {GAN} for Conditional Waveform Synthesis},
  journal      = {CoRR},
  volume       = {abs/2110.10139},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.10139},
  eprinttype    = {arXiv},
  eprint       = {2110.10139},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-10139.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-15245,
  author       = {Nicholas Roy and
                  Ingmar Posner and
                  Tim D. Barfoot and
                  Philippe Beaudoin and
                  Yoshua Bengio and
                  Jeannette Bohg and
                  Oliver Brock and
                  Isabelle Depatie and
                  Dieter Fox and
                  Daniel E. Koditschek and
                  Tom{\'{a}}s Lozano{-}P{\'{e}}rez and
                  Vikash Mansinghka and
                  Christopher J. Pal and
                  Blake A. Richards and
                  Dorsa Sadigh and
                  Stefan Schaal and
                  Gaurav S. Sukhatme and
                  Denis Th{\'{e}}rien and
                  Marc Toussaint and
                  Michiel van de Panne},
  title        = {From Machine Learning to Robotics: Challenges and Opportunities for
                  Embodied Intelligence},
  journal      = {CoRR},
  volume       = {abs/2110.15245},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.15245},
  eprinttype    = {arXiv},
  eprint       = {2110.15245},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-15245.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-15796,
  author       = {Kartik Ahuja and
                  Jason S. Hartford and
                  Yoshua Bengio},
  title        = {Properties from Mechanisms: An Equivariance Perspective on Identifiable
                  Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2110.15796},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.15796},
  eprinttype    = {arXiv},
  eprint       = {2110.15796},
  timestamp    = {Thu, 04 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-15796.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-09266,
  author       = {Yoshua Bengio and
                  Tristan Deleu and
                  Edward J. Hu and
                  Salem Lahlou and
                  Mo Tiwari and
                  Emmanuel Bengio},
  title        = {GFlowNet Foundations},
  journal      = {CoRR},
  volume       = {abs/2111.09266},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.09266},
  eprinttype    = {arXiv},
  eprint       = {2111.09266},
  timestamp    = {Mon, 22 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-09266.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-03215,
  author       = {Mohammad Pezeshki and
                  Amartya Mitra and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Multi-scale Feature Learning Dynamics: Insights for Double Descent},
  journal      = {CoRR},
  volume       = {abs/2112.03215},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.03215},
  eprinttype    = {arXiv},
  eprint       = {2112.03215},
  timestamp    = {Wed, 08 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-03215.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-13734,
  author       = {Enoch Tetteh and
                  Joseph D. Viviano and
                  Yoshua Bengio and
                  David Krueger and
                  Joseph Paul Cohen},
  title        = {Multi-Domain Balanced Sampling Improves Out-of-Distribution Generalization
                  of Chest X-ray Pathology Prediction Models},
  journal      = {CoRR},
  volume       = {abs/2112.13734},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.13734},
  eprinttype    = {arXiv},
  eprint       = {2112.13734},
  timestamp    = {Tue, 04 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-13734.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/YooSBK20,
  author       = {ByungIn Yoo and
                  Tristan Sylvain and
                  Yoshua Bengio and
                  Junmo Kim},
  title        = {Joint Learning of Generative Translator and Classifier for Visually
                  Similar Classes},
  journal      = {{IEEE} Access},
  volume       = {8},
  pages        = {219160--219173},
  year         = {2020},
  url          = {https://doi.org/10.1109/ACCESS.2020.3042302},
  doi          = {10.1109/ACCESS.2020.3042302},
  timestamp    = {Mon, 04 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/YooSBK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/bioinformatics/TrofimovCBPL20,
  author       = {Assya Trofimov and
                  Joseph Paul Cohen and
                  Yoshua Bengio and
                  Claude Perreault and
                  S{\'{e}}bastien Lemieux},
  title        = {Factorized embeddings learns rich and biologically meaningful embedding
                  spaces using factorized tensor decomposition},
  journal      = {Bioinform.},
  volume       = {36},
  number       = {Supplement-1},
  pages        = {i417--i426},
  year         = {2020},
  url          = {https://doi.org/10.1093/bioinformatics/btaa488},
  doi          = {10.1093/BIOINFORMATICS/BTAA488},
  timestamp    = {Fri, 25 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/bioinformatics/TrofimovCBPL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/GoodfellowPMXWO20,
  author       = {Ian J. Goodfellow and
                  Jean Pouget{-}Abadie and
                  Mehdi Mirza and
                  Bing Xu and
                  David Warde{-}Farley and
                  Sherjil Ozair and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generative adversarial networks},
  journal      = {Commun. {ACM}},
  volume       = {63},
  number       = {11},
  pages        = {139--144},
  year         = {2020},
  url          = {https://doi.org/10.1145/3422622},
  doi          = {10.1145/3422622},
  timestamp    = {Wed, 11 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cacm/GoodfellowPMXWO20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/SerbanSPPB20,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Michael Pieper and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {The Bottleneck Simulator: {A} Model-Based Deep Reinforcement Learning
                  Approach},
  journal      = {J. Artif. Intell. Res.},
  volume       = {69},
  pages        = {571--612},
  year         = {2020},
  url          = {https://doi.org/10.1613/jair.1.12463},
  doi          = {10.1613/JAIR.1.12463},
  timestamp    = {Fri, 06 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/SerbanSPPB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mlst/ZhouLCBB20,
  author       = {Sharon Zhou and
                  Alexandra Luccioni and
                  Gautier Cosne and
                  Michael S. Bernstein and
                  Yoshua Bengio},
  title        = {Establishing an evaluation metric to quantify climate change image
                  realism},
  journal      = {Mach. Learn. Sci. Technol.},
  volume       = {1},
  number       = {2},
  pages        = {25005},
  year         = {2020},
  url          = {https://doi.org/10.1088/2632-2153/ab7657},
  doi          = {10.1088/2632-2153/AB7657},
  timestamp    = {Thu, 12 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mlst/ZhouLCBB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/SodhaniCB20,
  author       = {Shagun Sodhani and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {Toward Training Recurrent Neural Networks for Lifelong Learning},
  journal      = {Neural Comput.},
  volume       = {32},
  number       = {1},
  pages        = {1--35},
  year         = {2020},
  url          = {https://doi.org/10.1162/neco\_a\_01246},
  doi          = {10.1162/NECO\_A\_01246},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/SodhaniCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tasm/LuccioniB20,
  author       = {Alexandra Luccioni and
                  Yoshua Bengio},
  title        = {On the Morality of Artificial Intelligence [Commentary]},
  journal      = {{IEEE} Technol. Soc. Mag.},
  volume       = {39},
  number       = {1},
  pages        = {16--25},
  year         = {2020},
  url          = {https://doi.org/10.1109/MTS.2020.2967486},
  doi          = {10.1109/MTS.2020.2967486},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tasm/LuccioniB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ZolnaSBHCBB20,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning (Student
                  Abstract)},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {13999--14000},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i10.7272},
  doi          = {10.1609/AAAI.V34I10.7272},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ZolnaSBHCBB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/RussinJOB20,
  author       = {Jacob L. Russin and
                  Jason Jo and
                  Randall C. O'Reilly and
                  Yoshua Bengio},
  editor       = {Shruti Rijhwani and
                  Jiangming Liu and
                  Yizhong Wang and
                  Rotem Dror},
  title        = {Compositional Generalization by Factorizing Alignment and Translation},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics: Student Research Workshop, {ACL} 2020, Online, July 5-10,
                  2020},
  pages        = {313--327},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-srw.42},
  doi          = {10.18653/V1/2020.ACL-SRW.42},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/RussinJOB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/DuLSOBZ20,
  author       = {Wenyu Du and
                  Zhouhan Lin and
                  Yikang Shen and
                  Timothy J. O'Donnell and
                  Yoshua Bengio and
                  Yue Zhang},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {Exploiting Syntactic Structure for Better Language Modeling: {A} Syntactic
                  Distance Approach},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {6611--6628},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.591},
  doi          = {10.18653/V1/2020.ACL-MAIN.591},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/DuLSOBZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aied/SerbanGKVBPCCB20,
  author       = {Iulian Vlad Serban and
                  Varun Gupta and
                  Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Laurent Charlin and
                  Yoshua Bengio},
  editor       = {Ig Ibert Bittencourt and
                  Mutlu Cukurova and
                  Kasia Muldner and
                  Rose Luckin and
                  Eva Mill{\'{a}}n},
  title        = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for
                  {STEM}},
  booktitle    = {Artificial Intelligence in Education - 21st International Conference,
                  {AIED} 2020, Ifrane, Morocco, July 6-10, 2020, Proceedings, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12164},
  pages        = {387--392},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-52240-7\_70},
  doi          = {10.1007/978-3-030-52240-7\_70},
  timestamp    = {Tue, 07 Jul 2020 13:05:42 +0200},
  biburl       = {https://dblp.org/rec/conf/aied/SerbanGKVBPCCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/ThomasPMMBR20,
  author       = {Valentin Thomas and
                  Fabian Pedregosa and
                  Bart van Merri{\"{e}}nboer and
                  Pierre{-}Antoine Manzagol and
                  Yoshua Bengio and
                  Nicolas Le Roux},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {On the interplay between noise and curvature and its effect on optimization
                  and generalization},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {3503--3513},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/thomas20a.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/ThomasPMMBR20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cogsci/RussinJOB20,
  author       = {Jacob L. Russin and
                  Jason Jo and
                  Randall C. O'Reilly and
                  Yoshua Bengio},
  editor       = {Stephanie Denison and
                  Michael Mack and
                  Yang Xu and
                  Blair C. Armstrong},
  title        = {Systematicity in a Recurrent Neural Network by Factorizing Syntax
                  and Semantics},
  booktitle    = {Proceedings of the 42th Annual Meeting of the Cognitive Science Society
                  - Developing a Mind: Learning in Humans, Animals, and Machines, CogSci
                  2020, virtual, July 29 - August 1, 2020},
  publisher    = {cognitivesciencesociety.org},
  year         = {2020},
  url          = {https://cogsci.mindmodeling.org/2020/papers/0027/index.html},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cogsci/RussinJOB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cpaior/BengioFLPS20,
  author       = {Yoshua Bengio and
                  Emma Frejinger and
                  Andrea Lodi and
                  Rahul Patel and
                  Sriram Sankaranarayanan},
  editor       = {Emmanuel Hebrard and
                  Nysret Musliu},
  title        = {A Learning-Based Algorithm to Quickly Compute Good Primal Solutions
                  for Stochastic Integer Programs},
  booktitle    = {Integration of Constraint Programming, Artificial Intelligence, and
                  Operations Research - 17th International Conference, {CPAIOR} 2020,
                  Vienna, Austria, September 21-24, 2020, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12296},
  pages        = {99--111},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58942-4\_7},
  doi          = {10.1007/978-3-030-58942-4\_7},
  timestamp    = {Tue, 22 Sep 2020 17:23:47 +0200},
  biburl       = {https://dblp.org/rec/conf/cpaior/BengioFLPS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/ArefinMSKKKB20,
  author       = {Md Rifat Arefin and
                  Vincent Michalski and
                  Pierre{-}Luc St{-}Charles and
                  Alfredo Kalaitzis and
                  Sookyung Kim and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio},
  title        = {Multi-Image Super-Resolution for Remote Sensing using Deep Recurrent
                  Networks},
  booktitle    = {2020 {IEEE/CVF} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} Workshops 2020, Seattle, WA, USA, June 14-19, 2020},
  pages        = {816--825},
  publisher    = {Computer Vision Foundation / {IEEE}},
  year         = {2020},
  url          = {https://openaccess.thecvf.com/content\_CVPRW\_2020/html/w11/Arefin\_Multi-Image\_Super-Resolution\_for\_Remote\_Sensing\_Using\_Deep\_Recurrent\_Networks\_CVPRW\_2020\_paper.html},
  doi          = {10.1109/CVPRW50498.2020.00111},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/ArefinMSKKKB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/MilbichRBSBOC20,
  author       = {Timo Milbich and
                  Karsten Roth and
                  Homanga Bharadhwaj and
                  Samarth Sinha and
                  Yoshua Bengio and
                  Bj{\"{o}}rn Ommer and
                  Joseph Paul Cohen},
  editor       = {Andrea Vedaldi and
                  Horst Bischof and
                  Thomas Brox and
                  Jan{-}Michael Frahm},
  title        = {DiVA: Diverse Visual Feature Aggregation for Deep Metric Learning},
  booktitle    = {Computer Vision - {ECCV} 2020 - 16th European Conference, Glasgow,
                  UK, August 23-28, 2020, Proceedings, Part {VIII}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12353},
  pages        = {590--607},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-58598-3\_35},
  doi          = {10.1007/978-3-030-58598-3\_35},
  timestamp    = {Tue, 10 Nov 2020 13:42:59 +0100},
  biburl       = {https://dblp.org/rec/conf/eccv/MilbichRBSBOC20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/BiskHTABCLLMNPT20,
  author       = {Yonatan Bisk and
                  Ari Holtzman and
                  Jesse Thomason and
                  Jacob Andreas and
                  Yoshua Bengio and
                  Joyce Chai and
                  Mirella Lapata and
                  Angeliki Lazaridou and
                  Jonathan May and
                  Aleksandr Nisnevich and
                  Nicolas Pinto and
                  Joseph P. Turian},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Experience Grounds Language},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {8718--8735},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.703},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.703},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/BiskHTABCLLMNPT20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RavanelliZPSMTB20,
  author       = {Mirco Ravanelli and
                  Jianyuan Zhong and
                  Santiago Pascual and
                  Pawel Swietojanski and
                  Jo{\~{a}}o Monteiro and
                  Jan Trmal and
                  Yoshua Bengio},
  title        = {Multi-Task Self-Supervised Learning for Robust Speech Recognition},
  booktitle    = {2020 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2020, Barcelona, Spain, May 4-8, 2020},
  pages        = {6989--6993},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICASSP40776.2020.9053569},
  doi          = {10.1109/ICASSP40776.2020.9053569},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/RavanelliZPSMTB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BengioDRKLBGP20,
  author       = {Yoshua Bengio and
                  Tristan Deleu and
                  Nasim Rahaman and
                  Nan Rosemary Ke and
                  S{\'{e}}bastien Lachapelle and
                  Olexa Bilaniuk and
                  Anirudh Goyal and
                  Christopher J. Pal},
  title        = {A Meta-Transfer Objective for Learning to Disentangle Causal Mechanisms},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=ryxWIgBFPS},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BengioDRKLBGP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalBBL20,
  author       = {Anirudh Goyal and
                  Yoshua Bengio and
                  Matthew M. Botvinick and
                  Sergey Levine},
  title        = {The Variational Bandwidth Bottleneck: Stochastic Evaluation on an
                  Information Budget},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=Hye1kTVFDS},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalBBL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalSBPLB20,
  author       = {Anirudh Goyal and
                  Shagun Sodhani and
                  Jonathan Binas and
                  Xue Bin Peng and
                  Sergey Levine and
                  Yoshua Bengio},
  title        = {Reinforcement Learning with Competitive Ensembles of Information-Constrained
                  Primitives},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=ryxgJTEYDr},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalSBPLB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/OreshkinCCB20,
  author       = {Boris N. Oreshkin and
                  Dmitri Carpov and
                  Nicolas Chapados and
                  Yoshua Bengio},
  title        = {{N-BEATS:} Neural basis expansion analysis for interpretable time
                  series forecasting},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=r1ecqn4YwB},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/OreshkinCCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RahamanWGRB20,
  author       = {Nasim Rahaman and
                  Steffen Wolf and
                  Anirudh Goyal and
                  Roman Remme and
                  Yoshua Bengio},
  title        = {Learning the Arrow of Time for Problems in Reinforcement Learning},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=rylJkpEtwS},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RahamanWGRB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/FedusRABLRD20,
  author       = {William Fedus and
                  Prajit Ramachandran and
                  Rishabh Agarwal and
                  Yoshua Bengio and
                  Hugo Larochelle and
                  Mark Rowland and
                  Will Dabney},
  title        = {Revisiting Fundamentals of Experience Replay},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {3061--3071},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/fedus20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/FedusRABLRD20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GottipatiSNPWLL20,
  author       = {Sai Krishna Gottipati and
                  Boris Sattarov and
                  Sufeng Niu and
                  Yashaswi Pathak and
                  Haoran Wei and
                  Shengchao Liu and
                  Simon Blackburn and
                  Karam M. J. Thomas and
                  Connor W. Coley and
                  Jian Tang and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {Learning to Navigate The Synthetically Accessible Chemical Space Using
                  Reinforcement Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {3668--3679},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/gottipati20a.html},
  timestamp    = {Thu, 01 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GottipatiSNPWLL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MittalLGVSLMB20,
  author       = {Sarthak Mittal and
                  Alex Lamb and
                  Anirudh Goyal and
                  Vikram Voleti and
                  Murray Shanahan and
                  Guillaume Lajoie and
                  Michael Mozer and
                  Yoshua Bengio},
  title        = {Learning to Combine Top-Down and Bottom-Up Signals in Recurrent Neural
                  Networks with Attention over Modules},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {6972--6986},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/mittal20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/MittalLGVSLMB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SinhaZGBLO20,
  author       = {Samarth Sinha and
                  Han Zhang and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Hugo Larochelle and
                  Augustus Odena},
  title        = {Small-GAN: Speeding up {GAN} Training using Core-Sets},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {9005--9015},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/sinha20b.html},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SinhaZGBLO20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ZhangZLBP20,
  author       = {Zijun Zhang and
                  Ruixiang Zhang and
                  Zongpeng Li and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {Perceptual Generative Autoencoders},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {11298--11306},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/zhang20ab.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/ZhangZLBP20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpr/HaceneLGCB20,
  author       = {Ghouthi Boukli Hacene and
                  Carlos Lassance and
                  Vincent Gripon and
                  Matthieu Courbariaux and
                  Yoshua Bengio},
  title        = {Attention Based Pruning for Shift Networks},
  booktitle    = {25th International Conference on Pattern Recognition, {ICPR} 2020,
                  Virtual Event / Milan, Italy, January 10-15, 2021},
  pages        = {4054--4061},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ICPR48806.2021.9412859},
  doi          = {10.1109/ICPR48806.2021.9412859},
  timestamp    = {Fri, 07 May 2021 08:42:33 +0200},
  biburl       = {https://dblp.org/rec/conf/icpr/HaceneLGCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/newcas/HaceneGAFB20,
  author       = {Ghouthi Boukli Hacene and
                  Vincent Gripon and
                  Matthieu Arzel and
                  Nicolas Farrugia and
                  Yoshua Bengio},
  title        = {Quantized Guided Pruning for Efficient Hardware Implementations of
                  Deep Neural Networks},
  booktitle    = {18th {IEEE} International New Circuits and Systems Conference, {NEWCAS}
                  2020, Montr{\'{e}}al, QC, Canada, June 16-19, 2020},
  pages        = {206--209},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/NEWCAS49341.2020.9159769},
  doi          = {10.1109/NEWCAS49341.2020.9159769},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/newcas/HaceneGAFB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CheZSLPCB20,
  author       = {Tong Che and
                  Ruixiang Zhang and
                  Jascha Sohl{-}Dickstein and
                  Hugo Larochelle and
                  Liam Paull and
                  Yuan Cao and
                  Yoshua Bengio},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Your {GAN} is Secretly an Energy-based Model and You Should Use Discriminator
                  Driven Latent Sampling},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/90525e70b7842930586545c6f1c9310c-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/CheZSLPCB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GuptaGKM0B20,
  author       = {Prateek Gupta and
                  Maxime Gasse and
                  Elias B. Khalil and
                  Pawan Kumar Mudigonda and
                  Andrea Lodi and
                  Yoshua Bengio},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Hybrid Models for Learning to Branch},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/d1e946f4e67db4b362ad23818a6fb78a-Abstract.html},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GuptaGKM0B20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KergKGGBL20,
  author       = {Giancarlo Kerg and
                  Bhargav Kanuparthi and
                  Anirudh Goyal and
                  Kyle Goyette and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Untangling tradeoffs between recurrence and self-attention in artificial
                  neural networks},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/e2065cb56f5533494522c46a72f1dfb0-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KergKGGBL20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-00006,
  author       = {Travis LaCroix and
                  Yoshua Bengio},
  title        = {Learning from Learning Machines: Optimisation, Rules, and Social Norms},
  journal      = {CoRR},
  volume       = {abs/2001.00006},
  year         = {2020},
  url          = {http://arxiv.org/abs/2001.00006},
  eprinttype    = {arXiv},
  eprint       = {2001.00006},
  timestamp    = {Fri, 10 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-00006.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-04025,
  author       = {Chen Ma and
                  Dylan R. Ashley and
                  Junfeng Wen and
                  Yoshua Bengio},
  title        = {Universal Successor Features for Transfer Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2001.04025},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.04025},
  eprinttype    = {arXiv},
  eprint       = {2001.04025},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-04025.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-09239,
  author       = {Mirco Ravanelli and
                  Jianyuan Zhong and
                  Santiago Pascual and
                  Pawel Swietojanski and
                  Jo{\~{a}}o Monteiro and
                  Jan Trmal and
                  Yoshua Bengio},
  title        = {Multi-task self-supervised learning for Robust Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/2001.09239},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.09239},
  eprinttype    = {arXiv},
  eprint       = {2001.09239},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-09239.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2001-09531,
  author       = {Gautier Cosne and
                  Adrien Juraver and
                  M{\'{e}}lisande Teng and
                  Victor Schmidt and
                  Vahe Vardanyan and
                  Alexandra Luccioni and
                  Yoshua Bengio},
  title        = {Using Simulated Data to Generate Images of Climate Change},
  journal      = {CoRR},
  volume       = {abs/2001.09531},
  year         = {2020},
  url          = {https://arxiv.org/abs/2001.09531},
  eprinttype    = {arXiv},
  eprint       = {2001.09531},
  timestamp    = {Thu, 30 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2001-09531.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-00412,
  author       = {Konrad Zolna and
                  Chitwan Saharia and
                  L{\'{e}}onard Boussioux and
                  David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {Combating False Negatives in Adversarial Imitation Learning},
  journal      = {CoRR},
  volume       = {abs/2002.00412},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.00412},
  eprinttype    = {arXiv},
  eprint       = {2002.00412},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-00412.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-02887,
  author       = {Boris N. Oreshkin and
                  Dmitri Carpov and
                  Nicolas Chapados and
                  Yoshua Bengio},
  title        = {Meta-learning framework with applications to zero-shot time-series
                  forecasting},
  journal      = {CoRR},
  volume       = {abs/2002.02887},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02887},
  eprinttype    = {arXiv},
  eprint       = {2002.02887},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02887.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-03090,
  author       = {Milos Nikolic and
                  Ghouthi Boukli Hacene and
                  Ciaran Bannon and
                  Alberto Delmas Lascorz and
                  Matthieu Courbariaux and
                  Yoshua Bengio and
                  Vincent Gripon and
                  Andreas Moshovos},
  title        = {BitPruning: Learning Bitlengths for Aggressive and Accurate Quantization},
  journal      = {CoRR},
  volume       = {abs/2002.03090},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.03090},
  eprinttype    = {arXiv},
  eprint       = {2002.03090},
  timestamp    = {Tue, 11 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-03090.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-05120,
  author       = {Giulia Zarpellon and
                  Jason Jo and
                  Andrea Lodi and
                  Yoshua Bengio},
  title        = {Parameterizing Branch-and-Bound Search Trees to Learn Branching Policies},
  journal      = {CoRR},
  volume       = {abs/2002.05120},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.05120},
  eprinttype    = {arXiv},
  eprint       = {2002.05120},
  timestamp    = {Fri, 14 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-05120.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-06460,
  author       = {Michel Deudon and
                  Alfredo Kalaitzis and
                  Israel Goytom and
                  Md Rifat Arefin and
                  Zhichao Lin and
                  Kris Sankaran and
                  Vincent Michalski and
                  Samira Ebrahimi Kahou and
                  Julien Cornebise and
                  Yoshua Bengio},
  title        = {HighRes-net: Recursive Fusion for Multi-Frame Super-Resolution of
                  Satellite Imagery},
  journal      = {CoRR},
  volume       = {abs/2002.06460},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.06460},
  eprinttype    = {arXiv},
  eprint       = {2002.06460},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-06460.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-09046,
  author       = {Devansh Arpit and
                  Huan Wang and
                  Caiming Xiong and
                  Richard Socher and
                  Yoshua Bengio},
  title        = {Neural Bayes: {A} Generic Parameterization Method for Unsupervised
                  Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2002.09046},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.09046},
  eprinttype    = {arXiv},
  eprint       = {2002.09046},
  timestamp    = {Tue, 03 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-09046.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-12499,
  author       = {William Fedus and
                  Dibya Ghosh and
                  John D. Martin and
                  Marc G. Bellemare and
                  Yoshua Bengio and
                  Hugo Larochelle},
  title        = {On Catastrophic Interference in Atari 2600 Games},
  journal      = {CoRR},
  volume       = {abs/2002.12499},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.12499},
  eprinttype    = {arXiv},
  eprint       = {2002.12499},
  timestamp    = {Tue, 05 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-12499.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-00982,
  author       = {Vijay Prakash Dwivedi and
                  Chaitanya K. Joshi and
                  Thomas Laurent and
                  Yoshua Bengio and
                  Xavier Bresson},
  title        = {Benchmarking Graph Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2003.00982},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.00982},
  eprinttype    = {arXiv},
  eprint       = {2003.00982},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-00982.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-04382,
  author       = {Qicheng Lao and
                  Xiang Jiang and
                  Mohammad Havaei and
                  Yoshua Bengio},
  title        = {Continuous Domain Adaptation with Variational Domain-Agnostic Feature
                  Replay},
  journal      = {CoRR},
  volume       = {abs/2003.04382},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.04382},
  eprinttype    = {arXiv},
  eprint       = {2003.04382},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-04382.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-06060,
  author       = {Tong Che and
                  Ruixiang Zhang and
                  Jascha Sohl{-}Dickstein and
                  Hugo Larochelle and
                  Liam Paull and
                  Yuan Cao and
                  Yoshua Bengio},
  title        = {Your {GAN} is Secretly an Energy-based Model and You Should use Discriminator
                  Driven Latent Sampling},
  journal      = {CoRR},
  volume       = {abs/2003.06060},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.06060},
  eprinttype    = {arXiv},
  eprint       = {2003.06060},
  timestamp    = {Tue, 17 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-06060.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-07449,
  author       = {Tristan Sylvain and
                  Pengchuan Zhang and
                  Yoshua Bengio and
                  R. Devon Hjelm and
                  Shikhar Sharma},
  title        = {Object-Centric Image Generation from Layouts},
  journal      = {CoRR},
  volume       = {abs/2003.07449},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.07449},
  eprinttype    = {arXiv},
  eprint       = {2003.07449},
  timestamp    = {Wed, 02 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-07449.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-07213,
  author       = {Miles Brundage and
                  Shahar Avin and
                  Jasmine Wang and
                  Haydn Belfield and
                  Gretchen Krueger and
                  Gillian K. Hadfield and
                  Heidy Khlaaf and
                  Jingying Yang and
                  Helen Toner and
                  Ruth Fong and
                  Tegan Maharaj and
                  Pang Wei Koh and
                  Sara Hooker and
                  Jade Leung and
                  Andrew Trask and
                  Emma Bluemke and
                  Jonathan Lebensold and
                  Cullen O'Keefe and
                  Mark Koren and
                  Th{\'{e}}o Ryffel and
                  J. B. Rubinovitz and
                  Tamay Besiroglu and
                  Federica Carugati and
                  Jack Clark and
                  Peter Eckersley and
                  Sarah de Haas and
                  Maritza Johnson and
                  Ben Laurie and
                  Alex Ingerman and
                  Igor Krawczuk and
                  Amanda Askell and
                  Rosario Cammarota and
                  Andrew Lohn and
                  David Krueger and
                  Charlotte Stix and
                  Peter Henderson and
                  Logan Graham and
                  Carina Prunkl and
                  Bianca Martin and
                  Elizabeth Seger and
                  Noa Zilberman and
                  Se{\'{a}}n {\'{O}} h{\'{E}}igeartaigh and
                  Frens Kroeger and
                  Girish Sastry and
                  Rebecca Kagan and
                  Adrian Weller and
                  Brian Tse and
                  Elizabeth Barnes and
                  Allan Dafoe and
                  Paul Scharre and
                  Ariel Herbert{-}Voss and
                  Martijn Rasser and
                  Shagun Sodhani and
                  Carrick Flynn and
                  Thomas Krendl Gilbert and
                  Lisa Dyer and
                  Saif Khan and
                  Yoshua Bengio and
                  Markus Anderljung},
  title        = {Toward Trustworthy {AI} Development: Mechanisms for Supporting Verifiable
                  Claims},
  journal      = {CoRR},
  volume       = {abs/2004.07213},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.07213},
  eprinttype    = {arXiv},
  eprint       = {2004.07213},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-07213.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-10151,
  author       = {Yonatan Bisk and
                  Ari Holtzman and
                  Jesse Thomason and
                  Jacob Andreas and
                  Yoshua Bengio and
                  Joyce Chai and
                  Mirella Lapata and
                  Angeliki Lazaridou and
                  Jonathan May and
                  Aleksandr Nisnevich and
                  Nicolas Pinto and
                  Joseph P. Turian},
  title        = {Experience Grounds Language},
  journal      = {CoRR},
  volume       = {abs/2004.10151},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.10151},
  eprinttype    = {arXiv},
  eprint       = {2004.10151},
  timestamp    = {Tue, 28 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-10151.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-11935,
  author       = {Anirudh Goyal and
                  Yoshua Bengio and
                  Matthew M. Botvinick and
                  Sergey Levine},
  title        = {The Variational Bandwidth Bottleneck: Stochastic Evaluation on an
                  Information Budget},
  journal      = {CoRR},
  volume       = {abs/2004.11935},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.11935},
  eprinttype    = {arXiv},
  eprint       = {2004.11935},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-11935.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-12485,
  author       = {Sai Krishna Gottipati and
                  Boris Sattarov and
                  Sufeng Niu and
                  Yashaswi Pathak and
                  Haoran Wei and
                  Shengchao Liu and
                  Karam M. J. Thomas and
                  Simon Blackburn and
                  Connor W. Coley and
                  Jian Tang and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {Learning To Navigate The Synthetically Accessible Chemical Space Using
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2004.12485},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.12485},
  eprinttype    = {arXiv},
  eprint       = {2004.12485},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-12485.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-13458,
  author       = {Timo Milbich and
                  Karsten Roth and
                  Homanga Bharadhwaj and
                  Samarth Sinha and
                  Yoshua Bengio and
                  Bj{\"{o}}rn Ommer and
                  Joseph Paul Cohen},
  title        = {DiVA: Diverse Visual Feature Aggregation for Deep Metric Learning},
  journal      = {CoRR},
  volume       = {abs/2004.13458},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.13458},
  eprinttype    = {arXiv},
  eprint       = {2004.13458},
  timestamp    = {Sat, 02 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-13458.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-04168,
  author       = {Maxence Ernoult and
                  Julie Grollier and
                  Damien Querlioz and
                  Yoshua Bengio and
                  Benjamin Scellier},
  title        = {Equilibrium Propagation with Continual Weight Updates},
  journal      = {CoRR},
  volume       = {abs/2005.04168},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.04168},
  eprinttype    = {arXiv},
  eprint       = {2005.04168},
  timestamp    = {Thu, 14 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-04168.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-04169,
  author       = {Maxence Ernoult and
                  Julie Grollier and
                  Damien Querlioz and
                  Yoshua Bengio and
                  Benjamin Scellier},
  title        = {Continual Weight Updates and Convolutional Architectures for Equilibrium
                  Propagation},
  journal      = {CoRR},
  volume       = {abs/2005.04169},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.04169},
  eprinttype    = {arXiv},
  eprint       = {2005.04169},
  timestamp    = {Thu, 14 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-04169.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-05864,
  author       = {Wenyu Du and
                  Zhouhan Lin and
                  Yikang Shen and
                  Timothy J. O'Donnell and
                  Yoshua Bengio and
                  Yue Zhang},
  title        = {Exploiting Syntactic Structure for Better Language Modeling: {A} Syntactic
                  Distance Approach},
  journal      = {CoRR},
  volume       = {abs/2005.05864},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.05864},
  eprinttype    = {arXiv},
  eprint       = {2005.05864},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-05864.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-06616,
  author       = {Iulian Vlad Serban and
                  Varun Gupta and
                  Ekaterina Kochmar and
                  Dung Do Vu and
                  Robert Belfer and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Laurent Charlin and
                  Yoshua Bengio},
  title        = {A Large-Scale, Open-Domain, Mixed-Interface Dialogue-Based {ITS} for
                  {STEM}},
  journal      = {CoRR},
  volume       = {abs/2005.06616},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.06616},
  eprinttype    = {arXiv},
  eprint       = {2005.06616},
  timestamp    = {Fri, 22 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-06616.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-08502,
  author       = {Hannah Alsdurf and
                  Yoshua Bengio and
                  Tristan Deleu and
                  Prateek Gupta and
                  Daphne Ippolito and
                  Richard Janda and
                  Max Jarvie and
                  Tyler Kolody and
                  Sekoul Krastev and
                  Tegan Maharaj and
                  Robert Obryk and
                  Dan Pilat and
                  Valerie Pisano and
                  Benjamin Prud'homme and
                  Meng Qu and
                  Nasim Rahaman and
                  Irina Rish and
                  Jean{-}Franois Rousseau and
                  Abhinav Sharma and
                  Brooke Struck and
                  Jian Tang and
                  Martin Weiss and
                  Yun William Yu},
  title        = {{COVI} White Paper},
  journal      = {CoRR},
  volume       = {abs/2005.08502},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.08502},
  eprinttype    = {arXiv},
  eprint       = {2005.08502},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-08502.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-09136,
  author       = {R{\'{e}}mi Le Priol and
                  Reza Babanezhad Harikandeh and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  title        = {An Analysis of the Adaptation Speed of Causal Models},
  journal      = {CoRR},
  volume       = {abs/2005.09136},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.09136},
  eprinttype    = {arXiv},
  eprint       = {2005.09136},
  timestamp    = {Fri, 22 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-09136.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2005-11856,
  author       = {Joseph Paul Cohen and
                  Lan Dao and
                  Paul Morrison and
                  Karsten Roth and
                  Yoshua Bengio and
                  Beiyi Shen and
                  Almas Abbasi and
                  Mahsa Hoshmand{-}Kochi and
                  Marzyeh Ghassemi and
                  Haifang Li and
                  Tim Q. Duong},
  title        = {Predicting {COVID-19} Pneumonia Severity on Chest X-ray with Deep
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2005.11856},
  year         = {2020},
  url          = {https://arxiv.org/abs/2005.11856},
  eprinttype    = {arXiv},
  eprint       = {2005.11856},
  timestamp    = {Fri, 29 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2005-11856.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-01981,
  author       = {Jack D. Kendall and
                  Ross D. Pantone and
                  Kalpana Manickavasagam and
                  Yoshua Bengio and
                  Benjamin Scellier},
  title        = {Training End-to-End Analog Neural Networks with Equilibrium Propagation},
  journal      = {CoRR},
  volume       = {abs/2006.01981},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.01981},
  eprinttype    = {arXiv},
  eprint       = {2006.01981},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-01981.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-03824,
  author       = {Axel Laborieux and
                  Maxence Ernoult and
                  Benjamin Scellier and
                  Yoshua Bengio and
                  Julie Grollier and
                  Damien Querlioz},
  title        = {Scaling Equilibrium Propagation to Deep ConvNets by Drastically Reducing
                  its Gradient Estimator Bias},
  journal      = {CoRR},
  volume       = {abs/2006.03824},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.03824},
  eprinttype    = {arXiv},
  eprint       = {2006.03824},
  timestamp    = {Fri, 12 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-03824.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-07461,
  author       = {Khurram Javed and
                  Martha White and
                  Yoshua Bengio},
  title        = {Learning Causal Models Online},
  journal      = {CoRR},
  volume       = {abs/2006.07461},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.07461},
  eprinttype    = {arXiv},
  eprint       = {2006.07461},
  timestamp    = {Wed, 17 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-07461.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-09471,
  author       = {Giancarlo Kerg and
                  Bhargav Kanuparthi and
                  Anirudh Goyal and
                  Kyle Goyette and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Untangling tradeoffs between recurrence and self-attention in neural
                  networks},
  journal      = {CoRR},
  volume       = {abs/2006.09471},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.09471},
  eprinttype    = {arXiv},
  eprint       = {2006.09471},
  timestamp    = {Tue, 23 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-09471.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-12278,
  author       = {Yihe Dong and
                  Will Sawin and
                  Yoshua Bengio},
  title        = {{HNHN:} Hypergraph Networks with Hyperedge Neurons},
  journal      = {CoRR},
  volume       = {abs/2006.12278},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.12278},
  eprinttype    = {arXiv},
  eprint       = {2006.12278},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-12278.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-13291,
  author       = {Matthew Amodio and
                  Rim Assouel and
                  Victor Schmidt and
                  Tristan Sylvain and
                  Smita Krishnaswamy and
                  Yoshua Bengio},
  title        = {Image-to-image Mapping with Many Domains by Sparse Attribute Transfer},
  journal      = {CoRR},
  volume       = {abs/2006.13291},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13291},
  eprinttype    = {arXiv},
  eprint       = {2006.13291},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13291.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-13352,
  author       = {Bo Li and
                  Yezhen Wang and
                  Tong Che and
                  Shanghang Zhang and
                  Sicheng Zhao and
                  Pengfei Xu and
                  Wei Zhou and
                  Yoshua Bengio and
                  Kurt Keutzer},
  title        = {Rethinking Distributional Matching Based Domain Adaptation},
  journal      = {CoRR},
  volume       = {abs/2006.13352},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.13352},
  eprinttype    = {arXiv},
  eprint       = {2006.13352},
  timestamp    = {Mon, 28 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-13352.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-15212,
  author       = {Prateek Gupta and
                  Maxime Gasse and
                  Elias B. Khalil and
                  M. Pawan Kumar and
                  Andrea Lodi and
                  Yoshua Bengio},
  title        = {Hybrid Models for Learning to Branch},
  journal      = {CoRR},
  volume       = {abs/2006.15212},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.15212},
  eprinttype    = {arXiv},
  eprint       = {2006.15212},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-15212.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-16225,
  author       = {Anirudh Goyal and
                  Alex Lamb and
                  Phanideep Gampa and
                  Philippe Beaudoin and
                  Sergey Levine and
                  Charles Blundell and
                  Yoshua Bengio and
                  Michael Mozer},
  title        = {Object Files and Schemata: Factorizing Declarative and Procedural
                  Knowledge in Dynamical Systems},
  journal      = {CoRR},
  volume       = {abs/2006.16225},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.16225},
  eprinttype    = {arXiv},
  eprint       = {2006.16225},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-16225.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-16981,
  author       = {Sarthak Mittal and
                  Alex Lamb and
                  Anirudh Goyal and
                  Vikram Voleti and
                  Murray Shanahan and
                  Guillaume Lajoie and
                  Michael Mozer and
                  Yoshua Bengio},
  title        = {Learning to Combine Top-Down and Bottom-Up Signals in Recurrent Neural
                  Networks with Attention over Modules},
  journal      = {CoRR},
  volume       = {abs/2006.16981},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.16981},
  eprinttype    = {arXiv},
  eprint       = {2006.16981},
  timestamp    = {Thu, 02 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-16981.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-06533,
  author       = {Nasim Rahaman and
                  Anirudh Goyal and
                  Muhammad Waleed Gondal and
                  Manuel Wuthrich and
                  Stefan Bauer and
                  Yash Sharma and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {S2RMs: Spatially Structured Recurrent Modules},
  journal      = {CoRR},
  volume       = {abs/2007.06533},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.06533},
  eprinttype    = {arXiv},
  eprint       = {2007.06533},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-06533.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-06700,
  author       = {William Fedus and
                  Prajit Ramachandran and
                  Rishabh Agarwal and
                  Yoshua Bengio and
                  Hugo Larochelle and
                  Mark Rowland and
                  Will Dabney},
  title        = {Revisiting Fundamentals of Experience Replay},
  journal      = {CoRR},
  volume       = {abs/2007.06700},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.06700},
  eprinttype    = {arXiv},
  eprint       = {2007.06700},
  timestamp    = {Tue, 21 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-06700.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-12770,
  author       = {David Yu{-}Tung Hui and
                  Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {BabyAI 1.1},
  journal      = {CoRR},
  volume       = {abs/2007.12770},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.12770},
  eprinttype    = {arXiv},
  eprint       = {2007.12770},
  timestamp    = {Wed, 29 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-12770.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-15139,
  author       = {Yoshua Bengio},
  title        = {Deriving Differential Target Propagation from Iterating Approximate
                  Inverses},
  journal      = {CoRR},
  volume       = {abs/2007.15139},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.15139},
  eprinttype    = {arXiv},
  eprint       = {2007.15139},
  timestamp    = {Mon, 03 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-15139.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-06456,
  author       = {Lucas Willems and
                  Salem Lahlou and
                  Yoshua Bengio},
  title        = {Mastering Rate based Curriculum Learning},
  journal      = {CoRR},
  volume       = {abs/2008.06456},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.06456},
  eprinttype    = {arXiv},
  eprint       = {2008.06456},
  timestamp    = {Fri, 21 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-06456.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-11783,
  author       = {Taesup Kim and
                  Sungwoong Kim and
                  Yoshua Bengio},
  title        = {Visual Concept Reasoning Networks},
  journal      = {CoRR},
  volume       = {abs/2008.11783},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.11783},
  eprinttype    = {arXiv},
  eprint       = {2008.11783},
  timestamp    = {Tue, 15 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-11783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-04029,
  author       = {Meng Qu and
                  Junkun Chen and
                  Louis{-}Pascal A. C. Xhonneux and
                  Yoshua Bengio and
                  Jian Tang},
  title        = {RNNLogic: Learning Logic Rules for Reasoning on Knowledge Graphs},
  journal      = {CoRR},
  volume       = {abs/2010.04029},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.04029},
  eprinttype    = {arXiv},
  eprint       = {2010.04029},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-04029.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-04296,
  author       = {Ossama Ahmed and
                  Frederik Tr{\"{a}}uble and
                  Anirudh Goyal and
                  Alexander Neitz and
                  Manuel W{\"{u}}thrich and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf and
                  Stefan Bauer},
  title        = {CausalWorld: {A} Robotic Manipulation Benchmark for Causal Structure
                  and Transfer Learning},
  journal      = {CoRR},
  volume       = {abs/2010.04296},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.04296},
  eprinttype    = {arXiv},
  eprint       = {2010.04296},
  timestamp    = {Tue, 13 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-04296.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-08012,
  author       = {Alex Lamb and
                  Anirudh Goyal and
                  Agnieszka Slowik and
                  Michael Mozer and
                  Philippe Beaudoin and
                  Yoshua Bengio},
  title        = {Neural Function Modules with Sparse Arguments: {A} Dynamic Approach
                  to Integrating Information across Layers},
  journal      = {CoRR},
  volume       = {abs/2010.08012},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.08012},
  eprinttype    = {arXiv},
  eprint       = {2010.08012},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-08012.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-10593,
  author       = {Tristan Sylvain and
                  Francis Dutil and
                  Tess Berthier and
                  Lisa Di{-}Jorio and
                  Margaux Luck and
                  R. Devon Hjelm and
                  Yoshua Bengio},
  title        = {Cross-Modal Information Maximization for Medical Imaging: {CMIM}},
  journal      = {CoRR},
  volume       = {abs/2010.10593},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.10593},
  eprinttype    = {arXiv},
  eprint       = {2010.10593},
  timestamp    = {Tue, 27 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-10593.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-11362,
  author       = {Rithesh Kumar and
                  Kundan Kumar and
                  Vicki Anand and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {{NU-GAN:} High resolution neural upsampling with {GAN}},
  journal      = {CoRR},
  volume       = {abs/2010.11362},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.11362},
  eprinttype    = {arXiv},
  eprint       = {2010.11362},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-11362.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-12536,
  author       = {Yoshua Bengio and
                  Prateek Gupta and
                  Tegan Maharaj and
                  Nasim Rahaman and
                  Martin Weiss and
                  Tristan Deleu and
                  Eilif B. M{\"{u}}ller and
                  Meng Qu and
                  Victor Schmidt and
                  Pierre{-}Luc St{-}Charles and
                  Hannah Alsdurf and
                  Olexa Bilaniuk and
                  David L. Buckeridge and
                  Ga{\'{e}}tan Marceau Caron and
                  Pierre Luc Carrier and
                  Joumana Ghosn and
                  Satya Ortiz{-}Gagne and
                  Chris Pal and
                  Irina Rish and
                  Bernhard Sch{\"{o}}lkopf and
                  Abhinav Sharma and
                  Jian Tang and
                  Andrew Williams},
  title        = {Predicting Infectiousness for Proactive Contact Tracing},
  journal      = {CoRR},
  volume       = {abs/2010.12536},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.12536},
  eprinttype    = {arXiv},
  eprint       = {2010.12536},
  timestamp    = {Tue, 26 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-12536.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-16004,
  author       = {Prateek Gupta and
                  Tegan Maharaj and
                  Martin Weiss and
                  Nasim Rahaman and
                  Hannah Alsdurf and
                  Abhinav Sharma and
                  Nanor Minoyan and
                  Soren Harnois{-}Leblanc and
                  Victor Schmidt and
                  Pierre{-}Luc St{-}Charles and
                  Tristan Deleu and
                  Andrew Williams and
                  Akshay Patel and
                  Meng Qu and
                  Olexa Bilaniuk and
                  Ga{\'{e}}tan Marceau Caron and
                  Pierre Luc Carrier and
                  Satya Ortiz{-}Gagn{\'{e}} and
                  Marc{-}Andre Rousseau and
                  David L. Buckeridge and
                  Joumana Ghosn and
                  Yang Zhang and
                  Bernhard Sch{\"{o}}lkopf and
                  Jian Tang and
                  Irina Rish and
                  Christopher Joseph Pal and
                  Joanna Merckx and
                  Eilif B. M{\"{u}}ller and
                  Yoshua Bengio},
  title        = {COVI-AgentSim: an Agent-based Model for Evaluating Methods of Digital
                  Contact Tracing},
  journal      = {CoRR},
  volume       = {abs/2010.16004},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.16004},
  eprinttype    = {arXiv},
  eprint       = {2010.16004},
  timestamp    = {Tue, 26 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-16004.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-09468,
  author       = {Mohammad Pezeshki and
                  S{\'{e}}kou{-}Oumar Kaba and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Doina Precup and
                  Guillaume Lajoie},
  title        = {Gradient Starvation: {A} Learning Proclivity in Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2011.09468},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.09468},
  eprinttype    = {arXiv},
  eprint       = {2011.09468},
  timestamp    = {Wed, 25 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-09468.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-13042,
  author       = {Cheng{-}Hao Liu and
                  Maksym Korablyov and
                  Stanislaw Jastrzebski and
                  Pawel Wlodarczyk{-}Pruszynski and
                  Yoshua Bengio and
                  Marwin H. S. Segler},
  title        = {RetroGNN: Approximating Retrosynthesis by Graph Neural Networks for
                  De Novo Drug Design},
  journal      = {CoRR},
  volume       = {abs/2011.13042},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.13042},
  eprinttype    = {arXiv},
  eprint       = {2011.13042},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-13042.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-15091,
  author       = {Anirudh Goyal and
                  Yoshua Bengio},
  title        = {Inductive Biases for Deep Learning of Higher-Level Cognition},
  journal      = {CoRR},
  volume       = {abs/2011.15091},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.15091},
  eprinttype    = {arXiv},
  eprint       = {2011.15091},
  timestamp    = {Tue, 01 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-15091.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-05013,
  author       = {Shimaa Baraka and
                  Benjamin Akera and
                  Bibek Aryal and
                  Tenzing Chogyal Sherpa and
                  Finu Shresta and
                  Anthony Ortiz and
                  Kris Sankaran and
                  Juan Lavista Ferres and
                  Mir Matin and
                  Yoshua Bengio},
  title        = {Machine Learning for Glacier Monitoring in the Hindu Kush Himalaya},
  journal      = {CoRR},
  volume       = {abs/2012.05013},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.05013},
  eprinttype    = {arXiv},
  eprint       = {2012.05013},
  timestamp    = {Tue, 15 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-05013.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/ScellierB19,
  author       = {Benjamin Scellier and
                  Yoshua Bengio},
  title        = {Equivalence of Equilibrium Propagation and Recurrent Backpropagation},
  journal      = {Neural Comput.},
  volume       = {31},
  number       = {2},
  year         = {2019},
  url          = {https://doi.org/10.1162/neco\_a\_01160},
  doi          = {10.1162/NECO\_A\_01160},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/ScellierB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/JingGPSTSB19,
  author       = {Li Jing and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  John Peurifoy and
                  Yichen Shen and
                  Max Tegmark and
                  Marin Soljacic and
                  Yoshua Bengio},
  title        = {Gated Orthogonal Recurrent Units: On Learning to Forget},
  journal      = {Neural Comput.},
  volume       = {31},
  number       = {4},
  year         = {2019},
  url          = {https://doi.org/10.1162/neco\_a\_01174},
  doi          = {10.1162/NECO\_A\_01174},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/JingGPSTSB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/KawaguchiB19,
  author       = {Kenji Kawaguchi and
                  Yoshua Bengio},
  title        = {Depth with nonlinearity creates no bad local minima in ResNets},
  journal      = {Neural Networks},
  volume       = {118},
  pages        = {167--174},
  year         = {2019},
  url          = {https://doi.org/10.1016/j.neunet.2019.06.009},
  doi          = {10.1016/J.NEUNET.2019.06.009},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/KawaguchiB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ChandarSVKB19,
  author       = {Sarath Chandar and
                  Chinnadhurai Sankar and
                  Eugene Vorontsov and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio},
  title        = {Towards Non-Saturating Recurrent Units for Modelling Long-Term Dependencies},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {3280--3287},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33013280},
  doi          = {10.1609/AAAI.V33I01.33013280},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ChandarSVKB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/Francois-LavetB19,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Yoshua Bengio and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Combined Reinforcement Learning via Abstract Representations},
  booktitle    = {The Thirty-Third {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2019, The Thirty-First Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2019, The Ninth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2019, Honolulu, Hawaii,
                  USA, January 27 - February 1, 2019},
  pages        = {3582--3589},
  publisher    = {{AAAI} Press},
  year         = {2019},
  url          = {https://doi.org/10.1609/aaai.v33i01.33013582},
  doi          = {10.1609/AAAI.V33I01.33013582},
  timestamp    = {Tue, 02 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/aaai/Francois-LavetB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SankarSPCB19,
  author       = {Chinnadhurai Sankar and
                  Sandeep Subramanian and
                  Chris Pal and
                  Sarath Chandar and
                  Yoshua Bengio},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Do Neural Dialog Systems Use the Conversation History Effectively?
                  An Empirical Study},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {32--37},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1004},
  doi          = {10.18653/V1/P19-1004},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SankarSPCB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ccs/LambVKB19,
  author       = {Alex Lamb and
                  Vikas Verma and
                  Juho Kannala and
                  Yoshua Bengio},
  editor       = {Lorenzo Cavallaro and
                  Johannes Kinder and
                  Sadia Afroz and
                  Battista Biggio and
                  Nicholas Carlini and
                  Yuval Elovici and
                  Asaf Shabtai},
  title        = {Interpolated Adversarial Training: Achieving Robust Neural Networks
                  Without Sacrificing Too Much Accuracy},
  booktitle    = {Proceedings of the 12th {ACM} Workshop on Artificial Intelligence
                  and Security, AISec@CCS 2019, London, UK, November 15, 2019},
  pages        = {95--103},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3338501.3357369},
  doi          = {10.1145/3338501.3357369},
  timestamp    = {Fri, 30 Dec 2022 23:08:56 +0100},
  biburl       = {https://dblp.org/rec/conf/ccs/LambVKB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YuanCFLPBT19,
  author       = {Xingdi Yuan and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Jie Fu and
                  Zhouhan Lin and
                  Chris Pal and
                  Yoshua Bengio and
                  Adam Trischler},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Interactive Language Learning by Question Answering},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {2796--2813},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1280},
  doi          = {10.18653/V1/D19-1280},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YuanCFLPBT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/ThompsonSBW19,
  author       = {Jessica A. F. Thompson and
                  Marc Sch{\"{o}}nwiesner and
                  Yoshua Bengio and
                  Daniel Willett},
  title        = {How Transferable Are Features in Convolutional Neural Network Acoustic
                  Models across Languages?},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {2827--2831},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683043},
  doi          = {10.1109/ICASSP.2019.8683043},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/ThompsonSBW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/YooSB19,
  author       = {Sanghyun Yoo and
                  Inchul Song and
                  Yoshua Bengio},
  title        = {A Highly Adaptive Acoustic Model for Accurate Multi-dialect Speech
                  Recognition},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {5716--5720},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683705},
  doi          = {10.1109/ICASSP.2019.8683705},
  timestamp    = {Sun, 30 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/YooSB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/KastnerSBC19,
  author       = {Kyle Kastner and
                  Jo{\~{a}}o Felipe Santos and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Representation Mixing for {TTS} Synthesis},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {5906--5910},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8682880},
  doi          = {10.1109/ICASSP.2019.8682880},
  timestamp    = {Sun, 30 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/KastnerSBC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RavanelliPB19,
  author       = {Mirco Ravanelli and
                  Titouan Parcollet and
                  Yoshua Bengio},
  title        = {The Pytorch-kaldi Speech Recognition Toolkit},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2019, Brighton, United Kingdom, May 12-17, 2019},
  pages        = {6465--6469},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICASSP.2019.8683713},
  doi          = {10.1109/ICASSP.2019.8683713},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/RavanelliPB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/SiddiqueeZTFGBL19,
  author       = {Md Mahfuzur Rahman Siddiquee and
                  Zongwei Zhou and
                  Nima Tajbakhsh and
                  Ruibin Feng and
                  Michael B. Gotway and
                  Yoshua Bengio and
                  Jianming Liang},
  title        = {Learning Fixed Points in Generative Adversarial Networks: From Image-to-Image
                  Translation to Disease Detection and Localization},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {191--200},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.00028},
  doi          = {10.1109/ICCV.2019.00028},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/SiddiqueeZTFGBL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/El-NoubySSHAKBT19,
  author       = {Alaaeldin El{-}Nouby and
                  Shikhar Sharma and
                  Hannes Schulz and
                  R. Devon Hjelm and
                  Layla El Asri and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio and
                  Graham W. Taylor},
  title        = {Tell, Draw, and Repeat: Generating and Modifying Images Based on Continual
                  Linguistic Instruction},
  booktitle    = {2019 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2019, Seoul, Korea (South), October 27 - November 2, 2019},
  pages        = {10303--10311},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICCV.2019.01040},
  doi          = {10.1109/ICCV.2019.01040},
  timestamp    = {Wed, 02 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iccv/El-NoubySSHAKBT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Chevalier-Boisvert19,
  author       = {Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Salem Lahlou and
                  Lucas Willems and
                  Chitwan Saharia and
                  Thien Huu Nguyen and
                  Yoshua Bengio},
  title        = {BabyAI: {A} Platform to Study the Sample Efficiency of Grounded Language
                  Learning},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rJeXCo0cYX},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Chevalier-Boisvert19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/FarshchianGCBMS19,
  author       = {Ali Farshchian and
                  Juan Alvaro Gallego and
                  Joseph Paul Cohen and
                  Yoshua Bengio and
                  Lee E. Miller and
                  Sara A. Solla},
  title        = {Adversarial Domain Adaptation for Stable Brain-Machine Interfaces},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=Hyx6Bi0qYm},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/FarshchianGCBMS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalBFSLLLB19,
  author       = {Anirudh Goyal and
                  Philemon Brakel and
                  William Fedus and
                  Soumye Singhal and
                  Timothy P. Lillicrap and
                  Sergey Levine and
                  Hugo Larochelle and
                  Yoshua Bengio},
  title        = {Recall Traces: Backtracking Models for Efficient Reinforcement Learning},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=HygsfnR9Ym},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalBFSLLLB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GoyalISALBBL19,
  author       = {Anirudh Goyal and
                  Riashat Islam and
                  Daniel Strouse and
                  Zafarali Ahmed and
                  Hugo Larochelle and
                  Matthew M. Botvinick and
                  Yoshua Bengio and
                  Sergey Levine},
  title        = {InfoBot: Transfer and Exploration via the Information Bottleneck},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rJg8yhAqKm},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GoyalISALBBL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HjelmFLGBTB19,
  author       = {R. Devon Hjelm and
                  Alex Fedorov and
                  Samuel Lavoie{-}Marchildon and
                  Karan Grewal and
                  Philip Bachman and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {Learning deep representations by mutual information estimation and
                  maximization},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=Bklr3j0cKX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HjelmFLGBTB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JastrzebskiKBFB19,
  author       = {Stanislaw Jastrzebski and
                  Zachary Kenton and
                  Nicolas Ballas and
                  Asja Fischer and
                  Yoshua Bengio and
                  Amos J. Storkey},
  title        = {On the Relation Between the Sharpest Directions of {DNN} Loss and
                  the {SGD} Step Length},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=SkgEaj05t7},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/JastrzebskiKBFB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KanuparthiAKKMB19,
  author       = {Bhargav Kanuparthi and
                  Devansh Arpit and
                  Giancarlo Kerg and
                  Nan Rosemary Ke and
                  Ioannis Mitliagkas and
                  Yoshua Bengio},
  title        = {h-detach: Modifying the {LSTM} Gradient Towards Better Optimization},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=ryf7ioRqFX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KanuparthiAKKMB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KeSTGBPB19,
  author       = {Nan Rosemary Ke and
                  Amanpreet Singh and
                  Ahmed Touati and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Devi Parikh and
                  Dhruv Batra},
  title        = {Modeling the Long Term Future in Model-Based Reinforcement Learning},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=SkgQBn0cF7},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KeSTGBPB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ParcolletRMLTMB19,
  author       = {Titouan Parcollet and
                  Mirco Ravanelli and
                  Mohamed Morchid and
                  Georges Linar{\`{e}}s and
                  Chiheb Trabelsi and
                  Renato De Mori and
                  Yoshua Bengio},
  title        = {Quaternion Recurrent Neural Networks},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=ByMHvs0cFQ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ParcolletRMLTMB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PicheTIBP19,
  author       = {Alexandre Pich{\'{e}} and
                  Valentin Thomas and
                  Cyril Ibrahim and
                  Yoshua Bengio and
                  Chris Pal},
  title        = {Probabilistic Planning with Sequential Monte Carlo methods},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=ByetGn0cYX},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PicheTIBP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TonevaSCTBG19,
  author       = {Mariya Toneva and
                  Alessandro Sordoni and
                  Remi Tachet des Combes and
                  Adam Trischler and
                  Yoshua Bengio and
                  Geoffrey J. Gordon},
  title        = {An Empirical Study of Example Forgetting during Deep Neural Network
                  Learning},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=BJlxm30cKm},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TonevaSCTBG19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/VelickovicFHLBH19,
  author       = {Petar Velickovic and
                  William Fedus and
                  William L. Hamilton and
                  Pietro Li{\`{o}} and
                  Yoshua Bengio and
                  R. Devon Hjelm},
  title        = {Deep Graph Infomax},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rklz9iAcKQ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/VelickovicFHLBH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZhangZLBP19,
  author       = {Zijun Zhang and
                  Ruixiang Zhang and
                  Zongpeng Li and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {Perceptual Generative Autoencoders},
  booktitle    = {Deep Generative Models for Highly Structured Data, {ICLR} 2019 Workshop,
                  New Orleans, Louisiana, United States, May 6, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rkxkr8UKuN},
  timestamp    = {Thu, 25 Jul 2019 16:26:32 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZhangZLBP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LambBGSMBM19,
  author       = {Alex Lamb and
                  Jonathan Binas and
                  Anirudh Goyal and
                  Sandeep Subramanian and
                  Ioannis Mitliagkas and
                  Yoshua Bengio and
                  Michael Mozer},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {State-Reification Networks: Improving Generalization by Modeling the
                  Distribution of Hidden Representations},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3622--3631},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/lamb19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LambBGSMBM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/QuBT19,
  author       = {Meng Qu and
                  Yoshua Bengio and
                  Jian Tang},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {{GMNN:} Graph Markov Neural Networks},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {5241--5250},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/qu19a.html},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/QuBT19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RahamanBADLHBC19,
  author       = {Nasim Rahaman and
                  Aristide Baratin and
                  Devansh Arpit and
                  Felix Draxler and
                  Min Lin and
                  Fred A. Hamprecht and
                  Yoshua Bengio and
                  Aaron C. Courville},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {On the Spectral Bias of Neural Networks},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {5301--5310},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/rahaman19a.html},
  timestamp    = {Wed, 29 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RahamanBADLHBC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/VermaLBNMLB19,
  author       = {Vikas Verma and
                  Alex Lamb and
                  Christopher Beckham and
                  Amir Najafi and
                  Ioannis Mitliagkas and
                  David Lopez{-}Paz and
                  Yoshua Bengio},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Manifold Mixup: Better Representations by Interpolating Hidden States},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {6438--6447},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/verma19a.html},
  timestamp    = {Fri, 05 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/VermaLBNMLB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/BharadhwajWBP19,
  author       = {Homanga Bharadhwaj and
                  Zihan Wang and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {A Data-Efficient Framework for Training and Sim-to-Real Transfer of
                  Navigation Policies},
  booktitle    = {International Conference on Robotics and Automation, {ICRA} 2019,
                  Montreal, QC, Canada, May 20-24, 2019},
  pages        = {782--788},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICRA.2019.8794310},
  doi          = {10.1109/ICRA.2019.8794310},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/BharadhwajWBP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/VermaLKBL19,
  author       = {Vikas Verma and
                  Alex Lamb and
                  Juho Kannala and
                  Yoshua Bengio and
                  David Lopez{-}Paz},
  editor       = {Sarit Kraus},
  title        = {Interpolation Consistency Training for Semi-supervised Learning},
  booktitle    = {Proceedings of the Twenty-Eighth International Joint Conference on
                  Artificial Intelligence, {IJCAI} 2019, Macao, China, August 10-16,
                  2019},
  pages        = {3635--3641},
  publisher    = {ijcai.org},
  year         = {2019},
  url          = {https://doi.org/10.24963/ijcai.2019/504},
  doi          = {10.24963/IJCAI.2019/504},
  timestamp    = {Tue, 20 Aug 2019 16:18:18 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/VermaLKBL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/PascualRSBB19,
  author       = {Santiago Pascual and
                  Mirco Ravanelli and
                  Joan Serr{\`{a}} and
                  Antonio Bonafonte and
                  Yoshua Bengio},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Learning Problem-Agnostic Speech Representations from Multiple Self-Supervised
                  Tasks},
  booktitle    = {Interspeech 2019, 20th Annual Conference of the International Speech
                  Communication Association, Graz, Austria, 15-19 September 2019},
  pages        = {161--165},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2605},
  doi          = {10.21437/INTERSPEECH.2019-2605},
  timestamp    = {Fri, 29 Jan 2021 17:41:10 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/PascualRSBB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/LugoschRITB19,
  author       = {Loren Lugosch and
                  Mirco Ravanelli and
                  Patrick Ignoto and
                  Vikrant Singh Tomar and
                  Yoshua Bengio},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Speech Model Pre-Training for End-to-End Spoken Language Understanding},
  booktitle    = {Interspeech 2019, 20th Annual Conference of the International Speech
                  Communication Association, Graz, Austria, 15-19 September 2019},
  pages        = {814--818},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2396},
  doi          = {10.21437/INTERSPEECH.2019-2396},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/LugoschRITB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RavanelliB19,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Learning Speaker Representations with Mutual Information},
  booktitle    = {Interspeech 2019, 20th Annual Conference of the International Speech
                  Communication Association, Graz, Austria, 15-19 September 2019},
  pages        = {1153--1157},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-2380},
  doi          = {10.21437/INTERSPEECH.2019-2380},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/RavanelliB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/miccai/TaghanakiHBDDHB19,
  author       = {Saeid Asgari Taghanaki and
                  Mohammad Havaei and
                  Tess Berthier and
                  Francis Dutil and
                  Lisa Di{-}Jorio and
                  Ghassan Hamarneh and
                  Yoshua Bengio},
  editor       = {Dinggang Shen and
                  Tianming Liu and
                  Terry M. Peters and
                  Lawrence H. Staib and
                  Caroline Essert and
                  Sean Zhou and
                  Pew{-}Thian Yap and
                  Ali R. Khan},
  title        = {InfoMask: Masked Variational Latent Representation to Localize Chest
                  Disease},
  booktitle    = {Medical Image Computing and Computer Assisted Intervention - {MICCAI}
                  2019 - 22nd International Conference, Shenzhen, China, October 13-17,
                  2019, Proceedings, Part {VI}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11769},
  pages        = {739--747},
  publisher    = {Springer},
  year         = {2019},
  url          = {https://doi.org/10.1007/978-3-030-32226-7\_82},
  doi          = {10.1007/978-3-030-32226-7\_82},
  timestamp    = {Mon, 19 Feb 2024 14:24:13 +0100},
  biburl       = {https://dblp.org/rec/conf/miccai/TaghanakiHBDDHB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BeckhamHVLGHBP19,
  author       = {Christopher Beckham and
                  Sina Honari and
                  Vikas Verma and
                  Alex Lamb and
                  Farnoosh Ghadiri and
                  R. Devon Hjelm and
                  Yoshua Bengio and
                  Chris Pal},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {On Adversarial Mixup Resynthesis},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {4348--4359},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/f708f064faaf32a43e4d3c784e6af9ea-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BeckhamHVLGHBP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ErnoultGQBS19,
  author       = {Maxence Ernoult and
                  Julie Grollier and
                  Damien Querlioz and
                  Yoshua Bengio and
                  Benjamin Scellier},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Updates of Equilibrium Prop Match Gradients of Backprop Through Time
                  in an {RNN} with Static Input},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {7079--7089},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/67974233917cea0e42a49a2fb7eb4cf4-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ErnoultGQBS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AnandROBCH19,
  author       = {Ankesh Anand and
                  Evan Racah and
                  Sherjil Ozair and
                  Yoshua Bengio and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  R. Devon Hjelm},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Unsupervised State Representation Learning in Atari},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {8766--8779},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/6fb52e71b837628ac16539c1ff911667-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/AnandROBCH19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ArpitCB19,
  author       = {Devansh Arpit and
                  V{\'{\i}}ctor Campos and
                  Yoshua Bengio},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {How to Initialize your Network? Robust Initialization for WeightNorm
                  {\&} ResNets},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {10900--10909},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/e520f70ac3930490458892665cda6620-Abstract.html},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ArpitCB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KimAB19,
  author       = {Taesup Kim and
                  Sungjin Ahn and
                  Yoshua Bengio},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Variational Temporal Abstraction},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {11566--11575},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/b5d3ad899f70013367f24e0b1fa75944-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KimAB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/AljundiLGB19,
  author       = {Rahaf Aljundi and
                  Min Lin and
                  Baptiste Goujaud and
                  Yoshua Bengio},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Gradient based sample selection for online continual learning},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {11816--11825},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/e562cd9c0768d5464b64cf61da7fc6bb-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/AljundiLGB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KergGTGVBL19,
  author       = {Giancarlo Kerg and
                  Kyle Goyette and
                  Maximilian Puelma Touzel and
                  Gauthier Gidel and
                  Eugene Vorontsov and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Non-normal Recurrent Neural Network (nnRNN): learning long time dependencies
                  while improving expressivity with transient dynamics},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {13591--13601},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/9d7099d87947faa8d07a272dd6954b80-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KergGTGVBL19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KumarKBGTSBBC19,
  author       = {Kundan Kumar and
                  Rithesh Kumar and
                  Thibault de Boissiere and
                  Lucas Gestin and
                  Wei Zhen Teoh and
                  Jose Sotelo and
                  Alexandre de Br{\'{e}}bisson and
                  Yoshua Bengio and
                  Aaron C. Courville},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {MelGAN: Generative Adversarial Networks for Conditional Waveform Synthesis},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {14881--14892},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/6804c9bca0a615bdb9374d00a9fcba59-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KumarKBGTSBBC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/OzairLBOLS19,
  author       = {Sherjil Ozair and
                  Corey Lynch and
                  Yoshua Bengio and
                  A{\"{a}}ron van den Oord and
                  Sergey Levine and
                  Pierre Sermanet},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Wasserstein Dependency Measure for Representation Learning},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {15578--15588},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/f9209b7866c9f69823201c1732cc8645-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/OzairLBOLS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-03611,
  author       = {Devansh Arpit and
                  Yoshua Bengio},
  title        = {The Benefits of Over-parameterization at Initialization in Deep ReLU
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1901.03611},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.03611},
  eprinttype    = {arXiv},
  eprint       = {1901.03611},
  timestamp    = {Sun, 03 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-03611.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-08508,
  author       = {Rithesh Kumar and
                  Anirudh Goyal and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Maximum Entropy Generators for Energy-Based Models},
  journal      = {CoRR},
  volume       = {abs/1901.08508},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.08508},
  eprinttype    = {arXiv},
  eprint       = {1901.08508},
  timestamp    = {Sat, 02 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-08508.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-10902,
  author       = {Anirudh Goyal and
                  Riashat Islam and
                  Daniel Strouse and
                  Zafarali Ahmed and
                  Matthew M. Botvinick and
                  Hugo Larochelle and
                  Sergey Levine and
                  Yoshua Bengio},
  title        = {InfoBot: Transfer and Exploration via the Information Bottleneck},
  journal      = {CoRR},
  volume       = {abs/1901.10902},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.10902},
  eprinttype    = {arXiv},
  eprint       = {1901.10902},
  timestamp    = {Wed, 20 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-10902.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-10912,
  author       = {Yoshua Bengio and
                  Tristan Deleu and
                  Nasim Rahaman and
                  Nan Rosemary Ke and
                  S{\'{e}}bastien Lachapelle and
                  Olexa Bilaniuk and
                  Anirudh Goyal and
                  Christopher J. Pal},
  title        = {A Meta-Transfer Objective for Learning to Disentangle Causal Mechanisms},
  journal      = {CoRR},
  volume       = {abs/1901.10912},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.10912},
  eprinttype    = {arXiv},
  eprint       = {1901.10912},
  timestamp    = {Sun, 03 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-10912.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-06704,
  author       = {Sarath Chandar and
                  Chinnadhurai Sankar and
                  Eugene Vorontsov and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio},
  title        = {Towards Non-saturating Recurrent Units for Modelling Long-term Dependencies},
  journal      = {CoRR},
  volume       = {abs/1902.06704},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.06704},
  eprinttype    = {arXiv},
  eprint       = {1902.06704},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-06704.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-06865,
  author       = {William Fedus and
                  Carles Gelada and
                  Yoshua Bengio and
                  Marc G. Bellemare and
                  Hugo Larochelle},
  title        = {Hyperbolic Discounting and Learning over Multiple Horizons},
  journal      = {CoRR},
  volume       = {abs/1902.06865},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.06865},
  eprinttype    = {arXiv},
  eprint       = {1902.06865},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-06865.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-01599,
  author       = {Nan Rosemary Ke and
                  Amanpreet Singh and
                  Ahmed Touati and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Devi Parikh and
                  Dhruv Batra},
  title        = {Learning Dynamics Model in Reinforcement Learning by Incorporating
                  the Long Term Future},
  journal      = {CoRR},
  volume       = {abs/1903.01599},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.01599},
  eprinttype    = {arXiv},
  eprint       = {1903.01599},
  timestamp    = {Tue, 02 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-01599.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-03825,
  author       = {Vikas Verma and
                  Alex Lamb and
                  Juho Kannala and
                  Yoshua Bengio and
                  David Lopez{-}Paz},
  title        = {Interpolation Consistency Training for Semi-Supervised Learning},
  journal      = {CoRR},
  volume       = {abs/1903.03825},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.03825},
  eprinttype    = {arXiv},
  eprint       = {1903.03825},
  timestamp    = {Tue, 02 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-03825.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-08671,
  author       = {Rahaf Aljundi and
                  Min Lin and
                  Baptiste Goujaud and
                  Yoshua Bengio},
  title        = {Online continual learning with no task boundaries},
  journal      = {CoRR},
  volume       = {abs/1903.08671},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.08671},
  eprinttype    = {arXiv},
  eprint       = {1903.08671},
  timestamp    = {Mon, 01 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-08671.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-11741,
  author       = {Saeid Asgari Taghanaki and
                  Mohammad Havaei and
                  Tess Berthier and
                  Francis Dutil and
                  Lisa Di{-}Jorio and
                  Ghassan Hamarneh and
                  Yoshua Bengio},
  title        = {InfoMask: Masked Variational Latent Representation to Localize Chest
                  Disease},
  journal      = {CoRR},
  volume       = {abs/1903.11741},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.11741},
  eprinttype    = {arXiv},
  eprint       = {1903.11741},
  timestamp    = {Tue, 02 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-11741.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-11780,
  author       = {Sherjil Ozair and
                  Corey Lynch and
                  Yoshua Bengio and
                  A{\"{a}}ron van den Oord and
                  Sergey Levine and
                  Pierre Sermanet},
  title        = {Wasserstein Dependency Measure for Representation Learning},
  journal      = {CoRR},
  volume       = {abs/1903.11780},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.11780},
  eprinttype    = {arXiv},
  eprint       = {1903.11780},
  timestamp    = {Tue, 02 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-11780.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1903-12262,
  author       = {Misha Benjamin and
                  Paul Gagnon and
                  Negar Rostamzadeh and
                  Chris Pal and
                  Yoshua Bengio and
                  Alex Shee},
  title        = {Towards Standardization of Data Licenses: The Montreal Data License},
  journal      = {CoRR},
  volume       = {abs/1903.12262},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.12262},
  eprinttype    = {arXiv},
  eprint       = {1903.12262},
  timestamp    = {Tue, 02 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-12262.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-03416,
  author       = {Santiago Pascual and
                  Mirco Ravanelli and
                  Joan Serr{\`{a}} and
                  Antonio Bonafonte and
                  Yoshua Bengio},
  title        = {Learning Problem-agnostic Speech Representations from Multiple Self-supervised
                  Tasks},
  journal      = {CoRR},
  volume       = {abs/1904.03416},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.03416},
  eprinttype    = {arXiv},
  eprint       = {1904.03416},
  timestamp    = {Wed, 24 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-03416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-03438,
  author       = {Konrad Zolna and
                  Negar Rostamzadeh and
                  Yoshua Bengio and
                  Sungjin Ahn and
                  Pedro O. Pinheiro},
  title        = {Reinforced Imitation in Heterogeneous Action Space},
  journal      = {CoRR},
  volume       = {abs/1904.03438},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.03438},
  eprinttype    = {arXiv},
  eprint       = {1904.03438},
  timestamp    = {Wed, 24 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-03438.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-03670,
  author       = {Loren Lugosch and
                  Mirco Ravanelli and
                  Patrick Ignoto and
                  Vikrant Singh Tomar and
                  Yoshua Bengio},
  title        = {Speech Model Pre-training for End-to-End Spoken Language Understanding},
  journal      = {CoRR},
  volume       = {abs/1904.03670},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.03670},
  eprinttype    = {arXiv},
  eprint       = {1904.03670},
  timestamp    = {Fri, 26 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-03670.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-07478,
  author       = {Becks Simpson and
                  Francis Dutil and
                  Yoshua Bengio and
                  Joseph Paul Cohen},
  title        = {GradMask: Reduce Overfitting by Regularizing Saliency},
  journal      = {CoRR},
  volume       = {abs/1904.07478},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.07478},
  eprinttype    = {arXiv},
  eprint       = {1904.07478},
  timestamp    = {Thu, 25 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-07478.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-09708,
  author       = {Jake Russin and
                  Jason Jo and
                  Randall C. O'Reilly and
                  Yoshua Bengio},
  title        = {Compositional generalization in a deep seq2seq model by separating
                  syntax and semantics},
  journal      = {CoRR},
  volume       = {abs/1904.09708},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.09708},
  eprinttype    = {arXiv},
  eprint       = {1904.09708},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-09708.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-03709,
  author       = {Victor Schmidt and
                  Alexandra Luccioni and
                  S. Karthik Mukkavilli and
                  Narmada Balasooriya and
                  Kris Sankaran and
                  Jennifer T. Chayes and
                  Yoshua Bengio},
  title        = {Visualizing the Consequences of Climate Change Using Cycle-Consistent
                  Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/1905.03709},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.03709},
  eprinttype    = {arXiv},
  eprint       = {1905.03709},
  timestamp    = {Wed, 09 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-03709.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-06214,
  author       = {Meng Qu and
                  Yoshua Bengio and
                  Jian Tang},
  title        = {{GMNN:} Graph Markov Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1905.06214},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.06214},
  eprinttype    = {arXiv},
  eprint       = {1905.06214},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-06214.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-09334,
  author       = {Jonathan Binas and
                  Sherjil Ozair and
                  Yoshua Bengio},
  title        = {The Journey is the Reward: Unsupervised Learning of Influential Trajectories},
  journal      = {CoRR},
  volume       = {abs/1905.09334},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.09334},
  eprinttype    = {arXiv},
  eprint       = {1905.09334},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-09334.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-10437,
  author       = {Boris N. Oreshkin and
                  Dmitri Carpov and
                  Nicolas Chapados and
                  Yoshua Bengio},
  title        = {{N-BEATS:} Neural basis expansion analysis for interpretable time
                  series forecasting},
  journal      = {CoRR},
  volume       = {abs/1905.10437},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.10437},
  eprinttype    = {arXiv},
  eprint       = {1905.10437},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-10437.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-11382,
  author       = {Alex Lamb and
                  Jonathan Binas and
                  Anirudh Goyal and
                  Sandeep Subramanian and
                  Ioannis Mitliagkas and
                  Denis Kazakov and
                  Yoshua Bengio and
                  Michael C. Mozer},
  title        = {State-Reification Networks: Improving Generalization by Modeling the
                  Distribution of Hidden Representations},
  journal      = {CoRR},
  volume       = {abs/1905.11382},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.11382},
  eprinttype    = {arXiv},
  eprint       = {1905.11382},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-11382.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-12080,
  author       = {Giancarlo Kerg and
                  Kyle Goyette and
                  Maximilian Puelma Touzel and
                  Gauthier Gidel and
                  Eugene Vorontsov and
                  Yoshua Bengio and
                  Guillaume Lajoie},
  title        = {Non-normal Recurrent Neural Network (nnRNN): learning long time dependencies
                  while improving expressivity with transient dynamics},
  journal      = {CoRR},
  volume       = {abs/1905.12080},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.12080},
  eprinttype    = {arXiv},
  eprint       = {1905.12080},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-12080.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-12300,
  author       = {Ghouthi Boukli Hacene and
                  Carlos Eduardo Rosar K{\'{o}}s Lassance and
                  Vincent Gripon and
                  Matthieu Courbariaux and
                  Yoshua Bengio},
  title        = {Attention Based Pruning for Shift Networks},
  journal      = {CoRR},
  volume       = {abs/1905.12300},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.12300},
  eprinttype    = {arXiv},
  eprint       = {1905.12300},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-12300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-13633,
  author       = {Maxence Ernoult and
                  Julie Grollier and
                  Damien Querlioz and
                  Yoshua Bengio and
                  Benjamin Scellier},
  title        = {Updates of Equilibrium Prop Match Gradients of Backprop Through Time
                  in an {RNN} with Static Input},
  journal      = {CoRR},
  volume       = {abs/1905.13633},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.13633},
  eprinttype    = {arXiv},
  eprint       = {1905.13633},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-13633.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-01603,
  author       = {Chinnadhurai Sankar and
                  Sandeep Subramanian and
                  Christopher J. Pal and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {Do Neural Dialog Systems Use the Conversation History Effectively?
                  An Empirical Study},
  journal      = {CoRR},
  volume       = {abs/1906.01603},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.01603},
  eprinttype    = {arXiv},
  eprint       = {1906.01603},
  timestamp    = {Thu, 13 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-01603.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-02341,
  author       = {Devansh Arpit and
                  Victor Campos and
                  Yoshua Bengio},
  title        = {How to Initialize your Network? Robust Initialization for WeightNorm
                  {\&} ResNets},
  journal      = {CoRR},
  volume       = {abs/1906.02341},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.02341},
  eprinttype    = {arXiv},
  eprint       = {1906.02341},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-02341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-04355,
  author       = {Shagun Sodhani and
                  Anirudh Goyal and
                  Tristan Deleu and
                  Yoshua Bengio and
                  Sergey Levine and
                  Jian Tang},
  title        = {Learning Powerful Policies by Using Consistent Dynamics Model},
  journal      = {CoRR},
  volume       = {abs/1906.04355},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.04355},
  eprinttype    = {arXiv},
  eprint       = {1906.04355},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-04355.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-05433,
  author       = {David Rolnick and
                  Priya L. Donti and
                  Lynn H. Kaack and
                  Kelly Kochanski and
                  Alexandre Lacoste and
                  Kris Sankaran and
                  Andrew Slavin Ross and
                  Nikola Milojevic{-}Dupont and
                  Natasha Jaques and
                  Anna Waldman{-}Brown and
                  Alexandra Luccioni and
                  Tegan Maharaj and
                  Evan D. Sherwin and
                  S. Karthik Mukkavilli and
                  Konrad P. K{\"{o}}rding and
                  Carla P. Gomes and
                  Andrew Y. Ng and
                  Demis Hassabis and
                  John C. Platt and
                  Felix Creutzig and
                  Jennifer T. Chayes and
                  Yoshua Bengio},
  title        = {Tackling Climate Change with Machine Learning},
  journal      = {CoRR},
  volume       = {abs/1906.05433},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.05433},
  eprinttype    = {arXiv},
  eprint       = {1906.05433},
  timestamp    = {Wed, 09 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-05433.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-06635,
  author       = {Min Lin and
                  Jie Fu and
                  Yoshua Bengio},
  title        = {Conditional Computation for Continual Learning},
  journal      = {CoRR},
  volume       = {abs/1906.06635},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.06635},
  eprinttype    = {arXiv},
  eprint       = {1906.06635},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-06635.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-06784,
  author       = {Alex Lamb and
                  Vikas Verma and
                  Juho Kannala and
                  Yoshua Bengio},
  title        = {Interpolated Adversarial Training: Achieving Robust Neural Networks
                  without Sacrificing Accuracy},
  journal      = {CoRR},
  volume       = {abs/1906.06784},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.06784},
  eprinttype    = {arXiv},
  eprint       = {1906.06784},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-06784.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-07774,
  author       = {Valentin Thomas and
                  Fabian Pedregosa and
                  Bart van Merri{\"{e}}nboer and
                  Pierre{-}Antoine Manzagol and
                  Yoshua Bengio and
                  Nicolas Le Roux},
  title        = {Information matrices and generalization},
  journal      = {CoRR},
  volume       = {abs/1906.07774},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.07774},
  eprinttype    = {arXiv},
  eprint       = {1906.07774},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-07774.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-08226,
  author       = {Ankesh Anand and
                  Evan Racah and
                  Sherjil Ozair and
                  Yoshua Bengio and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  R. Devon Hjelm},
  title        = {Unsupervised State Representation Learning in Atari},
  journal      = {CoRR},
  volume       = {abs/1906.08226},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.08226},
  eprinttype    = {arXiv},
  eprint       = {1906.08226},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-08226.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-10335,
  author       = {Zijun Zhang and
                  Ruixiang Zhang and
                  Zongpeng Li and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {Perceptual Generative Autoencoders},
  journal      = {CoRR},
  volume       = {abs/1906.10335},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.10335},
  eprinttype    = {arXiv},
  eprint       = {1906.10335},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-10335.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-10667,
  author       = {Anirudh Goyal and
                  Shagun Sodhani and
                  Jonathan Binas and
                  Xue Bin Peng and
                  Sergey Levine and
                  Yoshua Bengio},
  title        = {Reinforcement Learning with Competitive Ensembles of Information-Constrained
                  Primitives},
  journal      = {CoRR},
  volume       = {abs/1906.10667},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.10667},
  eprinttype    = {arXiv},
  eprint       = {1906.10667},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-10667.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-01285,
  author       = {Nasim Rahaman and
                  Steffen Wolf and
                  Anirudh Goyal and
                  Roman Remme and
                  Yoshua Bengio},
  title        = {Learning the Arrow of Time},
  journal      = {CoRR},
  volume       = {abs/1907.01285},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.01285},
  eprinttype    = {arXiv},
  eprint       = {1907.01285},
  timestamp    = {Wed, 01 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-01285.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-03179,
  author       = {Meng Qu and
                  Jian Tang and
                  Yoshua Bengio},
  title        = {Weakly-supervised Knowledge Graph Alignment with Adversarial Learning},
  journal      = {CoRR},
  volume       = {abs/1907.03179},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.03179},
  eprinttype    = {arXiv},
  eprint       = {1907.03179},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-03179.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-06965,
  author       = {Md Mahfuzur Rahman Siddiquee and
                  Zongwei Zhou and
                  Nima Tajbakhsh and
                  Ruibin Feng and
                  Michael B. Gotway and
                  Yoshua Bengio and
                  Jianming Liang},
  title        = {Learning Fixed Points in Generative Adversarial Networks: From Image-to-Image
                  Translation to Disease Detection and Localization},
  journal      = {CoRR},
  volume       = {abs/1908.06965},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.06965},
  eprinttype    = {arXiv},
  eprint       = {1908.06965},
  timestamp    = {Mon, 26 Aug 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-06965.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1908-10909,
  author       = {Xingdi Yuan and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Jie Fu and
                  Zhouhan Lin and
                  Christopher J. Pal and
                  Yoshua Bengio and
                  Adam Trischler},
  title        = {Interactive Language Learning by Question Answering},
  journal      = {CoRR},
  volume       = {abs/1908.10909},
  year         = {2019},
  url          = {http://arxiv.org/abs/1908.10909},
  eprinttype    = {arXiv},
  eprint       = {1908.10909},
  timestamp    = {Wed, 04 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1908-10909.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-00949,
  author       = {Jordan Hoffmann and
                  Louis Maestrati and
                  Yoshihide Sawada and
                  Jian Tang and
                  Jean Michel D. Sellier and
                  Yoshua Bengio},
  title        = {Data-Driven Approach to Encoding and Decoding 3-D Crystal Structures},
  journal      = {CoRR},
  volume       = {abs/1909.00949},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.00949},
  eprinttype    = {arXiv},
  eprint       = {1909.00949},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-00949.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-06576,
  author       = {Tristan Deleu and
                  Tobias W{\"{u}}rfl and
                  Mandana Samiei and
                  Joseph Paul Cohen and
                  Yoshua Bengio},
  title        = {Torchmeta: {A} Meta-Learning library for PyTorch},
  journal      = {CoRR},
  volume       = {abs/1909.06576},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.06576},
  eprinttype    = {arXiv},
  eprint       = {1909.06576},
  timestamp    = {Mon, 23 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-06576.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-10893,
  author       = {Anirudh Goyal and
                  Alex Lamb and
                  Jordan Hoffmann and
                  Shagun Sodhani and
                  Sergey Levine and
                  Yoshua Bengio and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Recurrent Independent Mechanisms},
  journal      = {CoRR},
  volume       = {abs/1909.10893},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.10893},
  eprinttype    = {arXiv},
  eprint       = {1909.10893},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-10893.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-11228,
  author       = {David Venuto and
                  L{\'{e}}onard Boussioux and
                  Junhao Wang and
                  Rola Dali and
                  Jhelum Chakravorty and
                  Yoshua Bengio and
                  Doina Precup},
  title        = {Avoidance Learning Using Observational Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1909.11228},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.11228},
  eprinttype    = {arXiv},
  eprint       = {1909.11228},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-11228.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-11715,
  author       = {Vikas Verma and
                  Meng Qu and
                  Alex Lamb and
                  Yoshua Bengio and
                  Juho Kannala and
                  Jian Tang},
  title        = {GraphMix: Regularized Training of Graph Neural Networks for Semi-Supervised
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1909.11715},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.11715},
  eprinttype    = {arXiv},
  eprint       = {1909.11715},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-11715.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-00199,
  author       = {Joseph D. Viviano and
                  Becks Simpson and
                  Francis Dutil and
                  Yoshua Bengio and
                  Joseph Paul Cohen},
  title        = {Underwhelming Generalization Improvements From Controlling Feature
                  Attribution},
  journal      = {CoRR},
  volume       = {abs/1910.00199},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.00199},
  eprinttype    = {arXiv},
  eprint       = {1910.00199},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-00199.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-00775,
  author       = {Taesup Kim and
                  Sungjin Ahn and
                  Yoshua Bengio},
  title        = {Variational Temporal Abstraction},
  journal      = {CoRR},
  volume       = {abs/1910.00775},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.00775},
  eprinttype    = {arXiv},
  eprint       = {1910.00775},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-00775.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-01075,
  author       = {Nan Rosemary Ke and
                  Olexa Bilaniuk and
                  Anirudh Goyal and
                  Stefan Bauer and
                  Hugo Larochelle and
                  Chris Pal and
                  Yoshua Bengio},
  title        = {Learning Neural Causal Models from Unknown Interventions},
  journal      = {CoRR},
  volume       = {abs/1910.01075},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.01075},
  eprinttype    = {arXiv},
  eprint       = {1910.01075},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-01075.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-06711,
  author       = {Kundan Kumar and
                  Rithesh Kumar and
                  Thibault de Boissiere and
                  Lucas Gestin and
                  Wei Zhen Teoh and
                  Jose Sotelo and
                  Alexandre de Br{\'{e}}bisson and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {MelGAN: Generative Adversarial Networks for Conditional Waveform Synthesis},
  journal      = {CoRR},
  volume       = {abs/1910.06711},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.06711},
  eprinttype    = {arXiv},
  eprint       = {1910.06711},
  timestamp    = {Wed, 16 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-06711.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-08922,
  author       = {Yimeng Min and
                  S. Karthik Mukkavilli and
                  Yoshua Bengio},
  title        = {Predicting ice flow using machine learning},
  journal      = {CoRR},
  volume       = {abs/1910.08922},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.08922},
  eprinttype    = {arXiv},
  eprint       = {1910.08922},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-08922.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-09570,
  author       = {Shawn Tan and
                  Guillaume Androz and
                  Ahmad Chamseddine and
                  Pierre Fecteau and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Joseph Paul Cohen},
  title        = {Icentia11K: An Unsupervised Representation Learning Dataset for Arrhythmia
                  Subtype Discovery},
  journal      = {CoRR},
  volume       = {abs/1910.09570},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.09570},
  eprinttype    = {arXiv},
  eprint       = {1910.09570},
  timestamp    = {Fri, 25 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-09570.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-10143,
  author       = {Sharon Zhou and
                  Alexandra Luccioni and
                  Gautier Cosne and
                  Michael S. Bernstein and
                  Yoshua Bengio},
  title        = {Establishing an Evaluation Metric to Quantify Climate Change Image
                  Realism},
  journal      = {CoRR},
  volume       = {abs/1910.10143},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.10143},
  eprinttype    = {arXiv},
  eprint       = {1910.10143},
  timestamp    = {Fri, 25 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-10143.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-13540,
  author       = {Samarth Sinha and
                  Han Zhang and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Hugo Larochelle and
                  Augustus Odena},
  title        = {Small-GAN: Speeding Up {GAN} Training Using Core-sets},
  journal      = {CoRR},
  volume       = {abs/1910.13540},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.13540},
  eprinttype    = {arXiv},
  eprint       = {1910.13540},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-13540.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-07421,
  author       = {Tong Che and
                  Xiaofeng Liu and
                  Site Li and
                  Yubin Ge and
                  Ruixiang Zhang and
                  Caiming Xiong and
                  Yoshua Bengio},
  title        = {Deep Verifier Networks: Verification of Deep Discriminative Models
                  with Deep Generative Models},
  journal      = {CoRR},
  volume       = {abs/1911.07421},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.07421},
  eprinttype    = {arXiv},
  eprint       = {1911.07421},
  timestamp    = {Fri, 14 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-07421.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-08585,
  author       = {Thomas Mesnard and
                  Ga{\"{e}}tan Vignoud and
                  Jo{\~{a}}o Sacramento and
                  Walter Senn and
                  Yoshua Bengio},
  title        = {Ghost Units Yield Biologically Plausible Backprop in Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1911.08585},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.08585},
  eprinttype    = {arXiv},
  eprint       = {1911.08585},
  timestamp    = {Wed, 04 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-08585.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-00444,
  author       = {Anirudh Srinivasan and
                  Dzmitry Bahdanau and
                  Maxime Chevalier{-}Boisvert and
                  Yoshua Bengio},
  title        = {Automated curriculum generation for Policy Gradients from Demonstrations},
  journal      = {CoRR},
  volume       = {abs/1912.00444},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.00444},
  eprinttype    = {arXiv},
  eprint       = {1912.00444},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-00444.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-00957,
  author       = {Jessenia Gonzalez and
                  Debjani Bhowmick and
                  Cesar Beltran and
                  Kris Sankaran and
                  Yoshua Bengio},
  title        = {Applying Knowledge Transfer for Water Body Segmentation in Peru},
  journal      = {CoRR},
  volume       = {abs/1912.00957},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.00957},
  eprinttype    = {arXiv},
  eprint       = {1912.00957},
  timestamp    = {Tue, 07 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-00957.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-02260,
  author       = {Jessica A. F. Thompson and
                  Yoshua Bengio and
                  Marc Sch{\"{o}}nwiesner},
  title        = {The effect of task and training on intermediate representations in
                  convolutional neural networks revealed with modified {RV} similarity
                  analysis},
  journal      = {CoRR},
  volume       = {abs/1912.02260},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.02260},
  eprinttype    = {arXiv},
  eprint       = {1912.02260},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-02260.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-05783,
  author       = {Dzmitry Bahdanau and
                  Harm de Vries and
                  Timothy J. O'Donnell and
                  Shikhar Murty and
                  Philippe Beaudoin and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {{CLOSURE:} Assessing Systematic Generalization of {CLEVR} Models},
  journal      = {CoRR},
  volume       = {abs/1912.05783},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.05783},
  eprinttype    = {arXiv},
  eprint       = {1912.05783},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-05783.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-06994,
  author       = {ByungIn Yoo and
                  Tristan Sylvain and
                  Yoshua Bengio and
                  Junmo Kim},
  title        = {Joint Learning of Generative Translator and Classifier for Visually
                  Similar Classes},
  journal      = {CoRR},
  volume       = {abs/1912.06994},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.06994},
  eprinttype    = {arXiv},
  eprint       = {1912.06994},
  timestamp    = {Fri, 03 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-06994.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-08112,
  author       = {Yoshua Bengio and
                  Emma Frejinger and
                  Andrea Lodi and
                  Rahul Patel and
                  Sriram Sankaranarayanan},
  title        = {A learning-based algorithm to quickly compute good primal solutions
                  for Stochastic Integer Programs},
  journal      = {CoRR},
  volume       = {abs/1912.08112},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.08112},
  eprinttype    = {arXiv},
  eprint       = {1912.08112},
  timestamp    = {Wed, 08 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-08112.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-11945,
  author       = {Alexandra Luccioni and
                  Yoshua Bengio},
  title        = {On the Morality of Artificial Intelligence},
  journal      = {CoRR},
  volume       = {abs/1912.11945},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.11945},
  eprinttype    = {arXiv},
  eprint       = {1912.11945},
  timestamp    = {Fri, 03 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-11945.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/bioinformatics/DerevyankoGBL18,
  author       = {Georgy Derevyanko and
                  Sergei Grudinin and
                  Yoshua Bengio and
                  Guillaume Lamoureux},
  title        = {Deep convolutional networks for quality assessment of protein folds},
  journal      = {Bioinform.},
  volume       = {34},
  number       = {23},
  pages        = {4046--4053},
  year         = {2018},
  url          = {https://doi.org/10.1093/bioinformatics/bty494},
  doi          = {10.1093/BIOINFORMATICS/BTY494},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/bioinformatics/DerevyankoGBL18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijon/ChoiCB18,
  author       = {Heeyoul Choi and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Fine-grained attention mechanism for neural machine translation},
  journal      = {Neurocomputing},
  volume       = {284},
  pages        = {171--176},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.neucom.2018.01.007},
  doi          = {10.1016/J.NEUCOM.2018.01.007},
  timestamp    = {Mon, 19 Mar 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ijon/ChoiCB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mia/DrozdzalCVSDTRB18,
  author       = {Michal Drozdzal and
                  Gabriel Chartrand and
                  Eugene Vorontsov and
                  Mahsa Shakeri and
                  Lisa Di{-}Jorio and
                  An Tang and
                  Adriana Romero and
                  Yoshua Bengio and
                  Chris Pal and
                  Samuel Kadoury},
  title        = {Learning normalized inputs for iterative estimation in medical image
                  segmentation},
  journal      = {Medical Image Anal.},
  volume       = {44},
  pages        = {1--13},
  year         = {2018},
  url          = {https://doi.org/10.1016/j.media.2017.11.005},
  doi          = {10.1016/J.MEDIA.2017.11.005},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/mia/DrozdzalCVSDTRB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/GulcehreCCB18,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sarath Chandar and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Dynamic Neural Turing Machine with Continuous and Discrete Addressing
                  Schemes},
  journal      = {Neural Comput.},
  volume       = {30},
  number       = {4},
  year         = {2018},
  url          = {https://doi.org/10.1162/neco\_a\_01060},
  doi          = {10.1162/NECO\_A\_01060},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/GulcehreCCB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/ZhangYZLB18,
  author       = {Xu{-}Yao Zhang and
                  Fei Yin and
                  Yan{-}Ming Zhang and
                  Cheng{-}Lin Liu and
                  Yoshua Bengio},
  title        = {Drawing and Recognizing Chinese Characters with Recurrent Neural Network},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {40},
  number       = {4},
  pages        = {849--862},
  year         = {2018},
  url          = {https://doi.org/10.1109/TPAMI.2017.2695539},
  doi          = {10.1109/TPAMI.2017.2695539},
  timestamp    = {Tue, 16 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pami/ZhangYZLB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tetci/RavanelliBOB18,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {Light Gated Recurrent Units for Speech Recognition},
  journal      = {{IEEE} Trans. Emerg. Top. Comput. Intell.},
  volume       = {2},
  number       = {2},
  pages        = {92--102},
  year         = {2018},
  url          = {https://doi.org/10.1109/TETCI.2017.2762739},
  doi          = {10.1109/TETCI.2017.2762739},
  timestamp    = {Tue, 14 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tetci/RavanelliBOB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/JingGPSTSB18,
  author       = {Li Jing and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  John Peurifoy and
                  Yichen Shen and
                  Max Tegmark and
                  Marin Soljacic and
                  Yoshua Bengio},
  title        = {Gated Orthogonal Recurrent Units: On Learning to Forget},
  booktitle    = {The Workshops of the The Thirty-Second {AAAI} Conference on Artificial
                  Intelligence, New Orleans, Louisiana, USA, February 2-7, 2018},
  series       = {{AAAI} Technical Report},
  volume       = {{WS-18}},
  pages        = {720--726},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://aaai.org/ocs/index.php/WS/AAAIW18/paper/view/16901},
  timestamp    = {Mon, 04 Sep 2023 16:46:41 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/JingGPSTSB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SubramanianWYZT18,
  author       = {Sandeep Subramanian and
                  Tong Wang and
                  Xingdi Yuan and
                  Saizheng Zhang and
                  Adam Trischler and
                  Yoshua Bengio},
  editor       = {Eunsol Choi and
                  Minjoon Seo and
                  Danqi Chen and
                  Robin Jia and
                  Jonathan Berant},
  title        = {Neural Models for Key Phrase Extraction and Question Generation},
  booktitle    = {Proceedings of the Workshop on Machine Reading for Question Answering@ACL
                  2018, Melbourne, Australia, July 19, 2018},
  pages        = {78--88},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/W18-2609/},
  doi          = {10.18653/V1/W18-2609},
  timestamp    = {Thu, 14 Dec 2023 18:03:42 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/SubramanianWYZT18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/BengioSCJLS18,
  author       = {Yikang Shen and
                  Zhouhan Lin and
                  Athul Paul Jacob and
                  Alessandro Sordoni and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Iryna Gurevych and
                  Yusuke Miyao},
  title        = {Straight to the Tree: Constituency Parsing with Neural Syntactic Distance},
  booktitle    = {Proceedings of the 56th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2018, Melbourne, Australia, July 15-20, 2018, Volume
                  1: Long Papers},
  pages        = {1171--1180},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://aclanthology.org/P18-1108/},
  doi          = {10.18653/V1/P18-1108},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/BengioSCJLS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/CasanovaCDRB18,
  author       = {Arantxa Casanova and
                  Guillem Cucurull and
                  Michal Drozdzal and
                  Adriana Romero and
                  Yoshua Bengio},
  title        = {On the Iterative Refinement of Densely Connected Representation Levels
                  for Semantic Segmentation},
  booktitle    = {2018 {IEEE} Conference on Computer Vision and Pattern Recognition
                  Workshops, {CVPR} Workshops 2018, Salt Lake City, UT, USA, June 18-22,
                  2018},
  pages        = {978--987},
  publisher    = {Computer Vision Foundation / {IEEE} Computer Society},
  year         = {2018},
  url          = {http://openaccess.thecvf.com/content\_cvpr\_2018\_workshops/w14/html/Casanova\_On\_the\_Iterative\_CVPR\_2018\_paper.html},
  doi          = {10.1109/CVPRW.2018.00144},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/CasanovaCDRB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/Yang0ZBCSM18,
  author       = {Zhilin Yang and
                  Peng Qi and
                  Saizheng Zhang and
                  Yoshua Bengio and
                  William W. Cohen and
                  Ruslan Salakhutdinov and
                  Christopher D. Manning},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {HotpotQA: {A} Dataset for Diverse, Explainable Multi-hop Question
                  Answering},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {2369--2380},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1259},
  doi          = {10.18653/V1/D18-1259},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/Yang0ZBCSM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icann/JastrzebskiKABF18,
  author       = {Stanislaw Jastrzebski and
                  Zachary Kenton and
                  Devansh Arpit and
                  Nicolas Ballas and
                  Asja Fischer and
                  Yoshua Bengio and
                  Amos J. Storkey},
  editor       = {Vera Kurkov{\'{a}} and
                  Yannis Manolopoulos and
                  Barbara Hammer and
                  Lazaros S. Iliadis and
                  Ilias Maglogiannis},
  title        = {Width of Minima Reached by Stochastic Gradient Descent is Influenced
                  by Learning Rate to Batch Size Ratio},
  booktitle    = {Artificial Neural Networks and Machine Learning - {ICANN} 2018 - 27th
                  International Conference on Artificial Neural Networks, Rhodes, Greece,
                  October 4-7, 2018, Proceedings, Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {11141},
  pages        = {392--402},
  publisher    = {Springer},
  year         = {2018},
  url          = {https://doi.org/10.1007/978-3-030-01424-7\_39},
  doi          = {10.1007/978-3-030-01424-7\_39},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icann/JastrzebskiKABF18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MimilakisDSSVB18,
  author       = {Stylianos Ioannis Mimilakis and
                  Konstantinos Drossos and
                  Jo{\~{a}}o Felipe Santos and
                  Gerald Schuller and
                  Tuomas Virtanen and
                  Yoshua Bengio},
  title        = {Monaural Singing Voice Separation with Skip-Filtering Connections
                  and Recurrent Inference of Time-Frequency Mask},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {721--725},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461822},
  doi          = {10.1109/ICASSP.2018.8461822},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/MimilakisDSSVB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SongCKB18,
  author       = {Inchul Song and
                  Junyoung Chung and
                  Taesup Kim and
                  Yoshua Bengio},
  title        = {Dynamic Frame Skipping for Fast Speech Recognition in Recurrent Neural
                  Network Based Acoustic Models},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {4984--4988},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8462615},
  doi          = {10.1109/ICASSP.2018.8462615},
  timestamp    = {Tue, 18 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/SongCKB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/SerdyukWFKLB18,
  author       = {Dmitriy Serdyuk and
                  Yongqiang Wang and
                  Christian Fuegen and
                  Anuj Kumar and
                  Baiyang Liu and
                  Yoshua Bengio},
  title        = {Towards End-to-end Spoken Language Understanding},
  booktitle    = {2018 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2018, Calgary, AB, Canada, April 15-20, 2018},
  pages        = {5754--5758},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICASSP.2018.8461785},
  doi          = {10.1109/ICASSP.2018.8461785},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/SerdyukWFKLB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/HjelmJTCCB18,
  author       = {R. Devon Hjelm and
                  Athul Paul Jacob and
                  Adam Trischler and
                  Gerry Che and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Boundary Seeking GANs},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=rkTS8lZAb},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/HjelmJTCCB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JastrzebskiABVC18,
  author       = {Stanislaw Jastrzebski and
                  Devansh Arpit and
                  Nicolas Ballas and
                  Vikas Verma and
                  Tong Che and
                  Yoshua Bengio},
  title        = {Residual Connections Encourage Iterative Inference},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SJa9iHgAZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/JastrzebskiABVC18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JastrzebskiKABF18,
  author       = {Stanislaw Jastrzebski and
                  Zachary Kenton and
                  Devansh Arpit and
                  Nicolas Ballas and
                  Asja Fischer and
                  Yoshua Bengio and
                  Amos J. Storkey},
  title        = {Finding Flatter Minima with {SGD}},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=r1VF9dCUG},
  timestamp    = {Thu, 04 Apr 2019 13:20:09 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/JastrzebskiKABF18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KahouMAKTB18,
  author       = {Samira Ebrahimi Kahou and
                  Vincent Michalski and
                  Adam Atkinson and
                  {\'{A}}kos K{\'{a}}d{\'{a}}r and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {FigureQA: An Annotated Figure Dataset for Visual Reasoning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=H1mz0OyDz},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KahouMAKTB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MaWB18,
  author       = {Chen Ma and
                  Junfeng Wen and
                  Yoshua Bengio},
  title        = {Universal Successor Representations for Transfer Reinforcement Learning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=HJ\_CpYyDz},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MaWB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ScellierGBMB18,
  author       = {Benjamin Scellier and
                  Anirudh Goyal and
                  Jonathan Binas and
                  Thomas Mesnard and
                  Yoshua Bengio},
  title        = {Extending the Framework of Equilibrium Propagation to General Dynamics},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=BJ5V4ICIG},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ScellierGBMB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SerdyukKSTPB18,
  author       = {Dmitriy Serdyuk and
                  Nan Rosemary Ke and
                  Alessandro Sordoni and
                  Adam Trischler and
                  Chris Pal and
                  Yoshua Bengio},
  title        = {Twin Networks: Matching the Future for Sequence Generation},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=BydLzGb0Z},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SerdyukKSTPB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SharmaSMKB18,
  author       = {Shikhar Sharma and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio},
  title        = {ChatPainter: Improving Text to Image Generation using Dialogue},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=rJsnEYJwG},
  timestamp    = {Wed, 02 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SharmaSMKB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SubramanianTBP18,
  author       = {Sandeep Subramanian and
                  Adam Trischler and
                  Yoshua Bengio and
                  Christopher J. Pal},
  title        = {Learning General Purpose Distributed Sentence Representations via
                  Large Scale Multi-task Learning},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=B18WgG-CZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SubramanianTBP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/TrabelsiBZSSSMR18,
  author       = {Chiheb Trabelsi and
                  Olexa Bilaniuk and
                  Ying Zhang and
                  Dmitriy Serdyuk and
                  Sandeep Subramanian and
                  Jo{\~{a}}o Felipe Santos and
                  Soroush Mehri and
                  Negar Rostamzadeh and
                  Yoshua Bengio and
                  Christopher J. Pal},
  title        = {Deep Complex Networks},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=H1T2hmZAb},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/TrabelsiBZSSSMR18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/VelickovicCCRLB18,
  author       = {Petar Velickovic and
                  Guillem Cucurull and
                  Arantxa Casanova and
                  Adriana Romero and
                  Pietro Li{\`{o}} and
                  Yoshua Bengio},
  title        = {Graph Attention Networks},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=rJXMpikCZ},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/VelickovicCCRLB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ZolnaASB18,
  author       = {Konrad Zolna and
                  Devansh Arpit and
                  Dendi Suhubdy and
                  Yoshua Bengio},
  title        = {Fraternal Dropout},
  booktitle    = {6th International Conference on Learning Representations, {ICLR} 2018,
                  Vancouver, BC, Canada, April 30 - May 3, 2018, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2018},
  url          = {https://openreview.net/forum?id=SJyVzQ-C-},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ZolnaASB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BelghaziBROBHC18,
  author       = {Mohamed Ishmael Belghazi and
                  Aristide Baratin and
                  Sai Rajeswar and
                  Sherjil Ozair and
                  Yoshua Bengio and
                  R. Devon Hjelm and
                  Aaron C. Courville},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Mutual Information Neural Estimation},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {530--539},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/belghazi18a.html},
  timestamp    = {Sat, 28 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BelghaziBROBHC18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KeZSLTBPCP18,
  author       = {Nan Rosemary Ke and
                  Konrad Zolna and
                  Alessandro Sordoni and
                  Zhouhan Lin and
                  Adam Trischler and
                  Yoshua Bengio and
                  Joelle Pineau and
                  Laurent Charlin and
                  Christopher J. Pal},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {Focused Hierarchical RNNs for Conditional Sequence Processing},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {2559--2568},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/ke18a.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KeZSLTBPCP18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/DrossosMSSVB18,
  author       = {Konstantinos Drossos and
                  Stylianos Ioannis Mimilakis and
                  Dmitriy Serdyuk and
                  Gerald Schuller and
                  Tuomas Virtanen and
                  Yoshua Bengio},
  title        = {MaD TwinNet: Masker-Denoiser Architecture with Twin Networks for Monaural
                  Sound Source Separation},
  booktitle    = {2018 International Joint Conference on Neural Networks, {IJCNN} 2018,
                  Rio de Janeiro, Brazil, July 8-13, 2018},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/IJCNN.2018.8489565},
  doi          = {10.1109/IJCNN.2018.8489565},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/DrossosMSSVB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ParcolletZMTLMB18,
  author       = {Titouan Parcollet and
                  Ying Zhang and
                  Mohamed Morchid and
                  Chiheb Trabelsi and
                  Georges Linar{\`{e}}s and
                  Renato de Mori and
                  Yoshua Bengio},
  editor       = {B. Yegnanarayana},
  title        = {Quaternion Convolutional Neural Networks for End-to-End Automatic
                  Speech Recognition},
  booktitle    = {Interspeech 2018, 19th Annual Conference of the International Speech
                  Communication Association, Hyderabad, India, 2-6 September 2018},
  pages        = {22--26},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1898},
  doi          = {10.21437/INTERSPEECH.2018-1898},
  timestamp    = {Fri, 21 May 2021 08:16:43 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ParcolletZMTLMB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RavanelliSB18,
  author       = {Mirco Ravanelli and
                  Dmitriy Serdyuk and
                  Yoshua Bengio},
  editor       = {B. Yegnanarayana},
  title        = {Twin Regularization for Online Speech Recognition},
  booktitle    = {Interspeech 2018, 19th Annual Conference of the International Speech
                  Communication Association, Hyderabad, India, 2-6 September 2018},
  pages        = {3718--3722},
  publisher    = {{ISCA}},
  year         = {2018},
  url          = {https://doi.org/10.21437/Interspeech.2018-1407},
  doi          = {10.21437/INTERSPEECH.2018-1407},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/RavanelliSB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Gonzalez-Garcia18,
  author       = {Abel Gonzalez{-}Garcia and
                  Joost van de Weijer and
                  Yoshua Bengio},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Image-to-image translation for cross-domain disentanglement},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {1294--1305},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/dc6a70712a252123c40d2adba6a11d84-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/Gonzalez-Garcia18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhangCGBS18,
  author       = {Ruixiang Zhang and
                  Tong Che and
                  Zoubin Ghahramani and
                  Yoshua Bengio and
                  Yangqiu Song},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {MetaGAN: An Adversarial Approach to Few-Shot Learning},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {2371--2380},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/4e4e53aa080247bc31d0eb4e7aeb07a0-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ZhangCGBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YoonKDKBA18,
  author       = {Jaesik Yoon and
                  Taesup Kim and
                  Ousmane Dia and
                  Sungwoong Kim and
                  Yoshua Bengio and
                  Sungjin Ahn},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Bayesian Model-Agnostic Meta-Learning},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {7343--7353},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/e1021d43911ca2c1845910d84f40aeae-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YoonKDKBA18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KeGBBMPB18,
  author       = {Nan Rosemary Ke and
                  Anirudh Goyal and
                  Olexa Bilaniuk and
                  Jonathan Binas and
                  Michael C. Mozer and
                  Chris Pal and
                  Yoshua Bengio},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Sparse Attentive Backtracking: Temporal Credit Assignment Through
                  Reminding},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {7651--7662},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/e16e74a63567ecb44ade5c87002bb1d9-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KeGBBMPB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SacramentoCBS18,
  author       = {Jo{\~{a}}o Sacramento and
                  Rui Ponte Costa and
                  Yoshua Bengio and
                  Walter Senn},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Dendritic cortical microcircuits approximate the backpropagation algorithm},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {8735--8746},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/1dc3a89d0d440ba31729b0ba74b93a33-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SacramentoCBS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rep4nlp/JacobLSB18,
  author       = {Athul Paul Jacob and
                  Zhouhan Lin and
                  Alessandro Sordoni and
                  Yoshua Bengio},
  editor       = {Isabelle Augenstein and
                  Kris Cao and
                  He He and
                  Felix Hill and
                  Spandana Gella and
                  Jamie Kiros and
                  Hongyuan Mei and
                  Dipendra Misra},
  title        = {Learning Hierarchical Structures On-The-Fly with a Recurrent-Recursive
                  Model for Sequences},
  booktitle    = {Proceedings of The Third Workshop on Representation Learning for NLP,
                  Rep4NLP@ACL 2018, Melbourne, Australia, July 20, 2018},
  pages        = {154--158},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/w18-3020},
  doi          = {10.18653/V1/W18-3020},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/rep4nlp/JacobLSB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/RavanelliB18,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Speaker Recognition from Raw Waveform with SincNet},
  booktitle    = {2018 {IEEE} Spoken Language Technology Workshop, {SLT} 2018, Athens,
                  Greece, December 18-21, 2018},
  pages        = {1021--1028},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SLT.2018.8639585},
  doi          = {10.1109/SLT.2018.8639585},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/RavanelliB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-00062,
  author       = {Jo{\~{a}}o Sacramento and
                  Rui Ponte Costa and
                  Yoshua Bengio and
                  Walter Senn},
  title        = {Dendritic error backpropagation in deep cortical microcircuits},
  journal      = {CoRR},
  volume       = {abs/1801.00062},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.00062},
  eprinttype    = {arXiv},
  eprint       = {1801.00062},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-00062.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-01442,
  author       = {Rithesh Kumar and
                  Jose Sotelo and
                  Kundan Kumar and
                  Alexandre de Br{\'{e}}bisson and
                  Yoshua Bengio},
  title        = {ObamaNet: Photo-realistic lip-sync from text},
  journal      = {CoRR},
  volume       = {abs/1801.01442},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.01442},
  eprinttype    = {arXiv},
  eprint       = {1801.01442},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-01442.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-04055,
  author       = {Akram Erraqabi and
                  Aristide Baratin and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  title        = {{A3T:} Adversarially Augmented Adversarial Training},
  journal      = {CoRR},
  volume       = {abs/1801.04055},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.04055},
  eprinttype    = {arXiv},
  eprint       = {1801.04055},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-04055.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-06700,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Mathieu Germain and
                  Saizheng Zhang and
                  Zhouhan Lin and
                  Sandeep Subramanian and
                  Taesup Kim and
                  Michael Pieper and
                  Sarath Chandar and
                  Nan Rosemary Ke and
                  Sai Rajeswar and
                  Alexandre de Br{\'{e}}bisson and
                  Jose M. R. Sotelo and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Alexandre Nguyen and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {A Deep Reinforcement Learning Chatbot (Short Version)},
  journal      = {CoRR},
  volume       = {abs/1801.06700},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.06700},
  eprinttype    = {arXiv},
  eprint       = {1801.06700},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-06700.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-00300,
  author       = {Konstantinos Drossos and
                  Stylianos Ioannis Mimilakis and
                  Dmitriy Serdyuk and
                  Gerald Schuller and
                  Tuomas Virtanen and
                  Yoshua Bengio},
  title        = {MaD TwinNet: Masker-Denoiser Architecture with Twin Networks for Monaural
                  Sound Source Separation},
  journal      = {CoRR},
  volume       = {abs/1802.00300},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.00300},
  eprinttype    = {arXiv},
  eprint       = {1802.00300},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-00300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-07426,
  author       = {Kenji Kawaguchi and
                  Yoshua Bengio},
  title        = {Generalization in Machine Learning via Analytical Learning Theory},
  journal      = {CoRR},
  volume       = {abs/1802.07426},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.07426},
  eprinttype    = {arXiv},
  eprint       = {1802.07426},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-07426.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-08216,
  author       = {Shikhar Sharma and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio},
  title        = {ChatPainter: Improving Text to Image Generation using Dialogue},
  journal      = {CoRR},
  volume       = {abs/1802.08216},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.08216},
  eprinttype    = {arXiv},
  eprint       = {1802.08216},
  timestamp    = {Wed, 02 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-08216.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-08395,
  author       = {Dmitriy Serdyuk and
                  Yongqiang Wang and
                  Christian Fuegen and
                  Anuj Kumar and
                  Baiyang Liu and
                  Yoshua Bengio},
  title        = {Towards end-to-end spoken language understanding},
  journal      = {CoRR},
  volume       = {abs/1802.08395},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.08395},
  eprinttype    = {arXiv},
  eprint       = {1802.08395},
  timestamp    = {Wed, 02 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-08395.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-08770,
  author       = {Chen Xing and
                  Devansh Arpit and
                  Christos Tsirigotis and
                  Yoshua Bengio},
  title        = {A Walk with {SGD}},
  journal      = {CoRR},
  volume       = {abs/1802.08770},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.08770},
  eprinttype    = {arXiv},
  eprint       = {1802.08770},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-08770.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-09386,
  author       = {Cl{\'{e}}ment Feutry and
                  Pablo Piantanida and
                  Yoshua Bengio and
                  Pierre Duhamel},
  title        = {Learning Anonymized Representations with Adversarial Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1802.09386},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.09386},
  eprinttype    = {arXiv},
  eprint       = {1802.09386},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-09386.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-09484,
  author       = {Valentin Thomas and
                  Emmanuel Bengio and
                  William Fedus and
                  Jules Pondard and
                  Philippe Beaudoin and
                  Hugo Larochelle and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Disentangling the independently controllable factors of variation
                  by interacting with the world},
  journal      = {CoRR},
  volume       = {abs/1802.09484},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.09484},
  eprinttype    = {arXiv},
  eprint       = {1802.09484},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-09484.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-10225,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {Light Gated Recurrent Units for Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1803.10225},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.10225},
  eprinttype    = {arXiv},
  eprint       = {1803.10225},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-10225.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-11407,
  author       = {Heeyoul Choi and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Fine-Grained Attention Mechanism for Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1803.11407},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.11407},
  eprinttype    = {arXiv},
  eprint       = {1803.11407},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-11407.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-00079,
  author       = {Sandeep Subramanian and
                  Adam Trischler and
                  Yoshua Bengio and
                  Christopher J. Pal},
  title        = {Learning General Purpose Distributed Sentence Representations via
                  Large Scale Multi-task Learning},
  journal      = {CoRR},
  volume       = {abs/1804.00079},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.00079},
  eprinttype    = {arXiv},
  eprint       = {1804.00079},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-00079.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-00379,
  author       = {Anirudh Goyal and
                  Philemon Brakel and
                  William Fedus and
                  Timothy P. Lillicrap and
                  Sergey Levine and
                  Hugo Larochelle and
                  Yoshua Bengio},
  title        = {Recall Traces: Backtracking Models for Efficient Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1804.00379},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.00379},
  eprinttype    = {arXiv},
  eprint       = {1804.00379},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-00379.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-02485,
  author       = {Alex Lamb and
                  Jonathan Binas and
                  Anirudh Goyal and
                  Dmitriy Serdyuk and
                  Sandeep Subramanian and
                  Ioannis Mitliagkas and
                  Yoshua Bengio},
  title        = {Fortified Networks: Improving the Robustness of Deep Networks by Modeling
                  the Manifold of Hidden Representations},
  journal      = {CoRR},
  volume       = {abs/1804.02485},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.02485},
  eprinttype    = {arXiv},
  eprint       = {1804.02485},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-02485.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-03758,
  author       = {Chen Ma and
                  Junfeng Wen and
                  Yoshua Bengio},
  title        = {Universal Successor Representations for Transfer Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1804.03758},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.03758},
  eprinttype    = {arXiv},
  eprint       = {1804.03758},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-03758.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-05374,
  author       = {Mirco Ravanelli and
                  Dmitriy Serdyuk and
                  Yoshua Bengio},
  title        = {Twin Regularization for online speech recognition},
  journal      = {CoRR},
  volume       = {abs/1804.05374},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.05374},
  eprinttype    = {arXiv},
  eprint       = {1804.05374},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-05374.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-09259,
  author       = {Stanislaw Jastrzebski and
                  Dzmitry Bahdanau and
                  Seyedarian Hosseini and
                  Michael Noukhovitch and
                  Yoshua Bengio and
                  Jackie Chi Kit Cheung},
  title        = {Commonsense mining as knowledge base completion? {A} study on the
                  impact of novelty},
  journal      = {CoRR},
  volume       = {abs/1804.09259},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.09259},
  eprinttype    = {arXiv},
  eprint       = {1804.09259},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-09259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-10727,
  author       = {Jonathan Binas and
                  Yoshua Bengio},
  title        = {Low-memory convolutional neural networks through incremental depth-first
                  processing},
  journal      = {CoRR},
  volume       = {abs/1804.10727},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.10727},
  eprinttype    = {arXiv},
  eprint       = {1804.10727},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-10727.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-11332,
  author       = {Arantxa Casanova and
                  Guillem Cucurull and
                  Michal Drozdzal and
                  Adriana Romero and
                  Yoshua Bengio},
  title        = {On the iterative refinement of densely connected representation levels
                  for semantic segmentation},
  journal      = {CoRR},
  volume       = {abs/1804.11332},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.11332},
  eprinttype    = {arXiv},
  eprint       = {1804.11332},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-11332.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-09730,
  author       = {Abel Gonzalez{-}Garcia and
                  Joost van de Weijer and
                  Yoshua Bengio},
  title        = {Image-to-image translation for cross-domain disentanglement},
  journal      = {CoRR},
  volume       = {abs/1805.09730},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.09730},
  eprinttype    = {arXiv},
  eprint       = {1805.09730},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-09730.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-01984,
  author       = {Margaux Luck and
                  Tristan Sylvain and
                  Joseph Paul Cohen and
                  H{\'{e}}lo{\"{\i}}se Cardinal and
                  Andrea Lodi and
                  Yoshua Bengio},
  title        = {Learning to rank for censored survival data},
  journal      = {CoRR},
  volume       = {abs/1806.01984},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.01984},
  eprinttype    = {arXiv},
  eprint       = {1806.01984},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-01984.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-03836,
  author       = {Taesup Kim and
                  Jaesik Yoon and
                  Ousmane Dia and
                  Sungwoong Kim and
                  Yoshua Bengio and
                  Sungjin Ahn},
  title        = {Bayesian Model-Agnostic Meta-Learning},
  journal      = {CoRR},
  volume       = {abs/1806.03836},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.03836},
  eprinttype    = {arXiv},
  eprint       = {1806.03836},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-03836.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-04168,
  author       = {Yikang Shen and
                  Zhouhan Lin and
                  Athul Paul Jacob and
                  Alessandro Sordoni and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Straight to the Tree: Constituency Parsing with Neural Syntactic Distance},
  journal      = {CoRR},
  volume       = {abs/1806.04168},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.04168},
  eprinttype    = {arXiv},
  eprint       = {1806.04168},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-04168.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-04342,
  author       = {Nan Rosemary Ke and
                  Konrad Zolna and
                  Alessandro Sordoni and
                  Zhouhan Lin and
                  Adam Trischler and
                  Yoshua Bengio and
                  Joelle Pineau and
                  Laurent Charlin and
                  Chris Pal},
  title        = {Focused Hierarchical RNNs for Conditional Sequence Processing},
  journal      = {CoRR},
  volume       = {abs/1806.04342},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.04342},
  eprinttype    = {arXiv},
  eprint       = {1806.04342},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-04342.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-04418,
  author       = {Titouan Parcollet and
                  Mirco Ravanelli and
                  Mohamed Morchid and
                  Georges Linar{\`{e}}s and
                  Chiheb Trabelsi and
                  Renato De Mori and
                  Yoshua Bengio},
  title        = {Quaternion Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1806.04418},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.04418},
  eprinttype    = {arXiv},
  eprint       = {1806.04418},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-04418.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-05236,
  author       = {Vikas Verma and
                  Alex Lamb and
                  Christopher Beckham and
                  Aaron C. Courville and
                  Ioannis Mitliagkas and
                  Yoshua Bengio},
  title        = {Manifold Mixup: Encouraging Meaningful On-Manifold Interpolation as
                  a Regularizer},
  journal      = {CoRR},
  volume       = {abs/1806.05236},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.05236},
  eprinttype    = {arXiv},
  eprint       = {1806.05236},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-05236.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-06765,
  author       = {Jason Jo and
                  Vikas Verma and
                  Yoshua Bengio},
  title        = {Modularity Matters: Learning Invariant Relational Reasoning Tasks},
  journal      = {CoRR},
  volume       = {abs/1806.06765},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.06765},
  eprinttype    = {arXiv},
  eprint       = {1806.06765},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-06765.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-06975,
  author       = {Francis Dutil and
                  Joseph Paul Cohen and
                  Martin Weiss and
                  Georgy Derevyanko and
                  Yoshua Bengio},
  title        = {Towards Gene Expression Convolutions using Gene Interaction Graphs},
  journal      = {CoRR},
  volume       = {abs/1806.06975},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.06975},
  eprinttype    = {arXiv},
  eprint       = {1806.06975},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-06975.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-07789,
  author       = {Titouan Parcollet and
                  Ying Zhang and
                  Mohamed Morchid and
                  Chiheb Trabelsi and
                  Georges Linar{\`{e}}s and
                  Renato De Mori and
                  Yoshua Bengio},
  title        = {Quaternion Convolutional Neural Networks for End-to-End Automatic
                  Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1806.07789},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.07789},
  eprinttype    = {arXiv},
  eprint       = {1806.07789},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-07789.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-08734,
  author       = {Nasim Rahaman and
                  Devansh Arpit and
                  Aristide Baratin and
                  Felix Draxler and
                  Min Lin and
                  Fred A. Hamprecht and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {On the Spectral Bias of Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1806.08734},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.08734},
  eprinttype    = {arXiv},
  eprint       = {1806.08734},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-08734.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-04723,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Michael Pieper and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {The Bottleneck Simulator: {A} Model-based Deep Reinforcement Learning
                  Approach},
  journal      = {CoRR},
  volume       = {abs/1807.04723},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.04723},
  eprinttype    = {arXiv},
  eprint       = {1807.04723},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-04723.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-05031,
  author       = {Stanislaw Jastrzebski and
                  Zachary Kenton and
                  Nicolas Ballas and
                  Asja Fischer and
                  Yoshua Bengio and
                  Amos J. Storkey},
  title        = {DNN's Sharpest Directions Along the {SGD} Trajectory},
  journal      = {CoRR},
  volume       = {abs/1807.05031},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.05031},
  eprinttype    = {arXiv},
  eprint       = {1807.05031},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-05031.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-11876,
  author       = {Eric Larsen and
                  S{\'{e}}bastien Lachapelle and
                  Yoshua Bengio and
                  Emma Frejinger and
                  Simon Lacoste{-}Julien and
                  Andrea Lodi},
  title        = {Predicting Solution Summaries to Integer Linear Programs under Imperfect
                  Information with Machine Learning},
  journal      = {CoRR},
  volume       = {abs/1807.11876},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.11876},
  eprinttype    = {arXiv},
  eprint       = {1807.11876},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-11876.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-00158,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Speaker Recognition from raw waveform with SincNet},
  journal      = {CoRR},
  volume       = {abs/1808.00158},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.00158},
  eprinttype    = {arXiv},
  eprint       = {1808.00158},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-00158.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-04873,
  author       = {Benjamin Scellier and
                  Anirudh Goyal and
                  Jonathan Binas and
                  Thomas Mesnard and
                  Yoshua Bengio},
  title        = {Generalization of Equilibrium Propagation to Vector Field Dynamics},
  journal      = {CoRR},
  volume       = {abs/1808.04873},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.04873},
  eprinttype    = {arXiv},
  eprint       = {1808.04873},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-04873.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-06670,
  author       = {R. Devon Hjelm and
                  Alex Fedorov and
                  Samuel Lavoie{-}Marchildon and
                  Karan Grewal and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {Learning deep representations by mutual information estimation and
                  maximization},
  journal      = {CoRR},
  volume       = {abs/1808.06670},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.06670},
  eprinttype    = {arXiv},
  eprint       = {1808.06670},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-06670.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-03702,
  author       = {Nan Rosemary Ke and
                  Anirudh Goyal and
                  Olexa Bilaniuk and
                  Jonathan Binas and
                  Michael C. Mozer and
                  Chris Pal and
                  Yoshua Bengio},
  title        = {Sparse Attentive Backtracking: Temporal CreditAssignment Through Reminding},
  journal      = {CoRR},
  volume       = {abs/1809.03702},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.03702},
  eprinttype    = {arXiv},
  eprint       = {1809.03702},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-03702.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-04506,
  author       = {Vincent Fran{\c{c}}ois{-}Lavet and
                  Yoshua Bengio and
                  Doina Precup and
                  Joelle Pineau},
  title        = {Combined Reinforcement Learning via Abstract Representations},
  journal      = {CoRR},
  volume       = {abs/1809.04506},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.04506},
  eprinttype    = {arXiv},
  eprint       = {1809.04506},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-04506.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-06848,
  author       = {Remi Tachet des Combes and
                  Mohammad Pezeshki and
                  Samira Shabanian and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {On the Learning Dynamics of Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1809.06848},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.06848},
  eprinttype    = {arXiv},
  eprint       = {1809.06848},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-06848.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-09600,
  author       = {Zhilin Yang and
                  Peng Qi and
                  Saizheng Zhang and
                  Yoshua Bengio and
                  William W. Cohen and
                  Ruslan Salakhutdinov and
                  Christopher D. Manning},
  title        = {HotpotQA: {A} Dataset for Diverse, Explainable Multi-hop Question
                  Answering},
  journal      = {CoRR},
  volume       = {abs/1809.09600},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.09600},
  eprinttype    = {arXiv},
  eprint       = {1809.09600},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-09600.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-10341,
  author       = {Petar Velickovic and
                  William Fedus and
                  William L. Hamilton and
                  Pietro Li{\`{o}} and
                  Yoshua Bengio and
                  R. Devon Hjelm},
  title        = {Deep Graph Infomax},
  journal      = {CoRR},
  volume       = {abs/1809.10341},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.10341},
  eprinttype    = {arXiv},
  eprint       = {1809.10341},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-10341.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-00045,
  author       = {Ali Farshchian and
                  Juan Alvaro Gallego and
                  Joseph Paul Cohen and
                  Yoshua Bengio and
                  Lee E. Miller and
                  Sara A. Solla},
  title        = {Adversarial Domain Adaptation for Stable Brain-Machine Interfaces},
  journal      = {CoRR},
  volume       = {abs/1810.00045},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.00045},
  eprinttype    = {arXiv},
  eprint       = {1810.00045},
  timestamp    = {Tue, 30 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-00045.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-03023,
  author       = {Devansh Arpit and
                  Bhargav Kanuparthi and
                  Giancarlo Kerg and
                  Nan Rosemary Ke and
                  Ioannis Mitliagkas and
                  Yoshua Bengio},
  title        = {h-detach: Modifying the {LSTM} Gradient Towards Better Optimization},
  journal      = {CoRR},
  volume       = {abs/1810.03023},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.03023},
  eprinttype    = {arXiv},
  eprint       = {1810.03023},
  timestamp    = {Thu, 01 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-03023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-03442,
  author       = {Assya Trofimov and
                  Francis Dutil and
                  Claude Perreault and
                  S{\'{e}}bastien Lemieux and
                  Yoshua Bengio and
                  Joseph Paul Cohen},
  title        = {Towards the Latent Transcriptome},
  journal      = {CoRR},
  volume       = {abs/1810.03442},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.03442},
  eprinttype    = {arXiv},
  eprint       = {1810.03442},
  timestamp    = {Thu, 01 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-03442.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-04871,
  author       = {Homanga Bharadhwaj and
                  Zihan Wang and
                  Yoshua Bengio and
                  Liam Paull},
  title        = {A Data-Efficient Framework for Training and Sim-to-Real Transfer of
                  Navigation Policies},
  journal      = {CoRR},
  volume       = {abs/1810.04871},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.04871},
  eprinttype    = {arXiv},
  eprint       = {1810.04871},
  timestamp    = {Tue, 30 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-04871.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-08272,
  author       = {Maxime Chevalier{-}Boisvert and
                  Dzmitry Bahdanau and
                  Salem Lahlou and
                  Lucas Willems and
                  Chitwan Saharia and
                  Thien Huu Nguyen and
                  Yoshua Bengio},
  title        = {BabyAI: First Steps Towards Grounded Language Learning With a Human
                  In the Loop},
  journal      = {CoRR},
  volume       = {abs/1810.08272},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.08272},
  eprinttype    = {arXiv},
  eprint       = {1810.08272},
  timestamp    = {Wed, 31 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-08272.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-08651,
  author       = {Jessica A. F. Thompson and
                  Yoshua Bengio and
                  Elia Formisano and
                  Marc Sch{\"{o}}nwiesner},
  title        = {How can deep learning advance computational modeling of sensory information
                  processing?},
  journal      = {CoRR},
  volume       = {abs/1810.08651},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.08651},
  eprinttype    = {arXiv},
  eprint       = {1810.08651},
  timestamp    = {Wed, 31 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-08651.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-09038,
  author       = {Kenji Kawaguchi and
                  Yoshua Bengio},
  title        = {Depth with Nonlinearity Creates No Bad Local Minima in ResNets},
  journal      = {CoRR},
  volume       = {abs/1810.09038},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.09038},
  eprinttype    = {arXiv},
  eprint       = {1810.09038},
  timestamp    = {Thu, 01 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-09038.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-11393,
  author       = {Jo{\~{a}}o Sacramento and
                  Rui Ponte Costa and
                  Yoshua Bengio and
                  Walter Senn},
  title        = {Dendritic cortical microcircuits approximate the backpropagation algorithm},
  journal      = {CoRR},
  volume       = {abs/1810.11393},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.11393},
  eprinttype    = {arXiv},
  eprint       = {1810.11393},
  timestamp    = {Thu, 01 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-11393.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-06128,
  author       = {Yoshua Bengio and
                  Andrea Lodi and
                  Antoine Prouvost},
  title        = {Machine Learning for Combinatorial Optimization: a Methodological
                  Tour d'Horizon},
  journal      = {CoRR},
  volume       = {abs/1811.06128},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.06128},
  eprinttype    = {arXiv},
  eprint       = {1811.06128},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-06128.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-07017,
  author       = {Shagun Sodhani and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {On Training Recurrent Neural Networks for Lifelong Learning},
  journal      = {CoRR},
  volume       = {abs/1811.07017},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.07017},
  eprinttype    = {arXiv},
  eprint       = {1811.07017},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-07017.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-07240,
  author       = {Kyle Kastner and
                  Jo{\~{a}}o Felipe Santos and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Representation Mixing for {TTS} Synthesis},
  journal      = {CoRR},
  volume       = {abs/1811.07240},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.07240},
  eprinttype    = {arXiv},
  eprint       = {1811.07240},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-07240.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-07453,
  author       = {Mirco Ravanelli and
                  Titouan Parcollet and
                  Yoshua Bengio},
  title        = {The PyTorch-Kaldi Speech Recognition Toolkit},
  journal      = {CoRR},
  volume       = {abs/1811.07453},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.07453},
  eprinttype    = {arXiv},
  eprint       = {1811.07453},
  timestamp    = {Mon, 26 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-07453.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-09725,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Interpretable Convolutional Filters with SincNet},
  journal      = {CoRR},
  volume       = {abs/1811.09725},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.09725},
  eprinttype    = {arXiv},
  eprint       = {1811.09725},
  timestamp    = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-09725.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-09766,
  author       = {Rim Assouel and
                  Mohamed Ahmed and
                  Marwin H. S. Segler and
                  Amir Saffari and
                  Yoshua Bengio},
  title        = {DEFactor: Differentiable Edge Factorization-based Probabilistic Graph
                  Generation},
  journal      = {CoRR},
  volume       = {abs/1811.09766},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.09766},
  eprinttype    = {arXiv},
  eprint       = {1811.09766},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-09766.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-09845,
  author       = {Alaaeldin El{-}Nouby and
                  Shikhar Sharma and
                  Hannes Schulz and
                  R. Devon Hjelm and
                  Layla El Asri and
                  Samira Ebrahimi Kahou and
                  Yoshua Bengio and
                  Graham W. Taylor},
  title        = {Keep Drawing It: Iterative language-based image generation and editing},
  journal      = {CoRR},
  volume       = {abs/1811.09845},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.09845},
  eprinttype    = {arXiv},
  eprint       = {1811.09845},
  timestamp    = {Wed, 02 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-09845.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-00271,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Learning Speaker Representations with Mutual Information},
  journal      = {CoRR},
  volume       = {abs/1812.00271},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.00271},
  eprinttype    = {arXiv},
  eprint       = {1812.00271},
  timestamp    = {Thu, 03 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-00271.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-02159,
  author       = {Tristan Deleu and
                  Yoshua Bengio},
  title        = {The effects of negative adaptation in Model-Agnostic Meta-Learning},
  journal      = {CoRR},
  volume       = {abs/1812.02159},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.02159},
  eprinttype    = {arXiv},
  eprint       = {1812.02159},
  timestamp    = {Tue, 01 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-02159.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-05159,
  author       = {Mariya Toneva and
                  Alessandro Sordoni and
                  Remi Tachet des Combes and
                  Adam Trischler and
                  Yoshua Bengio and
                  Geoffrey J. Gordon},
  title        = {An Empirical Study of Example Forgetting during Deep Neural Network
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1812.05159},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.05159},
  eprinttype    = {arXiv},
  eprint       = {1812.05159},
  timestamp    = {Tue, 01 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-05159.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-05920,
  author       = {Mirco Ravanelli and
                  Yoshua Bengio},
  title        = {Speech and Speaker Recognition from Raw Waveform with SincNet},
  journal      = {CoRR},
  volume       = {abs/1812.05920},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.05920},
  eprinttype    = {arXiv},
  eprint       = {1812.05920},
  timestamp    = {Thu, 03 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-05920.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-11337,
  author       = {Ghouthi Boukli Hacene and
                  Vincent Gripon and
                  Matthieu Arzel and
                  Nicolas Farrugia and
                  Yoshua Bengio},
  title        = {Quantized Guided Pruning for Efficient Hardware Implementations of
                  Convolutional Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1812.11337},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.11337},
  eprinttype    = {arXiv},
  eprint       = {1812.11337},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-11337.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/GulcehreFXCB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Orhan Firat and
                  Kelvin Xu and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {On integrating a language model into neural machine translation},
  journal      = {Comput. Speech Lang.},
  volume       = {45},
  pages        = {137--148},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.csl.2017.01.014},
  doi          = {10.1016/J.CSL.2017.01.014},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/GulcehreFXCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/ChoiCB17,
  author       = {Heeyoul Choi and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Context-dependent word representation for neural machine translation},
  journal      = {Comput. Speech Lang.},
  volume       = {45},
  pages        = {149--160},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.csl.2017.01.007},
  doi          = {10.1016/J.CSL.2017.01.007},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/ChoiCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/csl/FiratCSYB17,
  author       = {Orhan Firat and
                  Kyunghyun Cho and
                  Baskaran Sankaran and
                  Fatos T. Yarman{-}Vural and
                  Yoshua Bengio},
  title        = {Multi-way, multilingual neural machine translation},
  journal      = {Comput. Speech Lang.},
  volume       = {45},
  pages        = {236--252},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.csl.2016.10.006},
  doi          = {10.1016/J.CSL.2016.10.006},
  timestamp    = {Thu, 20 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csl/FiratCSYB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ficn/ScellierB17,
  author       = {Benjamin Scellier and
                  Yoshua Bengio},
  title        = {Equilibrium Propagation: Bridging the Gap between Energy-Based Models
                  and Backpropagation},
  journal      = {Frontiers Comput. Neurosci.},
  volume       = {11},
  pages        = {24},
  year         = {2017},
  url          = {https://doi.org/10.3389/fncom.2017.00024},
  doi          = {10.3389/FNCOM.2017.00024},
  timestamp    = {Sat, 23 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ficn/ScellierB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/HubaraCSEB17,
  author       = {Itay Hubara and
                  Matthieu Courbariaux and
                  Daniel Soudry and
                  Ran El{-}Yaniv and
                  Yoshua Bengio},
  title        = {Quantized Neural Networks: Training Neural Networks with Low Precision
                  Weights and Activations},
  journal      = {J. Mach. Learn. Res.},
  volume       = {18},
  pages        = {187:1--187:30},
  year         = {2017},
  url          = {http://jmlr.org/papers/v18/16-456.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/HubaraCSEB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mia/HavaeiDWBCBPJL17,
  author       = {Mohammad Havaei and
                  Axel Davy and
                  David Warde{-}Farley and
                  Antoine Biard and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Chris Pal and
                  Pierre{-}Marc Jodoin and
                  Hugo Larochelle},
  title        = {Brain tumor segmentation with Deep Neural Networks},
  journal      = {Medical Image Anal.},
  volume       = {35},
  pages        = {18--31},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.media.2016.05.004},
  doi          = {10.1016/J.MEDIA.2016.05.004},
  timestamp    = {Mon, 24 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/mia/HavaeiDWBCBPJL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mt/HillCJB17,
  author       = {Felix Hill and
                  Kyunghyun Cho and
                  S{\'{e}}bastien Jean and
                  Yoshua Bengio},
  title        = {The representational geometry of word meanings acquired by neural
                  machine translation models},
  journal      = {Mach. Transl.},
  volume       = {31},
  number       = {1-2},
  pages        = {3--18},
  year         = {2017},
  url          = {https://doi.org/10.1007/s10590-017-9194-2},
  doi          = {10.1007/S10590-017-9194-2},
  timestamp    = {Tue, 24 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/mt/HillCJB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioMFZW17,
  author       = {Yoshua Bengio and
                  Thomas Mesnard and
                  Asja Fischer and
                  Saizheng Zhang and
                  Yuhuai Wu},
  title        = {STDP-Compatible Approximation of Backpropagation in an Energy-Based
                  Model},
  journal      = {Neural Comput.},
  volume       = {29},
  number       = {3},
  pages        = {555--577},
  year         = {2017},
  url          = {https://doi.org/10.1162/NECO\_a\_00934},
  doi          = {10.1162/NECO\_A\_00934},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/neco/BengioMFZW17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pr/ZhangBL17,
  author       = {Xu{-}Yao Zhang and
                  Yoshua Bengio and
                  Cheng{-}Lin Liu},
  title        = {Online and offline handwritten Chinese character recognition: {A}
                  comprehensive study and new benchmark},
  journal      = {Pattern Recognit.},
  volume       = {61},
  pages        = {348--360},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.patcog.2016.08.005},
  doi          = {10.1016/J.PATCOG.2016.08.005},
  timestamp    = {Tue, 16 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pr/ZhangBL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/thms/ZhangXLB17,
  author       = {Xu{-}Yao Zhang and
                  Guo{-}Sen Xie and
                  Cheng{-}Lin Liu and
                  Yoshua Bengio},
  title        = {End-to-End Online Writer Identification With Recurrent Neural Network},
  journal      = {{IEEE} Trans. Hum. Mach. Syst.},
  volume       = {47},
  number       = {2},
  pages        = {285--292},
  year         = {2017},
  url          = {https://doi.org/10.1109/THMS.2016.2634921},
  doi          = {10.1109/THMS.2016.2634921},
  timestamp    = {Tue, 16 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/thms/ZhangXLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/ImAMB17,
  author       = {Daniel Jiwoong Im and
                  Sungjin Ahn and
                  Roland Memisevic and
                  Yoshua Bengio},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Denoising Criterion for Variational Auto-Encoding Framework},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {2059--2065},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10777},
  doi          = {10.1609/AAAI.V31I1.10777},
  timestamp    = {Mon, 04 Sep 2023 14:40:32 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/ImAMB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SerbanKTTZBC17,
  author       = {Iulian Vlad Serban and
                  Tim Klinger and
                  Gerald Tesauro and
                  Kartik Talamadupula and
                  Bowen Zhou and
                  Yoshua Bengio and
                  Aaron C. Courville},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {Multiresolution Recurrent Neural Networks: An Application to Dialogue
                  Response Generation},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3288--3294},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10984},
  doi          = {10.1609/AAAI.V31I1.10984},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SerbanKTTZBC17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SerbanSLCPCB17,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Ryan Lowe and
                  Laurent Charlin and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Satinder Singh and
                  Shaul Markovitch},
  title        = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating
                  Dialogues},
  booktitle    = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
                  February 4-9, 2017, San Francisco, California, {USA}},
  pages        = {3295--3301},
  publisher    = {{AAAI} Press},
  year         = {2017},
  url          = {https://doi.org/10.1609/aaai.v31i1.10983},
  doi          = {10.1609/AAAI.V31I1.10983},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SerbanSLCPCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/LoweNSABP17,
  author       = {Ryan Lowe and
                  Michael D. Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  editor       = {Regina Barzilay and
                  Min{-}Yen Kan},
  title        = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Volume
                  1: Long Papers},
  pages        = {1116--1126},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-1103},
  doi          = {10.18653/V1/P17-1103},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/LoweNSABP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/JegouDVRB17,
  author       = {Simon J{\'{e}}gou and
                  Michal Drozdzal and
                  David V{\'{a}}zquez and
                  Adriana Romero and
                  Yoshua Bengio},
  title        = {The One Hundred Layers Tiramisu: Fully Convolutional DenseNets for
                  Semantic Segmentation},
  booktitle    = {2017 {IEEE} Conference on Computer Vision and Pattern Recognition
                  Workshops, {CVPR} Workshops 2017, Honolulu, HI, USA, July 21-26, 2017},
  pages        = {1175--1183},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CVPRW.2017.156},
  doi          = {10.1109/CVPRW.2017.156},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/JegouDVRB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/NguyenCBDY17,
  author       = {Anh Nguyen and
                  Jeff Clune and
                  Yoshua Bengio and
                  Alexey Dosovitskiy and
                  Jason Yosinski},
  title        = {Plug {\&} Play Generative Networks: Conditional Iterative Generation
                  of Images in Latent Space},
  booktitle    = {2017 {IEEE} Conference on Computer Vision and Pattern Recognition,
                  {CVPR} 2017, Honolulu, HI, USA, July 21-26, 2017},
  pages        = {3510--3520},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CVPR.2017.374},
  doi          = {10.1109/CVPR.2017.374},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/NguyenCBDY17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/MongiaKEB17,
  author       = {Mihir Mongia and
                  Kundan Kumar and
                  Akram Erraqabi and
                  Yoshua Bengio},
  title        = {On random weights for texture generation in one layer {CNNS}},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {2207--2211},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7952548},
  doi          = {10.1109/ICASSP.2017.7952548},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/MongiaKEB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/RavanelliBOB17,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {A network of deep neural networks for Distant Speech Recognition},
  booktitle    = {2017 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2017, New Orleans, LA, USA, March 5-9, 2017},
  pages        = {4880--4884},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICASSP.2017.7953084},
  doi          = {10.1109/ICASSP.2017.7953084},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/RavanelliBOB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccvw/CohenBGLB17,
  author       = {Joseph Paul Cohen and
                  Genevi{\`{e}}ve Boucher and
                  Craig A. Glastonbury and
                  Henry Z. Lo and
                  Yoshua Bengio},
  title        = {Count-ception: Counting by Fully Convolutional Redundant Counting},
  booktitle    = {2017 {IEEE} International Conference on Computer Vision Workshops,
                  {ICCV} Workshops 2017, Venice, Italy, October 22-29, 2017},
  pages        = {18--26},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICCVW.2017.9},
  doi          = {10.1109/ICCVW.2017.9},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccvw/CohenBGLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AlainB17,
  author       = {Guillaume Alain and
                  Yoshua Bengio},
  title        = {Understanding intermediate layers using linear classifier probes},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=HJ4-rAVtl},
  timestamp    = {Thu, 04 Apr 2019 13:20:08 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AlainB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/BahdanauBXGLPCB17,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SJDaqqveg},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/BahdanauBXGLPCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CheLJBL17,
  author       = {Tong Che and
                  Yanran Li and
                  Athul Paul Jacob and
                  Yoshua Bengio and
                  Wenjie Li},
  title        = {Mode Regularized Generative Adversarial Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=HJKkY35le},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/CheLJBL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ChungAB17,
  author       = {Junyoung Chung and
                  Sungjin Ahn and
                  Yoshua Bengio},
  title        = {Hierarchical Multiscale Recurrent Neural Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=S1di0sfgl},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ChungAB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GulcehreMVB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Marcin Moczulski and
                  Francesco Visin and
                  Yoshua Bengio},
  title        = {Mollifying Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=r1G4z8cge},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GulcehreMVB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KruegerMKPBKGBC17,
  author       = {David Krueger and
                  Tegan Maharaj and
                  J{\'{a}}nos Kram{\'{a}}r and
                  Mohammad Pezeshki and
                  Nicolas Ballas and
                  Nan Rosemary Ke and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Christopher J. Pal},
  title        = {Zoneout: Regularizing RNNs by Randomly Preserving Hidden Activations},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=rJqBEPcxe},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KruegerMKPBKGBC17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LinFSYXZB17,
  author       = {Zhouhan Lin and
                  Minwei Feng and
                  C{\'{\i}}cero Nogueira dos Santos and
                  Mo Yu and
                  Bing Xiang and
                  Bowen Zhou and
                  Yoshua Bengio},
  title        = {A Structured Self-Attentive Sentence Embedding},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=BJC\_jUqxe},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LinFSYXZB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LoweNSABP17,
  author       = {Ryan Lowe and
                  Michael D. Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  title        = {Towards an automatic Turing test: Learning to evaluate dialogue responses},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=Sk7c3yVYg},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LoweNSABP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MehriKGKJSCB17,
  author       = {Soroush Mehri and
                  Kundan Kumar and
                  Ishaan Gulrajani and
                  Rithesh Kumar and
                  Shubham Jain and
                  Jose Sotelo and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {SampleRNN: An Unconditional End-to-End Neural Audio Generation Model},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=SkxKPDv5xl},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MehriKGKJSCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/MirzaCB17,
  author       = {Mehdi Mirza and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generalizable Features From Unsupervised Learning},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=BynzZolYg},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/MirzaCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/RomeroCESADLDHB17,
  author       = {Adriana Romero and
                  Pierre Luc Carrier and
                  Akram Erraqabi and
                  Tristan Sylvain and
                  Alex Auvolat and
                  Etienne Dejoie and
                  Marc{-}Andr{\'{e}} Legault and
                  Marie{-}Pierre Dub{\'{e}} and
                  Julie G. Hussin and
                  Yoshua Bengio},
  title        = {Diet Networks: Thin Parameters for Fat Genomics},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=Sk-oDY9ge},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/RomeroCESADLDHB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SoteloMKSKCB17,
  author       = {Jose Sotelo and
                  Soroush Mehri and
                  Kundan Kumar and
                  Jo{\~{a}}o Felipe Santos and
                  Kyle Kastner and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Char2Wav: End-to-End Speech Synthesis},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Workshop Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=B1VWyySKx},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SoteloMKSKCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Warde-FarleyB17,
  author       = {David Warde{-}Farley and
                  Yoshua Bengio},
  title        = {Improving Generative Adversarial Networks with Denoising Feature Matching},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=S1X7nhsxl},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Warde-FarleyB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ArpitJBKBKMFCBL17,
  author       = {Devansh Arpit and
                  Stanislaw Jastrzebski and
                  Nicolas Ballas and
                  David Krueger and
                  Emmanuel Bengio and
                  Maxinder S. Kanwal and
                  Tegan Maharaj and
                  Asja Fischer and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {A Closer Look at Memorization in Deep Networks},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {233--242},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/arpit17a.html},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ArpitJBKBKMFCBL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DinhPBB17,
  author       = {Laurent Dinh and
                  Razvan Pascanu and
                  Samy Bengio and
                  Yoshua Bengio},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Sharp Minima Can Generalize For Deep Nets},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {1019--1028},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/dinh17b.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DinhPBB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/GulcehreSMB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Jose Sotelo and
                  Marcin Moczulski and
                  Yoshua Bengio},
  title        = {A robust adaptive stochastic gradient method for deep learning},
  booktitle    = {2017 International Joint Conference on Neural Networks, {IJCNN} 2017,
                  Anchorage, AK, USA, May 14-19, 2017},
  pages        = {125--132},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IJCNN.2017.7965845},
  doi          = {10.1109/IJCNN.2017.7965845},
  timestamp    = {Wed, 16 Oct 2019 14:14:55 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/GulcehreSMB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RavanelliBOB17,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  editor       = {Francisco Lacerda},
  title        = {Improving Speech Recognition by Revising Gated Recurrent Units},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {1308--1312},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-775},
  doi          = {10.21437/INTERSPEECH.2017-775},
  timestamp    = {Sun, 06 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RavanelliBOB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/KimSB17,
  author       = {Taesup Kim and
                  Inchul Song and
                  Yoshua Bengio},
  editor       = {Francisco Lacerda},
  title        = {Dynamic Layer Normalization for Adaptive Neural Acoustic Modeling
                  in Speech Recognition},
  booktitle    = {Interspeech 2017, 18th Annual Conference of the International Speech
                  Communication Association, Stockholm, Sweden, August 20-24, 2017},
  pages        = {2411--2415},
  publisher    = {{ISCA}},
  year         = {2017},
  url          = {https://doi.org/10.21437/Interspeech.2017-556},
  doi          = {10.21437/INTERSPEECH.2017-556},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/KimSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isca/Bengio17,
  author       = {Yoshua Bengio},
  title        = {Towards more hardware-friendly deep learning},
  booktitle    = {Proceedings of the Workshop on Trends in Machine-Learning (and impact
                  on computer architecture), TIML@ISCA 2017, Toronto, ON, Canada, June
                  25, 2017},
  pages        = {5},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3149166.3149171},
  doi          = {10.1145/3149166.3149171},
  timestamp    = {Tue, 06 Nov 2018 11:07:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isca/Bengio17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoyalKGB17,
  author       = {Anirudh Goyal and
                  Nan Rosemary Ke and
                  Surya Ganguli and
                  Yoshua Bengio},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Variational Walkback: Learning a Transition Operator as a Stochastic
                  Recurrent Net},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {4392--4402},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/46a558d97954d0692411c861cf78ef79-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GoyalKGB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LambHGCCB17,
  author       = {Alex Lamb and
                  R. Devon Hjelm and
                  Yaroslav Ganin and
                  Joseph Paul Cohen and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {GibbsNet: Iterative Adversarial Inference for Deep Graphical Models},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {5089--5098},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/30f8f6b940d1073d8b6a5eebc46dd6e5-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LambHGCCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GulcehreDTB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Francis Dutil and
                  Adam Trischler and
                  Yoshua Bengio},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Plan, Attend, Generate: Planning for Sequence-to-Sequence Models},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {5474--5483},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/b030afbb3a8af8fb0759241c97466ee4-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GulcehreDTB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoyalSCKB17,
  author       = {Anirudh Goyal and
                  Alessandro Sordoni and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Nan Rosemary Ke and
                  Yoshua Bengio},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Z-Forcing: Training Stochastic Recurrent Networks},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {6713--6723},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/900c563bfd2c48c16701acca83ad858a-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GoyalSCKB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rep4nlp/GulcehreDTB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Francis Dutil and
                  Adam Trischler and
                  Yoshua Bengio},
  editor       = {Phil Blunsom and
                  Antoine Bordes and
                  Kyunghyun Cho and
                  Shay B. Cohen and
                  Chris Dyer and
                  Edward Grefenstette and
                  Karl Moritz Hermann and
                  Laura Rimell and
                  Jason Weston and
                  Scott Yih},
  title        = {Plan, Attend, Generate: Character-Level Neural Machine Translation
                  with Planning},
  booktitle    = {Proceedings of the 2nd Workshop on Representation Learning for NLP,
                  Rep4NLP@ACL 2017, Vancouver, Canada, August 3, 2017},
  pages        = {228--234},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/w17-2627},
  doi          = {10.18653/V1/W17-2627},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/rep4nlp/GulcehreDTB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangPBZLBC17,
  author       = {Ying Zhang and
                  Mohammad Pezeshki and
                  Philemon Brakel and
                  Saizheng Zhang and
                  C{\'{e}}sar Laurent and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Towards End-to-End Speech Recognition with Deep Convolutional Neural
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1701.02720},
  year         = {2017},
  url          = {http://arxiv.org/abs/1701.02720},
  eprinttype    = {arXiv},
  eprint       = {1701.02720},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangPBZLBC17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreCB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sarath Chandar and
                  Yoshua Bengio},
  title        = {Memory Augmented Neural Networks with Wormhole Connections},
  journal      = {CoRR},
  volume       = {abs/1701.08718},
  year         = {2017},
  url          = {http://arxiv.org/abs/1701.08718},
  eprinttype    = {arXiv},
  eprint       = {1701.08718},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DrozdzalCVDTRBP17,
  author       = {Michal Drozdzal and
                  Gabriel Chartrand and
                  Eugene Vorontsov and
                  Lisa Di{-}Jorio and
                  An Tang and
                  Adriana Romero and
                  Yoshua Bengio and
                  Chris Pal and
                  Samuel Kadoury},
  title        = {Learning Normalized Inputs for Iterative Estimation in Medical Image
                  Segmentation},
  journal      = {CoRR},
  volume       = {abs/1702.05174},
  year         = {2017},
  url          = {http://arxiv.org/abs/1702.05174},
  eprinttype    = {arXiv},
  eprint       = {1702.05174},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DrozdzalCVDTRBP17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CheLZHLSB17,
  author       = {Tong Che and
                  Yanran Li and
                  Ruixiang Zhang and
                  R. Devon Hjelm and
                  Wenjie Li and
                  Yangqiu Song and
                  Yoshua Bengio},
  title        = {Maximum-Likelihood Augmented Discrete Generative Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/1702.07983},
  year         = {2017},
  url          = {http://arxiv.org/abs/1702.07983},
  eprinttype    = {arXiv},
  eprint       = {1702.07983},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/CheLZHLSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HjelmJCCB17,
  author       = {R. Devon Hjelm and
                  Athul Paul Jacob and
                  Tong Che and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Boundary-Seeking Generative Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/1702.08431},
  year         = {2017},
  url          = {http://arxiv.org/abs/1702.08431},
  eprinttype    = {arXiv},
  eprint       = {1702.08431},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HjelmJCCB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreSMB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Jose Sotelo and
                  Marcin Moczulski and
                  Yoshua Bengio},
  title        = {A Robust Adaptive Stochastic Gradient Method for Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1703.00788},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.00788},
  eprinttype    = {arXiv},
  eprint       = {1703.00788},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreSMB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LinFSYXZB17,
  author       = {Zhouhan Lin and
                  Minwei Feng and
                  C{\'{\i}}cero Nogueira dos Santos and
                  Mo Yu and
                  Bing Xiang and
                  Bowen Zhou and
                  Yoshua Bengio},
  title        = {A Structured Self-attentive Sentence Embedding},
  journal      = {CoRR},
  volume       = {abs/1703.03130},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.03130},
  eprinttype    = {arXiv},
  eprint       = {1703.03130},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LinFSYXZB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DinhPBB17,
  author       = {Laurent Dinh and
                  Razvan Pascanu and
                  Samy Bengio and
                  Yoshua Bengio},
  title        = {Sharp Minima Can Generalize For Deep Nets},
  journal      = {CoRR},
  volume       = {abs/1703.04933},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.04933},
  eprinttype    = {arXiv},
  eprint       = {1703.04933},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DinhPBB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioTPPB17,
  author       = {Emmanuel Bengio and
                  Valentin Thomas and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Independently Controllable Features},
  journal      = {CoRR},
  volume       = {abs/1703.07718},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.07718},
  eprinttype    = {arXiv},
  eprint       = {1703.07718},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioTPPB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RavanelliBOB17,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {A network of deep neural networks for distant speech recognition},
  journal      = {CoRR},
  volume       = {abs/1703.08002},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.08002},
  eprinttype    = {arXiv},
  eprint       = {1703.08002},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RavanelliBOB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RavanelliBOB17a,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {Batch-normalized joint training for DNN-based distant speech recognition},
  journal      = {CoRR},
  volume       = {abs/1703.08471},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.08471},
  eprinttype    = {arXiv},
  eprint       = {1703.08471},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RavanelliBOB17a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CohenLB17,
  author       = {Joseph Paul Cohen and
                  Henry Z. Lo and
                  Yoshua Bengio},
  title        = {Count-ception: Counting by Fully Convolutional Redundant Counting},
  journal      = {CoRR},
  volume       = {abs/1703.08710},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.08710},
  eprinttype    = {arXiv},
  eprint       = {1703.08710},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/CohenLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RomeroDEJB17,
  author       = {Adriana Romero and
                  Michal Drozdzal and
                  Akram Erraqabi and
                  Simon J{\'{e}}gou and
                  Yoshua Bengio},
  title        = {Image Segmentation by Iterative Inference from Conditional Score Estimation},
  journal      = {CoRR},
  volume       = {abs/1705.07450},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.07450},
  eprinttype    = {arXiv},
  eprint       = {1705.07450},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RomeroDEJB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/TrabelsiBSSSMRB17,
  author       = {Chiheb Trabelsi and
                  Olexa Bilaniuk and
                  Dmitriy Serdyuk and
                  Sandeep Subramanian and
                  Jo{\~{a}}o Felipe Santos and
                  Soroush Mehri and
                  Negar Rostamzadeh and
                  Yoshua Bengio and
                  Christopher J. Pal},
  title        = {Deep Complex Networks},
  journal      = {CoRR},
  volume       = {abs/1705.09792},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.09792},
  eprinttype    = {arXiv},
  eprint       = {1705.09792},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/TrabelsiBSSSMRB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LuckSCLB17,
  author       = {Margaux Luck and
                  Tristan Sylvain and
                  H{\'{e}}lo{\"{\i}}se Cardinal and
                  Andrea Lodi and
                  Yoshua Bengio},
  title        = {Deep Learning for Patient-Specific Kidney Graft Survival Analysis},
  journal      = {CoRR},
  volume       = {abs/1705.10245},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.10245},
  eprinttype    = {arXiv},
  eprint       = {1705.10245},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LuckSCLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauBJGVB17,
  author       = {Dzmitry Bahdanau and
                  Tom Bosc and
                  Stanislaw Jastrzebski and
                  Edward Grefenstette and
                  Pascal Vincent and
                  Yoshua Bengio},
  title        = {Learning to Compute Word Embeddings On the Fly},
  journal      = {CoRR},
  volume       = {abs/1706.00286},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.00286},
  eprinttype    = {arXiv},
  eprint       = {1706.00286},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauBJGVB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JingGPSTSB17,
  author       = {Li Jing and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  John Peurifoy and
                  Yichen Shen and
                  Max Tegmark and
                  Marin Soljacic and
                  Yoshua Bengio},
  title        = {Gated Orthogonal Recurrent Units: On Learning to Forget},
  journal      = {CoRR},
  volume       = {abs/1706.02761},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.02761},
  eprinttype    = {arXiv},
  eprint       = {1706.02761},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JingGPSTSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreDTB17,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Francis Dutil and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {Plan, Attend, Generate: Character-level Neural Machine Translation
                  with Planning in the Decoder},
  journal      = {CoRR},
  volume       = {abs/1706.05087},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.05087},
  eprinttype    = {arXiv},
  eprint       = {1706.05087},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreDTB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ArpitJBKBKMFCBL17,
  author       = {Devansh Arpit and
                  Stanislaw Jastrzebski and
                  Nicolas Ballas and
                  David Krueger and
                  Emmanuel Bengio and
                  Maxinder S. Kanwal and
                  Tegan Maharaj and
                  Asja Fischer and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Simon Lacoste{-}Julien},
  title        = {A Closer Look at Memorization in Deep Networks},
  journal      = {CoRR},
  volume       = {abs/1706.05394},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.05394},
  eprinttype    = {arXiv},
  eprint       = {1706.05394},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ArpitJBKBKMFCBL17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MerrienboerSLB17,
  author       = {Bart van Merri{\"{e}}nboer and
                  Amartya Sanyal and
                  Hugo Larochelle and
                  Yoshua Bengio},
  title        = {Multiscale sequence modeling with a learned dictionary},
  journal      = {CoRR},
  volume       = {abs/1707.00762},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.00762},
  eprinttype    = {arXiv},
  eprint       = {1707.00762},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MerrienboerSLB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KimSB17,
  author       = {Taesup Kim and
                  Inchul Song and
                  Yoshua Bengio},
  title        = {Dynamic Layer Normalization for Adaptive Neural Acoustic Modeling
                  in Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1707.06065},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.06065},
  eprinttype    = {arXiv},
  eprint       = {1707.06065},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KimSB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-01289,
  author       = {Valentin Thomas and
                  Jules Pondard and
                  Emmanuel Bengio and
                  Marc Sarfati and
                  Philippe Beaudoin and
                  Marie{-}Jean Meurs and
                  Joelle Pineau and
                  Doina Precup and
                  Yoshua Bengio},
  title        = {Independently Controllable Factors},
  journal      = {CoRR},
  volume       = {abs/1708.01289},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.01289},
  eprinttype    = {arXiv},
  eprint       = {1708.01289},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-01289.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-06742,
  author       = {Dmitriy Serdyuk and
                  Nan Rosemary Ke and
                  Alessandro Sordoni and
                  Chris Pal and
                  Yoshua Bengio},
  title        = {Twin Networks: Using the Future as a Regularizer},
  journal      = {CoRR},
  volume       = {abs/1708.06742},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.06742},
  eprinttype    = {arXiv},
  eprint       = {1708.06742},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-06742.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-07149,
  author       = {Ryan Lowe and
                  Michael D. Noseworthy and
                  Iulian Vlad Serban and
                  Nicolas Angelard{-}Gontier and
                  Yoshua Bengio and
                  Joelle Pineau},
  title        = {Towards an Automatic Turing Test: Learning to Evaluate Dialogue Responses},
  journal      = {CoRR},
  volume       = {abs/1708.07149},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.07149},
  eprinttype    = {arXiv},
  eprint       = {1708.07149},
  timestamp    = {Fri, 28 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-07149.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-02349,
  author       = {Iulian Vlad Serban and
                  Chinnadhurai Sankar and
                  Mathieu Germain and
                  Saizheng Zhang and
                  Zhouhan Lin and
                  Sandeep Subramanian and
                  Taesup Kim and
                  Michael Pieper and
                  Sarath Chandar and
                  Nan Rosemary Ke and
                  Sai Mudumba and
                  Alexandre de Br{\'{e}}bisson and
                  Jose Sotelo and
                  Dendi Suhubdy and
                  Vincent Michalski and
                  Alexandre Nguyen and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {A Deep Reinforcement Learning Chatbot},
  journal      = {CoRR},
  volume       = {abs/1709.02349},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.02349},
  eprinttype    = {arXiv},
  eprint       = {1709.02349},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-02349.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1709-08568,
  author       = {Yoshua Bengio},
  title        = {The Consciousness Prior},
  journal      = {CoRR},
  volume       = {abs/1709.08568},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.08568},
  eprinttype    = {arXiv},
  eprint       = {1709.08568},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-08568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-00641,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {Improving speech recognition by revising gated recurrent units},
  journal      = {CoRR},
  volume       = {abs/1710.00641},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.00641},
  eprinttype    = {arXiv},
  eprint       = {1710.00641},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-00641.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-04773,
  author       = {Stanislaw Jastrzebski and
                  Devansh Arpit and
                  Nicolas Ballas and
                  Vikas Verma and
                  Tong Che and
                  Yoshua Bengio},
  title        = {Residual Connections Encourage Iterative Inference},
  journal      = {CoRR},
  volume       = {abs/1710.04773},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.04773},
  eprinttype    = {arXiv},
  eprint       = {1710.04773},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-04773.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-05468,
  author       = {Kenji Kawaguchi and
                  Leslie Pack Kaelbling and
                  Yoshua Bengio},
  title        = {Generalization in Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1710.05468},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.05468},
  eprinttype    = {arXiv},
  eprint       = {1710.05468},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-05468.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-07300,
  author       = {Samira Ebrahimi Kahou and
                  Adam Atkinson and
                  Vincent Michalski and
                  {\'{A}}kos K{\'{a}}d{\'{a}}r and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {FigureQA: An Annotated Figure Dataset for Visual Reasoning},
  journal      = {CoRR},
  volume       = {abs/1710.07300},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.07300},
  eprinttype    = {arXiv},
  eprint       = {1710.07300},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-07300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-10903,
  author       = {Petar Velickovic and
                  Guillem Cucurull and
                  Arantxa Casanova and
                  Adriana Romero and
                  Pietro Li{\`{o}} and
                  Yoshua Bengio},
  title        = {Graph Attention Networks},
  journal      = {CoRR},
  volume       = {abs/1710.10903},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.10903},
  eprinttype    = {arXiv},
  eprint       = {1710.10903},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-10903.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-00066,
  author       = {Konrad Zolna and
                  Devansh Arpit and
                  Dendi Suhubdy and
                  Yoshua Bengio},
  title        = {Fraternal Dropout},
  journal      = {CoRR},
  volume       = {abs/1711.00066},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.00066},
  eprinttype    = {arXiv},
  eprint       = {1711.00066},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-00066.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-01437,
  author       = {Stylianos Ioannis Mimilakis and
                  Konstantinos Drossos and
                  Jo{\~{a}}o Felipe Santos and
                  Gerald Schuller and
                  Tuomas Virtanen and
                  Yoshua Bengio},
  title        = {Monaural Singing Voice Separation with Skip-Filtering Connections
                  and Recurrent Inference of Time-Frequency Mask},
  journal      = {CoRR},
  volume       = {abs/1711.01437},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.01437},
  eprinttype    = {arXiv},
  eprint       = {1711.01437},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-01437.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02282,
  author       = {Anirudh Goyal and
                  Nan Rosemary Ke and
                  Surya Ganguli and
                  Yoshua Bengio},
  title        = {Variational Walkback: Learning a Transition Operator as a Stochastic
                  Recurrent Net},
  journal      = {CoRR},
  volume       = {abs/1711.02282},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02282},
  eprinttype    = {arXiv},
  eprint       = {1711.02282},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02282.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02326,
  author       = {Nan Rosemary Ke and
                  Anirudh Goyal and
                  Olexa Bilaniuk and
                  Jonathan Binas and
                  Laurent Charlin and
                  Chris Pal and
                  Yoshua Bengio},
  title        = {Sparse Attentive Backtracking: Long-Range Credit Assignment in Recurrent
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1711.02326},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02326},
  eprinttype    = {arXiv},
  eprint       = {1711.02326},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02326.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-04623,
  author       = {Stanislaw Jastrzebski and
                  Zachary Kenton and
                  Devansh Arpit and
                  Nicolas Ballas and
                  Asja Fischer and
                  Yoshua Bengio and
                  Amos J. Storkey},
  title        = {Three Factors Influencing Minima in {SGD}},
  journal      = {CoRR},
  volume       = {abs/1711.04623},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.04623},
  eprinttype    = {arXiv},
  eprint       = {1711.04623},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-04623.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-04755,
  author       = {Anirudh Goyal and
                  Nan Rosemary Ke and
                  Alex Lamb and
                  R. Devon Hjelm and
                  Chris Pal and
                  Joelle Pineau and
                  Yoshua Bengio},
  title        = {ACtuAL: Actor-Critic Under Adversarial Learning},
  journal      = {CoRR},
  volume       = {abs/1711.04755},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.04755},
  eprinttype    = {arXiv},
  eprint       = {1711.04755},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-04755.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-05411,
  author       = {Anirudh Goyal and
                  Alessandro Sordoni and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Nan Rosemary Ke and
                  Yoshua Bengio},
  title        = {Z-Forcing: Training Stochastic Recurrent Networks},
  journal      = {CoRR},
  volume       = {abs/1711.05411},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.05411},
  eprinttype    = {arXiv},
  eprint       = {1711.05411},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-05411.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-05717,
  author       = {Samira Shabanian and
                  Devansh Arpit and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {Variational Bi-LSTMs},
  journal      = {CoRR},
  volume       = {abs/1711.05717},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.05717},
  eprinttype    = {arXiv},
  eprint       = {1711.05717},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-05717.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-08416,
  author       = {Benjamin Scellier and
                  Yoshua Bengio},
  title        = {Equivalence of Equilibrium Propagation and Recurrent Backpropagation},
  journal      = {CoRR},
  volume       = {abs/1711.08416},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.08416},
  eprinttype    = {arXiv},
  eprint       = {1711.08416},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-08416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-10462,
  author       = {Francis Dutil and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Adam Trischler and
                  Yoshua Bengio},
  title        = {Plan, Attend, Generate: Planning for Sequence-to-Sequence Models},
  journal      = {CoRR},
  volume       = {abs/1711.10462},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.10462},
  eprinttype    = {arXiv},
  eprint       = {1711.10462},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-10462.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-11561,
  author       = {Jason Jo and
                  Yoshua Bengio},
  title        = {Measuring the tendency of CNNs to Learn Surface Statistical Regularities},
  journal      = {CoRR},
  volume       = {abs/1711.11561},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.11561},
  eprinttype    = {arXiv},
  eprint       = {1711.11561},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-11561.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-04120,
  author       = {Alex Lamb and
                  R. Devon Hjelm and
                  Yaroslav Ganin and
                  Joseph Paul Cohen and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {GibbsNet: Iterative Adversarial Inference for Deep Graphical Models},
  journal      = {CoRR},
  volume       = {abs/1712.04120},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.04120},
  eprinttype    = {arXiv},
  eprint       = {1712.04120},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-04120.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@book{DBLP:books/daglib/0040158,
  author       = {Ian J. Goodfellow and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Deep Learning},
  series       = {Adaptive computation and machine learning},
  publisher    = {{MIT} Press},
  year         = {2016},
  url          = {http://www.deeplearningbook.org/},
  isbn         = {978-0-262-03561-3},
  timestamp    = {Sat, 25 Mar 2017 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/books/daglib/0040158.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/GulcehreB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Yoshua Bengio},
  title        = {Knowledge Matters: Importance of Prior Information for Optimization},
  journal      = {J. Mach. Learn. Res.},
  volume       = {17},
  pages        = {8:1--8:32},
  year         = {2016},
  url          = {http://jmlr.org/papers/v17/gulchere16a.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/GulcehreB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmui/KahouBLGMKJFDBF16,
  author       = {Samira Ebrahimi Kahou and
                  Xavier Bouthillier and
                  Pascal Lamblin and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Vincent Michalski and
                  Kishore Konda and
                  S{\'{e}}bastien Jean and
                  Pierre Froumenty and
                  Yann N. Dauphin and
                  Nicolas Boulanger{-}Lewandowski and
                  Raul Chandias Ferrari and
                  Mehdi Mirza and
                  David Warde{-}Farley and
                  Aaron C. Courville and
                  Pascal Vincent and
                  Roland Memisevic and
                  Christopher Joseph Pal and
                  Yoshua Bengio},
  title        = {EmoNets: Multimodal deep learning approaches for emotion recognition
                  in video},
  journal      = {J. Multimodal User Interfaces},
  volume       = {10},
  number       = {2},
  pages        = {99--111},
  year         = {2016},
  url          = {https://doi.org/10.1007/s12193-015-0195-2},
  doi          = {10.1007/S12193-015-0195-2},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmui/KahouBLGMKJFDBF16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pieee/HaykinWB16,
  author       = {Simon Haykin and
                  Stephen J. Wright and
                  Yoshua Bengio},
  title        = {Big Data: Theoretical Aspects [Scanning the Issue]},
  journal      = {Proc. {IEEE}},
  volume       = {104},
  number       = {1},
  pages        = {8--10},
  year         = {2016},
  url          = {https://doi.org/10.1109/JPROC.2015.2507658},
  doi          = {10.1109/JPROC.2015.2507658},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pieee/HaykinWB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/HillCKB16,
  author       = {Felix Hill and
                  KyungHyun Cho and
                  Anna Korhonen and
                  Yoshua Bengio},
  title        = {Learning to Understand Phrases by Embedding the Dictionary},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {4},
  pages        = {17--30},
  year         = {2016},
  url          = {https://doi.org/10.1162/tacl\_a\_00080},
  doi          = {10.1162/TACL\_A\_00080},
  timestamp    = {Fri, 10 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/HillCKB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SerbanSBCP16,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Joelle Pineau},
  editor       = {Dale Schuurmans and
                  Michael P. Wellman},
  title        = {Building End-To-End Dialogue Systems Using Generative Hierarchical
                  Neural Network Models},
  booktitle    = {Proceedings of the Thirtieth {AAAI} Conference on Artificial Intelligence,
                  February 12-17, 2016, Phoenix, Arizona, {USA}},
  pages        = {3776--3784},
  publisher    = {{AAAI} Press},
  year         = {2016},
  url          = {https://doi.org/10.1609/aaai.v30i1.9883},
  doi          = {10.1609/AAAI.V30I1.9883},
  timestamp    = {Mon, 04 Sep 2023 15:08:28 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SerbanSBCP16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ChungCB16,
  author       = {Junyoung Chung and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {A Character-level Decoder without Explicit Segmentation for Neural
                  Machine Translation},
  booktitle    = {Proceedings of the 54th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2016, August 7-12, 2016, Berlin, Germany, Volume
                  1: Long Papers},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/p16-1160},
  doi          = {10.18653/V1/P16-1160},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/ChungCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GulcehreANZB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sungjin Ahn and
                  Ramesh Nallapati and
                  Bowen Zhou and
                  Yoshua Bengio},
  title        = {Pointing the Unknown Words},
  booktitle    = {Proceedings of the 54th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2016, August 7-12, 2016, Berlin, Germany, Volume
                  1: Long Papers},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/p16-1014},
  doi          = {10.18653/V1/P16-1014},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GulcehreANZB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SerbanGGACCB16,
  author       = {Iulian Vlad Serban and
                  Alberto Garc{\'{\i}}a{-}Dur{\'{a}}n and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sungjin Ahn and
                  Sarath Chandar and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generating Factoid Questions With Recurrent Neural Networks: The 30M
                  Factoid Question-Answer Corpus},
  booktitle    = {Proceedings of the 54th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2016, August 7-12, 2016, Berlin, Germany, Volume
                  1: Long Papers},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/p16-1056},
  doi          = {10.18653/V1/P16-1056},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SerbanGGACCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/bmvc/YaoBCSB16,
  author       = {Li Yao and
                  Nicolas Ballas and
                  Kyunghyun Cho and
                  John R. Smith and
                  Yoshua Bengio},
  editor       = {Richard C. Wilson and
                  Edwin R. Hancock and
                  William A. P. Smith},
  title        = {Oracle Performance for Visual Captioning},
  booktitle    = {Proceedings of the British Machine Vision Conference 2016, {BMVC}
                  2016, York, UK, September 19-22, 2016},
  publisher    = {{BMVA} Press},
  year         = {2016},
  url          = {http://www.bmva.org/bmvc/2016/papers/paper141/index.html},
  timestamp    = {Wed, 03 Feb 2021 08:36:18 +0100},
  biburl       = {https://dblp.org/rec/conf/bmvc/YaoBCSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/VisinRCMCKBC16,
  author       = {Francesco Visin and
                  Adriana Romero and
                  Kyunghyun Cho and
                  Matteo Matteucci and
                  Marco Ciccone and
                  Kyle Kastner and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {ReSeg: {A} Recurrent Neural Network-Based Model for Semantic Segmentation},
  booktitle    = {2016 {IEEE} Conference on Computer Vision and Pattern Recognition
                  Workshops, {CVPR} Workshops 2016, Las Vegas, NV, USA, June 26 - July
                  1, 2016},
  pages        = {426--433},
  publisher    = {{IEEE} Computer Society},
  year         = {2016},
  url          = {https://doi.org/10.1109/CVPRW.2016.60},
  doi          = {10.1109/CVPRW.2016.60},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/VisinRCMCKBC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LaurentPBZB16,
  author       = {C{\'{e}}sar Laurent and
                  Gabriel Pereyra and
                  Philemon Brakel and
                  Ying Zhang and
                  Yoshua Bengio},
  title        = {Batch normalized recurrent neural networks},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {2657--2661},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472159},
  doi          = {10.1109/ICASSP.2016.7472159},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/LaurentPBZB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BahdanauCSBB16,
  author       = {Dzmitry Bahdanau and
                  Jan Chorowski and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Yoshua Bengio},
  title        = {End-to-end attention-based large vocabulary speech recognition},
  booktitle    = {2016 {IEEE} International Conference on Acoustics, Speech and Signal
                  Processing, {ICASSP} 2016, Shanghai, China, March 20-25, 2016},
  pages        = {4945--4949},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/ICASSP.2016.7472618},
  doi          = {10.1109/ICASSP.2016.7472618},
  timestamp    = {Sat, 19 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BahdanauCSBB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ArjovskySB16,
  author       = {Mart{\'{\i}}n Arjovsky and
                  Amar Shah and
                  Yoshua Bengio},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Unitary Evolution Recurrent Neural Networks},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {1120--1128},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/arjovsky16.html},
  timestamp    = {Wed, 29 May 2019 08:41:46 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ArjovskySB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PezeshkiFBCB16,
  author       = {Mohammad Pezeshki and
                  Linxi Fan and
                  Philemon Brakel and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Deconstructing the Ladder Network Architecture},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {2368--2376},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/pezeshki16.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/PezeshkiFBCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BornscheinSFB16,
  author       = {J{\"{o}}rg Bornschein and
                  Samira Shabanian and
                  Asja Fischer and
                  Yoshua Bengio},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Bidirectional Helmholtz Machines},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {2511--2519},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/bornschein16.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BornscheinSFB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GulcehreMDB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Marcin Moczulski and
                  Misha Denil and
                  Yoshua Bengio},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Noisy Activation Functions},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {3059--3068},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/gulcehre16.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GulcehreMDB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/ZhangPBZLBC16,
  author       = {Ying Zhang and
                  Mohammad Pezeshki and
                  Phil{\'{e}}mon Brakel and
                  Saizheng Zhang and
                  C{\'{e}}sar Laurent and
                  Yoshua Bengio and
                  Aaron C. Courville},
  editor       = {Nelson Morgan},
  title        = {Towards End-to-End Speech Recognition with Deep Convolutional Neural
                  Networks},
  booktitle    = {Interspeech 2016, 17th Annual Conference of the International Speech
                  Communication Association, San Francisco, CA, USA, September 8-12,
                  2016},
  pages        = {410--414},
  publisher    = {{ISCA}},
  year         = {2016},
  url          = {https://doi.org/10.21437/Interspeech.2016-1446},
  doi          = {10.21437/INTERSPEECH.2016-1446},
  timestamp    = {Mon, 26 Jun 2023 16:43:56 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/ZhangPBZLBC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/miccai/HavaeiGCB16,
  author       = {Mohammad Havaei and
                  Nicolas Guizard and
                  Nicolas Chapados and
                  Yoshua Bengio},
  editor       = {S{\'{e}}bastien Ourselin and
                  Leo Joskowicz and
                  Mert R. Sabuncu and
                  G{\"{o}}zde B. {\"{U}}nal and
                  William M. Wells III},
  title        = {HeMIS: Hetero-Modal Image Segmentation},
  booktitle    = {Medical Image Computing and Computer-Assisted Intervention - {MICCAI}
                  2016 - 19th International Conference, Athens, Greece, October 17-21,
                  2016, Proceedings, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9901},
  pages        = {469--477},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-46723-8\_54},
  doi          = {10.1007/978-3-319-46723-8\_54},
  timestamp    = {Fri, 08 Apr 2022 11:01:35 +0200},
  biburl       = {https://dblp.org/rec/conf/miccai/HavaeiGCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/FiratCB16,
  author       = {Orhan Firat and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Kevin Knight and
                  Ani Nenkova and
                  Owen Rambow},
  title        = {Multi-Way, Multilingual Neural Machine Translation with a Shared Attention
                  Mechanism},
  booktitle    = {{NAACL} {HLT} 2016, The 2016 Conference of the North American Chapter
                  of the Association for Computational Linguistics: Human Language Technologies,
                  San Diego California, USA, June 12-17, 2016},
  pages        = {866--875},
  publisher    = {The Association for Computational Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/n16-1101},
  doi          = {10.18653/V1/N16-1101},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/FiratCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ZhangWCLMSB16,
  author       = {Saizheng Zhang and
                  Yuhuai Wu and
                  Tong Che and
                  Zhouhan Lin and
                  Roland Memisevic and
                  Ruslan Salakhutdinov and
                  Yoshua Bengio},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Architectural Complexity Measures of Recurrent Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {1822--1830},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/860320be12a1c050cd7731794e231bd3-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ZhangWCLMSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/WuZZBS16,
  author       = {Yuhuai Wu and
                  Saizheng Zhang and
                  Ying Zhang and
                  Yoshua Bengio and
                  Ruslan Salakhutdinov},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {On Multiplicative Integration with Recurrent Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {2856--2864},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/f69e505b08403ad2298b9f262659929a-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/WuZZBS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HubaraCSEB16,
  author       = {Itay Hubara and
                  Matthieu Courbariaux and
                  Daniel Soudry and
                  Ran El{-}Yaniv and
                  Yoshua Bengio},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Binarized Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {4107--4115},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/d8330f857a17c53d217014ee776bfd50-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HubaraCSEB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoyalLZZCB16,
  author       = {Anirudh Goyal and
                  Alex Lamb and
                  Ying Zhang and
                  Saizheng Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Daniel D. Lee and
                  Masashi Sugiyama and
                  Ulrike von Luxburg and
                  Isabelle Guyon and
                  Roman Garnett},
  title        = {Professor Forcing: {A} New Algorithm for Training Recurrent Networks},
  booktitle    = {Advances in Neural Information Processing Systems 29: Annual Conference
                  on Neural Information Processing Systems 2016, December 5-10, 2016,
                  Barcelona, Spain},
  pages        = {4601--4609},
  year         = {2016},
  url          = {https://proceedings.neurips.cc/paper/2016/hash/16026d60ff9b54410b3435b403afd226-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GoyalLZZCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slt/RavanelliBOB16,
  author       = {Mirco Ravanelli and
                  Philemon Brakel and
                  Maurizio Omologo and
                  Yoshua Bengio},
  title        = {Batch-normalized joint training for DNN-based distant speech recognition},
  booktitle    = {2016 {IEEE} Spoken Language Technology Workshop, {SLT} 2016, San Diego,
                  CA, USA, December 13-16, 2016},
  pages        = {28--34},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/SLT.2016.7846241},
  doi          = {10.1109/SLT.2016.7846241},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/slt/RavanelliBOB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/ChungCB16,
  author       = {Junyoung Chung and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {{NYU-MILA} Neural Machine Translation Systems for WMT'16},
  booktitle    = {Proceedings of the First Conference on Machine Translation, {WMT}
                  2016, colocated with {ACL} 2016, August 11-12, Berlin, Germany},
  pages        = {268--271},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/w16-2309},
  doi          = {10.18653/V1/W16-2309},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wmt/ChungCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/LinCMB15,
  author       = {Zhouhan Lin and
                  Matthieu Courbariaux and
                  Roland Memisevic and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Neural Networks with Few Multiplications},
  booktitle    = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {http://arxiv.org/abs/1510.03009},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LinCMB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2016,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {4th International Conference on Learning Representations, {ICLR} 2016,
                  San Juan, Puerto Rico, May 2-4, 2016, Conference Track Proceedings},
  year         = {2016},
  url          = {https://iclr.cc/archive/www/doku.php\%3Fid=iclr2016:accepted-main.html},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2016.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/FiratCB16,
  author       = {Orhan Firat and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Multi-Way, Multilingual Neural Machine Translation with a Shared Attention
                  Mechanism},
  journal      = {CoRR},
  volume       = {abs/1601.01073},
  year         = {2016},
  url          = {http://arxiv.org/abs/1601.01073},
  eprinttype    = {arXiv},
  eprint       = {1601.01073},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/FiratCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CourbariauxB16,
  author       = {Matthieu Courbariaux and
                  Yoshua Bengio},
  title        = {BinaryNet: Training Deep Neural Networks with Weights and Activations
                  Constrained to +1 or -1},
  journal      = {CoRR},
  volume       = {abs/1602.02830},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.02830},
  eprinttype    = {arXiv},
  eprint       = {1602.02830},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/CourbariauxB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ScellierB16,
  author       = {Benjamin Scellier and
                  Yoshua Bengio},
  title        = {Towards a Biologically Plausible Backprop},
  journal      = {CoRR},
  volume       = {abs/1602.05179},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.05179},
  eprinttype    = {arXiv},
  eprint       = {1602.05179},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ScellierB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangWCLMSB16,
  author       = {Saizheng Zhang and
                  Yuhuai Wu and
                  Tong Che and
                  Zhouhan Lin and
                  Roland Memisevic and
                  Ruslan Salakhutdinov and
                  Yoshua Bengio},
  title        = {Architectural Complexity Measures of Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1602.08210},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.08210},
  eprinttype    = {arXiv},
  eprint       = {1602.08210},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangWCLMSB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreMDB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Marcin Moczulski and
                  Misha Denil and
                  Yoshua Bengio},
  title        = {Noisy Activation Functions},
  journal      = {CoRR},
  volume       = {abs/1603.00391},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.00391},
  eprinttype    = {arXiv},
  eprint       = {1603.00391},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreMDB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChungCB16,
  author       = {Junyoung Chung and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {A Character-level Decoder without Explicit Segmentation for Neural
                  Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1603.06147},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.06147},
  eprinttype    = {arXiv},
  eprint       = {1603.06147},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChungCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanGGACCB16,
  author       = {Iulian Vlad Serban and
                  Alberto Garc{\'{\i}}a{-}Dur{\'{a}}n and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sungjin Ahn and
                  Sarath Chandar and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generating Factoid Questions With Recurrent Neural Networks: The 30M
                  Factoid Question-Answer Corpus},
  journal      = {CoRR},
  volume       = {abs/1603.06807},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.06807},
  eprinttype    = {arXiv},
  eprint       = {1603.06807},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanGGACCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreANZB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sungjin Ahn and
                  Ramesh Nallapati and
                  Bowen Zhou and
                  Yoshua Bengio},
  title        = {Pointing the Unknown Words},
  journal      = {CoRR},
  volume       = {abs/1603.08148},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.08148},
  eprinttype    = {arXiv},
  eprint       = {1603.08148},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreANZB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Al-RfouAAa16,
  author       = {Rami Al{-}Rfou and
                  Guillaume Alain and
                  Amjad Almahairi and
                  Christof Angerm{\"{u}}ller and
                  Dzmitry Bahdanau and
                  Nicolas Ballas and
                  Fr{\'{e}}d{\'{e}}ric Bastien and
                  Justin Bayer and
                  Anatoly Belikov and
                  Alexander Belopolsky and
                  Yoshua Bengio and
                  Arnaud Bergeron and
                  James Bergstra and
                  Valentin Bisson and
                  Josh Bleecher Snyder and
                  Nicolas Bouchard and
                  Nicolas Boulanger{-}Lewandowski and
                  Xavier Bouthillier and
                  Alexandre de Br{\'{e}}bisson and
                  Olivier Breuleux and
                  Pierre Luc Carrier and
                  Kyunghyun Cho and
                  Jan Chorowski and
                  Paul F. Christiano and
                  Tim Cooijmans and
                  Marc{-}Alexandre C{\^{o}}t{\'{e}} and
                  Myriam C{\^{o}}t{\'{e}} and
                  Aaron C. Courville and
                  Yann N. Dauphin and
                  Olivier Delalleau and
                  Julien Demouth and
                  Guillaume Desjardins and
                  Sander Dieleman and
                  Laurent Dinh and
                  Melanie Ducoffe and
                  Vincent Dumoulin and
                  Samira Ebrahimi Kahou and
                  Dumitru Erhan and
                  Ziye Fan and
                  Orhan Firat and
                  Mathieu Germain and
                  Xavier Glorot and
                  Ian J. Goodfellow and
                  Matthew Graham and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Philippe Hamel and
                  Iban Harlouchet and
                  Jean{-}Philippe Heng and
                  Bal{\'{a}}zs Hidasi and
                  Sina Honari and
                  Arjun Jain and
                  S{\'{e}}bastien Jean and
                  Kai Jia and
                  Mikhail Korobov and
                  Vivek Kulkarni and
                  Alex Lamb and
                  Pascal Lamblin and
                  Eric Larsen and
                  C{\'{e}}sar Laurent and
                  Sean Lee and
                  Simon Lefran{\c{c}}ois and
                  Simon Lemieux and
                  Nicholas L{\'{e}}onard and
                  Zhouhan Lin and
                  Jesse A. Livezey and
                  Cory Lorenz and
                  Jeremiah Lowin and
                  Qianli Ma and
                  Pierre{-}Antoine Manzagol and
                  Olivier Mastropietro and
                  Robert McGibbon and
                  Roland Memisevic and
                  Bart van Merri{\"{e}}nboer and
                  Vincent Michalski and
                  Mehdi Mirza and
                  Alberto Orlandi and
                  Christopher Joseph Pal and
                  Razvan Pascanu and
                  Mohammad Pezeshki and
                  Colin Raffel and
                  Daniel Renshaw and
                  Matthew Rocklin and
                  Adriana Romero and
                  Markus Roth and
                  Peter Sadowski and
                  John Salvatier and
                  Fran{\c{c}}ois Savard and
                  Jan Schl{\"{u}}ter and
                  John Schulman and
                  Gabriel Schwartz and
                  Iulian Vlad Serban and
                  Dmitriy Serdyuk and
                  Samira Shabanian and
                  {\'{E}}tienne Simon and
                  Sigurd Spieckermann and
                  S. Ramana Subramanyam and
                  Jakub Sygnowski and
                  J{\'{e}}r{\'{e}}mie Tanguay and
                  Gijs van Tulder and
                  Joseph P. Turian and
                  Sebastian Urban and
                  Pascal Vincent and
                  Francesco Visin and
                  Harm de Vries and
                  David Warde{-}Farley and
                  Dustin J. Webb and
                  Matthew Willson and
                  Kelvin Xu and
                  Lijun Xue and
                  Li Yao and
                  Saizheng Zhang and
                  Ying Zhang},
  title        = {Theano: {A} Python framework for fast computation of mathematical
                  expressions},
  journal      = {CoRR},
  volume       = {abs/1605.02688},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.02688},
  eprinttype    = {arXiv},
  eprint       = {1605.02688},
  timestamp    = {Thu, 30 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Al-RfouAAa16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanSLCPCB16,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Ryan Lowe and
                  Laurent Charlin and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {A Hierarchical Latent Variable Encoder-Decoder Model for Generating
                  Dialogues},
  journal      = {CoRR},
  volume       = {abs/1605.06069},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.06069},
  eprinttype    = {arXiv},
  eprint       = {1605.06069},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanSLCPCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChandarALVTB16,
  author       = {Sarath Chandar and
                  Sungjin Ahn and
                  Hugo Larochelle and
                  Pascal Vincent and
                  Gerald Tesauro and
                  Yoshua Bengio},
  title        = {Hierarchical Memory Networks},
  journal      = {CoRR},
  volume       = {abs/1605.07427},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.07427},
  eprinttype    = {arXiv},
  eprint       = {1605.07427},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChandarALVTB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanKTTZBC16,
  author       = {Iulian Vlad Serban and
                  Tim Klinger and
                  Gerald Tesauro and
                  Kartik Talamadupula and
                  Bowen Zhou and
                  Yoshua Bengio and
                  Aaron C. Courville},
  title        = {Multiresolution Recurrent Neural Networks: An Application to Dialogue
                  Response Generation},
  journal      = {CoRR},
  volume       = {abs/1606.00776},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.00776},
  eprinttype    = {arXiv},
  eprint       = {1606.00776},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanKTTZBC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KruegerMKPBKGBL16,
  author       = {David Krueger and
                  Tegan Maharaj and
                  J{\'{a}}nos Kram{\'{a}}r and
                  Mohammad Pezeshki and
                  Nicolas Ballas and
                  Nan Rosemary Ke and
                  Anirudh Goyal and
                  Yoshua Bengio and
                  Hugo Larochelle and
                  Aaron C. Courville and
                  Chris Pal},
  title        = {Zoneout: Regularizing RNNs by Randomly Preserving Hidden Activations},
  journal      = {CoRR},
  volume       = {abs/1606.01305},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.01305},
  eprinttype    = {arXiv},
  eprint       = {1606.01305},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KruegerMKPBKGBL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioSBSS16,
  author       = {Yoshua Bengio and
                  Benjamin Scellier and
                  Olexa Bilaniuk and
                  Jo{\~{a}}o Sacramento and
                  Walter Senn},
  title        = {Feedforward Initialization for Fast Inference of Deep Generative Networks
                  is biologically plausible},
  journal      = {CoRR},
  volume       = {abs/1606.01651},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.01651},
  eprinttype    = {arXiv},
  eprint       = {1606.01651},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioSBSS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SordoniBB16,
  author       = {Alessandro Sordoni and
                  Philip Bachman and
                  Yoshua Bengio},
  title        = {Iterative Alternating Neural Attention for Machine Reading},
  journal      = {CoRR},
  volume       = {abs/1606.02245},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.02245},
  eprinttype    = {arXiv},
  eprint       = {1606.02245},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SordoniBB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KimB16,
  author       = {Taesup Kim and
                  Yoshua Bengio},
  title        = {Deep Directed Generative Models with Energy-Based Probability Estimation},
  journal      = {CoRR},
  volume       = {abs/1606.03439},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.03439},
  eprinttype    = {arXiv},
  eprint       = {1606.03439},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KimB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangBL16,
  author       = {Xu{-}Yao Zhang and
                  Yoshua Bengio and
                  Cheng{-}Lin Liu},
  title        = {Online and Offline Handwritten Chinese Character Recognition: {A}
                  Comprehensive Study and New Benchmark},
  journal      = {CoRR},
  volume       = {abs/1606.05763},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.05763},
  eprinttype    = {arXiv},
  eprint       = {1606.05763},
  timestamp    = {Tue, 16 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangBL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangYZLB16,
  author       = {Xu{-}Yao Zhang and
                  Fei Yin and
                  Yan{-}Ming Zhang and
                  Cheng{-}Lin Liu and
                  Yoshua Bengio},
  title        = {Drawing and Recognizing Chinese Characters with Recurrent Neural Network},
  journal      = {CoRR},
  volume       = {abs/1606.06539},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.06539},
  eprinttype    = {arXiv},
  eprint       = {1606.06539},
  timestamp    = {Tue, 16 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangYZLB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/WuZZBS16,
  author       = {Yuhuai Wu and
                  Saizheng Zhang and
                  Ying Zhang and
                  Yoshua Bengio and
                  Ruslan Salakhutdinov},
  title        = {On Multiplicative Integration with Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1606.06630},
  year         = {2016},
  url          = {http://arxiv.org/abs/1606.06630},
  eprinttype    = {arXiv},
  eprint       = {1606.06630},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/WuZZBS16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreCCB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Sarath Chandar and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Dynamic Neural Turing Machine with Soft and Hard Addressing Schemes},
  journal      = {CoRR},
  volume       = {abs/1607.00036},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.00036},
  eprinttype    = {arXiv},
  eprint       = {1607.00036},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreCCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoiCB16,
  author       = {Heeyoul Choi and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Context-Dependent Word Representation for Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1607.00578},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.00578},
  eprinttype    = {arXiv},
  eprint       = {1607.00578},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoiCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HavaeiGCB16,
  author       = {Mohammad Havaei and
                  Nicolas Guizard and
                  Nicolas Chapados and
                  Yoshua Bengio},
  title        = {HeMIS: Hetero-Modal Image Segmentation},
  journal      = {CoRR},
  volume       = {abs/1607.05194},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.05194},
  eprinttype    = {arXiv},
  eprint       = {1607.05194},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HavaeiGCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauBXGLPCB16,
  author       = {Dzmitry Bahdanau and
                  Philemon Brakel and
                  Kelvin Xu and
                  Anirudh Goyal and
                  Ryan Lowe and
                  Joelle Pineau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {An Actor-Critic Algorithm for Sequence Prediction},
  journal      = {CoRR},
  volume       = {abs/1607.07086},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.07086},
  eprinttype    = {arXiv},
  eprint       = {1607.07086},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauBXGLPCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AhnCPB16,
  author       = {Sungjin Ahn and
                  Heeyoul Choi and
                  Tanel P{\"{a}}rnamaa and
                  Yoshua Bengio},
  title        = {A Neural Knowledge Language Model},
  journal      = {CoRR},
  volume       = {abs/1608.00318},
  year         = {2016},
  url          = {http://arxiv.org/abs/1608.00318},
  eprinttype    = {arXiv},
  eprint       = {1608.00318},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AhnCPB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreMVB16,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Marcin Moczulski and
                  Francesco Visin and
                  Yoshua Bengio},
  title        = {Mollifying Networks},
  journal      = {CoRR},
  volume       = {abs/1608.04980},
  year         = {2016},
  url          = {http://arxiv.org/abs/1608.04980},
  eprinttype    = {arXiv},
  eprint       = {1608.04980},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreMVB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OttLZLB16,
  author       = {Joachim Ott and
                  Zhouhan Lin and
                  Ying Zhang and
                  Shih{-}Chii Liu and
                  Yoshua Bengio},
  title        = {Recurrent Neural Networks With Limited Numerical Precision},
  journal      = {CoRR},
  volume       = {abs/1608.06902},
  year         = {2016},
  url          = {http://arxiv.org/abs/1608.06902},
  eprinttype    = {arXiv},
  eprint       = {1608.06902},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OttLZLB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChungAB16,
  author       = {Junyoung Chung and
                  Sungjin Ahn and
                  Yoshua Bengio},
  title        = {Hierarchical Multiscale Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1609.01704},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.01704},
  eprinttype    = {arXiv},
  eprint       = {1609.01704},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChungAB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HubaraCSEB16,
  author       = {Itay Hubara and
                  Matthieu Courbariaux and
                  Daniel Soudry and
                  Ran El{-}Yaniv and
                  Yoshua Bengio},
  title        = {Quantized Neural Networks: Training Neural Networks with Low Precision
                  Weights and Activations},
  journal      = {CoRR},
  volume       = {abs/1609.07061},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.07061},
  eprinttype    = {arXiv},
  eprint       = {1609.07061},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HubaraCSEB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlainB16,
  author       = {Guillaume Alain and
                  Yoshua Bengio},
  title        = {Understanding intermediate layers using linear classifier probes},
  journal      = {CoRR},
  volume       = {abs/1610.01644},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.01644},
  eprinttype    = {arXiv},
  eprint       = {1610.01644},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlainB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LambGZZCB16,
  author       = {Alex Lamb and
                  Anirudh Goyal and
                  Ying Zhang and
                  Saizheng Zhang and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Professor Forcing: {A} New Algorithm for Training Recurrent Networks},
  journal      = {CoRR},
  volume       = {abs/1610.09038},
  year         = {2016},
  url          = {http://arxiv.org/abs/1610.09038},
  eprinttype    = {arXiv},
  eprint       = {1610.09038},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LambGZZCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OttLZLB16a,
  author       = {Joachim Ott and
                  Zhouhan Lin and
                  Ying Zhang and
                  Shih{-}Chii Liu and
                  Yoshua Bengio},
  title        = {Recurrent Neural Networks With Limited Numerical Precision},
  journal      = {CoRR},
  volume       = {abs/1611.07065},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.07065},
  eprinttype    = {arXiv},
  eprint       = {1611.07065},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OttLZLB16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JegouDVRB16,
  author       = {Simon J{\'{e}}gou and
                  Michal Drozdzal and
                  David V{\'{a}}zquez and
                  Adriana Romero and
                  Yoshua Bengio},
  title        = {The One Hundred Layers Tiramisu: Fully Convolutional DenseNets for
                  Semantic Segmentation},
  journal      = {CoRR},
  volume       = {abs/1611.09326},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.09326},
  eprinttype    = {arXiv},
  eprint       = {1611.09326},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JegouDVRB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RomeroCESADLDHB16,
  author       = {Adriana Romero and
                  Pierre Luc Carrier and
                  Akram Erraqabi and
                  Tristan Sylvain and
                  Alex Auvolat and
                  Etienne Dejoie and
                  Marc{-}Andr{\'{e}} Legault and
                  Marie{-}Pierre Dub{\'{e}} and
                  Julie G. Hussin and
                  Yoshua Bengio},
  title        = {Diet Networks: Thin Parameters for Fat Genomic},
  journal      = {CoRR},
  volume       = {abs/1611.09340},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.09340},
  eprinttype    = {arXiv},
  eprint       = {1611.09340},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/RomeroCESADLDHB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/NguyenYBDC16,
  author       = {Anh Nguyen and
                  Jason Yosinski and
                  Yoshua Bengio and
                  Alexey Dosovitskiy and
                  Jeff Clune},
  title        = {Plug {\&} Play Generative Networks: Conditional Iterative Generation
                  of Images in Latent Space},
  journal      = {CoRR},
  volume       = {abs/1612.00005},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.00005},
  eprinttype    = {arXiv},
  eprint       = {1612.00005},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/NguyenYBDC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerdyukABRTB16,
  author       = {Dmitriy Serdyuk and
                  Kartik Audhkhasi and
                  Philemon Brakel and
                  Bhuvana Ramabhadran and
                  Samuel Thomas and
                  Yoshua Bengio},
  title        = {Invariant Representations for Noisy Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1612.01928},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.01928},
  eprinttype    = {arXiv},
  eprint       = {1612.01928},
  timestamp    = {Fri, 03 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerdyukABRTB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CheLJBL16,
  author       = {Tong Che and
                  Yanran Li and
                  Athul Paul Jacob and
                  Yoshua Bengio and
                  Wenjie Li},
  title        = {Mode Regularized Generative Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/1612.02136},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.02136},
  eprinttype    = {arXiv},
  eprint       = {1612.02136},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/CheLJBL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MirzaCB16,
  author       = {Mehdi Mirza and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generalizable Features From Unsupervised Learning},
  journal      = {CoRR},
  volume       = {abs/1612.03809},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.03809},
  eprinttype    = {arXiv},
  eprint       = {1612.03809},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MirzaCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MongiaKEB16,
  author       = {Mihir Mongia and
                  Kundan Kumar and
                  Akram Erraqabi and
                  Yoshua Bengio},
  title        = {On Random Weights for Texture Generation in One Layer Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1612.06070},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.06070},
  eprinttype    = {arXiv},
  eprint       = {1612.06070},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MongiaKEB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MehriKGKJSCB16,
  author       = {Soroush Mehri and
                  Kundan Kumar and
                  Ishaan Gulrajani and
                  Rithesh Kumar and
                  Shubham Jain and
                  Jose Sotelo and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {SampleRNN: An Unconditional End-to-End Neural Audio Generation Model},
  journal      = {CoRR},
  volume       = {abs/1612.07837},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.07837},
  eprinttype    = {arXiv},
  eprint       = {1612.07837},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MehriKGKJSCB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nature/LeCunBH15,
  author       = {Yann LeCun and
                  Yoshua Bengio and
                  Geoffrey E. Hinton},
  title        = {Deep learning},
  journal      = {Nat.},
  volume       = {521},
  number       = {7553},
  pages        = {436--444},
  year         = {2015},
  url          = {https://doi.org/10.1038/nature14539},
  doi          = {10.1038/NATURE14539},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nature/LeCunBH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/BengioL15,
  author       = {Yoshua Bengio and
                  Honglak Lee},
  title        = {Editorial introduction to the Neural Networks special issue on Deep
                  Learning of Representations},
  journal      = {Neural Networks},
  volume       = {64},
  pages        = {1--3},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.neunet.2014.12.006},
  doi          = {10.1016/J.NEUNET.2014.12.006},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nn/BengioL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/GoodfellowECCMH15,
  author       = {Ian J. Goodfellow and
                  Dumitru Erhan and
                  Pierre Luc Carrier and
                  Aaron C. Courville and
                  Mehdi Mirza and
                  Benjamin Hamner and
                  William Cukierski and
                  Yichuan Tang and
                  David Thaler and
                  Dong{-}Hyun Lee and
                  Yingbo Zhou and
                  Chetan Ramaiah and
                  Fangxiang Feng and
                  Ruifan Li and
                  Xiaojie Wang and
                  Dimitris Athanasakis and
                  John Shawe{-}Taylor and
                  Maxim Milakov and
                  John Park and
                  Radu Tudor Ionescu and
                  Marius Popescu and
                  Cristian Grozea and
                  James Bergstra and
                  Jingjing Xie and
                  Lukasz Romaszko and
                  Bing Xu and
                  Zhang Chuang and
                  Yoshua Bengio},
  title        = {Challenges in representation learning: {A} report on three machine
                  learning contests},
  journal      = {Neural Networks},
  volume       = {64},
  pages        = {59--63},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.neunet.2014.09.005},
  doi          = {10.1016/J.NEUNET.2014.09.005},
  timestamp    = {Mon, 15 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/nn/GoodfellowECCMH15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/taslp/MesnilDYBDHHHTY15,
  author       = {Gr{\'{e}}goire Mesnil and
                  Yann N. Dauphin and
                  Kaisheng Yao and
                  Yoshua Bengio and
                  Li Deng and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Xiaodong He and
                  Larry P. Heck and
                  G{\"{o}}khan T{\"{u}}r and
                  Dong Yu and
                  Geoffrey Zweig},
  title        = {Using Recurrent Neural Networks for Slot Filling in Spoken Language
                  Understanding},
  journal      = {{IEEE} {ACM} Trans. Audio Speech Lang. Process.},
  volume       = {23},
  number       = {3},
  pages        = {530--539},
  year         = {2015},
  url          = {https://doi.org/10.1109/TASLP.2014.2383614},
  doi          = {10.1109/TASLP.2014.2383614},
  timestamp    = {Fri, 13 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/taslp/MesnilDYBDHHHTY15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmm/ChoCB15,
  author       = {Kyunghyun Cho and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Describing Multimedia Content Using Attention-Based Encoder-Decoder
                  Networks},
  journal      = {{IEEE} Trans. Multim.},
  volume       = {17},
  number       = {11},
  pages        = {1875--1886},
  year         = {2015},
  url          = {https://doi.org/10.1109/TMM.2015.2477044},
  doi          = {10.1109/TMM.2015.2477044},
  timestamp    = {Thu, 01 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmm/ChoCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/JeanCMB15,
  author       = {S{\'{e}}bastien Jean and
                  KyungHyun Cho and
                  Roland Memisevic and
                  Yoshua Bengio},
  title        = {On Using Very Large Target Vocabulary for Neural Machine Translation},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers},
  pages        = {1--10},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-1001},
  doi          = {10.3115/V1/P15-1001},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/JeanCMB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acpr/Bengio15,
  author       = {Yoshua Bengio},
  title        = {{IAPR} keynote lecture {IV:} Deep learning},
  booktitle    = {3rd {IAPR} Asian Conference on Pattern Recognition, {ACPR} 2015, Kuala
                  Lumpur, Malaysia, November 3-6, 2015},
  pages        = {xx},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/ACPR.2015.7486451},
  doi          = {10.1109/ACPR.2015.7486451},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/acpr/Bengio15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/SordoniBVLSN15,
  author       = {Alessandro Sordoni and
                  Yoshua Bengio and
                  Hossein Vahabi and
                  Christina Lioma and
                  Jakob Grue Simonsen and
                  Jian{-}Yun Nie},
  editor       = {James Bailey and
                  Alistair Moffat and
                  Charu C. Aggarwal and
                  Maarten de Rijke and
                  Ravi Kumar and
                  Vanessa Murdock and
                  Timos K. Sellis and
                  Jeffrey Xu Yu},
  title        = {A Hierarchical Recurrent Encoder-Decoder for Generative Context-Aware
                  Query Suggestion},
  booktitle    = {Proceedings of the 24th {ACM} International Conference on Information
                  and Knowledge Management, {CIKM} 2015, Melbourne, VIC, Australia,
                  October 19 - 23, 2015},
  pages        = {553--562},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2806416.2806493},
  doi          = {10.1145/2806416.2806493},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cikm/SordoniBVLSN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GouwsBC15,
  author       = {Stephan Gouws and
                  Yoshua Bengio and
                  Greg Corrado},
  editor       = {Francis R. Bach and
                  David M. Blei},
  title        = {BilBOWA: Fast Bilingual Distributed Representations without Word Alignments},
  booktitle    = {Proceedings of the 32nd International Conference on Machine Learning,
                  {ICML} 2015, Lille, France, 6-11 July 2015},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {37},
  pages        = {748--756},
  publisher    = {JMLR.org},
  year         = {2015},
  url          = {http://proceedings.mlr.press/v37/gouws15.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GouwsBC15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/XuBKCCSZB15,
  author       = {Kelvin Xu and
                  Jimmy Ba and
                  Ryan Kiros and
                  Kyunghyun Cho and
                  Aaron C. Courville and
                  Ruslan Salakhutdinov and
                  Richard S. Zemel and
                  Yoshua Bengio},
  editor       = {Francis R. Bach and
                  David M. Blei},
  title        = {Show, Attend and Tell: Neural Image Caption Generation with Visual
                  Attention},
  booktitle    = {Proceedings of the 32nd International Conference on Machine Learning,
                  {ICML} 2015, Lille, France, 6-11 July 2015},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {37},
  pages        = {2048--2057},
  publisher    = {JMLR.org},
  year         = {2015},
  url          = {http://proceedings.mlr.press/v37/xuc15.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/XuBKCCSZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChungGCB15,
  author       = {Junyoung Chung and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Francis R. Bach and
                  David M. Blei},
  title        = {Gated Feedback Recurrent Neural Networks},
  booktitle    = {Proceedings of the 32nd International Conference on Machine Learning,
                  {ICML} 2015, Lille, France, 6-11 July 2015},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {37},
  pages        = {2067--2075},
  publisher    = {JMLR.org},
  year         = {2015},
  url          = {http://proceedings.mlr.press/v37/chung15.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChungGCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChorowskiBSCB15,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Attention-Based Models for Speech Recognition},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {577--585},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/1068c6e4c8051cfd4e9ea8072e3189e2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChorowskiBSCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DauphinVB15,
  author       = {Yann N. Dauphin and
                  Harm de Vries and
                  Yoshua Bengio},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {Equilibrated adaptive learning rates for non-convex optimization},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {1504--1512},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/430c3626b879b4005d41b8a46172e0c0-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DauphinVB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChungKDGCB15,
  author       = {Junyoung Chung and
                  Kyle Kastner and
                  Laurent Dinh and
                  Kratarth Goel and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {A Recurrent Latent Variable Model for Sequential Data},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {2980--2988},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/b618c3210e934362ac261db280128c22-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChungKDGCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CourbariauxBD15,
  author       = {Matthieu Courbariaux and
                  Yoshua Bengio and
                  Jean{-}Pierre David},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {BinaryConnect: Training Deep Neural Networks with binary weights during
                  propagations},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {3123--3131},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/3e15cc11f979ed25912dff5b0669f2cd-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/CourbariauxBD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/BrebissonSAVB15,
  author       = {Alexandre de Br{\'{e}}bisson and
                  {\'{E}}tienne Simon and
                  Alex Auvolat and
                  Pascal Vincent and
                  Yoshua Bengio},
  editor       = {Adolfo Mart{\'{\i}}nez Us{\'{o}} and
                  Jo{\~{a}}o Mendes{-}Moreira and
                  Lu{\'{\i}}s Moreira{-}Matias and
                  Meelis Kull and
                  Nicolas Lachiche},
  title        = {Artificial Neural Networks Applied to Taxi Destination Prediction},
  booktitle    = {Proceedings of the {ECML/PKDD} 2015 Discovery Challenges co-located
                  with European Conference on Machine Learning and Principles and Practice
                  of Knowledge Discovery in Databases {(ECML-PKDD} 2015), Porto, Portugal,
                  September 7-11, 2015},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {1526},
  publisher    = {CEUR-WS.org},
  year         = {2015},
  url          = {https://ceur-ws.org/Vol-1526/paper21.pdf},
  timestamp    = {Mon, 03 Apr 2023 18:25:50 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/BrebissonSAVB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/LeeZFB15,
  author       = {Dong{-}Hyun Lee and
                  Saizheng Zhang and
                  Asja Fischer and
                  Yoshua Bengio},
  editor       = {Annalisa Appice and
                  Pedro Pereira Rodrigues and
                  V{\'{\i}}tor Santos Costa and
                  Carlos Soares and
                  Jo{\~{a}}o Gama and
                  Al{\'{\i}}pio Jorge},
  title        = {Difference Target Propagation},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases - European Conference,
                  {ECML} {PKDD} 2015, Porto, Portugal, September 7-11, 2015, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9284},
  pages        = {498--515},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-23528-8\_31},
  doi          = {10.1007/978-3-319-23528-8\_31},
  timestamp    = {Mon, 30 Nov 2020 08:47:26 +0100},
  biburl       = {https://dblp.org/rec/conf/pkdd/LeeZFB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wmt/JeanFCMB15,
  author       = {S{\'{e}}bastien Jean and
                  Orhan Firat and
                  Kyunghyun Cho and
                  Roland Memisevic and
                  Yoshua Bengio},
  title        = {Montreal Neural Machine Translation Systems for WMT'15},
  booktitle    = {Proceedings of the Tenth Workshop on Statistical Machine Translation,
                  WMT@EMNLP 2015, 17-18 September 2015, Lisbon, Portugal},
  pages        = {134--140},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.18653/v1/w15-3014},
  doi          = {10.18653/V1/W15-3014},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wmt/JeanFCMB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/BahdanauCB14,
  author       = {Dzmitry Bahdanau and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Neural Machine Translation by Jointly Learning to Align and Translate},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1409.0473},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/BornscheinB14,
  author       = {J{\"{o}}rg Bornschein and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Reweighted Wake-Sleep},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1406.2751},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BornscheinB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/CourbariauxBD14,
  author       = {Matthieu Courbariaux and
                  Yoshua Bengio and
                  Jean{-}Pierre David},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Low precision arithmetic for deep learning},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.7024},
  timestamp    = {Wed, 17 Jul 2019 10:40:54 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/CourbariauxBD14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/DinhKB14,
  author       = {Laurent Dinh and
                  David Krueger and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {{NICE:} Non-linear Independent Components Estimation},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1410.8516},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/DinhKB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/HillCJDB14a,
  author       = {Felix Hill and
                  Kyunghyun Cho and
                  S{\'{e}}bastien Jean and
                  Coline Devin and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Embedding Word Similarity with Neural Machine Translation},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.6448},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/HillCJDB14a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/LeeZBB14,
  author       = {Dong{-}Hyun Lee and
                  Saizheng Zhang and
                  Antoine Biard and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Target Propagation},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.7525},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/LeeZBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/MesnilMRB14,
  author       = {Gr{\'{e}}goire Mesnil and
                  Tom{\'{a}}s Mikolov and
                  Marc'Aurelio Ranzato and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Ensemble of Generative and Discriminative Techniques for Sentiment
                  Analysis of Movie Reviews},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.5335},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MesnilMRB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/RomeroBKCGB14,
  author       = {Adriana Romero and
                  Nicolas Ballas and
                  Samira Ebrahimi Kahou and
                  Antoine Chassang and
                  Carlo Gatta and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {FitNets: Hints for Thin Deep Nets},
  booktitle    = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {http://arxiv.org/abs/1412.6550},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RomeroBKCGB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2015,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
  year         = {2015},
  url          = {https://iclr.cc/archive/www/doku.php\%3Fid=iclr2015:accepted-main.html},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2015.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2015w,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {3rd International Conference on Learning Representations, {ICLR} 2015,
                  San Diego, CA, USA, May 7-9, 2015, Workshop Track Proceedings},
  year         = {2015},
  url          = {https://iclr.cc/archive/www/doku.php\%3Fid=iclr2015:accepted-main.html},
  timestamp    = {Wed, 17 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2015w.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChungGCB15,
  author       = {Junyoung Chung and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Gated Feedback Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1502.02367},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.02367},
  eprinttype    = {arXiv},
  eprint       = {1502.02367},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChungGCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/XuBKCCSZB15,
  author       = {Kelvin Xu and
                  Jimmy Ba and
                  Ryan Kiros and
                  Kyunghyun Cho and
                  Aaron C. Courville and
                  Ruslan Salakhutdinov and
                  Richard S. Zemel and
                  Yoshua Bengio},
  title        = {Show, Attend and Tell: Neural Image Caption Generation with Visual
                  Attention},
  journal      = {CoRR},
  volume       = {abs/1502.03044},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.03044},
  eprinttype    = {arXiv},
  eprint       = {1502.03044},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/XuBKCCSZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioLBL15,
  author       = {Yoshua Bengio and
                  Dong{-}Hyun Lee and
                  J{\"{o}}rg Bornschein and
                  Zhouhan Lin},
  title        = {Towards Biologically Plausible Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1502.04156},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.04156},
  eprinttype    = {arXiv},
  eprint       = {1502.04156},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioLBL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DauphinVCB15,
  author       = {Yann N. Dauphin and
                  Harm de Vries and
                  Junyoung Chung and
                  Yoshua Bengio},
  title        = {RMSProp and equilibrated adaptive learning rates for non-convex optimization},
  journal      = {CoRR},
  volume       = {abs/1502.04390},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.04390},
  eprinttype    = {arXiv},
  eprint       = {1502.04390},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DauphinVCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KahouBLGMKJFDBF15,
  author       = {Samira Ebrahimi Kahou and
                  Xavier Bouthillier and
                  Pascal Lamblin and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Vincent Michalski and
                  Kishore Reddy Konda and
                  S{\'{e}}bastien Jean and
                  Pierre Froumenty and
                  Yann N. Dauphin and
                  Nicolas Boulanger{-}Lewandowski and
                  Raul Chandias Ferrari and
                  Mehdi Mirza and
                  David Warde{-}Farley and
                  Aaron C. Courville and
                  Pascal Vincent and
                  Roland Memisevic and
                  Christopher J. Pal and
                  Yoshua Bengio},
  title        = {EmoNets: Multimodal deep learning approaches for emotion recognition
                  in video},
  journal      = {CoRR},
  volume       = {abs/1503.01800},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.01800},
  eprinttype    = {arXiv},
  eprint       = {1503.01800},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KahouBLGMKJFDBF15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreFXCBLBS15,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Orhan Firat and
                  Kelvin Xu and
                  Kyunghyun Cho and
                  Lo{\"{\i}}c Barrault and
                  Huei{-}Chi Lin and
                  Fethi Bougares and
                  Holger Schwenk and
                  Yoshua Bengio},
  title        = {On Using Monolingual Corpora in Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1503.03535},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.03535},
  eprinttype    = {arXiv},
  eprint       = {1503.03535},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreFXCBLBS15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlainBYYTZV15,
  author       = {Guillaume Alain and
                  Yoshua Bengio and
                  Li Yao and
                  Jason Yosinski and
                  Eric Thibodeau{-}Laufer and
                  Saizheng Zhang and
                  Pascal Vincent},
  title        = {GSNs : Generative Stochastic Networks},
  journal      = {CoRR},
  volume       = {abs/1503.05571},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.05571},
  eprinttype    = {arXiv},
  eprint       = {1503.05571},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlainBYYTZV15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HillCKB15,
  author       = {Felix Hill and
                  Kyunghyun Cho and
                  Anna Korhonen and
                  Yoshua Bengio},
  title        = {Learning to Understand Phrases by Embedding the Dictionary},
  journal      = {CoRR},
  volume       = {abs/1504.00548},
  year         = {2015},
  url          = {http://arxiv.org/abs/1504.00548},
  eprinttype    = {arXiv},
  eprint       = {1504.00548},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HillCKB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/VisinKCMCB15,
  author       = {Francesco Visin and
                  Kyle Kastner and
                  Kyunghyun Cho and
                  Matteo Matteucci and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {ReNet: {A} Recurrent Neural Network Based Alternative to Convolutional
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1505.00393},
  year         = {2015},
  url          = {http://arxiv.org/abs/1505.00393},
  eprinttype    = {arXiv},
  eprint       = {1505.00393},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/VisinKCMCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HavaeiDWBCBPJL15,
  author       = {Mohammad Havaei and
                  Axel Davy and
                  David Warde{-}Farley and
                  Antoine Biard and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Chris Pal and
                  Pierre{-}Marc Jodoin and
                  Hugo Larochelle},
  title        = {Brain Tumor Segmentation with Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1505.03540},
  year         = {2015},
  url          = {http://arxiv.org/abs/1505.03540},
  eprinttype    = {arXiv},
  eprint       = {1505.03540},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HavaeiDWBCBPJL15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MerrienboerBDSW15,
  author       = {Bart van Merri{\"{e}}nboer and
                  Dzmitry Bahdanau and
                  Vincent Dumoulin and
                  Dmitriy Serdyuk and
                  David Warde{-}Farley and
                  Jan Chorowski and
                  Yoshua Bengio},
  title        = {Blocks and Fuel: Frameworks for deep learning},
  journal      = {CoRR},
  volume       = {abs/1506.00619},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.00619},
  eprinttype    = {arXiv},
  eprint       = {1506.00619},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MerrienboerBDSW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChungKDGCB15,
  author       = {Junyoung Chung and
                  Kyle Kastner and
                  Laurent Dinh and
                  Kratarth Goel and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {A Recurrent Latent Variable Model for Sequential Data},
  journal      = {CoRR},
  volume       = {abs/1506.02216},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.02216},
  eprinttype    = {arXiv},
  eprint       = {1506.02216},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChungKDGCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BornscheinSFB15,
  author       = {J{\"{o}}rg Bornschein and
                  Samira Shabanian and
                  Asja Fischer and
                  Yoshua Bengio},
  title        = {Training opposing directed models using geometric mean matching},
  journal      = {CoRR},
  volume       = {abs/1506.03877},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.03877},
  eprinttype    = {arXiv},
  eprint       = {1506.03877},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BornscheinSFB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChorowskiBSCB15,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Attention-Based Models for Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1506.07503},
  year         = {2015},
  url          = {http://arxiv.org/abs/1506.07503},
  eprinttype    = {arXiv},
  eprint       = {1506.07503},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChorowskiBSCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoCB15,
  author       = {KyungHyun Cho and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Describing Multimedia Content using Attention-based Encoder-Decoder
                  Networks},
  journal      = {CoRR},
  volume       = {abs/1507.01053},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.01053},
  eprinttype    = {arXiv},
  eprint       = {1507.01053},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SordoniBVLSN15,
  author       = {Alessandro Sordoni and
                  Yoshua Bengio and
                  Hossein Vahabi and
                  Christina Lioma and
                  Jakob Grue Simonsen and
                  Jian{-}Yun Nie},
  title        = {A Hierarchical Recurrent Encoder-Decoder For Generative Context-Aware
                  Query Suggestion},
  journal      = {CoRR},
  volume       = {abs/1507.02221},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.02221},
  eprinttype    = {arXiv},
  eprint       = {1507.02221},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SordoniBVLSN15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SerbanSBCP15,
  author       = {Iulian Vlad Serban and
                  Alessandro Sordoni and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Joelle Pineau},
  title        = {Hierarchical Neural Network Generative Models for Movie Dialogues},
  journal      = {CoRR},
  volume       = {abs/1507.04808},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.04808},
  eprinttype    = {arXiv},
  eprint       = {1507.04808},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SerbanSBCP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BrebissonSAVB15,
  author       = {Alexandre de Br{\'{e}}bisson and
                  {\'{E}}tienne Simon and
                  Alex Auvolat and
                  Pascal Vincent and
                  Yoshua Bengio},
  title        = {Artificial Neural Networks Applied to Taxi Destination Prediction},
  journal      = {CoRR},
  volume       = {abs/1508.00021},
  year         = {2015},
  url          = {http://arxiv.org/abs/1508.00021},
  eprinttype    = {arXiv},
  eprint       = {1508.00021},
  timestamp    = {Fri, 27 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BrebissonSAVB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauCSBB15,
  author       = {Dzmitry Bahdanau and
                  Jan Chorowski and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Yoshua Bengio},
  title        = {End-to-End Attention-based Large Vocabulary Speech Recognition},
  journal      = {CoRR},
  volume       = {abs/1508.04395},
  year         = {2015},
  url          = {http://arxiv.org/abs/1508.04395},
  eprinttype    = {arXiv},
  eprint       = {1508.04395},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauCSBB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioMFZW15,
  author       = {Yoshua Bengio and
                  Thomas Mesnard and
                  Asja Fischer and
                  Saizheng Zhang and
                  Yuhai Wu},
  title        = {An objective function for {STDP}},
  journal      = {CoRR},
  volume       = {abs/1509.05936},
  year         = {2015},
  url          = {http://arxiv.org/abs/1509.05936},
  eprinttype    = {arXiv},
  eprint       = {1509.05936},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioMFZW15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LaurentPBZB15,
  author       = {C{\'{e}}sar Laurent and
                  Gabriel Pereyra and
                  Philemon Brakel and
                  Ying Zhang and
                  Yoshua Bengio},
  title        = {Batch Normalized Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1510.01378},
  year         = {2015},
  url          = {http://arxiv.org/abs/1510.01378},
  eprinttype    = {arXiv},
  eprint       = {1510.01378},
  timestamp    = {Fri, 03 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LaurentPBZB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Bengio15,
  author       = {Yoshua Bengio},
  title        = {Early Inference in Energy-Based Models Approximates Back-Propagation},
  journal      = {CoRR},
  volume       = {abs/1510.02777},
  year         = {2015},
  url          = {http://arxiv.org/abs/1510.02777},
  eprinttype    = {arXiv},
  eprint       = {1510.02777},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Bengio15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CourbariauxBD15,
  author       = {Matthieu Courbariaux and
                  Yoshua Bengio and
                  Jean{-}Pierre David},
  title        = {BinaryConnect: Training Deep Neural Networks with binary weights during
                  propagations},
  journal      = {CoRR},
  volume       = {abs/1511.00363},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.00363},
  eprinttype    = {arXiv},
  eprint       = {1511.00363},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/CourbariauxBD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/YaoBCSB15,
  author       = {Li Yao and
                  Nicolas Ballas and
                  KyungHyun Cho and
                  John R. Smith and
                  Yoshua Bengio},
  title        = {Trainable performance upper bounds for image and video captioning},
  journal      = {CoRR},
  volume       = {abs/1511.04590},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.04590},
  eprinttype    = {arXiv},
  eprint       = {1511.04590},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YaoBCSB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ImAMB15,
  author       = {Daniel Jiwoong Im and
                  Sungjin Ahn and
                  Roland Memisevic and
                  Yoshua Bengio},
  title        = {Denoising Criterion for Variational Auto-Encoding Framework},
  journal      = {CoRR},
  volume       = {abs/1511.06406},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06406},
  eprinttype    = {arXiv},
  eprint       = {1511.06406},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ImAMB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PezeshkiFBCB15,
  author       = {Mohammad Pezeshki and
                  Linxi Fan and
                  Philemon Brakel and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Deconstructing the Ladder Network Architecture},
  journal      = {CoRR},
  volume       = {abs/1511.06430},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06430},
  eprinttype    = {arXiv},
  eprint       = {1511.06430},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PezeshkiFBCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BahdanauSBKCCB15,
  author       = {Dzmitry Bahdanau and
                  Dmitriy Serdyuk and
                  Philemon Brakel and
                  Nan Rosemary Ke and
                  Jan Chorowski and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Task Loss Estimation for Sequence Prediction},
  journal      = {CoRR},
  volume       = {abs/1511.06456},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06456},
  eprinttype    = {arXiv},
  eprint       = {1511.06456},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BahdanauSBKCCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ArjovskySB15,
  author       = {Mart{\'{\i}}n Arjovsky and
                  Amar Shah and
                  Yoshua Bengio},
  title        = {Unitary Evolution Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1511.06464},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06464},
  eprinttype    = {arXiv},
  eprint       = {1511.06464},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ArjovskySB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AlainLSCB15,
  author       = {Guillaume Alain and
                  Alex Lamb and
                  Chinnadhurai Sankar and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Variance Reduction in {SGD} by Distributed Importance Sampling},
  journal      = {CoRR},
  volume       = {abs/1511.06481},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.06481},
  eprinttype    = {arXiv},
  eprint       = {1511.06481},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AlainLSCB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/VisinKCBMC15,
  author       = {Francesco Visin and
                  Kyle Kastner and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Matteo Matteucci and
                  KyungHyun Cho},
  title        = {ReSeg: {A} Recurrent Neural Network for Object Segmentation},
  journal      = {CoRR},
  volume       = {abs/1511.07053},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.07053},
  eprinttype    = {arXiv},
  eprint       = {1511.07053},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/VisinKCBMC15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/bc/RivestKB14,
  author       = {Fran{\c{c}}ois Rivest and
                  John Kalaska and
                  Yoshua Bengio},
  title        = {Conditioning and time representation in long short-term memory networks},
  journal      = {Biol. Cybern.},
  volume       = {108},
  number       = {1},
  pages        = {23--48},
  year         = {2014},
  url          = {https://doi.org/10.1007/s00422-013-0575-1},
  doi          = {10.1007/S00422-013-0575-1},
  timestamp    = {Thu, 17 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/bc/RivestKB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/AlainB14,
  author       = {Guillaume Alain and
                  Yoshua Bengio},
  title        = {What regularized auto-encoders learn from the data-generating distribution},
  journal      = {J. Mach. Learn. Res.},
  volume       = {15},
  number       = {1},
  pages        = {3563--3593},
  year         = {2014},
  url          = {https://dl.acm.org/doi/10.5555/2627435.2750359},
  doi          = {10.5555/2627435.2750359},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/AlainB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/BordesGWB14,
  author       = {Antoine Bordes and
                  Xavier Glorot and
                  Jason Weston and
                  Yoshua Bengio},
  title        = {A semantic matching energy function for learning with multi-relational
                  data - Application to word-sense disambiguation},
  journal      = {Mach. Learn.},
  volume       = {94},
  number       = {2},
  pages        = {233--259},
  year         = {2014},
  url          = {https://doi.org/10.1007/s10994-013-5363-6},
  doi          = {10.1007/S10994-013-5363-6},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ml/BordesGWB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/MesnilBWCB14,
  author       = {Gr{\'{e}}goire Mesnil and
                  Antoine Bordes and
                  Jason Weston and
                  Gal Chechik and
                  Yoshua Bengio},
  title        = {Learning semantic representations of objects and their parts},
  journal      = {Mach. Learn.},
  volume       = {94},
  number       = {2},
  pages        = {281--301},
  year         = {2014},
  url          = {https://doi.org/10.1007/s10994-013-5336-9},
  doi          = {10.1007/S10994-013-5336-9},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/MesnilBWCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/CourvilleDBB14,
  author       = {Aaron C. Courville and
                  Guillaume Desjardins and
                  James Bergstra and
                  Yoshua Bengio},
  title        = {The Spike-and-Slab {RBM} and Extensions to Discrete and Sparse Data
                  Distributions},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {36},
  number       = {9},
  pages        = {1874--1887},
  year         = {2014},
  url          = {https://doi.org/10.1109/TPAMI.2013.238},
  doi          = {10.1109/TPAMI.2013.238},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pami/CourvilleDBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DumoulinGCB14,
  author       = {Vincent Dumoulin and
                  Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Carla E. Brodley and
                  Peter Stone},
  title        = {On the Challenges of Physical Implementations of RBMs},
  booktitle    = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence,
                  July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada},
  pages        = {1199--1205},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {https://doi.org/10.1609/aaai.v28i1.8924},
  doi          = {10.1609/AAAI.V28I1.8924},
  timestamp    = {Mon, 04 Sep 2023 15:06:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DumoulinGCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/SordoniBN14,
  author       = {Alessandro Sordoni and
                  Yoshua Bengio and
                  Jian{-}Yun Nie},
  editor       = {Carla E. Brodley and
                  Peter Stone},
  title        = {Learning Concept Embeddings for Query Expansion by Quantum Entropy
                  Minimization},
  booktitle    = {Proceedings of the Twenty-Eighth {AAAI} Conference on Artificial Intelligence,
                  July 27 -31, 2014, Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada},
  pages        = {1586--1592},
  publisher    = {{AAAI} Press},
  year         = {2014},
  url          = {https://doi.org/10.1609/aaai.v28i1.8933},
  doi          = {10.1609/AAAI.V28I1.8933},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/SordoniBN14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ChoMGBBSB14,
  author       = {Kyunghyun Cho and
                  Bart van Merrienboer and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Dzmitry Bahdanau and
                  Fethi Bougares and
                  Holger Schwenk and
                  Yoshua Bengio},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
                  Machine Translation},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {1724--1734},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1179},
  doi          = {10.3115/V1/D14-1179},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/ChoMGBBSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/gecco/Bengio14,
  author       = {Yoshua Bengio},
  editor       = {Dirk V. Arnold and
                  Enrique Alba},
  title        = {Deep learning and cultural evolution},
  booktitle    = {Genetic and Evolutionary Computation Conference, {GECCO} '14, Vancouver,
                  BC, Canada, July 12-16, 2014, Companion Material Proceedings},
  pages        = {1--2},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2598394.2598395},
  doi          = {10.1145/2598394.2598395},
  timestamp    = {Wed, 13 Jul 2022 16:15:15 +0200},
  biburl       = {https://dblp.org/rec/conf/gecco/Bengio14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BengioLAY14,
  author       = {Yoshua Bengio and
                  Eric Laufer and
                  Guillaume Alain and
                  Jason Yosinski},
  title        = {Deep Generative Stochastic Networks Trainable by Backprop},
  booktitle    = {Proceedings of the 31th International Conference on Machine Learning,
                  {ICML} 2014, Beijing, China, 21-26 June 2014},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {32},
  pages        = {226--234},
  publisher    = {JMLR.org},
  year         = {2014},
  url          = {http://proceedings.mlr.press/v32/bengio14.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BengioLAY14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/ChenWSB14,
  author       = {Minmin Chen and
                  Kilian Q. Weinberger and
                  Fei Sha and
                  Yoshua Bengio},
  title        = {Marginalized Denoising Auto-encoders for Nonlinear Representations},
  booktitle    = {Proceedings of the 31th International Conference on Machine Learning,
                  {ICML} 2014, Beijing, China, 21-26 June 2014},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {32},
  pages        = {1476--1484},
  publisher    = {JMLR.org},
  year         = {2014},
  url          = {http://proceedings.mlr.press/v32/cheng14.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/ChenWSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/Bengio14,
  author       = {Yoshua Bengio},
  editor       = {Sofus A. Macskassy and
                  Claudia Perlich and
                  Jure Leskovec and
                  Wei Wang and
                  Rayid Ghani},
  title        = {Scaling up deep learning},
  booktitle    = {The 20th {ACM} {SIGKDD} International Conference on Knowledge Discovery
                  and Data Mining, {KDD} '14, New York, NY, {USA} - August 24 - 27,
                  2014},
  pages        = {1966},
  publisher    = {{ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1145/2623330.2630802},
  doi          = {10.1145/2623330.2630802},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/kdd/Bengio14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RaikoLCB14,
  author       = {Tapani Raiko and
                  Li Yao and
                  KyungHyun Cho and
                  Yoshua Bengio},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Iterative Neural Autoregressive Distribution Estimator NADE-k},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {325--333},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/555d6702c950ecb729a966504af0a635-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/RaikoLCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoodfellowPMXWOCB14,
  author       = {Ian J. Goodfellow and
                  Jean Pouget{-}Abadie and
                  Mehdi Mirza and
                  Bing Xu and
                  David Warde{-}Farley and
                  Sherjil Ozair and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Generative Adversarial Nets},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {2672--2680},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/5ca3e9b122f61f8f06494c97b1afccf3-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GoodfellowPMXWOCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MontufarPCB14,
  author       = {Guido Mont{\'{u}}far and
                  Razvan Pascanu and
                  KyungHyun Cho and
                  Yoshua Bengio},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {On the Number of Linear Regions of Deep Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {2924--2932},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/109d2dd3608f669ca17920c511c2a41e-Abstract.html},
  timestamp    = {Mon, 02 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/MontufarPCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DauphinPGCGB14,
  author       = {Yann N. Dauphin and
                  Razvan Pascanu and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  KyungHyun Cho and
                  Surya Ganguli and
                  Yoshua Bengio},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Identifying and attacking the saddle point problem in high-dimensional
                  non-convex optimization},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {2933--2941},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/17e23e50bedc63b4095e3d8204ce063b-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DauphinPGCGB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/YosinskiCBL14,
  author       = {Jason Yosinski and
                  Jeff Clune and
                  Yoshua Bengio and
                  Hod Lipson},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {How transferable are features in deep neural networks?},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {3320--3328},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/375c71349b295fbe2dcdca9206f20a06-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YosinskiCBL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/YaoOCB14,
  author       = {Li Yao and
                  Sherjil Ozair and
                  KyungHyun Cho and
                  Yoshua Bengio},
  editor       = {Toon Calders and
                  Floriana Esposito and
                  Eyke H{\"{u}}llermeier and
                  Rosa Meo},
  title        = {On the Equivalence between Deep {NADE} and Generative Stochastic Networks},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases - European Conference,
                  {ECML} {PKDD} 2014, Nancy, France, September 15-19, 2014. Proceedings,
                  Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8726},
  pages        = {322--336},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-662-44845-8\_21},
  doi          = {10.1007/978-3-662-44845-8\_21},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pkdd/YaoOCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/GulcehreCPB14,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  KyungHyun Cho and
                  Razvan Pascanu and
                  Yoshua Bengio},
  editor       = {Toon Calders and
                  Floriana Esposito and
                  Eyke H{\"{u}}llermeier and
                  Rosa Meo},
  title        = {Learned-Norm Pooling for Deep Feedforward and Recurrent Neural Networks},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases - European Conference,
                  {ECML} {PKDD} 2014, Nancy, France, September 15-19, 2014. Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8724},
  pages        = {530--546},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-662-44848-9\_34},
  doi          = {10.1007/978-3-662-44848-9\_34},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/pkdd/GulcehreCPB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssst/Pouget-AbadieBM14,
  author       = {Jean Pouget{-}Abadie and
                  Dzmitry Bahdanau and
                  Bart van Merrienboer and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Dekai Wu and
                  Marine Carpuat and
                  Xavier Carreras and
                  Eva Maria Vecchi},
  title        = {Overcoming the Curse of Sentence Length for Neural Machine Translation
                  using Automatic Segmentation},
  booktitle    = {Proceedings of SSST@EMNLP 2014, Eighth Workshop on Syntax, Semantics
                  and Structure in Statistical Translation, Doha, Qatar, 25 October
                  2014},
  pages        = {78--85},
  publisher    = {Association for Computational Linguistics},
  year         = {2014},
  url          = {https://aclanthology.org/W14-4009/},
  doi          = {10.3115/V1/W14-4009},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssst/Pouget-AbadieBM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ssst/ChoMBB14,
  author       = {Kyunghyun Cho and
                  Bart van Merrienboer and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  editor       = {Dekai Wu and
                  Marine Carpuat and
                  Xavier Carreras and
                  Eva Maria Vecchi},
  title        = {On the Properties of Neural Machine Translation: Encoder-Decoder Approaches},
  booktitle    = {Proceedings of SSST@EMNLP 2014, Eighth Workshop on Syntax, Semantics
                  and Structure in Statistical Translation, Doha, Qatar, 25 October
                  2014},
  pages        = {103--111},
  publisher    = {Association for Computational Linguistics},
  year         = {2014},
  url          = {https://aclanthology.org/W14-4012/},
  doi          = {10.3115/V1/W14-4012},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ssst/ChoMBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/BengioY13,
  author       = {Yoshua Bengio and
                  Li Yao},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Bounding the Test Log-Likelihood of Generative Models},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1311.6184},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioY13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/GoodfellowMDCB13,
  author       = {Ian J. Goodfellow and
                  Mehdi Mirza and
                  Xia Da and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {An Empirical Investigation of Catastrophic Forgeting in Gradient-Based
                  Neural Networks},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1312.6211},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GoodfellowMDCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/OzairYB13,
  author       = {Sherjil Ozair and
                  Li Yao and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Multimodal Transitions for Generative Stochastic Networks},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Workshop Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1312.5578},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OzairYB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/PascanuGCB13,
  author       = {Razvan Pascanu and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {How to Construct Deep Recurrent Neural Networks},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1312.6026},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PascanuGCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/PascanuMB13,
  author       = {Razvan Pascanu and
                  Guido Mont{\'{u}}far and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {On the number of inference regions of deep feed forward networks with
                  piece-wise linear activations},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1312.6098},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PascanuMB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/Warde-FarleyGCB13,
  author       = {David Warde{-}Farley and
                  Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {An empirical analysis of dropout in piecewise linear networks},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1312.6197},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Warde-FarleyGCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3584,
  author       = {Razvan Pascanu and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Revisiting Natural Gradient for Deep Networks},
  booktitle    = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {http://arxiv.org/abs/1301.3584},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:series/sci/Bengio14,
  author       = {Yoshua Bengio},
  editor       = {Taras Kowaliw and
                  Nicolas Bred{\`{e}}che and
                  Ren{\'{e}} Doursat},
  title        = {Evolving Culture Versus Local Minima},
  booktitle    = {Growing Adaptive Machines - Combining Development and Learning in
                  Artificial Neural Networks},
  series       = {Studies in Computational Intelligence},
  volume       = {557},
  pages        = {109--138},
  publisher    = {Springer},
  year         = {2014},
  url          = {https://doi.org/10.1007/978-3-642-55337-0\_3},
  doi          = {10.1007/978-3-642-55337-0\_3},
  timestamp    = {Tue, 24 Oct 2017 16:58:47 +0200},
  biburl       = {https://dblp.org/rec/series/sci/Bengio14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2014,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Conference Track Proceedings},
  year         = {2014},
  url          = {https://openreview.net/group?id=ICLR.cc/2014},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2014.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2014w,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {2nd International Conference on Learning Representations, {ICLR} 2014,
                  Banff, AB, Canada, April 14-16, 2014, Workshop Track Proceedings},
  year         = {2014},
  url          = {https://openreview.net/group?id=ICLR.cc/2014},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2014w.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MontufarPCB14,
  author       = {Guido Mont{\'{u}}far and
                  Razvan Pascanu and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {On the Number of Linear Regions of Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1402.1869},
  year         = {2014},
  url          = {http://arxiv.org/abs/1402.1869},
  eprinttype    = {arXiv},
  eprint       = {1402.1869},
  timestamp    = {Mon, 02 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/MontufarPCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PascanuDGB14,
  author       = {Razvan Pascanu and
                  Yann N. Dauphin and
                  Surya Ganguli and
                  Yoshua Bengio},
  title        = {On the saddle point problem for non-convex optimization},
  journal      = {CoRR},
  volume       = {abs/1405.4604},
  year         = {2014},
  url          = {http://arxiv.org/abs/1405.4604},
  eprinttype    = {arXiv},
  eprint       = {1405.4604},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PascanuDGB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoMGBSB14,
  author       = {Kyunghyun Cho and
                  Bart van Merrienboer and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Fethi Bougares and
                  Holger Schwenk and
                  Yoshua Bengio},
  title        = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical
                  Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1406.1078},
  year         = {2014},
  url          = {http://arxiv.org/abs/1406.1078},
  eprinttype    = {arXiv},
  eprint       = {1406.1078},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoMGBSB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RaikoYCB14,
  author       = {Tapani Raiko and
                  Li Yao and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Iterative Neural Autoregressive Distribution Estimator (NADE-k)},
  journal      = {CoRR},
  volume       = {abs/1406.1485},
  year         = {2014},
  url          = {http://arxiv.org/abs/1406.1485},
  eprinttype    = {arXiv},
  eprint       = {1406.1485},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RaikoYCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DauphinPGCGB14,
  author       = {Yann N. Dauphin and
                  Razvan Pascanu and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Kyunghyun Cho and
                  Surya Ganguli and
                  Yoshua Bengio},
  title        = {Identifying and attacking the saddle point problem in high-dimensional
                  non-convex optimization},
  journal      = {CoRR},
  volume       = {abs/1406.2572},
  year         = {2014},
  url          = {http://arxiv.org/abs/1406.2572},
  eprinttype    = {arXiv},
  eprint       = {1406.2572},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DauphinPGCGB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GoodfellowPMXWOCB14,
  author       = {Ian J. Goodfellow and
                  Jean Pouget{-}Abadie and
                  Mehdi Mirza and
                  Bing Xu and
                  David Warde{-}Farley and
                  Sherjil Ozair and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Generative Adversarial Networks},
  journal      = {CoRR},
  volume       = {abs/1406.2661},
  year         = {2014},
  url          = {http://arxiv.org/abs/1406.2661},
  eprinttype    = {arXiv},
  eprint       = {1406.2661},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GoodfellowPMXWOCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoB14,
  author       = {Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {Exponentially Increasing the Capacity-to-Computation Ratio for Conditional
                  Computation in Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1406.7362},
  year         = {2014},
  url          = {http://arxiv.org/abs/1406.7362},
  eprinttype    = {arXiv},
  eprint       = {1406.7362},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Bengio14,
  author       = {Yoshua Bengio},
  title        = {How Auto-Encoders Could Provide Credit Assignment in Deep Networks
                  via Target Propagation},
  journal      = {CoRR},
  volume       = {abs/1407.7906},
  year         = {2014},
  url          = {http://arxiv.org/abs/1407.7906},
  eprinttype    = {arXiv},
  eprint       = {1407.7906},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Bengio14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/YaoOCB14,
  author       = {Li Yao and
                  Sherjil Ozair and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {On the Equivalence Between Deep {NADE} and Generative Stochastic Networks},
  journal      = {CoRR},
  volume       = {abs/1409.0585},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.0585},
  eprinttype    = {arXiv},
  eprint       = {1409.0585},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YaoOCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Pouget-AbadieBMCB14,
  author       = {Jean Pouget{-}Abadie and
                  Dzmitry Bahdanau and
                  Bart van Merrienboer and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Overcoming the Curse of Sentence Length for Neural Machine Translation
                  using Automatic Segmentation},
  journal      = {CoRR},
  volume       = {abs/1409.1257},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.1257},
  eprinttype    = {arXiv},
  eprint       = {1409.1257},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Pouget-AbadieBMCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChoMBB14,
  author       = {KyungHyun Cho and
                  Bart van Merrienboer and
                  Dzmitry Bahdanau and
                  Yoshua Bengio},
  title        = {On the Properties of Neural Machine Translation: Encoder-Decoder Approaches},
  journal      = {CoRR},
  volume       = {abs/1409.1259},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.1259},
  eprinttype    = {arXiv},
  eprint       = {1409.1259},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChoMBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DesjardinsLCB14,
  author       = {Guillaume Desjardins and
                  Heng Luo and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Deep Tempering},
  journal      = {CoRR},
  volume       = {abs/1410.0123},
  year         = {2014},
  url          = {http://arxiv.org/abs/1410.0123},
  eprinttype    = {arXiv},
  eprint       = {1410.0123},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DesjardinsLCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/OzairB14,
  author       = {Sherjil Ozair and
                  Yoshua Bengio},
  title        = {Deep Directed Generative Autoencoders},
  journal      = {CoRR},
  volume       = {abs/1410.0630},
  year         = {2014},
  url          = {http://arxiv.org/abs/1410.0630},
  eprinttype    = {arXiv},
  eprint       = {1410.0630},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/OzairB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HillCJDB14,
  author       = {Felix Hill and
                  KyungHyun Cho and
                  S{\'{e}}bastien Jean and
                  Coline Devin and
                  Yoshua Bengio},
  title        = {Not All Neural Embeddings are Born Equal},
  journal      = {CoRR},
  volume       = {abs/1410.0718},
  year         = {2014},
  url          = {http://arxiv.org/abs/1410.0718},
  eprinttype    = {arXiv},
  eprint       = {1410.0718},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/HillCJDB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GouwsBC14,
  author       = {Stephan Gouws and
                  Yoshua Bengio and
                  Greg Corrado},
  title        = {BilBOWA: Fast Bilingual Distributed Representations without Word Alignments},
  journal      = {CoRR},
  volume       = {abs/1410.2455},
  year         = {2014},
  url          = {http://arxiv.org/abs/1410.2455},
  eprinttype    = {arXiv},
  eprint       = {1410.2455},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GouwsBC14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/YosinskiCBL14,
  author       = {Jason Yosinski and
                  Jeff Clune and
                  Yoshua Bengio and
                  Hod Lipson},
  title        = {How transferable are features in deep neural networks?},
  journal      = {CoRR},
  volume       = {abs/1411.1792},
  year         = {2014},
  url          = {http://arxiv.org/abs/1411.1792},
  eprinttype    = {arXiv},
  eprint       = {1411.1792},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YosinskiCBL14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChorowskiBCB14,
  author       = {Jan Chorowski and
                  Dzmitry Bahdanau and
                  Kyunghyun Cho and
                  Yoshua Bengio},
  title        = {End-to-end Continuous Speech Recognition using Attention-based Recurrent
                  {NN:} First Results},
  journal      = {CoRR},
  volume       = {abs/1412.1602},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.1602},
  eprinttype    = {arXiv},
  eprint       = {1412.1602},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChorowskiBCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JeanCMB14,
  author       = {S{\'{e}}bastien Jean and
                  Kyunghyun Cho and
                  Roland Memisevic and
                  Yoshua Bengio},
  title        = {On Using Very Large Target Vocabulary for Neural Machine Translation},
  journal      = {CoRR},
  volume       = {abs/1412.2007},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.2007},
  eprinttype    = {arXiv},
  eprint       = {1412.2007},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JeanCMB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ChungGCB14,
  author       = {Junyoung Chung and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  KyungHyun Cho and
                  Yoshua Bengio},
  title        = {Empirical Evaluation of Gated Recurrent Neural Networks on Sequence
                  Modeling},
  journal      = {CoRR},
  volume       = {abs/1412.3555},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.3555},
  eprinttype    = {arXiv},
  eprint       = {1412.3555},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ChungGCB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreB14,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Yoshua Bengio},
  title        = {{ADASECANT:} Robust Adaptive Secant Method for Stochastic Gradient},
  journal      = {CoRR},
  volume       = {abs/1412.7419},
  year         = {2014},
  url          = {http://arxiv.org/abs/1412.7419},
  eprinttype    = {arXiv},
  eprint       = {1412.7419},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cim/MartinezBY13,
  author       = {H{\'{e}}ctor Perez Mart{\'{\i}}nez and
                  Yoshua Bengio and
                  Georgios N. Yannakakis},
  title        = {Learning Deep Physiological Models of Affect},
  journal      = {{IEEE} Comput. Intell. Mag.},
  volume       = {8},
  number       = {2},
  pages        = {20--33},
  year         = {2013},
  url          = {https://doi.org/10.1109/MCI.2013.2247823},
  doi          = {10.1109/MCI.2013.2247823},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cim/MartinezBY13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/BengioCV13,
  author       = {Yoshua Bengio and
                  Aaron C. Courville and
                  Pascal Vincent},
  title        = {Representation Learning: {A} Review and New Perspectives},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {35},
  number       = {8},
  pages        = {1798--1828},
  year         = {2013},
  url          = {https://doi.org/10.1109/TPAMI.2013.50},
  doi          = {10.1109/TPAMI.2013.50},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pami/BengioCV13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/GoodfellowCB13,
  author       = {Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Scaling Up Spike-and-Slab Models for Unsupervised Feature Learning},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {35},
  number       = {8},
  pages        = {1902--1914},
  year         = {2013},
  url          = {https://doi.org/10.1109/TPAMI.2012.273},
  doi          = {10.1109/TPAMI.2012.273},
  timestamp    = {Mon, 16 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pami/GoodfellowCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/LuoCCB13,
  author       = {Heng Luo and
                  Pierre Luc Carrier and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Texture Modeling with Convolutional Spike-and-Slab RBMs and Deep Extensions},
  booktitle    = {Proceedings of the Sixteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2013, Scottsdale, AZ, USA,
                  April 29 - May 1, 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {31},
  pages        = {415--423},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v31/luo13a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/LuoCCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cig/Thibodeau-LauferFYDB13,
  author       = {Eric Thibodeau{-}Laufer and
                  Raul Chandias Ferrari and
                  Li Yao and
                  Olivier Delalleau and
                  Yoshua Bengio},
  title        = {Stacked calibration of off-policy policy evaluation for video game
                  matchmaking},
  booktitle    = {2013 {IEEE} Conference on Computational Inteligence in Games (CIG),
                  Niagara Falls, ON, Canada, August 11-13, 2013},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/CIG.2013.6633642},
  doi          = {10.1109/CIG.2013.6633642},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/cig/Thibodeau-LauferFYDB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/Boulanger-LewandowskiBV13,
  author       = {Nicolas Boulanger{-}Lewandowski and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {High-dimensional sequence transduction},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {3178--3182},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6638244},
  doi          = {10.1109/ICASSP.2013.6638244},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/Boulanger-LewandowskiBV13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BengioBP13,
  author       = {Yoshua Bengio and
                  Nicolas Boulanger{-}Lewandowski and
                  Razvan Pascanu},
  title        = {Advances in optimizing recurrent networks},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech and Signal Processing,
                  {ICASSP} 2013, Vancouver, BC, Canada, May 26-31, 2013},
  pages        = {8624--8628},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/ICASSP.2013.6639349},
  doi          = {10.1109/ICASSP.2013.6639349},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/BengioBP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icmi/KanouPBFGMVCBFMJCDBAZLRDPWTSBKW13,
  author       = {Samira Ebrahimi Kahou and
                  Christopher J. Pal and
                  Xavier Bouthillier and
                  Pierre Froumenty and
                  {\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Roland Memisevic and
                  Pascal Vincent and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Raul Chandias Ferrari and
                  Mehdi Mirza and
                  S{\'{e}}bastien Jean and
                  Pierre Luc Carrier and
                  Yann N. Dauphin and
                  Nicolas Boulanger{-}Lewandowski and
                  Abhishek Aggarwal and
                  Jeremie Zumer and
                  Pascal Lamblin and
                  Jean{-}Philippe Raymond and
                  Guillaume Desjardins and
                  Razvan Pascanu and
                  David Warde{-}Farley and
                  Atousa Torabi and
                  Arjun Sharma and
                  Emmanuel Bengio and
                  Kishore Reddy Konda and
                  Zhenzhou Wu},
  editor       = {Julien Epps and
                  Fang Chen and
                  Sharon L. Oviatt and
                  Kenji Mase and
                  Andrew Sears and
                  Kristiina Jokinen and
                  Bj{\"{o}}rn W. Schuller},
  title        = {Combining modality specific deep neural networks for emotion recognition
                  in video},
  booktitle    = {2013 International Conference on Multimodal Interaction, {ICMI} '13,
                  Sydney, NSW, Australia, December 9-13, 2013},
  pages        = {543--550},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2522848.2531745},
  doi          = {10.1145/2522848.2531745},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icmi/KanouPBFGMVCBFMJCDBAZLRDPWTSBKW13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BengioMDR13,
  author       = {Yoshua Bengio and
                  Gr{\'{e}}goire Mesnil and
                  Yann N. Dauphin and
                  Salah Rifai},
  title        = {Better Mixing via Deep Representations},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {552--560},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/bengio13.html},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BengioMDR13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/PascanuMB13,
  author       = {Razvan Pascanu and
                  Tom{\'{a}}s Mikolov and
                  Yoshua Bengio},
  title        = {On the difficulty of training recurrent neural networks},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {1310--1318},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/pascanu13.html},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/PascanuMB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GoodfellowWMCB13,
  author       = {Ian J. Goodfellow and
                  David Warde{-}Farley and
                  Mehdi Mirza and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Maxout Networks},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {1319--1327},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/goodfellow13.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GoodfellowWMCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iconip/GoodfellowECCMHCTTLZRFLWASMPIPGBXRXZB13,
  author       = {Ian J. Goodfellow and
                  Dumitru Erhan and
                  Pierre Luc Carrier and
                  Aaron C. Courville and
                  Mehdi Mirza and
                  Benjamin Hamner and
                  William Cukierski and
                  Yichuan Tang and
                  David Thaler and
                  Dong{-}Hyun Lee and
                  Yingbo Zhou and
                  Chetan Ramaiah and
                  Fangxiang Feng and
                  Ruifan Li and
                  Xiaojie Wang and
                  Dimitris Athanasakis and
                  John Shawe{-}Taylor and
                  Maxim Milakov and
                  John Park and
                  Radu Tudor Ionescu and
                  Marius Popescu and
                  Cristian Grozea and
                  James Bergstra and
                  Jingjing Xie and
                  Lukasz Romaszko and
                  Bing Xu and
                  Chuang Zhang and
                  Yoshua Bengio},
  editor       = {Minho Lee and
                  Akira Hirose and
                  Zeng{-}Guang Hou and
                  Rhee Man Kil},
  title        = {Challenges in Representation Learning: {A} Report on Three Machine
                  Learning Contests},
  booktitle    = {Neural Information Processing - 20th International Conference, {ICONIP}
                  2013, Daegu, Korea, November 3-7, 2013. Proceedings, Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {8228},
  pages        = {117--124},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-42051-1\_16},
  doi          = {10.1007/978-3-642-42051-1\_16},
  timestamp    = {Mon, 15 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iconip/GoodfellowECCMHCTTLZRFLWASMPIPGBXRXZB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpram/MesnilRBGBV13a,
  author       = {Gr{\'{e}}goire Mesnil and
                  Salah Rifai and
                  Antoine Bordes and
                  Xavier Glorot and
                  Yoshua Bengio and
                  Pascal Vincent},
  editor       = {Ana L. N. Fred and
                  Maria De Marsico},
  title        = {Unsupervised Learning of Semantics of Object Detections for Scene
                  Categorization},
  booktitle    = {Pattern Recognition Applications and Methods - International Conference,
                  {ICPRAM} 2013 Barcelona, Spain, February 15-18, 2013 Revised Selected
                  Papers},
  series       = {Advances in Intelligent Systems and Computing},
  volume       = {318},
  pages        = {209--224},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-319-12610-4\_13},
  doi          = {10.1007/978-3-319-12610-4\_13},
  timestamp    = {Thu, 15 Jun 2017 21:36:18 +0200},
  biburl       = {https://dblp.org/rec/conf/icpram/MesnilRBGBV13a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpram/MesnilRBGBV13,
  author       = {Gr{\'{e}}goire Mesnil and
                  Salah Rifai and
                  Antoine Bordes and
                  Xavier Glorot and
                  Yoshua Bengio and
                  Pascal Vincent},
  editor       = {Maria De Marsico and
                  Ana L. N. Fred},
  title        = {Unsupervised and Transfer Learning under Uncertainty - From Object
                  Detections to Scene Categorization},
  booktitle    = {{ICPRAM} 2013 - Proceedings of the 2nd International Conference on
                  Pattern Recognition Applications and Methods, Barcelona, Spain, 15-18
                  February, 2013},
  pages        = {345--354},
  publisher    = {SciTePress},
  year         = {2013},
  timestamp    = {Tue, 01 Oct 2013 13:16:05 +0200},
  biburl       = {https://dblp.org/rec/conf/icpram/MesnilRBGBV13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/MesnilHDB13,
  author       = {Gr{\'{e}}goire Mesnil and
                  Xiaodong He and
                  Li Deng and
                  Yoshua Bengio},
  editor       = {Fr{\'{e}}d{\'{e}}ric Bimbot and
                  Christophe Cerisara and
                  C{\'{e}}cile Fougeron and
                  Guillaume Gravier and
                  Lori Lamel and
                  Fran{\c{c}}ois Pellegrino and
                  Pascal Perrier},
  title        = {Investigation of recurrent-neural-network architectures and learning
                  methods for spoken language understanding},
  booktitle    = {{INTERSPEECH} 2013, 14th Annual Conference of the International Speech
                  Communication Association, Lyon, France, August 25-29, 2013},
  pages        = {3771--3775},
  publisher    = {{ISCA}},
  year         = {2013},
  url          = {https://doi.org/10.21437/Interspeech.2013-596},
  doi          = {10.21437/INTERSPEECH.2013-596},
  timestamp    = {Fri, 23 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/MesnilHDB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/Boulanger-LewandowskiBV13,
  author       = {Nicolas Boulanger{-}Lewandowski and
                  Yoshua Bengio and
                  Pascal Vincent},
  editor       = {Alceu de Souza Britto Jr. and
                  Fabien Gouyon and
                  Simon Dixon},
  title        = {Audio Chord Recognition with Recurrent Neural Networks},
  booktitle    = {Proceedings of the 14th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2013, Curitiba, Brazil, November 4-8,
                  2013},
  pages        = {335--340},
  year         = {2013},
  url          = {http://www.ppgia.pucpr.br/ismir2013/wp-content/uploads/2013/09/243\_Paper.pdf},
  timestamp    = {Thu, 05 Dec 2013 18:14:04 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/Boulanger-LewandowskiBV13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoodfellowMCB13,
  author       = {Ian J. Goodfellow and
                  Mehdi Mirza and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Multi-Prediction Deep Boltzmann Machines},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {548--556},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/0bb4aec1710521c12ee76289d9440817-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GoodfellowMCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioYAV13,
  author       = {Yoshua Bengio and
                  Li Yao and
                  Guillaume Alain and
                  Pascal Vincent},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Generalized Denoising Auto-Encoders as Generative Models},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {899--907},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/559cb990c9dffd8675f6bc2186971dc2-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioYAV13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DauphinB13,
  author       = {Yann N. Dauphin and
                  Yoshua Bengio},
  editor       = {Christopher J. C. Burges and
                  L{\'{e}}on Bottou and
                  Zoubin Ghahramani and
                  Kilian Q. Weinberger},
  title        = {Stochastic Ratio Matching of RBMs for Sparse High-Dimensional Inputs},
  booktitle    = {Advances in Neural Information Processing Systems 26: 27th Annual
                  Conference on Neural Information Processing Systems 2013. Proceedings
                  of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  pages        = {1340--1348},
  year         = {2013},
  url          = {https://proceedings.neurips.cc/paper/2013/hash/7f5d04d189dfb634e6a85bb9d9adf21e-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DauphinB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigir/SordoniNB13,
  author       = {Alessandro Sordoni and
                  Jian{-}Yun Nie and
                  Yoshua Bengio},
  editor       = {Gareth J. F. Jones and
                  Paraic Sheridan and
                  Diane Kelly and
                  Maarten de Rijke and
                  Tetsuya Sakai},
  title        = {Modeling term dependencies with quantum language models for {IR}},
  booktitle    = {The 36th International {ACM} {SIGIR} conference on research and development
                  in Information Retrieval, {SIGIR} '13, Dublin, Ireland - July 28 -
                  August 01, 2013},
  pages        = {653--662},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2484028.2484098},
  doi          = {10.1145/2484028.2484098},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sigir/SordoniNB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/slsp/Bengio13,
  author       = {Yoshua Bengio},
  editor       = {Adrian{-}Horia Dediu and
                  Carlos Mart{\'{\i}}n{-}Vide and
                  Ruslan Mitkov and
                  Bianca Truthe},
  title        = {Deep Learning of Representations: Looking Forward},
  booktitle    = {Statistical Language and Speech Processing - First International Conference,
                  {SLSP} 2013, Tarragona, Spain, July 29-31, 2013. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7978},
  pages        = {1--37},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-39593-2\_1},
  doi          = {10.1007/978-3-642-39593-2\_1},
  timestamp    = {Sun, 02 Oct 2022 16:15:34 +0200},
  biburl       = {https://dblp.org/rec/conf/slsp/Bengio13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1211-4246,
  author       = {Guillaume Alain and
                  Yoshua Bengio and
                  Salah Rifai},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Regularized Auto-Encoders Estimate Local Statistics},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Conference Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1211.4246},
  timestamp    = {Thu, 04 Apr 2019 13:20:07 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1211-4246.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3485,
  author       = {Xavier Glorot and
                  Antoine Bordes and
                  Jason Weston and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {A Semantic Matching Energy Function for Learning with Multi-relational
                  Data},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3485},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3485.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3545,
  author       = {Guillaume Desjardins and
                  Razvan Pascanu and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Metric-Free Natural Gradient for Joint-Training of Boltzmann Machines},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Conference Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3545},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3545.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3568,
  author       = {Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Joint Training Deep Boltzmann Machines for Classification},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3568},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3568.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3583,
  author       = {Yann N. Dauphin and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Big Neural Networks Waste Capacity},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3583},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3583.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-3584v4,
  author       = {Razvan Pascanu and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Natural Gradient Revisited},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.3584v4},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-3584v4.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/corr/abs-1301-4083,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Knowledge Matters: Importance of Prior Information for Optimization},
  booktitle    = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Conference Track Proceedings},
  year         = {2013},
  url          = {http://arxiv.org/abs/1301.4083},
  timestamp    = {Fri, 29 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1301-4083.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:series/isrl/BengioC13,
  author       = {Yoshua Bengio and
                  Aaron C. Courville},
  editor       = {Monica Bianchini and
                  Marco Maggini and
                  Lakhmi C. Jain},
  title        = {Deep Learning of Representations},
  booktitle    = {Handbook on Neural Information Processing},
  series       = {Intelligent Systems Reference Library},
  volume       = {49},
  pages        = {1--28},
  publisher    = {Springer},
  year         = {2013},
  url          = {https://doi.org/10.1007/978-3-642-36657-4\_1},
  doi          = {10.1007/978-3-642-36657-4\_1},
  timestamp    = {Tue, 16 May 2017 14:24:22 +0200},
  biburl       = {https://dblp.org/rec/series/isrl/BengioC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2013,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Conference Track Proceedings},
  year         = {2013},
  url          = {https://openreview.net/group?id=ICLR.cc/2013},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2013.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/iclr/2013w,
  editor       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {1st International Conference on Learning Representations, {ICLR} 2013,
                  Scottsdale, Arizona, USA, May 2-4, 2013, Workshop Track Proceedings},
  year         = {2013},
  url          = {https://openreview.net/group?id=ICLR.cc/2013},
  timestamp    = {Thu, 04 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/2013w.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1302-4389,
  author       = {Ian J. Goodfellow and
                  David Warde{-}Farley and
                  Mehdi Mirza and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Maxout Networks},
  journal      = {CoRR},
  volume       = {abs/1302.4389},
  year         = {2013},
  url          = {http://arxiv.org/abs/1302.4389},
  eprinttype    = {arXiv},
  eprint       = {1302.4389},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1302-4389.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1305-0445,
  author       = {Yoshua Bengio},
  title        = {Deep Learning of Representations: Looking Forward},
  journal      = {CoRR},
  volume       = {abs/1305.0445},
  year         = {2013},
  url          = {http://arxiv.org/abs/1305.0445},
  eprinttype    = {arXiv},
  eprint       = {1305.0445},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1305-0445.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1305-2982,
  author       = {Yoshua Bengio},
  title        = {Estimating or Propagating Gradients Through Stochastic Neurons},
  journal      = {CoRR},
  volume       = {abs/1305.2982},
  year         = {2013},
  url          = {http://arxiv.org/abs/1305.2982},
  eprinttype    = {arXiv},
  eprint       = {1305.2982},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1305-2982.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1305-6663,
  author       = {Yoshua Bengio and
                  Li Yao and
                  Guillaume Alain and
                  Pascal Vincent},
  title        = {Generalized Denoising Auto-Encoders as Generative Models},
  journal      = {CoRR},
  volume       = {abs/1305.6663},
  year         = {2013},
  url          = {http://arxiv.org/abs/1305.6663},
  eprinttype    = {arXiv},
  eprint       = {1305.6663},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1305-6663.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioT13,
  author       = {Yoshua Bengio and
                  Eric Thibodeau{-}Laufer and
                  Jason Yosinski},
  title        = {Deep Generative Stochastic Networks Trainable by Backprop},
  journal      = {CoRR},
  volume       = {abs/1306.1091},
  year         = {2013},
  url          = {http://arxiv.org/abs/1306.1091},
  eprinttype    = {arXiv},
  eprint       = {1306.1091},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioT13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GoodfellowECCMHCTTLZRFLWASMPIPGBXRXZB13,
  author       = {Ian J. Goodfellow and
                  Dumitru Erhan and
                  Pierre Luc Carrier and
                  Aaron C. Courville and
                  Mehdi Mirza and
                  Benjamin Hamner and
                  William Cukierski and
                  Yichuan Tang and
                  David Thaler and
                  Dong{-}Hyun Lee and
                  Yingbo Zhou and
                  Chetan Ramaiah and
                  Fangxiang Feng and
                  Ruifan Li and
                  Xiaojie Wang and
                  Dimitris Athanasakis and
                  John Shawe{-}Taylor and
                  Maxim Milakov and
                  John Park and
                  Radu Tudor Ionescu and
                  Marius Popescu and
                  Cristian Grozea and
                  James Bergstra and
                  Jingjing Xie and
                  Lukasz Romaszko and
                  Bing Xu and
                  Chuang Zhang and
                  Yoshua Bengio},
  title        = {Challenges in Representation Learning: {A} report on three machine
                  learning contests},
  journal      = {CoRR},
  volume       = {abs/1307.0414},
  year         = {2013},
  url          = {http://arxiv.org/abs/1307.0414},
  eprinttype    = {arXiv},
  eprint       = {1307.0414},
  timestamp    = {Mon, 15 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/GoodfellowECCMHCTTLZRFLWASMPIPGBXRXZB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioLC13,
  author       = {Yoshua Bengio and
                  Nicholas L{\'{e}}onard and
                  Aaron C. Courville},
  title        = {Estimating or Propagating Gradients Through Stochastic Neurons for
                  Conditional Computation},
  journal      = {CoRR},
  volume       = {abs/1308.3432},
  year         = {2013},
  url          = {http://arxiv.org/abs/1308.3432},
  eprinttype    = {arXiv},
  eprint       = {1308.3432},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioLC13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GoodfellowWLDMPBBB13,
  author       = {Ian J. Goodfellow and
                  David Warde{-}Farley and
                  Pascal Lamblin and
                  Vincent Dumoulin and
                  Mehdi Mirza and
                  Razvan Pascanu and
                  James Bergstra and
                  Fr{\'{e}}d{\'{e}}ric Bastien and
                  Yoshua Bengio},
  title        = {Pylearn2: a machine learning research library},
  journal      = {CoRR},
  volume       = {abs/1308.4214},
  year         = {2013},
  url          = {http://arxiv.org/abs/1308.4214},
  eprinttype    = {arXiv},
  eprint       = {1308.4214},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GoodfellowWLDMPBBB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GulcehreCPB13,
  author       = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
                  Kyunghyun Cho and
                  Razvan Pascanu and
                  Yoshua Bengio},
  title        = {Learned-norm pooling for deep neural networks},
  journal      = {CoRR},
  volume       = {abs/1311.1780},
  year         = {2013},
  url          = {http://arxiv.org/abs/1311.1780},
  eprinttype    = {arXiv},
  eprint       = {1311.1780},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GulcehreCPB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DumoulinGCB13,
  author       = {Vincent Dumoulin and
                  Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {On the Challenges of Physical Implementations of RBMs},
  journal      = {CoRR},
  volume       = {abs/1312.5258},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.5258},
  eprinttype    = {arXiv},
  eprint       = {1312.5258},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DumoulinGCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ci/BengioCDLSHL12,
  author       = {Yoshua Bengio and
                  Nicolas Chapados and
                  Olivier Delalleau and
                  Hugo Larochelle and
                  Xavier Saint{-}Mleux and
                  Christian Hudon and
                  J{\'{e}}r{\^{o}}me Louradour},
  title        = {Detonation Classification from acoustic Signature with the Restricted
                  Boltzmann Machine},
  journal      = {Comput. Intell.},
  volume       = {28},
  number       = {2},
  pages        = {261--288},
  year         = {2012},
  url          = {https://doi.org/10.1111/j.1467-8640.2012.00419.x},
  doi          = {10.1111/J.1467-8640.2012.00419.X},
  timestamp    = {Sun, 15 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ci/BengioCDLSHL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BergstraB12,
  author       = {James Bergstra and
                  Yoshua Bengio},
  title        = {Random Search for Hyper-Parameter Optimization},
  journal      = {J. Mach. Learn. Res.},
  volume       = {13},
  pages        = {281--305},
  year         = {2012},
  url          = {https://dl.acm.org/doi/10.5555/2503308.2188395},
  doi          = {10.5555/2503308.2188395},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BergstraB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/LarochelleMPB12,
  author       = {Hugo Larochelle and
                  Michael I. Mandel and
                  Razvan Pascanu and
                  Yoshua Bengio},
  title        = {Learning Algorithms for the Classification Restricted Boltzmann Machine},
  journal      = {J. Mach. Learn. Res.},
  volume       = {13},
  pages        = {643--669},
  year         = {2012},
  url          = {https://dl.acm.org/doi/10.5555/2503308.2188407},
  doi          = {10.5555/2503308.2188407},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/LarochelleMPB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tciaig/DelalleauCTFBZ12,
  author       = {Olivier Delalleau and
                  Emile Contal and
                  Eric Thibodeau{-}Laufer and
                  Raul Chandias Ferrari and
                  Yoshua Bengio and
                  Frank Zhang},
  title        = {Beyond Skill Rating: Advanced Matchmaking in Ghost Recon Online},
  journal      = {{IEEE} Trans. Comput. Intell. {AI} Games},
  volume       = {4},
  number       = {3},
  pages        = {167--177},
  year         = {2012},
  url          = {https://doi.org/10.1109/TCIAIG.2012.2188833},
  doi          = {10.1109/TCIAIG.2012.2188833},
  timestamp    = {Wed, 13 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tciaig/DelalleauCTFBZ12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SocherBM12,
  author       = {Richard Socher and
                  Yoshua Bengio and
                  Christopher D. Manning},
  title        = {Deep Learning for {NLP} (without Magic)},
  booktitle    = {The 50th Annual Meeting of the Association for Computational Linguistics,
                  Tutorial Abstracts, July 8, 2012, Jeju Island, Korea},
  pages        = {5},
  publisher    = {The Association for Computer Linguistics},
  year         = {2012},
  url          = {https://aclanthology.org/P12-4005/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SocherBM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eccv/RifaiBCVM12,
  author       = {Salah Rifai and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Pascal Vincent and
                  Mehdi Mirza},
  editor       = {Andrew W. Fitzgibbon and
                  Svetlana Lazebnik and
                  Pietro Perona and
                  Yoichi Sato and
                  Cordelia Schmid},
  title        = {Disentangling Factors of Variation for Facial Expression Recognition},
  booktitle    = {Computer Vision - {ECCV} 2012 - 12th European Conference on Computer
                  Vision, Florence, Italy, October 7-13, 2012, Proceedings, Part {VI}},
  series       = {Lecture Notes in Computer Science},
  volume       = {7577},
  pages        = {808--822},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-33783-3\_58},
  doi          = {10.1007/978-3-642-33783-3\_58},
  timestamp    = {Thu, 27 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eccv/RifaiBCVM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Boulanger-LewandowskiBV12,
  author       = {Nicolas Boulanger{-}Lewandowski and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {Modeling Temporal Dependencies in High-Dimensional Sequences: Application
                  to Polyphonic Music Generation and Transcription},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/590.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Boulanger-LewandowskiBV12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GoodfellowCB12,
  author       = {Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Large-Scale Feature Learning With Spike-and-Slab Sparse Coding},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/718.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GoodfellowCB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RifaiDVB12,
  author       = {Salah Rifai and
                  Yann N. Dauphin and
                  Pascal Vincent and
                  Yoshua Bengio},
  title        = {A Generative Process for Contractive Auto-Encoders},
  booktitle    = {Proceedings of the 29th International Conference on Machine Learning,
                  {ICML} 2012, Edinburgh, Scotland, UK, June 26 - July 1, 2012},
  publisher    = {icml.cc / Omnipress},
  year         = {2012},
  url          = {http://icml.cc/2012/papers/910.pdf},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RifaiDVB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/Boulanger-LewandowskiBV12,
  author       = {Nicolas Boulanger{-}Lewandowski and
                  Yoshua Bengio and
                  Pascal Vincent},
  editor       = {Fabien Gouyon and
                  Perfecto Herrera and
                  Luis Gustavo Martins and
                  Meinard M{\"{u}}ller},
  title        = {Discriminative Non-negative Matrix Factorization for Multiple Pitch
                  Estimation},
  booktitle    = {Proceedings of the 13th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2012, Mosteiro S.Bento Da Vit{\'{o}}ria,
                  Porto, Portugal, October 8-12, 2012},
  pages        = {205--210},
  publisher    = {{FEUP} Edi{\c{c}}{\~{o}}es},
  year         = {2012},
  url          = {http://ismir2012.ismir.net/event/papers/205-ismir-2012.pdf},
  timestamp    = {Tue, 04 Jan 2022 10:38:10 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/Boulanger-LewandowskiBV12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/HamelBE12,
  author       = {Philippe Hamel and
                  Yoshua Bengio and
                  Douglas Eck},
  editor       = {Fabien Gouyon and
                  Perfecto Herrera and
                  Luis Gustavo Martins and
                  Meinard M{\"{u}}ller},
  title        = {Building Musically-relevant Audio Features through Multiple Timescale
                  Representations},
  booktitle    = {Proceedings of the 13th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2012, Mosteiro S.Bento Da Vit{\'{o}}ria,
                  Porto, Portugal, October 8-12, 2012},
  pages        = {553--558},
  publisher    = {{FEUP} Edi{\c{c}}{\~{o}}es},
  year         = {2012},
  url          = {http://ismir2012.ismir.net/event/papers/553-ismir-2012.pdf},
  timestamp    = {Tue, 04 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/HamelBE12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/Bengio12,
  author       = {Yoshua Bengio},
  editor       = {Isabelle Guyon and
                  Gideon Dror and
                  Vincent Lemaire and
                  Graham W. Taylor and
                  Daniel L. Silver},
  title        = {Deep Learning of Representations for Unsupervised and Transfer Learning},
  booktitle    = {Unsupervised and Transfer Learning - Workshop held at {ICML} 2011,
                  Bellevue, Washington, USA, July 2, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {27},
  pages        = {17--36},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v27/bengio12a.html},
  timestamp    = {Wed, 02 Sep 2020 16:33:18 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/Bengio12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/MesnilDGRBGLMDWVCB12,
  author       = {Gr{\'{e}}goire Mesnil and
                  Yann N. Dauphin and
                  Xavier Glorot and
                  Salah Rifai and
                  Yoshua Bengio and
                  Ian J. Goodfellow and
                  Erick Lavoie and
                  Xavier Muller and
                  Guillaume Desjardins and
                  David Warde{-}Farley and
                  Pascal Vincent and
                  Aaron C. Courville and
                  James Bergstra},
  editor       = {Isabelle Guyon and
                  Gideon Dror and
                  Vincent Lemaire and
                  Graham W. Taylor and
                  Daniel L. Silver},
  title        = {Unsupervised and Transfer Learning Challenge: a Deep Learning Approach},
  booktitle    = {Unsupervised and Transfer Learning - Workshop held at {ICML} 2011,
                  Bellevue, Washington, USA, July 2, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {27},
  pages        = {97--110},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v27/mesnil12a.html},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/MesnilDGRBGLMDWVCB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/BordesGWB12,
  author       = {Antoine Bordes and
                  Xavier Glorot and
                  Jason Weston and
                  Yoshua Bengio},
  editor       = {Neil D. Lawrence and
                  Mark A. Girolami},
  title        = {Joint Learning of Words and Meaning Representations for Open-Text
                  Semantic Parsing},
  booktitle    = {Proceedings of the Fifteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2012, La Palma, Canary Islands,
                  Spain, April 21-23, 2012},
  series       = {{JMLR} Proceedings},
  volume       = {22},
  pages        = {127--135},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v22/bordes12.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BordesGWB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:series/lncs/Bengio12,
  author       = {Yoshua Bengio},
  editor       = {Gr{\'{e}}goire Montavon and
                  Genevieve B. Orr and
                  Klaus{-}Robert M{\"{u}}ller},
  title        = {Practical Recommendations for Gradient-Based Training of Deep Architectures},
  booktitle    = {Neural Networks: Tricks of the Trade - Second Edition},
  series       = {Lecture Notes in Computer Science},
  volume       = {7700},
  pages        = {437--478},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-35289-8\_26},
  doi          = {10.1007/978-3-642-35289-8\_26},
  timestamp    = {Wed, 25 Sep 2019 17:41:07 +0200},
  biburl       = {https://dblp.org/rec/series/lncs/Bengio12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1201-3382,
  author       = {Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Spike-and-Slab Sparse Coding for Unsupervised Feature Discovery},
  journal      = {CoRR},
  volume       = {abs/1201.3382},
  year         = {2012},
  url          = {http://arxiv.org/abs/1201.3382},
  eprinttype    = {arXiv},
  eprint       = {1201.3382},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1201-3382.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1203-2990,
  author       = {Yoshua Bengio},
  title        = {Evolving Culture vs Local Minima},
  journal      = {CoRR},
  volume       = {abs/1203.2990},
  year         = {2012},
  url          = {http://arxiv.org/abs/1203.2990},
  eprinttype    = {arXiv},
  eprint       = {1203.2990},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1203-2990.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1203-4416,
  author       = {Guillaume Desjardins and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {On Training Deep Boltzmann Machines},
  journal      = {CoRR},
  volume       = {abs/1203.4416},
  year         = {2012},
  url          = {http://arxiv.org/abs/1203.4416},
  eprinttype    = {arXiv},
  eprint       = {1203.4416},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1203-4416.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1206-5533,
  author       = {Yoshua Bengio},
  title        = {Practical recommendations for gradient-based training of deep architectures},
  journal      = {CoRR},
  volume       = {abs/1206.5533},
  year         = {2012},
  url          = {http://arxiv.org/abs/1206.5533},
  eprinttype    = {arXiv},
  eprint       = {1206.5533},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1206-5533.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1206-5538,
  author       = {Yoshua Bengio and
                  Aaron C. Courville and
                  Pascal Vincent},
  title        = {Unsupervised Feature Learning and Deep Learning: {A} Review and New
                  Perspectives},
  journal      = {CoRR},
  volume       = {abs/1206.5538},
  year         = {2012},
  url          = {http://arxiv.org/abs/1206.5538},
  eprinttype    = {arXiv},
  eprint       = {1206.5538},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1206-5538.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1207-0057,
  author       = {Yoshua Bengio and
                  Guillaume Alain and
                  Salah Rifai},
  title        = {Implicit Density Estimation by Local Moment Matching to Sample from
                  Auto-Encoders},
  journal      = {CoRR},
  volume       = {abs/1207.0057},
  year         = {2012},
  url          = {http://arxiv.org/abs/1207.0057},
  eprinttype    = {arXiv},
  eprint       = {1207.0057},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1207-0057.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1207-4404,
  author       = {Yoshua Bengio and
                  Gr{\'{e}}goire Mesnil and
                  Yann N. Dauphin and
                  Salah Rifai},
  title        = {Better Mixing via Deep Representations},
  journal      = {CoRR},
  volume       = {abs/1207.4404},
  year         = {2012},
  url          = {http://arxiv.org/abs/1207.4404},
  eprinttype    = {arXiv},
  eprint       = {1207.4404},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1207-4404.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1209-0521,
  author       = {Olivier Delalleau and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Efficient {EM} Training of Gaussian Mixtures with Missing Data},
  journal      = {CoRR},
  volume       = {abs/1209.0521},
  year         = {2012},
  url          = {http://arxiv.org/abs/1209.0521},
  eprinttype    = {arXiv},
  eprint       = {1209.0521},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1209-0521.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1210-5474,
  author       = {Guillaume Desjardins and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Disentangling Factors of Variation via Generative Entangling},
  journal      = {CoRR},
  volume       = {abs/1210.5474},
  year         = {2012},
  url          = {http://arxiv.org/abs/1210.5474},
  eprinttype    = {arXiv},
  eprint       = {1210.5474},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1210-5474.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1211-5063,
  author       = {Razvan Pascanu and
                  Tom{\'{a}}s Mikolov and
                  Yoshua Bengio},
  title        = {Understanding the exploding gradient problem},
  journal      = {CoRR},
  volume       = {abs/1211.5063},
  year         = {2012},
  url          = {http://arxiv.org/abs/1211.5063},
  eprinttype    = {arXiv},
  eprint       = {1211.5063},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1211-5063.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1211-5590,
  author       = {Fr{\'{e}}d{\'{e}}ric Bastien and
                  Pascal Lamblin and
                  Razvan Pascanu and
                  James Bergstra and
                  Ian J. Goodfellow and
                  Arnaud Bergeron and
                  Nicolas Bouchard and
                  David Warde{-}Farley and
                  Yoshua Bengio},
  title        = {Theano: new features and speed improvements},
  journal      = {CoRR},
  volume       = {abs/1211.5590},
  year         = {2012},
  url          = {http://arxiv.org/abs/1211.5590},
  eprinttype    = {arXiv},
  eprint       = {1211.5590},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1211-5590.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1211-5687,
  author       = {Heng Luo and
                  Pierre Luc Carrier and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Texture Modeling with Convolutional Spike-and-Slab RBMs and Deep Extensions},
  journal      = {CoRR},
  volume       = {abs/1211.5687},
  year         = {2012},
  url          = {http://arxiv.org/abs/1211.5687},
  eprinttype    = {arXiv},
  eprint       = {1211.5687},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1211-5687.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1212-0901,
  author       = {Yoshua Bengio and
                  Nicolas Boulanger{-}Lewandowski and
                  Razvan Pascanu},
  title        = {Advances in Optimizing Recurrent Networks},
  journal      = {CoRR},
  volume       = {abs/1212.0901},
  year         = {2012},
  url          = {http://arxiv.org/abs/1212.0901},
  eprinttype    = {arXiv},
  eprint       = {1212.0901},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1212-0901.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1212-1936,
  author       = {Nicolas Boulanger{-}Lewandowski and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {High-dimensional sequence transduction},
  journal      = {CoRR},
  volume       = {abs/1212.1936},
  year         = {2012},
  url          = {http://arxiv.org/abs/1212.1936},
  eprinttype    = {arXiv},
  eprint       = {1212.1936},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1212-1936.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1212-2686,
  author       = {Ian J. Goodfellow and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Joint Training of Deep Boltzmann Machines},
  journal      = {CoRR},
  volume       = {abs/1212.2686},
  year         = {2012},
  url          = {http://arxiv.org/abs/1212.2686},
  eprinttype    = {arXiv},
  eprint       = {1212.2686},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1212-2686.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BergstraBL11,
  author       = {James Bergstra and
                  Yoshua Bengio and
                  J{\'{e}}r{\^{o}}me Louradour},
  title        = {Suitability of {V1} Energy Models for Object Classification},
  journal      = {Neural Comput.},
  volume       = {23},
  number       = {3},
  pages        = {774--790},
  year         = {2011},
  url          = {https://doi.org/10.1162/NECO\_a\_00084},
  doi          = {10.1162/NECO\_A\_00084},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BergstraBL11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BreuleuxBV11,
  author       = {Olivier Breuleux and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {Quickly Generating Representative Samples from an RBM-Derived Process},
  journal      = {Neural Comput.},
  volume       = {23},
  number       = {8},
  pages        = {2058--2073},
  year         = {2011},
  url          = {https://doi.org/10.1162/NECO\_a\_00158},
  doi          = {10.1162/NECO\_A\_00158},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BreuleuxBV11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tomccap/MandelPEBASM11,
  author       = {Michael I. Mandel and
                  Razvan Pascanu and
                  Douglas Eck and
                  Yoshua Bengio and
                  Luca Maria Aiello and
                  Rossano Schifanella and
                  Filippo Menczer},
  title        = {Contextual tag inference},
  journal      = {{ACM} Trans. Multim. Comput. Commun. Appl.},
  volume       = {7},
  number       = {Supplement},
  pages        = {32},
  year         = {2011},
  url          = {https://doi.org/10.1145/2037676.2037689},
  doi          = {10.1145/2037676.2037689},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tomccap/MandelPEBASM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/BordesWCB11,
  author       = {Antoine Bordes and
                  Jason Weston and
                  Ronan Collobert and
                  Yoshua Bengio},
  editor       = {Wolfram Burgard and
                  Dan Roth},
  title        = {Learning Structured Embeddings of Knowledge Bases},
  booktitle    = {Proceedings of the Twenty-Fifth {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2011, San Francisco, California, USA, August 7-11, 2011},
  pages        = {301--306},
  publisher    = {{AAAI} Press},
  year         = {2011},
  url          = {https://doi.org/10.1609/aaai.v25i1.7917},
  doi          = {10.1609/AAAI.V25I1.7917},
  timestamp    = {Mon, 04 Sep 2023 16:05:54 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/BordesWCB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/alt/BengioD11,
  author       = {Yoshua Bengio and
                  Olivier Delalleau},
  editor       = {Jyrki Kivinen and
                  Csaba Szepesv{\'{a}}ri and
                  Esko Ukkonen and
                  Thomas Zeugmann},
  title        = {On the Expressive Power of Deep Architectures},
  booktitle    = {Algorithmic Learning Theory - 22nd International Conference, {ALT}
                  2011, Espoo, Finland, October 5-7, 2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6925},
  pages        = {18--36},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24412-4\_3},
  doi          = {10.1007/978-3-642-24412-4\_3},
  timestamp    = {Tue, 14 May 2019 10:00:51 +0200},
  biburl       = {https://dblp.org/rec/conf/alt/BengioD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dis/BengioD11,
  author       = {Yoshua Bengio and
                  Olivier Delalleau},
  editor       = {Tapio Elomaa and
                  Jaakko Hollm{\'{e}}n and
                  Heikki Mannila},
  title        = {On the Expressive Power of Deep Architectures},
  booktitle    = {Discovery Science - 14th International Conference, {DS} 2011, Espoo,
                  Finland, October 5-7, 2011. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6926},
  pages        = {1},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-24477-3\_1},
  doi          = {10.1007/978-3-642-24477-3\_1},
  timestamp    = {Tue, 14 May 2019 10:00:46 +0200},
  biburl       = {https://dblp.org/rec/conf/dis/BengioD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GlorotBB11,
  author       = {Xavier Glorot and
                  Antoine Bordes and
                  Yoshua Bengio},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Domain Adaptation for Large-Scale Sentiment Classification: {A} Deep
                  Learning Approach},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {513--520},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/342\_icmlpaper.pdf},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GlorotBB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RifaiVMGB11,
  author       = {Salah Rifai and
                  Pascal Vincent and
                  Xavier Muller and
                  Xavier Glorot and
                  Yoshua Bengio},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Contractive Auto-Encoders: Explicit Invariance During Feature Extraction},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {833--840},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/455\_icmlpaper.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RifaiVMGB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DauphinGB11,
  author       = {Yann N. Dauphin and
                  Xavier Glorot and
                  Yoshua Bengio},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Large-Scale Learning of Embeddings with Reconstruction Sampling},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {945--952},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/491\_icmlpaper.pdf},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DauphinGB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/CourvilleBB11,
  author       = {Aaron C. Courville and
                  James Bergstra and
                  Yoshua Bengio},
  editor       = {Lise Getoor and
                  Tobias Scheffer},
  title        = {Unsupervised Models of Images by Spikeand-Slab RBMs},
  booktitle    = {Proceedings of the 28th International Conference on Machine Learning,
                  {ICML} 2011, Bellevue, Washington, USA, June 28 - July 2, 2011},
  pages        = {1145--1152},
  publisher    = {Omnipress},
  year         = {2011},
  url          = {https://icml.cc/2011/papers/591\_icmlpaper.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/CourvilleBB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/HamelLBE11,
  author       = {Philippe Hamel and
                  Simon Lemieux and
                  Yoshua Bengio and
                  Douglas Eck},
  editor       = {Anssi Klapuri and
                  Colby Leider},
  title        = {Temporal Pooling and Multiscale Learning for Automatic Annotation
                  and Ranking of Music Audio},
  booktitle    = {Proceedings of the 12th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2011, Miami, Florida, USA, October 24-28,
                  2011},
  pages        = {729--734},
  publisher    = {University of Miami},
  year         = {2011},
  url          = {http://ismir2011.ismir.net/papers/PS6-13.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/HamelLBE11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlslp/Bengio11,
  author       = {Yoshua Bengio},
  title        = {On learning distributed representations of semantics},
  booktitle    = {2011 Symposium on Machine Learning in Speech and Language Processing,
                  {MLSLP} 2011, Bellevue, WA, USA, June 27, 2011},
  publisher    = {{ISCA}},
  year         = {2011},
  url          = {http://www.isca-speech.org/archive/mlslp\_2011/ml11\_112.html},
  timestamp    = {Tue, 16 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/mlslp/Bengio11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DelalleauB11,
  author       = {Olivier Delalleau and
                  Yoshua Bengio},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {Shallow vs. Deep Sum-Product Networks},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {666--674},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/8e6b42f1644ecb1327dc03ab345e618b-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DelalleauB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RifaiDVBM11,
  author       = {Salah Rifai and
                  Yann N. Dauphin and
                  Pascal Vincent and
                  Yoshua Bengio and
                  Xavier Muller},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {The Manifold Tangent Classifier},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {2294--2302},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/d1f44e2f09dc172978a4d3151d11d63e-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RifaiDVBM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DesjardinsCB11,
  author       = {Guillaume Desjardins and
                  Aaron C. Courville and
                  Yoshua Bengio},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {On Tracking The Partition Function},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {2501--2509},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/861dc9bd7f4e7dd3cccd534d0ae2a2e9-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DesjardinsCB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BergstraBBK11,
  author       = {James Bergstra and
                  R{\'{e}}mi Bardenet and
                  Yoshua Bengio and
                  Bal{\'{a}}zs K{\'{e}}gl},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {Algorithms for Hyper-Parameter Optimization},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {2546--2554},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/86e8f7ab32cfd12577bc2619bc635690-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BergstraBBK11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/RifaiMVMBDG11,
  author       = {Salah Rifai and
                  Gr{\'{e}}goire Mesnil and
                  Pascal Vincent and
                  Xavier Muller and
                  Yoshua Bengio and
                  Yann N. Dauphin and
                  Xavier Glorot},
  editor       = {Dimitrios Gunopulos and
                  Thomas Hofmann and
                  Donato Malerba and
                  Michalis Vazirgiannis},
  title        = {Higher Order Contractive Auto-Encoder},
  booktitle    = {Machine Learning and Knowledge Discovery in Databases - European Conference,
                  {ECML} {PKDD} 2011, Athens, Greece, September 5-9, 2011, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {6912},
  pages        = {645--660},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-23783-6\_41},
  doi          = {10.1007/978-3-642-23783-6\_41},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pkdd/RifaiMVMBDG11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/Bengio11,
  author       = {Yoshua Bengio},
  editor       = {Geoffrey J. Gordon and
                  David B. Dunson and
                  Miroslav Dud{\'{\i}}k},
  title        = {Discussion of "The Neural Autoregressive Distribution Estimator"},
  booktitle    = {Proceedings of the Fourteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2011, Fort Lauderdale, USA,
                  April 11-13, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {15},
  pages        = {38--39},
  publisher    = {JMLR.org},
  year         = {2011},
  url          = {http://proceedings.mlr.press/v15/bengio11a/bengio11a.pdf},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/Bengio11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/BengioBBBBCCCEEGMLPRSS11,
  author       = {Yoshua Bengio and
                  Fr{\'{e}}d{\'{e}}ric Bastien and
                  Arnaud Bergeron and
                  Nicolas Boulanger{-}Lewandowski and
                  Thomas M. Breuel and
                  Youssouf Chherawala and
                  Moustapha Ciss{\'{e}} and
                  Myriam C{\^{o}}t{\'{e}} and
                  Dumitru Erhan and
                  Jeremy Eustache and
                  Xavier Glorot and
                  Xavier Muller and
                  Sylvain Pannetier Lebeuf and
                  Razvan Pascanu and
                  Salah Rifai and
                  Fran{\c{c}}ois Savard and
                  Guillaume Sicard},
  editor       = {Geoffrey J. Gordon and
                  David B. Dunson and
                  Miroslav Dud{\'{\i}}k},
  title        = {Deep Learners Benefit More from Out-of-Distribution Examples},
  booktitle    = {Proceedings of the Fourteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2011, Fort Lauderdale, USA,
                  April 11-13, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {15},
  pages        = {164--172},
  publisher    = {JMLR.org},
  year         = {2011},
  url          = {http://proceedings.mlr.press/v15/bengio11b/bengio11b.pdf},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BengioBBBBCCCEEGMLPRSS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/CourvilleBB11,
  author       = {Aaron C. Courville and
                  James Bergstra and
                  Yoshua Bengio},
  editor       = {Geoffrey J. Gordon and
                  David B. Dunson and
                  Miroslav Dud{\'{\i}}k},
  title        = {A Spike and Slab Restricted Boltzmann Machine},
  booktitle    = {Proceedings of the Fourteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2011, Fort Lauderdale, USA,
                  April 11-13, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {15},
  pages        = {233--241},
  publisher    = {JMLR.org},
  year         = {2011},
  url          = {http://proceedings.mlr.press/v15/courville11a/courville11a.pdf},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/CourvilleBB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/GlorotBB11,
  author       = {Xavier Glorot and
                  Antoine Bordes and
                  Yoshua Bengio},
  editor       = {Geoffrey J. Gordon and
                  David B. Dunson and
                  Miroslav Dud{\'{\i}}k},
  title        = {Deep Sparse Rectifier Neural Networks},
  booktitle    = {Proceedings of the Fourteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2011, Fort Lauderdale, USA,
                  April 11-13, 2011},
  series       = {{JMLR} Proceedings},
  volume       = {15},
  pages        = {315--323},
  publisher    = {JMLR.org},
  year         = {2011},
  url          = {http://proceedings.mlr.press/v15/glorot11a/glorot11a.pdf},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/GlorotBB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1103-2832,
  author       = {Michael I. Mandel and
                  Razvan Pascanu and
                  Hugo Larochelle and
                  Yoshua Bengio},
  title        = {Autotagging music with conditional restricted Boltzmann machines},
  journal      = {CoRR},
  volume       = {abs/1103.2832},
  year         = {2011},
  url          = {http://arxiv.org/abs/1103.2832},
  eprinttype    = {arXiv},
  eprint       = {1103.2832},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1103-2832.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1104-3250,
  author       = {Salah Rifai and
                  Xavier Glorot and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {Adding noise to the input of a model trained with a regularized objective},
  journal      = {CoRR},
  volume       = {abs/1104.3250},
  year         = {2011},
  url          = {http://arxiv.org/abs/1104.3250},
  eprinttype    = {arXiv},
  eprint       = {1104.3250},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1104-3250.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1104-4153,
  author       = {Salah Rifai and
                  Xavier Muller and
                  Xavier Glorot and
                  Gr{\'{e}}goire Mesnil and
                  Yoshua Bengio and
                  Pascal Vincent},
  title        = {Learning invariant features through local space contraction},
  journal      = {CoRR},
  volume       = {abs/1104.4153},
  year         = {2011},
  url          = {http://arxiv.org/abs/1104.4153},
  eprinttype    = {arXiv},
  eprint       = {1104.4153},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1104-4153.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1107-3663,
  author       = {Antoine Bordes and
                  Xavier Glorot and
                  Jason Weston and
                  Yoshua Bengio},
  title        = {Towards Open-Text Semantic Parsing via Multi-Task Learning of Structured
                  Embeddings},
  journal      = {CoRR},
  volume       = {abs/1107.3663},
  year         = {2011},
  url          = {http://arxiv.org/abs/1107.3663},
  eprinttype    = {arXiv},
  eprint       = {1107.3663},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1107-3663.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1109-6638,
  author       = {James Bergstra and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {The Statistical Inefficiency of Sparse Coding for Images (or, One
                  Gabor to Rule them All)},
  journal      = {CoRR},
  volume       = {abs/1109.6638},
  year         = {2011},
  url          = {http://arxiv.org/abs/1109.6638},
  eprinttype    = {arXiv},
  eprint       = {1109.6638},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1109-6638.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ci/BengioDS10,
  author       = {Yoshua Bengio and
                  Olivier Delalleau and
                  Clarence Simard},
  title        = {Decision trees do not generalize to new variations},
  journal      = {Comput. Intell.},
  volume       = {26},
  number       = {4},
  pages        = {449--467},
  year         = {2010},
  url          = {https://doi.org/10.1111/j.1467-8640.2010.00366.x},
  doi          = {10.1111/J.1467-8640.2010.00366.X},
  timestamp    = {Sun, 15 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ci/BengioDS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcns/RivestKB10,
  author       = {Fran{\c{c}}ois Rivest and
                  John Kalaska and
                  Yoshua Bengio},
  title        = {Alternative time representation in dopamine models},
  journal      = {J. Comput. Neurosci.},
  volume       = {28},
  number       = {1},
  pages        = {107--130},
  year         = {2010},
  url          = {https://doi.org/10.1007/s10827-009-0191-1},
  doi          = {10.1007/S10827-009-0191-1},
  timestamp    = {Thu, 16 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jcns/RivestKB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/ErhanBCMVB10,
  author       = {Dumitru Erhan and
                  Yoshua Bengio and
                  Aaron C. Courville and
                  Pierre{-}Antoine Manzagol and
                  Pascal Vincent and
                  Samy Bengio},
  title        = {Why Does Unsupervised Pre-training Help Deep Learning?},
  journal      = {J. Mach. Learn. Res.},
  volume       = {11},
  pages        = {625--660},
  year         = {2010},
  url          = {https://dl.acm.org/doi/10.5555/1756006.1756025},
  doi          = {10.5555/1756006.1756025},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/ErhanBCMVB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/VincentLLBM10,
  author       = {Pascal Vincent and
                  Hugo Larochelle and
                  Isabelle Lajoie and
                  Yoshua Bengio and
                  Pierre{-}Antoine Manzagol},
  title        = {Stacked Denoising Autoencoders: Learning Useful Representations in
                  a Deep Network with a Local Denoising Criterion},
  journal      = {J. Mach. Learn. Res.},
  volume       = {11},
  pages        = {3371--3408},
  year         = {2010},
  url          = {https://dl.acm.org/doi/10.5555/1756006.1953039},
  doi          = {10.5555/1756006.1953039},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/VincentLLBM10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/RouxB10,
  author       = {Nicolas Le Roux and
                  Yoshua Bengio},
  title        = {Deep Belief Networks Are Compact Universal Approximators},
  journal      = {Neural Comput.},
  volume       = {22},
  number       = {8},
  pages        = {2192--2207},
  year         = {2010},
  url          = {https://doi.org/10.1162/neco.2010.08-09-1081},
  doi          = {10.1162/NECO.2010.08-09-1081},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/RouxB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/LarochelleBT10,
  author       = {Hugo Larochelle and
                  Yoshua Bengio and
                  Joseph P. Turian},
  title        = {Tractable Multivariate Binary Density Estimation and the Restricted
                  Boltzmann Forest},
  journal      = {Neural Comput.},
  volume       = {22},
  number       = {9},
  pages        = {2285--2307},
  year         = {2010},
  url          = {https://doi.org/10.1162/NECO\_a\_00014},
  doi          = {10.1162/NECO\_A\_00014},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/LarochelleBT10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/TurianRB10,
  author       = {Joseph P. Turian and
                  Lev{-}Arie Ratinov and
                  Yoshua Bengio},
  editor       = {Jan Hajic and
                  Sandra Carberry and
                  Stephen Clark},
  title        = {Word Representations: {A} Simple and General Method for Semi-Supervised
                  Learning},
  booktitle    = {{ACL} 2010, Proceedings of the 48th Annual Meeting of the Association
                  for Computational Linguistics, July 11-16, 2010, Uppsala, Sweden},
  pages        = {384--394},
  publisher    = {The Association for Computer Linguistics},
  year         = {2010},
  url          = {https://aclanthology.org/P10-1040/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/TurianRB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ismir/MandelEB10,
  author       = {Michael I. Mandel and
                  Douglas Eck and
                  Yoshua Bengio},
  editor       = {J. Stephen Downie and
                  Remco C. Veltkamp},
  title        = {Learning Tags that Vary Within a Song},
  booktitle    = {Proceedings of the 11th International Society for Music Information
                  Retrieval Conference, {ISMIR} 2010, Utrecht, Netherlands, August 9-13,
                  2010},
  pages        = {399--404},
  publisher    = {International Society for Music Information Retrieval},
  year         = {2010},
  url          = {http://ismir2010.ismir.net/proceedings/ismir2010-68.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ismir/MandelEB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/scipy/BergstraBBLPDTWB10,
  author       = {James Bergstra and
                  Olivier Breuleux and
                  Fr{\'{e}}d{\'{e}}ric Bastien and
                  Pascal Lamblin and
                  Razvan Pascanu and
                  Guillaume Desjardins and
                  Joseph P. Turian and
                  David Warde{-}Farley and
                  Yoshua Bengio},
  editor       = {St{\'{e}}fan van der Walt and
                  Jarrod Millman},
  title        = {Theano: {A} {CPU} and {GPU} Math Compiler in Python},
  booktitle    = {Proceedings of the 9th Python in Science Conference 2010 (SciPy 2010),
                  Austin, Texas, June 28 - July 3, 2010},
  pages        = {18--24},
  publisher    = {scipy.org},
  year         = {2010},
  url          = {https://doi.org/10.25080/Majora-92bf1922-003},
  doi          = {10.25080/MAJORA-92BF1922-003},
  timestamp    = {Tue, 16 May 2023 17:03:08 +0200},
  biburl       = {https://dblp.org/rec/conf/scipy/BergstraBBLPDTWB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/DesjardinsCBVD10,
  author       = {Guillaume Desjardins and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Pascal Vincent and
                  Olivier Delalleau},
  editor       = {Yee Whye Teh and
                  D. Mike Titterington},
  title        = {Tempered Markov Chain Monte Carlo for training of Restricted Boltzmann
                  Machines},
  booktitle    = {Proceedings of the Thirteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
                  Italy, May 13-15, 2010},
  series       = {{JMLR} Proceedings},
  volume       = {9},
  pages        = {145--152},
  publisher    = {JMLR.org},
  year         = {2010},
  url          = {http://proceedings.mlr.press/v9/desjardins10a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/DesjardinsCBVD10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/ErhanCBV10,
  author       = {Dumitru Erhan and
                  Aaron C. Courville and
                  Yoshua Bengio and
                  Pascal Vincent},
  editor       = {Yee Whye Teh and
                  D. Mike Titterington},
  title        = {Why Does Unsupervised Pre-training Help Deep Learning?},
  booktitle    = {Proceedings of the Thirteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
                  Italy, May 13-15, 2010},
  series       = {{JMLR} Proceedings},
  volume       = {9},
  pages        = {201--208},
  publisher    = {JMLR.org},
  year         = {2010},
  url          = {http://proceedings.mlr.press/v9/erhan10a.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/ErhanCBV10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/GlorotB10,
  author       = {Xavier Glorot and
                  Yoshua Bengio},
  editor       = {Yee Whye Teh and
                  D. Mike Titterington},
  title        = {Understanding the difficulty of training deep feedforward neural networks},
  booktitle    = {Proceedings of the Thirteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2010, Chia Laguna Resort, Sardinia,
                  Italy, May 13-15, 2010},
  series       = {{JMLR} Proceedings},
  volume       = {9},
  pages        = {249--256},
  publisher    = {JMLR.org},
  year         = {2010},
  url          = {http://proceedings.mlr.press/v9/glorot10a.html},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/GlorotB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1009-3589,
  author       = {Fr{\'{e}}d{\'{e}}ric Bastien and
                  Yoshua Bengio and
                  Arnaud Bergeron and
                  Nicolas Boulanger{-}Lewandowski and
                  Thomas M. Breuel and
                  Youssouf Chherawala and
                  Moustapha Ciss{\'{e}} and
                  Myriam C{\^{o}}t{\'{e}} and
                  Dumitru Erhan and
                  Jeremy Eustache and
                  Xavier Glorot and
                  Xavier Muller and
                  Sylvain Pannetier Lebeuf and
                  Razvan Pascanu and
                  Salah Rifai and
                  Fran{\c{c}}ois Savard and
                  Guillaume Sicard},
  title        = {Deep Self-Taught Learning for Handwritten Character Recognition},
  journal      = {CoRR},
  volume       = {abs/1009.3589},
  year         = {2010},
  url          = {http://arxiv.org/abs/1009.3589},
  eprinttype    = {arXiv},
  eprint       = {1009.3589},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1009-3589.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1012-3476,
  author       = {Guillaume Desjardins and
                  Aaron C. Courville and
                  Yoshua Bengio},
  title        = {Adaptive Parallel Tempering for Stochastic Maximum Likelihood Learning
                  of RBMs},
  journal      = {CoRR},
  volume       = {abs/1012.3476},
  year         = {2010},
  url          = {http://arxiv.org/abs/1012.3476},
  eprinttype    = {arXiv},
  eprint       = {1012.3476},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1012-3476.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftml/Bengio09,
  author       = {Yoshua Bengio},
  title        = {Learning Deep Architectures for {AI}},
  journal      = {Found. Trends Mach. Learn.},
  volume       = {2},
  number       = {1},
  pages        = {1--127},
  year         = {2009},
  url          = {https://doi.org/10.1561/2200000006},
  doi          = {10.1561/2200000006},
  timestamp    = {Thu, 18 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ftml/Bengio09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/LarochelleBLL09,
  author       = {Hugo Larochelle and
                  Yoshua Bengio and
                  J{\'{e}}r{\^{o}}me Louradour and
                  Pascal Lamblin},
  title        = {Exploring Strategies for Training Deep Neural Networks},
  journal      = {J. Mach. Learn. Res.},
  volume       = {10},
  pages        = {1--40},
  year         = {2009},
  url          = {https://dl.acm.org/doi/10.5555/1577069.1577070},
  doi          = {10.5555/1577069.1577070},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/LarochelleBLL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/DugasBBNG09,
  author       = {Charles Dugas and
                  Yoshua Bengio and
                  Fran{\c{c}}ois B{\'{e}}lisle and
                  Claude Nadeau and
                  Ren{\'{e}} Garcia},
  title        = {Incorporating Functional Knowledge in Neural Networks},
  journal      = {J. Mach. Learn. Res.},
  volume       = {10},
  pages        = {1239--1262},
  year         = {2009},
  url          = {https://dl.acm.org/doi/10.5555/1577069.1577111},
  doi          = {10.5555/1577069.1577111},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/DugasBBNG09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioD09,
  author       = {Yoshua Bengio and
                  Olivier Delalleau},
  title        = {Justifying and Generalizing Contrastive Divergence},
  journal      = {Neural Comput.},
  volume       = {21},
  number       = {6},
  pages        = {1601--1621},
  year         = {2009},
  url          = {https://doi.org/10.1162/neco.2008.11-07-647},
  doi          = {10.1162/NECO.2008.11-07-647},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BengioD09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/CarreauB09,
  author       = {Julie Carreau and
                  Yoshua Bengio},
  title        = {A Hybrid Pareto Mixture for Conditional Asymmetric Fat-Tailed Distributions},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {20},
  number       = {7},
  pages        = {1087--1101},
  year         = {2009},
  url          = {https://doi.org/10.1109/TNN.2009.2016339},
  doi          = {10.1109/TNN.2009.2016339},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/CarreauB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/YuSLHB09,
  author       = {Kai Yu and
                  Ruslan Salakhutdinov and
                  Yann LeCun and
                  Geoffrey E. Hinton and
                  Yoshua Bengio},
  editor       = {Andrea Pohoreckyj Danyluk and
                  L{\'{e}}on Bottou and
                  Michael L. Littman},
  title        = {Workshop summary: Workshop on learning feature hierarchies},
  booktitle    = {Proceedings of the 26th Annual International Conference on Machine
                  Learning, {ICML} 2009, Montreal, Quebec, Canada, June 14-18, 2009},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {382},
  pages        = {5},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1553374.1553543},
  doi          = {10.1145/1553374.1553543},
  timestamp    = {Tue, 06 Nov 2018 16:58:29 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/YuSLHB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BengioLCW09,
  author       = {Yoshua Bengio and
                  J{\'{e}}r{\^{o}}me Louradour and
                  Ronan Collobert and
                  Jason Weston},
  editor       = {Andrea Pohoreckyj Danyluk and
                  L{\'{e}}on Bottou and
                  Michael L. Littman},
  title        = {Curriculum learning},
  booktitle    = {Proceedings of the 26th Annual International Conference on Machine
                  Learning, {ICML} 2009, Montreal, Quebec, Canada, June 14-18, 2009},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {382},
  pages        = {41--48},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1553374.1553380},
  doi          = {10.1145/1553374.1553380},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/BengioLCW09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/TurianBB09,
  author       = {Joseph P. Turian and
                  James Bergstra and
                  Yoshua Bengio},
  title        = {Quadratic Features and Deep Architectures for Chunking},
  booktitle    = {Human Language Technologies: Conference of the North American Chapter
                  of the Association of Computational Linguistics, Proceedings, May
                  31 - June 5, 2009, Boulder, Colorado, USA, Short Papers},
  pages        = {245--248},
  publisher    = {The Association for Computational Linguistics},
  year         = {2009},
  url          = {https://aclanthology.org/N09-2062/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/TurianBB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BergstraB09,
  author       = {James Bergstra and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Slow, Decorrelated Features for Pretraining Complex Cell-like Networks},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {99--107},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/043c3d7e489c69b48737cc0c92d0f3a2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BergstraB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CourvilleEB09,
  author       = {Aaron C. Courville and
                  Douglas Eck and
                  Yoshua Bengio},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {An Infinite Factor Model Hierarchy Via a Noisy-Or Mechanism},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {405--413},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/1e6e0a04d20f50967c64dac2d639a577-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/CourvilleEB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/ErhanMBBV09,
  author       = {Dumitru Erhan and
                  Pierre{-}Antoine Manzagol and
                  Yoshua Bengio and
                  Samy Bengio and
                  Pascal Vincent},
  editor       = {David A. Van Dyk and
                  Max Welling},
  title        = {The Difficulty of Training Deep Architectures and the Effect of Unsupervised
                  Pre-Training},
  booktitle    = {Proceedings of the Twelfth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2009, Clearwater Beach, Florida,
                  USA, April 16-18, 2009},
  series       = {{JMLR} Proceedings},
  volume       = {5},
  pages        = {153--160},
  publisher    = {JMLR.org},
  year         = {2009},
  url          = {http://proceedings.mlr.press/v5/erhan09a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/ErhanMBBV09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/nips/2008,
  editor       = {Daphne Koller and
                  Dale Schuurmans and
                  Yoshua Bengio and
                  L{\'{e}}on Bottou},
  title        = {Advances in Neural Information Processing Systems 21, Proceedings
                  of the Twenty-Second Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 8-11, 2008},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2008},
  timestamp    = {Mon, 16 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/2008.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/nips/2009,
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009},
  isbn         = {9781615679119},
  timestamp    = {Mon, 16 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/2009.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/RouxB08,
  author       = {Nicolas Le Roux and
                  Yoshua Bengio},
  title        = {Representational Power of Restricted Boltzmann Machines and Deep Belief
                  Networks},
  journal      = {Neural Comput.},
  volume       = {20},
  number       = {6},
  pages        = {1631--1649},
  year         = {2008},
  url          = {https://doi.org/10.1162/neco.2008.04-07-510},
  doi          = {10.1162/NECO.2008.04-07-510},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/RouxB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/scholarpedia/Bengio08,
  author       = {Yoshua Bengio},
  title        = {Neural net language models},
  journal      = {Scholarpedia},
  volume       = {3},
  number       = {1},
  pages        = {3881},
  year         = {2008},
  url          = {https://doi.org/10.4249/scholarpedia.3881},
  doi          = {10.4249/SCHOLARPEDIA.3881},
  timestamp    = {Thu, 23 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scholarpedia/Bengio08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioS08,
  author       = {Yoshua Bengio and
                  Jean{-}S{\'{e}}bastien Senecal},
  title        = {Adaptive Importance Sampling to Accelerate Training of a Neural Probabilistic
                  Language Model},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {19},
  number       = {4},
  pages        = {713--722},
  year         = {2008},
  url          = {https://doi.org/10.1109/TNN.2007.912312},
  doi          = {10.1109/TNN.2007.912312},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/LarochelleEB08,
  author       = {Hugo Larochelle and
                  Dumitru Erhan and
                  Yoshua Bengio},
  editor       = {Dieter Fox and
                  Carla P. Gomes},
  title        = {Zero-data Learning of New Tasks},
  booktitle    = {Proceedings of the Twenty-Third {AAAI} Conference on Artificial Intelligence,
                  {AAAI} 2008, Chicago, Illinois, USA, July 13-17, 2008},
  pages        = {646--651},
  publisher    = {{AAAI} Press},
  year         = {2008},
  url          = {http://www.aaai.org/Library/AAAI/2008/aaai08-103.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/LarochelleEB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LarochelleB08,
  author       = {Hugo Larochelle and
                  Yoshua Bengio},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Classification using discriminative restricted Boltzmann machines},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {536--543},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390224},
  doi          = {10.1145/1390156.1390224},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LarochelleB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/VincentLBM08,
  author       = {Pascal Vincent and
                  Hugo Larochelle and
                  Yoshua Bengio and
                  Pierre{-}Antoine Manzagol},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Extracting and composing robust features with denoising autoencoders},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {1096--1103},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390294},
  doi          = {10.1145/1390156.1390294},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/VincentLBM08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcp/ChapadosB07,
  author       = {Nicolas Chapados and
                  Yoshua Bengio},
  title        = {Noisy {K} Best-Paths for Approximate Dynamic Programming with Application
                  to Portfolio Optimization},
  journal      = {J. Comput.},
  volume       = {2},
  number       = {1},
  pages        = {12--19},
  year         = {2007},
  url          = {http://www.jcomputers.us/index.php?m=content\&\#38;c=index\&\#38;a=show\&\#38;catid=72\&\#38;id=877},
  doi          = {10.4304/JCP.2.1.12-19},
  timestamp    = {Thu, 25 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jcp/ChapadosB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LarochelleECBB07,
  author       = {Hugo Larochelle and
                  Dumitru Erhan and
                  Aaron C. Courville and
                  James Bergstra and
                  Yoshua Bengio},
  editor       = {Zoubin Ghahramani},
  title        = {An empirical evaluation of deep architectures on problems with many
                  factors of variation},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fourth International Conference
                  {(ICML} 2007), Corvallis, Oregon, USA, June 20-24, 2007},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {227},
  pages        = {473--480},
  publisher    = {{ACM}},
  year         = {2007},
  url          = {https://doi.org/10.1145/1273496.1273556},
  doi          = {10.1145/1273496.1273556},
  timestamp    = {Wed, 28 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LarochelleECBB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChapadosB07,
  author       = {Nicolas Chapados and
                  Yoshua Bengio},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Augmented Functional Time Series Representation and Forecasting with
                  Gaussian Processes},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {265--272},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/81e74d678581a3bb7a720b019f4f1a93-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/ChapadosB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RouxBLJK07,
  author       = {Nicolas Le Roux and
                  Yoshua Bengio and
                  Pascal Lamblin and
                  Marc Joliveau and
                  Bal{\'{a}}zs K{\'{e}}gl},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Learning the 2-D Topology of Images},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {841--848},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/7fa732b517cbed14a48843d74526c11a-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RouxBLJK07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RouxMB07,
  author       = {Nicolas Le Roux and
                  Pierre{-}Antoine Manzagol and
                  Yoshua Bengio},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Topmoumoute Online Natural Gradient Algorithm},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {849--856},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/9f61408e3afb633e50cdf1b20de6f466-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RouxMB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/CarreauB07,
  author       = {Julie Carreau and
                  Yoshua Bengio},
  editor       = {Marina Meila and
                  Xiaotong Shen},
  title        = {A Hybrid Pareto Model for Conditional Density Estimation of Asymmetric
                  Fat-Tail Data},
  booktitle    = {Proceedings of the Eleventh International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2007, San Juan, Puerto Rico,
                  March 21-24, 2007},
  series       = {{JMLR} Proceedings},
  volume       = {2},
  pages        = {51--58},
  publisher    = {JMLR.org},
  year         = {2007},
  url          = {http://proceedings.mlr.press/v2/carreau07a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/CarreauB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/RouxB07,
  author       = {Nicolas Le Roux and
                  Yoshua Bengio},
  editor       = {Marina Meila and
                  Xiaotong Shen},
  title        = {Continuous Neural Networks},
  booktitle    = {Proceedings of the Eleventh International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2007, San Juan, Puerto Rico,
                  March 21-24, 2007},
  series       = {{JMLR} Proceedings},
  volume       = {2},
  pages        = {404--411},
  publisher    = {JMLR.org},
  year         = {2007},
  url          = {http://proceedings.mlr.press/v2/leroux07a.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/RouxB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcisd/ErhanLYB06,
  author       = {Dumitru Erhan and
                  Pierre{-}Jean L'Heureux and
                  Shi Yi Yue and
                  Yoshua Bengio},
  title        = {Collaborative Filtering on a Family of Biological Targets},
  journal      = {J. Chem. Inf. Model.},
  volume       = {46},
  number       = {2},
  pages        = {626--635},
  year         = {2006},
  url          = {https://doi.org/10.1021/ci050367t},
  doi          = {10.1021/CI050367T},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jcisd/ErhanLYB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioML06,
  author       = {Yoshua Bengio and
                  Martin Monperrus and
                  Hugo Larochelle},
  title        = {Nonlocal Estimation of Manifold Structure},
  journal      = {Neural Comput.},
  volume       = {18},
  number       = {10},
  pages        = {2509--2528},
  year         = {2006},
  url          = {https://doi.org/10.1162/neco.2006.18.10.2509},
  doi          = {10.1162/NECO.2006.18.10.2509},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BengioML06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ai/ChapadosB06,
  author       = {Nicolas Chapados and
                  Yoshua Bengio},
  editor       = {Luc Lamontagne and
                  Mario Marchand},
  title        = {The \emph{K} Best-Paths Approach to Approximate Dynamic Programming
                  with Application to Portfolio Optimization},
  booktitle    = {Advances in Artificial Intelligence, 19th Conference of the Canadian
                  Society for Computational Studies of Intelligence, Canadian {AI} 2006,
                  Qu{\'{e}}bec City, Qu{\'{e}}bec, Canada, June 7-9, 2006,
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4013},
  pages        = {491--502},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11766247\_42},
  doi          = {10.1007/11766247\_42},
  timestamp    = {Thu, 28 Sep 2023 12:27:07 +0200},
  biburl       = {https://dblp.org/rec/conf/ai/ChapadosB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioLPL06,
  author       = {Yoshua Bengio and
                  Pascal Lamblin and
                  Dan Popovici and
                  Hugo Larochelle},
  editor       = {Bernhard Sch{\"{o}}lkopf and
                  John C. Platt and
                  Thomas Hofmann},
  title        = {Greedy Layer-Wise Training of Deep Networks},
  booktitle    = {Advances in Neural Information Processing Systems 19, Proceedings
                  of the Twentieth Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 4-7, 2006},
  pages        = {153--160},
  publisher    = {{MIT} Press},
  year         = {2006},
  url          = {https://proceedings.neurips.cc/paper/2006/hash/5da713a690c067105aeb2fae32403405-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioLPL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/mit/06/GrandvaletB06,
  author       = {Yves Grandvalet and
                  Yoshua Bengio},
  editor       = {Olivier Chapelle and
                  Bernhard Sch{\"{o}}lkopf and
                  Alexander Zien},
  title        = {Entropy Regularization},
  booktitle    = {Semi-Supervised Learning},
  pages        = {151--168},
  publisher    = {The {MIT} Press},
  year         = {2006},
  url          = {https://doi.org/10.7551/mitpress/9780262033589.003.0009},
  doi          = {10.7551/MITPRESS/9780262033589.003.0009},
  timestamp    = {Mon, 16 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/mit/06/GrandvaletB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/mit/06/BengioDR06,
  author       = {Yoshua Bengio and
                  Olivier Delalleau and
                  Nicolas Le Roux},
  editor       = {Olivier Chapelle and
                  Bernhard Sch{\"{o}}lkopf and
                  Alexander Zien},
  title        = {Label Propagation and Quadratic Criterion},
  booktitle    = {Semi-Supervised Learning},
  pages        = {192--216},
  publisher    = {The {MIT} Press},
  year         = {2006},
  url          = {https://doi.org/10.7551/mitpress/9780262033589.003.0011},
  doi          = {10.7551/MITPRESS/9780262033589.003.0011},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/mit/06/BengioDR06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/mit/06/DelalleauBR06,
  author       = {Olivier Delalleau and
                  Yoshua Bengio and
                  Nicolas Le Roux},
  editor       = {Olivier Chapelle and
                  Bernhard Sch{\"{o}}lkopf and
                  Alexander Zien},
  title        = {Large-Scale Algorithms},
  booktitle    = {Semi-Supervised Learning},
  pages        = {332--341},
  publisher    = {The {MIT} Press},
  year         = {2006},
  url          = {https://doi.org/10.7551/mitpress/9780262033589.003.0018},
  doi          = {10.7551/MITPRESS/9780262033589.003.0018},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/books/mit/06/DelalleauBR06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:books/sp/06/BengioDRPVO06,
  author       = {Yoshua Bengio and
                  Olivier Delalleau and
                  Nicolas Le Roux and
                  Jean{-}Fran{\c{c}}ois Paiement and
                  Pascal Vincent and
                  Marie Ouimet},
  editor       = {Isabelle Guyon and
                  Masoud Nikravesh and
                  Steve R. Gunn and
                  Lotfi A. Zadeh},
  title        = {Spectral Dimensionality Reduction},
  booktitle    = {Feature Extraction - Foundations and Applications},
  series       = {Studies in Fuzziness and Soft Computing},
  volume       = {207},
  pages        = {519--550},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/978-3-540-35488-8\_28},
  doi          = {10.1007/978-3-540-35488-8\_28},
  timestamp    = {Fri, 26 Jul 2019 12:50:23 +0200},
  biburl       = {https://dblp.org/rec/books/sp/06/BengioDRPVO06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/DelalleauBR05,
  author       = {Olivier Delalleau and
                  Yoshua Bengio and
                  Nicolas Le Roux},
  editor       = {Robert G. Cowell and
                  Zoubin Ghahramani},
  title        = {Efficient Non-Parametric Function Induction in Semi-Supervised Learning},
  booktitle    = {Proceedings of the Tenth International Workshop on Artificial Intelligence
                  and Statistics, {AISTATS} 2005, Bridgetown, Barbados, January 6-8,
                  2005},
  publisher    = {Society for Artificial Intelligence and Statistics},
  year         = {2005},
  url          = {http://www.gatsby.ucl.ac.uk/aistats/fullpapers/204.pdf},
  timestamp    = {Wed, 06 May 2015 20:30:46 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/DelalleauBR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/MorinB05,
  author       = {Frederic Morin and
                  Yoshua Bengio},
  editor       = {Robert G. Cowell and
                  Zoubin Ghahramani},
  title        = {Hierarchical Probabilistic Neural Network Language Model},
  booktitle    = {Proceedings of the Tenth International Workshop on Artificial Intelligence
                  and Statistics, {AISTATS} 2005, Bridgetown, Barbados, January 6-8,
                  2005},
  publisher    = {Society for Artificial Intelligence and Statistics},
  year         = {2005},
  url          = {http://www.gatsby.ucl.ac.uk/aistats/fullpapers/208.pdf},
  timestamp    = {Wed, 06 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/MorinB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/OuimetB05,
  author       = {Marie Ouimet and
                  Yoshua Bengio},
  editor       = {Robert G. Cowell and
                  Zoubin Ghahramani},
  title        = {Greedy Spectral Embedding},
  booktitle    = {Proceedings of the Tenth International Workshop on Artificial Intelligence
                  and Statistics, {AISTATS} 2005, Bridgetown, Barbados, January 6-8,
                  2005},
  publisher    = {Society for Artificial Intelligence and Statistics},
  year         = {2005},
  url          = {http://www.gatsby.ucl.ac.uk/aistats/fullpapers/209.pdf},
  timestamp    = {Wed, 06 May 2015 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/OuimetB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cfap/GrandvaletB05,
  author       = {Yves Grandvalet and
                  Yoshua Bengio},
  editor       = {Fran{\c{c}}ois Denis},
  title        = {Semi-supervised Learning by Entropy Minimization},
  booktitle    = {Actes de {CAP} 05, Conf{\'{e}}rence francophone sur l'apprentissage
                  automatique - 2005, Nice, France, du 31 mai au 3 juin 2005},
  pages        = {281--296},
  publisher    = {{PUG}},
  year         = {2005},
  timestamp    = {Wed, 29 Jun 2005 08:39:22 +0200},
  biburl       = {https://dblp.org/rec/conf/cfap/GrandvaletB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioDR05,
  author       = {Yoshua Bengio and
                  Olivier Delalleau and
                  Nicolas Le Roux},
  title        = {The Curse of Highly Variable Functions for Local Kernel Machines},
  booktitle    = {Advances in Neural Information Processing Systems 18 [Neural Information
                  Processing Systems, {NIPS} 2005, December 5-8, 2005, Vancouver, British
                  Columbia, Canada]},
  pages        = {107--114},
  year         = {2005},
  url          = {https://proceedings.neurips.cc/paper/2005/hash/663772ea088360f95bac3dc7ffb841be-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioDR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioLV05,
  author       = {Yoshua Bengio and
                  Hugo Larochelle and
                  Pascal Vincent},
  title        = {Non-Local Manifold Parzen Windows},
  booktitle    = {Advances in Neural Information Processing Systems 18 [Neural Information
                  Processing Systems, {NIPS} 2005, December 5-8, 2005, Vancouver, British
                  Columbia, Canada]},
  pages        = {115--122},
  year         = {2005},
  url          = {https://proceedings.neurips.cc/paper/2005/hash/17eb7ecc4c38e4705361cccd903ad8c6-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioLV05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioRVDM05,
  author       = {Yoshua Bengio and
                  Nicolas Le Roux and
                  Pascal Vincent and
                  Olivier Delalleau and
                  Patrice Marcotte},
  title        = {Convex Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 18 [Neural Information
                  Processing Systems, {NIPS} 2005, December 5-8, 2005, Vancouver, British
                  Columbia, Canada]},
  pages        = {123--130},
  year         = {2005},
  url          = {https://proceedings.neurips.cc/paper/2005/hash/0fc170ecbb8ff1afb2c6de48ea5343e7-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioRVDM05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcamd/LHeureuxCBDY04,
  author       = {Pierre{-}Jean L'Heureux and
                  Julie Carreau and
                  Yoshua Bengio and
                  Olivier Delalleau and
                  Shi Yi Yue},
  title        = {Locally Linear Embedding for dimensionality reduction in {QSAR}},
  journal      = {J. Comput. Aided Mol. Des.},
  volume       = {18},
  number       = {7},
  pages        = {475--482},
  year         = {2004},
  url          = {https://doi.org/10.1007/s10822-004-5319-9},
  doi          = {10.1007/S10822-004-5319-9},
  timestamp    = {Thu, 16 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jcamd/LHeureuxCBDY04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BengioG04,
  author       = {Yoshua Bengio and
                  Yves Grandvalet},
  title        = {No Unbiased Estimator of the Variance of K-Fold Cross-Validation},
  journal      = {J. Mach. Learn. Res.},
  volume       = {5},
  pages        = {1089--1105},
  year         = {2004},
  url          = {http://jmlr.org/papers/volume5/grandvalet04a/grandvalet04a.pdf},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BengioG04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioDRPVO04,
  author       = {Yoshua Bengio and
                  Olivier Delalleau and
                  Nicolas Le Roux and
                  Jean{-}Fran{\c{c}}ois Paiement and
                  Pascal Vincent and
                  Marie Ouimet},
  title        = {Learning Eigenfunctions Links Spectral Embedding and Kernel {PCA}},
  journal      = {Neural Comput.},
  volume       = {16},
  number       = {10},
  pages        = {2197--2219},
  year         = {2004},
  url          = {https://doi.org/10.1162/0899766041732396},
  doi          = {10.1162/0899766041732396},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BengioDRPVO04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/BhattacharyaGB04,
  author       = {Indrajit Bhattacharya and
                  Lise Getoor and
                  Yoshua Bengio},
  editor       = {Donia Scott and
                  Walter Daelemans and
                  Marilyn A. Walker},
  title        = {Unsupervised Sense Disambiguation Using Bilingual Probabilistic Models},
  booktitle    = {Proceedings of the 42nd Annual Meeting of the Association for Computational
                  Linguistics, 21-26 July, 2004, Barcelona, Spain},
  pages        = {287--294},
  publisher    = {{ACL}},
  year         = {2004},
  url          = {https://aclanthology.org/P04-1037/},
  doi          = {10.3115/1218955.1218992},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/BhattacharyaGB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioM04,
  author       = {Yoshua Bengio and
                  Martin Monperrus},
  title        = {Non-Local Manifold Tangent Learning},
  booktitle    = {Advances in Neural Information Processing Systems 17 [Neural Information
                  Processing Systems, {NIPS} 2004, December 13-18, 2004, Vancouver,
                  British Columbia, Canada]},
  pages        = {129--136},
  year         = {2004},
  url          = {https://proceedings.neurips.cc/paper/2004/hash/0b7e926154c1274e8b602ff0d7c133d7-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioM04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GrandvaletB04,
  author       = {Yves Grandvalet and
                  Yoshua Bengio},
  title        = {Semi-supervised Learning by Entropy Minimization},
  booktitle    = {Advances in Neural Information Processing Systems 17 [Neural Information
                  Processing Systems, {NIPS} 2004, December 13-18, 2004, Vancouver,
                  British Columbia, Canada]},
  pages        = {529--536},
  year         = {2004},
  url          = {https://proceedings.neurips.cc/paper/2004/hash/96f2b50b5d3613adf9c27049b2a888c7-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GrandvaletB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RivestBK04,
  author       = {Fran{\c{c}}ois Rivest and
                  Yoshua Bengio and
                  John Kalaska},
  title        = {Brain Inspired Reinforcement Learning},
  booktitle    = {Advances in Neural Information Processing Systems 17 [Neural Information
                  Processing Systems, {NIPS} 2004, December 13-18, 2004, Vancouver,
                  British Columbia, Canada]},
  pages        = {1129--1136},
  year         = {2004},
  url          = {https://proceedings.neurips.cc/paper/2004/hash/d37b3ca37106b2bfdeaa12647e3bb1c9-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/RivestBK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/taln/BoufadenBL04,
  author       = {Narj{\`{e}}s Boufaden and
                  Yoshua Bengio and
                  Guy Lapalme},
  editor       = {Philippe Blache and
                  No{\"{e}}l Nguyen and
                  Nouredine Chenfour and
                  Abdenbi Rajouani},
  title        = {Approche statistique pour le rep{\'{e}}rage de mots informatifs
                  dans les textes oraux},
  booktitle    = {Actes de la 11{\`{e}}me conf{\'{e}}rence sur le Traitement Automatique
                  des Langues Naturelles. Articles longs, {TALN} 2004, F{\`{e}}s, Maroc,
                  April 2004},
  pages        = {249--258},
  publisher    = {{ATALA}},
  year         = {2004},
  url          = {https://aclanthology.org/2004.jeptalnrecital-long.26/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/taln/BoufadenBL04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijprai/CollobertB03,
  author       = {Ronan Collobert and
                  Yoshua Bengio and
                  Samy Bengio},
  title        = {Scaling Large Learning Problems with Hard Parallel Mixtures},
  journal      = {Int. J. Pattern Recognit. Artif. Intell.},
  volume       = {17},
  number       = {3},
  pages        = {349--365},
  year         = {2003},
  url          = {https://doi.org/10.1142/S0218001403002411},
  doi          = {10.1142/S0218001403002411},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijprai/CollobertB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BengioDVJ03,
  author       = {Yoshua Bengio and
                  R{\'{e}}jean Ducharme and
                  Pascal Vincent and
                  Christian Janvin},
  title        = {A Neural Probabilistic Language Model},
  journal      = {J. Mach. Learn. Res.},
  volume       = {3},
  pages        = {1137--1155},
  year         = {2003},
  url          = {http://jmlr.org/papers/v3/bengio03a.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BengioDVJ03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/BengioC03,
  author       = {Yoshua Bengio and
                  Nicolas Chapados},
  title        = {Extensions to Metric-Based Model Selection},
  journal      = {J. Mach. Learn. Res.},
  volume       = {3},
  pages        = {1209--1227},
  year         = {2003},
  url          = {http://jmlr.org/papers/v3/bengio03b.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BengioC03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/NadeauB03,
  author       = {Claude Nadeau and
                  Yoshua Bengio},
  title        = {Inference for the Generalization Error},
  journal      = {Mach. Learn.},
  volume       = {52},
  number       = {3},
  pages        = {239--281},
  year         = {2003},
  url          = {https://doi.org/10.1023/A:1024068626366},
  doi          = {10.1023/A:1024068626366},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/NadeauB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/GhosnB03,
  author       = {Joumana Ghosn and
                  Yoshua Bengio},
  title        = {Bias learning, knowledge sharing},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {14},
  number       = {4},
  pages        = {748--765},
  year         = {2003},
  url          = {https://doi.org/10.1109/TNN.2003.810608},
  doi          = {10.1109/TNN.2003.810608},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/GhosnB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/BengioS03,
  author       = {Yoshua Bengio and
                  Jean{-}S{\'{e}}bastien Senecal},
  editor       = {Christopher M. Bishop and
                  Brendan J. Frey},
  title        = {Quick Training of Probabilistic Neural Nets by Importance Sampling},
  booktitle    = {Proceedings of the Ninth International Workshop on Artificial Intelligence
                  and Statistics, {AISTATS} 2003, Key West, Florida, USA, January 3-6,
                  2003},
  publisher    = {Society for Artificial Intelligence and Statistics},
  year         = {2003},
  url          = {http://research.microsoft.com/en-us/um/cambridge/events/aistats2003/proceedings/164.pdf},
  timestamp    = {Wed, 06 May 2015 20:33:21 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/BengioS03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioPVDRO03,
  author       = {Yoshua Bengio and
                  Jean{-}Fran{\c{c}}ois Paiement and
                  Pascal Vincent and
                  Olivier Delalleau and
                  Nicolas Le Roux and
                  Marie Ouimet},
  editor       = {Sebastian Thrun and
                  Lawrence K. Saul and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {Out-of-Sample Extensions for LLE, Isomap, MDS, Eigenmaps, and Spectral
                  Clustering},
  booktitle    = {Advances in Neural Information Processing Systems 16 [Neural Information
                  Processing Systems, {NIPS} 2003, December 8-13, 2003, Vancouver and
                  Whistler, British Columbia, Canada]},
  pages        = {177--184},
  publisher    = {{MIT} Press},
  year         = {2003},
  url          = {https://proceedings.neurips.cc/paper/2003/hash/cf05968255451bdefe3c5bc64d550517-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioPVDRO03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioG03,
  author       = {Yoshua Bengio and
                  Yves Grandvalet},
  editor       = {Sebastian Thrun and
                  Lawrence K. Saul and
                  Bernhard Sch{\"{o}}lkopf},
  title        = {No Unbiased Estimator of the Variance of K-Fold Cross-Validation},
  booktitle    = {Advances in Neural Information Processing Systems 16 [Neural Information
                  Processing Systems, {NIPS} 2003, December 8-13, 2003, Vancouver and
                  Whistler, British Columbia, Canada]},
  pages        = {513--520},
  publisher    = {{MIT} Press},
  year         = {2003},
  url          = {https://proceedings.neurips.cc/paper/2003/hash/e82c4b19b8151ddc25d4d93baf7b908f-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioG03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/BengioS02,
  author       = {Yoshua Bengio and
                  Dale Schuurmans},
  title        = {Guest Introduction: Special Issue on New Methods for Model Selection
                  and Model Combination},
  journal      = {Mach. Learn.},
  volume       = {48},
  number       = {1-3},
  pages        = {5--7},
  year         = {2002},
  url          = {https://doi.org/10.1023/A:1013921901994},
  doi          = {10.1023/A:1013921901994},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/BengioS02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/ChapelleVB02,
  author       = {Olivier Chapelle and
                  Vladimir Vapnik and
                  Yoshua Bengio},
  title        = {Model Selection for Small Sample Regression},
  journal      = {Mach. Learn.},
  volume       = {48},
  number       = {1-3},
  pages        = {9--23},
  year         = {2002},
  url          = {https://doi.org/10.1023/A:1013943418833},
  doi          = {10.1023/A:1013943418833},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/ChapelleVB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/VincentB02,
  author       = {Pascal Vincent and
                  Yoshua Bengio},
  title        = {Kernel Matching Pursuit},
  journal      = {Mach. Learn.},
  volume       = {48},
  number       = {1-3},
  pages        = {165--187},
  year         = {2002},
  url          = {https://doi.org/10.1023/A:1013955821559},
  doi          = {10.1023/A:1013955821559},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/VincentB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/CollobertBB02,
  author       = {Ronan Collobert and
                  Samy Bengio and
                  Yoshua Bengio},
  title        = {A Parallel Mixture of SVMs for Very Large Scale Problems},
  journal      = {Neural Comput.},
  volume       = {14},
  number       = {5},
  pages        = {1105--1114},
  year         = {2002},
  url          = {https://doi.org/10.1162/089976602753633402},
  doi          = {10.1162/089976602753633402},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/CollobertBB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/TakeuchiBK02,
  author       = {Ichiro Takeuchi and
                  Yoshua Bengio and
                  Takafumi Kanamori},
  title        = {Robust Regression with Asymmetric Heavy-Tail Noise Distributions},
  journal      = {Neural Comput.},
  volume       = {14},
  number       = {10},
  pages        = {2469--2496},
  year         = {2002},
  url          = {https://doi.org/10.1162/08997660260293300},
  doi          = {10.1162/08997660260293300},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/TakeuchiBK02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VincentB02,
  author       = {Pascal Vincent and
                  Yoshua Bengio},
  editor       = {Suzanna Becker and
                  Sebastian Thrun and
                  Klaus Obermayer},
  title        = {Manifold Parzen Windows},
  booktitle    = {Advances in Neural Information Processing Systems 15 [Neural Information
                  Processing Systems, {NIPS} 2002, December 9-14, 2002, Vancouver, British
                  Columbia, Canada]},
  pages        = {825--832},
  publisher    = {{MIT} Press},
  year         = {2002},
  url          = {https://proceedings.neurips.cc/paper/2002/hash/2d969e2cee8cfa07ce7ca0bb13c7a36d-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/VincentB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nnsp/BengioC02,
  author       = {Yoshua Bengio and
                  Nicolas Chapados},
  title        = {Metric-based model selection for time-series forecasting},
  booktitle    = {Proceedings of the 12th {IEEE} Workshop on Neural Networks for Signal
                  Processing, {NNSP} 2002, Martigny, Valais, Switzerland, September
                  4-6, 2002},
  pages        = {13--22},
  publisher    = {{IEEE}},
  year         = {2002},
  url          = {https://doi.org/10.1109/NNSP.2002.1030013},
  doi          = {10.1109/NNSP.2002.1030013},
  timestamp    = {Wed, 16 Oct 2019 14:14:54 +0200},
  biburl       = {https://dblp.org/rec/conf/nnsp/BengioC02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/svm/CollobertBB02,
  author       = {Ronan Collobert and
                  Yoshua Bengio and
                  Samy Bengio},
  editor       = {Seong{-}Whan Lee and
                  Alessandro Verri},
  title        = {Scaling Large Learning Problems with Hard Parallel Mixtures},
  booktitle    = {Pattern Recognition with Support Vector Machines, First International
                  Workshop, {SVM} 2002, Niagara Falls, Canada, August 10, 2002, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {2388},
  pages        = {8--23},
  publisher    = {Springer},
  year         = {2002},
  url          = {https://doi.org/10.1007/3-540-45665-1\_2},
  doi          = {10.1007/3-540-45665-1\_2},
  timestamp    = {Tue, 14 May 2019 10:00:52 +0200},
  biburl       = {https://dblp.org/rec/conf/svm/CollobertBB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/taln/BoufadenLB02,
  author       = {Narj{\`{e}}s Boufaden and
                  Guy Lapalme and
                  Yoshua Bengio},
  editor       = {Jean{-}Marie Pierrel},
  title        = {Segmentation en th{\`{e}}mes de conversations t{\'{e}}l{\'{e}}phoniques
                  : traitement en amont pour l'extraction d'information},
  booktitle    = {Actes de la 9{\`{e}}me conf{\'{e}}rence sur le Traitement Automatique
                  des Langues Naturelles. Posters, {TALN} 2002, Nancy, France, June
                  2002},
  pages        = {376--381},
  publisher    = {{ATALA}},
  year         = {2002},
  url          = {https://aclanthology.org/2002.jeptalnrecital-poster.10/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/taln/BoufadenLB02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioLD01,
  author       = {Yoshua Bengio and
                  Vincent{-}Philippe Lauzon and
                  R{\'{e}}jean Ducharme},
  title        = {Experiments on the application of IOHMMs to model financial returns
                  series},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {12},
  number       = {1},
  pages        = {113--123},
  year         = {2001},
  url          = {https://doi.org/10.1109/72.896800},
  doi          = {10.1109/72.896800},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioLD01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/ChapadosB01,
  author       = {Nicolas Chapados and
                  Yoshua Bengio},
  title        = {Cost functions and model combination for VaR-based asset allocation
                  using neural networks},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {12},
  number       = {4},
  pages        = {890--906},
  year         = {2001},
  url          = {https://doi.org/10.1109/72.935098},
  doi          = {10.1109/72.935098},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnn/ChapadosB01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/CollobertBB01,
  author       = {Ronan Collobert and
                  Samy Bengio and
                  Yoshua Bengio},
  editor       = {Thomas G. Dietterich and
                  Suzanna Becker and
                  Zoubin Ghahramani},
  title        = {A Parallel Mixture of SVMs for Very Large Scale Problems},
  booktitle    = {Advances in Neural Information Processing Systems 14 [Neural Information
                  Processing Systems: Natural and Synthetic, {NIPS} 2001, December 3-8,
                  2001, Vancouver, British Columbia, Canada]},
  pages        = {633--640},
  publisher    = {{MIT} Press},
  year         = {2001},
  url          = {https://proceedings.neurips.cc/paper/2001/hash/36ac8e558ac7690b6f44e2cb5ef93322-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/CollobertBB01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VincentB01,
  author       = {Pascal Vincent and
                  Yoshua Bengio},
  editor       = {Thomas G. Dietterich and
                  Suzanna Becker and
                  Zoubin Ghahramani},
  title        = {K-Local Hyperplane and Convex Distance Nearest Neighbor Algorithms},
  booktitle    = {Advances in Neural Information Processing Systems 14 [Neural Information
                  Processing Systems: Natural and Synthetic, {NIPS} 2001, December 3-8,
                  2001, Vancouver, British Columbia, Canada]},
  pages        = {985--992},
  publisher    = {{MIT} Press},
  year         = {2001},
  url          = {https://proceedings.neurips.cc/paper/2001/hash/1359aa933b48b754a2f54adb688bfa77-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/VincentB01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/ChapadosBVGDTM01,
  author       = {Nicolas Chapados and
                  Yoshua Bengio and
                  Pascal Vincent and
                  Joumana Ghosn and
                  Charles Dugas and
                  Ichiro Takeuchi and
                  Linyan Meng},
  editor       = {Thomas G. Dietterich and
                  Suzanna Becker and
                  Zoubin Ghahramani},
  title        = {Estimating Car Insurance Premia: a Case Study in High-Dimensional
                  Data Inference},
  booktitle    = {Advances in Neural Information Processing Systems 14 [Neural Information
                  Processing Systems: Natural and Synthetic, {NIPS} 2001, December 3-8,
                  2001, Vancouver, British Columbia, Canada]},
  pages        = {1369--1376},
  publisher    = {{MIT} Press},
  year         = {2001},
  url          = {https://proceedings.neurips.cc/paper/2001/hash/2d405b367158e3f12d7c1e31a96b3af3-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/ChapadosBVGDTM01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nlprs/BoufadenLB01,
  author       = {Narj{\`{e}}s Boufaden and
                  Guy Lapalme and
                  Yoshua Bengio},
  title        = {Topic Segmentation : {A} First Stage to Dialog-Based Information Extraction},
  booktitle    = {Proceedings of the Sixth Natural Language Processing Pacific Rim Symposium,
                  November 27-30, 2001, Hitotsubashi Memorial Hall, National Center
                  of Sciences, Tokyo, Japan},
  pages        = {273--279},
  year         = {2001},
  url          = {http://www.afnlp.org/nlprs2001/pdf/0097-01.pdf},
  timestamp    = {Thu, 04 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nlprs/BoufadenLB01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/SchwenkB00,
  author       = {Holger Schwenk and
                  Yoshua Bengio},
  title        = {Boosting Neural Networks},
  journal      = {Neural Comput.},
  volume       = {12},
  number       = {8},
  pages        = {1869--1887},
  year         = {2000},
  url          = {https://doi.org/10.1162/089976600300015178},
  doi          = {10.1162/089976600300015178},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/SchwenkB00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/Bengio00,
  author       = {Yoshua Bengio},
  title        = {Gradient-Based Optimization of Hyperparameters},
  journal      = {Neural Comput.},
  volume       = {12},
  number       = {8},
  pages        = {1889--1900},
  year         = {2000},
  url          = {https://doi.org/10.1162/089976600300015187},
  doi          = {10.1162/089976600300015187},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/Bengio00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioB00,
  author       = {Samy Bengio and
                  Yoshua Bengio},
  title        = {Taking on the curse of dimensionality in joint distributions using
                  neural networks},
  journal      = {{IEEE} Trans. Neural Networks Learn. Syst.},
  volume       = {11},
  number       = {3},
  pages        = {550--557},
  year         = {2000},
  url          = {https://doi.org/10.1109/72.846725},
  doi          = {10.1109/72.846725},
  timestamp    = {Sat, 30 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioB00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/GhosnB00,
  author       = {Joumana Ghosn and
                  Yoshua Bengio},
  title        = {Bias Learning, Knowledge Sharing},
  booktitle    = {Proceedings of the {IEEE-INNS-ENNS} International Joint Conference
                  on Neural Networks, {IJCNN} 2000, Neural Computing: New Challenges
                  and Perspectives for the New Millennium, Como, Italy, July 24-27,
                  2000, Volume 1},
  pages        = {9--14},
  publisher    = {{IEEE} Computer Society},
  year         = {2000},
  url          = {https://doi.org/10.1109/IJCNN.2000.857806},
  doi          = {10.1109/IJCNN.2000.857806},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/GhosnB00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/Bengio00a,
  author       = {Yoshua Bengio},
  title        = {Probabilistic Neural Network Models for Sequential Data},
  booktitle    = {Proceedings of the {IEEE-INNS-ENNS} International Joint Conference
                  on Neural Networks, {IJCNN} 2000, Neural Computing: New Challenges
                  and Perspectives for the New Millennium, Como, Italy, July 24-27,
                  2000, Volume 5},
  pages        = {79--84},
  publisher    = {{IEEE} Computer Society},
  year         = {2000},
  url          = {https://doi.org/10.1109/IJCNN.2000.861438},
  doi          = {10.1109/IJCNN.2000.861438},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/Bengio00a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/VincentB00,
  author       = {Pascal Vincent and
                  Yoshua Bengio},
  title        = {A Neural Support Vector Network Architecture with Adaptive Kernels},
  booktitle    = {Proceedings of the {IEEE-INNS-ENNS} International Joint Conference
                  on Neural Networks, {IJCNN} 2000, Neural Computing: New Challenges
                  and Perspectives for the New Millennium, Como, Italy, July 24-27,
                  2000, Volume 5},
  pages        = {187--192},
  publisher    = {{IEEE} Computer Society},
  year         = {2000},
  url          = {https://doi.org/10.1109/IJCNN.2000.861455},
  doi          = {10.1109/IJCNN.2000.861455},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/VincentB00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcnn/Bengio00,
  author       = {Yoshua Bengio},
  title        = {Continuous Optimization of Hyper-Parameters},
  booktitle    = {Proceedings of the {IEEE-INNS-ENNS} International Joint Conference
                  on Neural Networks, {IJCNN} 2000, Neural Computing: New Challenges
                  and Perspectives for the New Millennium, Como, Italy, July 24-27,
                  2000, Volume 1},
  pages        = {305--310},
  publisher    = {{IEEE} Computer Society},
  year         = {2000},
  url          = {https://doi.org/10.1109/IJCNN.2000.857853},
  doi          = {10.1109/IJCNN.2000.857853},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ijcnn/Bengio00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DugasBBNG00,
  author       = {Charles Dugas and
                  Yoshua Bengio and
                  Fran{\c{c}}ois B{\'{e}}lisle and
                  Claude Nadeau and
                  Ren{\'{e}} Garcia},
  editor       = {Todd K. Leen and
                  Thomas G. Dietterich and
                  Volker Tresp},
  title        = {Incorporating Second-Order Functional Knowledge for Better Option
                  Pricing},
  booktitle    = {Advances in Neural Information Processing Systems 13, Papers from
                  Neural Information Processing Systems {(NIPS)} 2000, Denver, CO, {USA}},
  pages        = {472--478},
  publisher    = {{MIT} Press},
  year         = {2000},
  url          = {https://proceedings.neurips.cc/paper/2000/hash/44968aece94f667e4095002d140b5896-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DugasBBNG00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioDV00,
  author       = {Yoshua Bengio and
                  R{\'{e}}jean Ducharme and
                  Pascal Vincent},
  editor       = {Todd K. Leen and
                  Thomas G. Dietterich and
                  Volker Tresp},
  title        = {A Neural Probabilistic Language Model},
  booktitle    = {Advances in Neural Information Processing Systems 13, Papers from
                  Neural Information Processing Systems {(NIPS)} 2000, Denver, CO, {USA}},
  pages        = {932--938},
  publisher    = {{MIT} Press},
  year         = {2000},
  url          = {https://proceedings.neurips.cc/paper/2000/hash/728f206c2a01bf572b5940d7d9a8fa4c-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioDV00.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioBRB99,
  author       = {Samy Bengio and
                  Yoshua Bengio and
                  Jacques Robert and
                  Gilles B{\'{e}}langer},
  title        = {Stochastic Learning of Strategic Equilibria for Auctions},
  journal      = {Neural Comput.},
  volume       = {11},
  number       = {5},
  pages        = {1199--1209},
  year         = {1999},
  url          = {https://doi.org/10.1162/089976699300016412},
  doi          = {10.1162/089976699300016412},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BengioBRB99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dcc/PigeonB99,
  author       = {Steven Pigeon and
                  Yoshua Bengio},
  title        = {Binary Pseudowavelets and Applications to Bilevel Image Processing},
  booktitle    = {Data Compression Conference, {DCC} 1999, Snowbird, Utah, USA, March
                  29-31, 1999},
  pages        = {364--373},
  publisher    = {{IEEE} Computer Society},
  year         = {1999},
  url          = {https://doi.org/10.1109/DCC.1999.755686},
  doi          = {10.1109/DCC.1999.755686},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dcc/PigeonB99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/NadeauB99,
  author       = {Claude Nadeau and
                  Yoshua Bengio},
  editor       = {Sara A. Solla and
                  Todd K. Leen and
                  Klaus{-}Robert M{\"{u}}ller},
  title        = {Inference for the Generalization Error},
  booktitle    = {Advances in Neural Information Processing Systems 12, {[NIPS} Conference,
                  Denver, Colorado, USA, November 29 - December 4, 1999]},
  pages        = {307--313},
  publisher    = {The {MIT} Press},
  year         = {1999},
  url          = {http://papers.nips.cc/paper/1661-inference-for-the-generalization-error},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/NadeauB99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioB99,
  author       = {Yoshua Bengio and
                  Samy Bengio},
  editor       = {Sara A. Solla and
                  Todd K. Leen and
                  Klaus{-}Robert M{\"{u}}ller},
  title        = {Modeling High-Dimensional Discrete Data with Multi-Layer Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 12, {[NIPS} Conference,
                  Denver, Colorado, USA, November 29 - December 4, 1999]},
  pages        = {400--406},
  publisher    = {The {MIT} Press},
  year         = {1999},
  url          = {http://papers.nips.cc/paper/1679-modeling-high-dimensional-discrete-data-with-multi-layer-neural-networks},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioB99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/shape/CunHBB99,
  author       = {Yann LeCun and
                  Patrick Haffner and
                  L{\'{e}}on Bottou and
                  Yoshua Bengio},
  editor       = {David A. Forsyth and
                  Joseph L. Mundy and
                  Vito Di Ges{\`{u}} and
                  Roberto Cipolla},
  title        = {Object Recognition with Gradient-Based Learning},
  booktitle    = {Shape, Contour and Grouping in Computer Vision},
  series       = {Lecture Notes in Computer Science},
  volume       = {1681},
  pages        = {319},
  publisher    = {Springer},
  year         = {1999},
  url          = {https://doi.org/10.1007/3-540-46805-6\_19},
  doi          = {10.1007/3-540-46805-6\_19},
  timestamp    = {Tue, 14 May 2019 10:00:35 +0200},
  biburl       = {https://dblp.org/rec/conf/shape/CunHBB99.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cai/BengioGGLS98,
  author       = {Yoshua Bengio and
                  Francois Gingras and
                  Bernard Goulard and
                  Jean{-}Marc Lina and
                  Keith Scott},
  title        = {Gaussian Mixture Densities for Classification of Nuclear Power Plant
                  Data},
  journal      = {Comput. Artif. Intell.},
  volume       = {17},
  number       = {2-3},
  pages        = {189--209},
  year         = {1998},
  url          = {http://www.cai.sk/ojs/index.php/cai/article/view/637},
  timestamp    = {Mon, 14 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cai/BengioGGLS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jei/BottouHHSBL98,
  author       = {L{\'{e}}on Bottou and
                  Patrick Haffner and
                  Paul G. Howard and
                  Patrice Y. Simard and
                  Yoshua Bengio and
                  Yann LeCun},
  title        = {High quality document image compression with "DjVu"},
  journal      = {J. Electronic Imaging},
  volume       = {7},
  number       = {3},
  pages        = {410--425},
  year         = {1998},
  url          = {https://doi.org/10.1117/1.482609},
  doi          = {10.1117/1.482609},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jei/BottouHHSBL98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pieee/LeCunBBH98,
  author       = {Yann LeCun and
                  L{\'{e}}on Bottou and
                  Yoshua Bengio and
                  Patrick Haffner},
  title        = {Gradient-based learning applied to document recognition},
  journal      = {Proc. {IEEE}},
  volume       = {86},
  number       = {11},
  pages        = {2278--2324},
  year         = {1998},
  url          = {https://doi.org/10.1109/5.726791},
  doi          = {10.1109/5.726791},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pieee/LeCunBBH98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/adl/HaffnerBHSBC98,
  author       = {Patrick Haffner and
                  L{\'{e}}on Bottou and
                  Paul G. Howard and
                  Patrice Y. Simard and
                  Yoshua Bengio and
                  Yann LeCun},
  title        = {Browsing through High Quality Document Images with DjVu},
  booktitle    = {Proceedings of the {IEEE} Forum on Research and Technology Advances
                  in Digital Libraries, {IEEE} {ADL} '98, Santa Barbara, California,
                  USA, April 22-24, 1998},
  pages        = {309--318},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/ADL.1998.670431},
  doi          = {10.1109/ADL.1998.670431},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/adl/HaffnerBHSBC98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dcc/BottouHB98,
  author       = {L{\'{e}}on Bottou and
                  Paul G. Howard and
                  Yoshua Bengio},
  title        = {The Z-Coder Adaptive Binary Coder},
  booktitle    = {Data Compression Conference, {DCC} 1998, Snowbird, Utah, USA, March
                  30 - April 1, 1998},
  pages        = {13--22},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/DCC.1998.672124},
  doi          = {10.1109/DCC.1998.672124},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dcc/BottouHB98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dcc/PigeonB98,
  author       = {Steven Pigeon and
                  Yoshua Bengio},
  title        = {A Memory-Efficient Adaptive Huffman Coding Algorthm for Very Large
                  Sets of Symbols},
  booktitle    = {Data Compression Conference, {DCC} 1998, Snowbird, Utah, USA, March
                  30 - April 1, 1998},
  pages        = {568},
  publisher    = {{IEEE} Computer Society},
  year         = {1998},
  url          = {https://doi.org/10.1109/DCC.1998.672310},
  doi          = {10.1109/DCC.1998.672310},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/dcc/PigeonB98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/miip/BonnevilleMBS98,
  author       = {Martin Bonneville and
                  Jean Meunier and
                  Yoshua Bengio and
                  Jean{-}Paul Soucy},
  editor       = {Kenneth M. Hanson},
  title        = {Support vector machines for improving the classification of brain
                  {PET} images},
  booktitle    = {Medical Imaging 1998: Image Processing, San Diego, CA, United States,
                  21-26 February 1998},
  series       = {{SPIE} Proceedings},
  volume       = {3338},
  publisher    = {{SPIE}},
  year         = {1998},
  url          = {https://doi.org/10.1117/12.310900},
  doi          = {10.1117/12.310900},
  timestamp    = {Wed, 25 Jul 2018 18:08:09 +0200},
  biburl       = {https://dblp.org/rec/conf/miip/BonnevilleMBS98.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijns/Bengio97,
  author       = {Yoshua Bengio},
  title        = {Using a Financial Training Criterion Rather than a Prediction Criterion},
  journal      = {Int. J. Neural Syst.},
  volume       = {8},
  number       = {4},
  pages        = {433--443},
  year         = {1997},
  url          = {https://doi.org/10.1142/S0129065797000422},
  doi          = {10.1142/S0129065797000422},
  timestamp    = {Sun, 02 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijns/Bengio97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cvpr/BottouBL97,
  author       = {L{\'{e}}on Bottou and
                  Yoshua Bengio and
                  Yann LeCun},
  title        = {Global Training of Document Processing Systems Using Graph Transformer
                  Networks},
  booktitle    = {1997 Conference on Computer Vision and Pattern Recognition {(CVPR}
                  '97), June 17-19, 1997, San Juan, Puerto Rico},
  pages        = {489--494},
  publisher    = {{IEEE} Computer Society},
  year         = {1997},
  url          = {https://doi.org/10.1109/CVPR.1997.609370},
  doi          = {10.1109/CVPR.1997.609370},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/cvpr/BottouBL97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icann/SchwenkB97,
  author       = {Holger Schwenk and
                  Yoshua Bengio},
  editor       = {Wulfram Gerstner and
                  Alain Germond and
                  Martin Hasler and
                  Jean{-}Daniel Nicoud},
  title        = {AdaBoosting Neural Networks: Application to on-line Character Recognition},
  booktitle    = {Artificial Neural Networks - {ICANN} '97, 7th International Conference,
                  Lausanne, Switzerland, October 8-10, 1997, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {1327},
  pages        = {967--972},
  publisher    = {Springer},
  year         = {1997},
  url          = {https://doi.org/10.1007/BFb0020278},
  doi          = {10.1007/BFB0020278},
  timestamp    = {Tue, 14 May 2019 10:00:49 +0200},
  biburl       = {https://dblp.org/rec/conf/icann/SchwenkB97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/LeCunBB97,
  author       = {Yann LeCun and
                  L{\'{e}}on Bottou and
                  Yoshua Bengio},
  title        = {Reading checks with multilayer graph transformer networks},
  booktitle    = {1997 {IEEE} International Conference on Acoustics, Speech, and Signal
                  Processing, {ICASSP} '97, Munich, Germany, April 21-24, 1997},
  pages        = {151--154},
  publisher    = {{IEEE} Computer Society},
  year         = {1997},
  url          = {https://doi.org/10.1109/ICASSP.1997.599580},
  doi          = {10.1109/ICASSP.1997.599580},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icassp/LeCunBB97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/RahimBL97,
  author       = {Mazin Rahim and
                  Yoshua Bengio and
                  Yann LeCun},
  editor       = {George Kokkinakis and
                  Nikos Fakotakis and
                  Evangelos Dermatas},
  title        = {Discriminative feature and model design for automatic speech recognition},
  booktitle    = {Fifth European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1997, Rhodes, Greece, September 22-25, 1997},
  pages        = {75--78},
  publisher    = {{ISCA}},
  year         = {1997},
  url          = {https://doi.org/10.21437/Eurospeech.1997-46},
  doi          = {10.21437/EUROSPEECH.1997-46},
  timestamp    = {Sun, 02 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/RahimBL97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioBIS97,
  author       = {Yoshua Bengio and
                  Samy Bengio and
                  Jean{-}Franc Isabelle and
                  Yoram Singer},
  editor       = {Michael I. Jordan and
                  Michael J. Kearns and
                  Sara A. Solla},
  title        = {Shared Context Probabilistic Transducers},
  booktitle    = {Advances in Neural Information Processing Systems 10, {[NIPS} Conference,
                  Denver, Colorado, USA, 1997]},
  pages        = {409--415},
  publisher    = {The {MIT} Press},
  year         = {1997},
  url          = {http://papers.nips.cc/paper/1379-shared-context-probabilistic-transducers},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioBIS97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SchwenkB97,
  author       = {Holger Schwenk and
                  Yoshua Bengio},
  editor       = {Michael I. Jordan and
                  Michael J. Kearns and
                  Sara A. Solla},
  title        = {Training Methods for Adaptive Boosting of Neural Networks},
  booktitle    = {Advances in Neural Information Processing Systems 10, {[NIPS} Conference,
                  Denver, Colorado, USA, 1997]},
  pages        = {647--653},
  publisher    = {The {MIT} Press},
  year         = {1997},
  url          = {http://papers.nips.cc/paper/1335-training-methods-for-adaptive-boosting-of-neural-networks},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SchwenkB97.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioF96,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  title        = {Input-output HMMs for sequence processing},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {7},
  number       = {5},
  pages        = {1231--1249},
  year         = {1996},
  url          = {https://doi.org/10.1109/72.536317},
  doi          = {10.1109/72.536317},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioF96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GhosnB96,
  author       = {Joumana Ghosn and
                  Yoshua Bengio},
  editor       = {Michael Mozer and
                  Michael I. Jordan and
                  Thomas Petsche},
  title        = {Multi-Task Learning for Stock Selection},
  booktitle    = {Advances in Neural Information Processing Systems 9, NIPS, Denver,
                  CO, USA, December 2-5, 1996},
  pages        = {946--952},
  publisher    = {{MIT} Press},
  year         = {1996},
  url          = {http://papers.nips.cc/paper/1221-multi-task-learning-for-stock-selection},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GhosnB96.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jair/BengioF95,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  title        = {Diffusion of Context and Credit Information in Markovian Models},
  journal      = {J. Artif. Intell. Res.},
  volume       = {3},
  pages        = {249--270},
  year         = {1995},
  url          = {https://doi.org/10.1613/jair.233},
  doi          = {10.1613/JAIR.233},
  timestamp    = {Mon, 21 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jair/BengioF95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/neco/BengioLNB95,
  author       = {Yoshua Bengio and
                  Yann LeCun and
                  Craig R. Nohl and
                  Christopher J. C. Burges},
  title        = {LeRec: a {NN/HMM} hybrid for on-line handwriting recognition},
  journal      = {Neural Comput.},
  volume       = {7},
  number       = {6},
  pages        = {1289--1303},
  year         = {1995},
  url          = {https://doi.org/10.1162/neco.1995.7.6.1289},
  doi          = {10.1162/NECO.1995.7.6.1289},
  timestamp    = {Tue, 01 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/neco/BengioLNB95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npl/BengioBC95,
  author       = {Samy Bengio and
                  Yoshua Bengio and
                  Jocelyn Cloutier},
  title        = {On the search for new learning rules for ANNs},
  journal      = {Neural Process. Lett.},
  volume       = {2},
  number       = {4},
  pages        = {26--30},
  year         = {1995},
  url          = {https://doi.org/10.1007/BF02279935},
  doi          = {10.1007/BF02279935},
  timestamp    = {Thu, 09 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/npl/BengioBC95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioG95,
  author       = {Yoshua Bengio and
                  Francois Gingras},
  editor       = {David S. Touretzky and
                  Michael Mozer and
                  Michael E. Hasselmo},
  title        = {Recurrent Neural Networks for Missing or Asynchronous Data},
  booktitle    = {Advances in Neural Information Processing Systems 8, NIPS, Denver,
                  CO, USA, November 27-30, 1995},
  pages        = {395--401},
  publisher    = {{MIT} Press},
  year         = {1995},
  url          = {http://papers.nips.cc/paper/1126-recurrent-neural-networks-for-missing-or-asynchronous-data},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioG95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HihiB95,
  author       = {Salah El Hihi and
                  Yoshua Bengio},
  editor       = {David S. Touretzky and
                  Michael Mozer and
                  Michael E. Hasselmo},
  title        = {Hierarchical Recurrent Neural Networks for Long-Term Dependencies},
  booktitle    = {Advances in Neural Information Processing Systems 8, NIPS, Denver,
                  CO, USA, November 27-30, 1995},
  pages        = {493--499},
  publisher    = {{MIT} Press},
  year         = {1995},
  url          = {http://papers.nips.cc/paper/1102-hierarchical-recurrent-neural-networks-for-long-term-dependencies},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HihiB95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BengioF95,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  title        = {Diffusion of Context and Credit Information in Markovian Models},
  journal      = {CoRR},
  volume       = {abs/cs/9510101},
  year         = {1995},
  url          = {http://arxiv.org/abs/cs/9510101},
  eprinttype    = {arXiv},
  eprint       = {cs/9510101},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BengioF95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioSF94,
  author       = {Yoshua Bengio and
                  Patrice Y. Simard and
                  Paolo Frasconi},
  title        = {Learning long-term dependencies with gradient descent is difficult},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {5},
  number       = {2},
  pages        = {157--166},
  year         = {1994},
  url          = {https://doi.org/10.1109/72.279181},
  doi          = {10.1109/72.279181},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioSF94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icec/BengioBC94,
  author       = {Samy Bengio and
                  Yoshua Bengio and
                  Jocelyn Cloutier},
  title        = {Use of Genetic Programming for the Search of a New Learning Rule for
                  Neural Networks},
  booktitle    = {Proceedings of the First {IEEE} Conference on Evolutionary Computation,
                  {IEEE} World Congress on Computational Intelligence, Orlando, Florida,
                  USA, June 27-29, 1994},
  pages        = {324--327},
  publisher    = {{IEEE}},
  year         = {1994},
  url          = {https://doi.org/10.1109/ICEC.1994.349932},
  doi          = {10.1109/ICEC.1994.349932},
  timestamp    = {Wed, 16 Oct 2019 14:14:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icec/BengioBC94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpr/LeCunB94,
  author       = {Yann LeCun and
                  Yoshua Bengio},
  title        = {Word-level training of a handwritten word recognizer based on convolutional
                  neural networks},
  booktitle    = {12th {IAPR} International Conference on Pattern Recognition, Conference
                  {B:} Patern Recognition and Neural Networks, {ICPR} 1994, Jerusalem,
                  Israel, 9-13 October, 1994, Volume 2},
  pages        = {88--92},
  publisher    = {{IEEE}},
  year         = {1994},
  url          = {https://doi.org/10.1109/ICPR.1994.576881},
  doi          = {10.1109/ICPR.1994.576881},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpr/LeCunB94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpr/FrasconiB94,
  author       = {Paolo Frasconi and
                  Yoshua Bengio},
  title        = {An {EM} approach to grammatical inference: input/output HMMs},
  booktitle    = {12th {IAPR} International Conference on Pattern Recognition, Conference
                  {B:} Patern Recognition and Neural Networks, {ICPR} 1994, Jerusalem,
                  Israel, 9-13 October, 1994, Volume 2},
  pages        = {289--294},
  publisher    = {{IEEE}},
  year         = {1994},
  url          = {https://doi.org/10.1109/ICPR.1994.576922},
  doi          = {10.1109/ICPR.1994.576922},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpr/FrasconiB94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icpr/BengioL94,
  author       = {Yoshua Bengio and
                  Yann LeCun},
  title        = {Word normalization for online handwritten word recognition},
  booktitle    = {12th {IAPR} International Conference on Pattern Recognition, Conference
                  {B:} Patern Recognition and Neural Networks, {ICPR} 1994, Jerusalem,
                  Israel, 9-13 October, 1994, Volume 2},
  pages        = {409--413},
  publisher    = {{IEEE}},
  year         = {1994},
  url          = {https://doi.org/10.1109/ICPR.1994.576966},
  doi          = {10.1109/ICPR.1994.576966},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpr/BengioL94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioF94,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  editor       = {Gerald Tesauro and
                  David S. Touretzky and
                  Todd K. Leen},
  title        = {An Input Output {HMM} Architecture},
  booktitle    = {Advances in Neural Information Processing Systems 7, {[NIPS} Conference,
                  Denver, Colorado, USA, 1994]},
  pages        = {427--434},
  publisher    = {{MIT} Press},
  year         = {1994},
  url          = {http://papers.nips.cc/paper/964-an-input-output-hmm-architecture},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioF94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioF94a,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  editor       = {Gerald Tesauro and
                  David S. Touretzky and
                  Todd K. Leen},
  title        = {Diffusion of Credit in Markovian Models},
  booktitle    = {Advances in Neural Information Processing Systems 7, {[NIPS} Conference,
                  Denver, Colorado, USA, 1994]},
  pages        = {553--560},
  publisher    = {{MIT} Press},
  year         = {1994},
  url          = {http://papers.nips.cc/paper/919-diffusion-of-credit-in-markovian-models},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioF94a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BottouB94,
  author       = {L{\'{e}}on Bottou and
                  Yoshua Bengio},
  editor       = {Gerald Tesauro and
                  David S. Touretzky and
                  Todd K. Leen},
  title        = {Convergence Properties of the K-Means Algorithms},
  booktitle    = {Advances in Neural Information Processing Systems 7, {[NIPS} Conference,
                  Denver, Colorado, USA, 1994]},
  pages        = {585--592},
  publisher    = {{MIT} Press},
  year         = {1994},
  url          = {http://papers.nips.cc/paper/989-convergence-properties-of-the-k-means-algorithms},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BottouB94.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijprai/Bengio93,
  author       = {Yoshua Bengio},
  title        = {A Connectionist Approach to Speech Recognition},
  journal      = {Int. J. Pattern Recognit. Artif. Intell.},
  volume       = {7},
  number       = {4},
  pages        = {647--667},
  year         = {1993},
  url          = {https://doi.org/10.1142/S0218001493000327},
  doi          = {10.1142/S0218001493000327},
  timestamp    = {Mon, 11 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijprai/Bengio93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icnn/BengioFS93,
  author       = {Yoshua Bengio and
                  Paolo Frasconi and
                  Patrice Y. Simard},
  title        = {The problem of learning long-term dependencies in recurrent networks},
  booktitle    = {Proceedings of International Conference on Neural Networks (ICNN'88),
                  San Francisco, CA, USA, March 28 - April 1, 1993},
  pages        = {1183--1188},
  publisher    = {{IEEE}},
  year         = {1993},
  url          = {https://doi.org/10.1109/ICNN.1993.298725},
  doi          = {10.1109/ICNN.1993.298725},
  timestamp    = {Wed, 04 Sep 2019 08:33:25 +0200},
  biburl       = {https://dblp.org/rec/conf/icnn/BengioFS93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioF93,
  author       = {Yoshua Bengio and
                  Paolo Frasconi},
  editor       = {Jack D. Cowan and
                  Gerald Tesauro and
                  Joshua Alspector},
  title        = {Credit Assignment through Time: Alternatives to Backpropagation},
  booktitle    = {Advances in Neural Information Processing Systems 6, [7th {NIPS} Conference,
                  Denver, Colorado, USA, 1993]},
  pages        = {75--82},
  publisher    = {Morgan Kaufmann},
  year         = {1993},
  url          = {http://papers.nips.cc/paper/724-credit-assignment-through-time-alternatives-to-backpropagation},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioF93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioCH93,
  author       = {Yoshua Bengio and
                  Yann LeCun and
                  Donnie Henderson},
  editor       = {Jack D. Cowan and
                  Gerald Tesauro and
                  Joshua Alspector},
  title        = {Globally Trained Handwritten Word Recognizer Using Spatial Representation,
                  Convolutional Neural Networks, and Hidden Markov Models},
  booktitle    = {Advances in Neural Information Processing Systems 6, [7th {NIPS} Conference,
                  Denver, Colorado, USA, 1993]},
  pages        = {937--944},
  publisher    = {Morgan Kaufmann},
  year         = {1993},
  url          = {http://papers.nips.cc/paper/819-globally-trained-handwritten-word-recognizer-using-spatial-representation-convolutional-neural-networks-and-hidden-markov-models},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioCH93.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/prl/BengioMG92,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  Marco Gori},
  title        = {Learning the dynamic nature of speech with back-propagation for sequences},
  journal      = {Pattern Recognit. Lett.},
  volume       = {13},
  number       = {5},
  pages        = {375--385},
  year         = {1992},
  url          = {https://doi.org/10.1016/0167-8655(92)90035-X},
  doi          = {10.1016/0167-8655(92)90035-X},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/prl/BengioMG92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/BengioMFK92,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  Giovanni Flammia and
                  Ralf Kompe},
  title        = {Phonetically motivated acoustic parameters for continuous speech recognition
                  using artificial neural networks},
  journal      = {Speech Commun.},
  volume       = {11},
  number       = {2-3},
  pages        = {261--271},
  year         = {1992},
  url          = {https://doi.org/10.1016/0167-6393(92)90020-8},
  doi          = {10.1016/0167-6393(92)90020-8},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/speech/BengioMFK92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tnn/BengioMFK92,
  author       = {Yoshua Bengio and
                  Renato De Mori and
                  Giovanni Flammia and
                  Ralf Kompe},
  title        = {Global optimization of a neural network-hidden Markov model hybrid},
  journal      = {{IEEE} Trans. Neural Networks},
  volume       = {3},
  number       = {2},
  pages        = {252--259},
  year         = {1992},
  url          = {https://doi.org/10.1109/72.125866},
  doi          = {10.1109/72.125866},
  timestamp    = {Wed, 14 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tnn/BengioMFK92.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/BengioMFK91,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  Giovanni Flammia and
                  Ralf Kompe},
  title        = {Phonetically motivated acoustic parameters for continuous speech recognition
                  using artificial neural networks},
  booktitle    = {Second European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1991, Genova, Italy, September 24-26, 1991},
  pages        = {551--554},
  publisher    = {{ISCA}},
  year         = {1991},
  url          = {https://doi.org/10.21437/Eurospeech.1991-137},
  doi          = {10.21437/EUROSPEECH.1991-137},
  timestamp    = {Sun, 02 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/BengioMFK91.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/BengioMFK91a,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  Giovanni Flammia and
                  Ralf Kompe},
  title        = {A comparative study on hybrid acoustic phonetic decoders based on
                  artificial neural networks},
  booktitle    = {Second European Conference on Speech Communication and Technology,
                  {EUROSPEECH} 1991, Genova, Italy, September 24-26, 1991},
  pages        = {1007--1010},
  publisher    = {{ISCA}},
  year         = {1991},
  url          = {https://doi.org/10.21437/Eurospeech.1991-241},
  doi          = {10.21437/EUROSPEECH.1991-241},
  timestamp    = {Sun, 02 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/interspeech/BengioMFK91a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioMFK91,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  Giovanni Flammia and
                  Ralf Kompe},
  editor       = {John E. Moody and
                  Stephen Jose Hanson and
                  Richard Lippmann},
  title        = {Neural Network - Gaussian Mixture Hybrid for Speech Recognition or
                  Density Estimation},
  booktitle    = {Advances in Neural Information Processing Systems 4, {[NIPS} Conference,
                  Denver, Colorado, USA, December 2-5, 1991]},
  pages        = {175--182},
  publisher    = {Morgan Kaufmann},
  year         = {1991},
  url          = {http://papers.nips.cc/paper/521-neural-network-gaussian-mixture-hybrid-for-speech-recognition-or-density-estimation},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioMFK91.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/bioinformatics/BengioP90,
  author       = {Yoshua Bengio and
                  Yannick Pouliot},
  title        = {Efficient recognition of immunoglobulin domains from amino acid sequences
                  using a neural network},
  journal      = {Comput. Appl. Biosci.},
  volume       = {6},
  number       = {4},
  pages        = {319--324},
  year         = {1990},
  url          = {https://doi.org/10.1093/bioinformatics/6.4.319},
  doi          = {10.1093/BIOINFORMATICS/6.4.319},
  timestamp    = {Fri, 15 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/bioinformatics/BengioP90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/speech/CosiBM90,
  author       = {Piero Cosi and
                  Yoshua Bengio and
                  Renato de Mori},
  title        = {Phonetically-based multi-layered neural networks for vowel classification},
  journal      = {Speech Commun.},
  volume       = {9},
  number       = {1},
  pages        = {15--29},
  year         = {1990},
  url          = {https://doi.org/10.1016/0167-6393(90)90041-7},
  doi          = {10.1016/0167-6393(90)90041-7},
  timestamp    = {Sat, 22 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/speech/CosiBM90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BengioCMN90,
  author       = {Yoshua Bengio and
                  R{\'{e}}gis Cardin and
                  Renato De Mori and
                  Yves Normandin},
  title        = {A hybrid coder for hidden Markov models using a recurrent neural network},
  booktitle    = {1990 International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} '90, Albuquerque, New Mexico, USA, April 3-6, 1990},
  pages        = {537--540},
  publisher    = {{IEEE}},
  year         = {1990},
  url          = {https://doi.org/10.1109/ICASSP.1990.115768},
  doi          = {10.1109/ICASSP.1990.115768},
  timestamp    = {Mon, 09 Aug 2021 14:54:02 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BengioCMN90.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/cacm/BengioCMM89,
  author       = {Yoshua Bengio and
                  R{\'{e}}gis Cardin and
                  Renato de Mori and
                  Ettore Merlo},
  title        = {Programmable Execution of Multi-Layered Networks for Automatic Speech
                  Recognition},
  journal      = {Commun. {ACM}},
  volume       = {32},
  number       = {2},
  pages        = {195--199},
  year         = {1989},
  url          = {https://doi.org/10.1145/63342.63345},
  doi          = {10.1145/63342.63345},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/cacm/BengioCMM89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BengioCCM89,
  author       = {Yoshua Bengio and
                  R{\'{e}}gis Cardin and
                  Piero Cosi and
                  Renato De Mori},
  title        = {Speech coding with multi-layer networks},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} '89, Glasgow, Scotland, May 23-26, 1989},
  pages        = {164--167},
  publisher    = {{IEEE}},
  year         = {1989},
  url          = {https://doi.org/10.1109/ICASSP.1989.266389},
  doi          = {10.1109/ICASSP.1989.266389},
  timestamp    = {Mon, 09 Aug 2021 14:54:02 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BengioCCM89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ijcai/MoriBC89,
  author       = {Renato de Mori and
                  Yoshua Bengio and
                  Piero Cosi},
  editor       = {N. S. Sridharan},
  title        = {On the Generalization Capability of Multi-Layered Networks in the
                  Extraction of Speech Properties},
  booktitle    = {Proceedings of the 11th International Joint Conference on Artificial
                  Intelligence. Detroit, MI, USA, August 1989},
  pages        = {1531--1536},
  publisher    = {Morgan Kaufmann},
  year         = {1989},
  url          = {http://ijcai.org/Proceedings/89-2/Papers/108.pdf},
  timestamp    = {Tue, 20 Aug 2019 16:17:51 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcai/MoriBC89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nato/BengioCCMM89,
  author       = {Yoshua Bengio and
                  R{\'{e}}gis Cardin and
                  Piero Cosi and
                  Renato De Mori and
                  Ettore Merlo},
  editor       = {Fran{\c{c}}oise Fogelman{-}Souli{\'{e}} and
                  Jeanny H{\'{e}}rault},
  title        = {Speech coding with multilayer networks},
  booktitle    = {Neurocomputing - Algorithms, Architectures and Applications, Proceedings
                  of the {NATO} Advanced Research Workshop on Neurocomputing Algorithms,
                  Architectures and Applications, Les Arcs, France, February 27 - March
                  3, 1989},
  series       = {{NATO} {ASI} Series},
  volume       = {68},
  pages        = {207--216},
  publisher    = {Springer},
  year         = {1989},
  url          = {https://doi.org/10.1007/978-3-642-76153-9\_26},
  doi          = {10.1007/978-3-642-76153-9\_26},
  timestamp    = {Sat, 18 Apr 2020 18:05:29 +0200},
  biburl       = {https://dblp.org/rec/conf/nato/BengioCCMM89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioMC89,
  author       = {Yoshua Bengio and
                  Renato de Mori and
                  R{\'{e}}gis Cardin},
  editor       = {David S. Touretzky},
  title        = {Speaker Independent Speech Recognition with Neural Networks and Speech
                  Knowledge},
  booktitle    = {Advances in Neural Information Processing Systems 2, {[NIPS} Conference,
                  Denver, Colorado, USA, November 27-30, 1989]},
  pages        = {218--225},
  publisher    = {Morgan Kaufmann},
  year         = {1989},
  url          = {http://papers.nips.cc/paper/273-speaker-independent-speech-recognition-with-neural-networks-and-speech-knowledge},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioMC89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioBPA89,
  author       = {Yoshua Bengio and
                  Samy Bengio and
                  Yannick Pouliot and
                  Patrick Agin},
  editor       = {David S. Touretzky},
  title        = {A Neural Network to Detect Homologies in Proteins},
  booktitle    = {Advances in Neural Information Processing Systems 2, {[NIPS} Conference,
                  Denver, Colorado, USA, November 27-30, 1989]},
  pages        = {423--430},
  publisher    = {Morgan Kaufmann},
  year         = {1989},
  url          = {http://papers.nips.cc/paper/214-a-neural-network-to-detect-homologies-in-proteins},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/BengioBPA89.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/MoriBC88,
  author       = {Renato de Mori and
                  Yoshua Bengio and
                  R{\'{e}}gis Cardin},
  editor       = {Howard E. Shrobe and
                  Tom M. Mitchell and
                  Reid G. Smith},
  title        = {Data-Driven Execution of Multi-Layered Networks for Automatic Speech
                  Recognition},
  booktitle    = {Proceedings of the 7th National Conference on Artificial Intelligence,
                  St. Paul, MN, USA, August 21-26, 1988},
  pages        = {734--738},
  publisher    = {{AAAI} Press / The {MIT} Press},
  year         = {1988},
  url          = {http://www.aaai.org/Library/AAAI/1988/aaai88-130.php},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/MoriBC88.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icassp/BengioM88,
  author       = {Yoshua Bengio and
                  Renato De Mori},
  title        = {Use of neural networks for the recognition of place of articulation},
  booktitle    = {{IEEE} International Conference on Acoustics, Speech, and Signal Processing,
                  {ICASSP} '88, New York, New York, USA, April 11-14, 1988},
  pages        = {103--106},
  publisher    = {{IEEE}},
  year         = {1988},
  url          = {https://doi.org/10.1109/ICASSP.1988.196522},
  doi          = {10.1109/ICASSP.1988.196522},
  timestamp    = {Mon, 09 Aug 2021 14:54:02 +0200},
  biburl       = {https://dblp.org/rec/conf/icassp/BengioM88.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/BengioCMC88,
  author       = {Yoshua Bengio and
                  R{\'{e}}gis Cardin and
                  Renato de Mori and
                  Piero Cosi},
  editor       = {David S. Touretzky},
  title        = {Use of Multi-Layered Networks for Coding Speech with Phonetic Features},
  booktitle    = {Advances in Neural Information Processing Systems 1, {[NIPS} Conference,
                  Denver, Colorado, USA, 1988]},
  pages        = {224--231},
  publisher    = {Morgan Kaufmann},
  year         = {1988},
  url          = {http://papers.nips.cc/paper/113-use-of-multi-layered-networks-for-coding-speech-with-phonetic-features},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BengioCMC88.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics