BibTeX records: Edouard Grave

download as .bib file

@article{DBLP:journals/jmlr/IzacardLLHPSDJRG23,
  author       = {Gautier Izacard and
                  Patrick S. H. Lewis and
                  Maria Lomeli and
                  Lucas Hosseini and
                  Fabio Petroni and
                  Timo Schick and
                  Jane Dwivedi{-}Yu and
                  Armand Joulin and
                  Sebastian Riedel and
                  Edouard Grave},
  title        = {Atlas: Few-shot Learning with Retrieval Augmented Language Models},
  journal      = {J. Mach. Learn. Res.},
  volume       = {24},
  pages        = {251:1--251:43},
  year         = {2023},
  url          = {http://jmlr.org/papers/v24/23-0037.html},
  timestamp    = {Thu, 19 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/IzacardLLHPSDJRG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/natmi/PetroniBPLIHDLSBMJGR23,
  author       = {Fabio Petroni and
                  Samuel Broscheit and
                  Aleksandra Piktus and
                  Patrick S. H. Lewis and
                  Gautier Izacard and
                  Lucas Hosseini and
                  Jane Dwivedi{-}Yu and
                  Maria Lomeli and
                  Timo Schick and
                  Michele Bevilacqua and
                  Pierre{-}Emmanuel Mazar{\'{e}} and
                  Armand Joulin and
                  Edouard Grave and
                  Sebastian Riedel},
  title        = {Improving Wikipedia verifiability with {AI}},
  journal      = {Nat. Mac. Intell.},
  volume       = {5},
  number       = {10},
  pages        = {1142--1148},
  year         = {2023},
  url          = {https://doi.org/10.1038/s42256-023-00726-1},
  doi          = {10.1038/S42256-023-00726-1},
  timestamp    = {Sat, 13 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/natmi/PetroniBPLIHDLSBMJGR23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pami/TouvronBCCEGIJSVJ23,
  author       = {Hugo Touvron and
                  Piotr Bojanowski and
                  Mathilde Caron and
                  Matthieu Cord and
                  Alaaeldin El{-}Nouby and
                  Edouard Grave and
                  Gautier Izacard and
                  Armand Joulin and
                  Gabriel Synnaeve and
                  Jakob Verbeek and
                  Herv{\'{e}} J{\'{e}}gou},
  title        = {ResMLP: Feedforward Networks for Image Classification With Data-Efficient
                  Training},
  journal      = {{IEEE} Trans. Pattern Anal. Mach. Intell.},
  volume       = {45},
  number       = {4},
  pages        = {5314--5321},
  year         = {2023},
  url          = {https://doi.org/10.1109/TPAMI.2022.3206148},
  doi          = {10.1109/TPAMI.2022.3206148},
  timestamp    = {Tue, 28 Mar 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pami/TouvronBCCEGIJSVJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SchickYJPLIYNG023,
  author       = {Timo Schick and
                  Jane A. Yu and
                  Zhengbao Jiang and
                  Fabio Petroni and
                  Patrick S. H. Lewis and
                  Gautier Izacard and
                  Qingfei You and
                  Christoforos Nalmpantis and
                  Edouard Grave and
                  Sebastian Riedel},
  title        = {{PEER:} {A} Collaborative Language Model},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=KbYevcLjnc},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SchickYJPLIYNG023.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-07842,
  author       = {Gr{\'{e}}goire Mialon and
                  Roberto Dess{\`{\i}} and
                  Maria Lomeli and
                  Christoforos Nalmpantis and
                  Ramakanth Pasunuru and
                  Roberta Raileanu and
                  Baptiste Rozi{\`{e}}re and
                  Timo Schick and
                  Jane Dwivedi{-}Yu and
                  Asli Celikyilmaz and
                  Edouard Grave and
                  Yann LeCun and
                  Thomas Scialom},
  title        = {Augmented Language Models: a Survey},
  journal      = {CoRR},
  volume       = {abs/2302.07842},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.07842},
  doi          = {10.48550/ARXIV.2302.07842},
  eprinttype    = {arXiv},
  eprint       = {2302.07842},
  timestamp    = {Mon, 20 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-07842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-13971,
  author       = {Hugo Touvron and
                  Thibaut Lavril and
                  Gautier Izacard and
                  Xavier Martinet and
                  Marie{-}Anne Lachaux and
                  Timoth{\'{e}}e Lacroix and
                  Baptiste Rozi{\`{e}}re and
                  Naman Goyal and
                  Eric Hambro and
                  Faisal Azhar and
                  Aur{\'{e}}lien Rodriguez and
                  Armand Joulin and
                  Edouard Grave and
                  Guillaume Lample},
  title        = {LLaMA: Open and Efficient Foundation Language Models},
  journal      = {CoRR},
  volume       = {abs/2302.13971},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.13971},
  doi          = {10.48550/ARXIV.2302.13971},
  eprinttype    = {arXiv},
  eprint       = {2302.13971},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-13971.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-13581,
  author       = {Giovanni Monea and
                  Armand Joulin and
                  Edouard Grave},
  title        = {PaSS: Parallel Speculative Sampling},
  journal      = {CoRR},
  volume       = {abs/2311.13581},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.13581},
  doi          = {10.48550/ARXIV.2311.13581},
  eprinttype    = {arXiv},
  eprint       = {2311.13581},
  timestamp    = {Thu, 30 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-13581.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/IzacardCHRBJG22,
  author       = {Gautier Izacard and
                  Mathilde Caron and
                  Lucas Hosseini and
                  Sebastian Riedel and
                  Piotr Bojanowski and
                  Armand Joulin and
                  Edouard Grave},
  title        = {Unsupervised Dense Information Retrieval with Contrastive Learning},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2022},
  year         = {2022},
  url          = {https://openreview.net/forum?id=jKN1pXi7b0},
  timestamp    = {Fri, 19 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/IzacardCHRBJG22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KahnPLXHCT0GASL22,
  author       = {Jacob D. Kahn and
                  Vineel Pratap and
                  Tatiana Likhomanenko and
                  Qiantong Xu and
                  Awni Y. Hannun and
                  Jeff Cai and
                  Paden Tomasello and
                  Ann Lee and
                  Edouard Grave and
                  Gilad Avidov and
                  Benoit Steiner and
                  Vitaliy Liptchinsky and
                  Gabriel Synnaeve and
                  Ronan Collobert},
  editor       = {Kamalika Chaudhuri and
                  Stefanie Jegelka and
                  Le Song and
                  Csaba Szepesv{\'{a}}ri and
                  Gang Niu and
                  Sivan Sabato},
  title        = {Flashlight: Enabling Innovation in Tools for Machine Learning},
  booktitle    = {International Conference on Machine Learning, {ICML} 2022, 17-23 July
                  2022, Baltimore, Maryland, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {162},
  pages        = {10557--10574},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v162/kahn22a.html},
  timestamp    = {Tue, 12 Jul 2022 17:36:52 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KahnPLXHCT0GASL22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2201-12465,
  author       = {Jacob Kahn and
                  Vineel Pratap and
                  Tatiana Likhomanenko and
                  Qiantong Xu and
                  Awni Y. Hannun and
                  Jeff Cai and
                  Paden Tomasello and
                  Ann Lee and
                  Edouard Grave and
                  Gilad Avidov and
                  Benoit Steiner and
                  Vitaliy Liptchinsky and
                  Gabriel Synnaeve and
                  Ronan Collobert},
  title        = {Flashlight: Enabling Innovation in Tools for Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2201.12465},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.12465},
  eprinttype    = {arXiv},
  eprint       = {2201.12465},
  timestamp    = {Tue, 05 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-12465.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2207-06220,
  author       = {Fabio Petroni and
                  Samuel Broscheit and
                  Aleksandra Piktus and
                  Patrick S. H. Lewis and
                  Gautier Izacard and
                  Lucas Hosseini and
                  Jane Dwivedi{-}Yu and
                  Maria Lomeli and
                  Timo Schick and
                  Pierre{-}Emmanuel Mazar{\'{e}} and
                  Armand Joulin and
                  Edouard Grave and
                  Sebastian Riedel},
  title        = {Improving Wikipedia Verifiability with {AI}},
  journal      = {CoRR},
  volume       = {abs/2207.06220},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2207.06220},
  doi          = {10.48550/ARXIV.2207.06220},
  eprinttype    = {arXiv},
  eprint       = {2207.06220},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2207-06220.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-03299,
  author       = {Gautier Izacard and
                  Patrick S. H. Lewis and
                  Maria Lomeli and
                  Lucas Hosseini and
                  Fabio Petroni and
                  Timo Schick and
                  Jane Dwivedi{-}Yu and
                  Armand Joulin and
                  Sebastian Riedel and
                  Edouard Grave},
  title        = {Few-shot Learning with Retrieval Augmented Language Models},
  journal      = {CoRR},
  volume       = {abs/2208.03299},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.03299},
  doi          = {10.48550/ARXIV.2208.03299},
  eprinttype    = {arXiv},
  eprint       = {2208.03299},
  timestamp    = {Wed, 25 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-03299.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2208-11663,
  author       = {Timo Schick and
                  Jane Dwivedi{-}Yu and
                  Zhengbao Jiang and
                  Fabio Petroni and
                  Patrick S. H. Lewis and
                  Gautier Izacard and
                  Qingfei You and
                  Christoforos Nalmpantis and
                  Edouard Grave and
                  Sebastian Riedel},
  title        = {{PEER:} {A} Collaborative Language Model},
  journal      = {CoRR},
  volume       = {abs/2208.11663},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.11663},
  doi          = {10.48550/ARXIV.2208.11663},
  eprinttype    = {arXiv},
  eprint       = {2208.11663},
  timestamp    = {Wed, 25 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-11663.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-13331,
  author       = {Jane Dwivedi{-}Yu and
                  Timo Schick and
                  Zhengbao Jiang and
                  Maria Lomeli and
                  Patrick S. H. Lewis and
                  Gautier Izacard and
                  Edouard Grave and
                  Sebastian Riedel and
                  Fabio Petroni},
  title        = {EditEval: An Instruction-Based Benchmark for Text Improvements},
  journal      = {CoRR},
  volume       = {abs/2209.13331},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.13331},
  doi          = {10.48550/ARXIV.2209.13331},
  eprinttype    = {arXiv},
  eprint       = {2209.13331},
  timestamp    = {Wed, 25 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-13331.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SchwenkWEGJF20,
  author       = {Holger Schwenk and
                  Guillaume Wenzek and
                  Sergey Edunov and
                  Edouard Grave and
                  Armand Joulin and
                  Angela Fan},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {CCMatrix: Mining Billions of High-Quality Parallel Sentences on the
                  Web},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {6490--6500},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.507},
  doi          = {10.18653/V1/2021.ACL-LONG.507},
  timestamp    = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SchwenkWEGJF20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/IzacardG21,
  author       = {Gautier Izacard and
                  Edouard Grave},
  editor       = {Paola Merlo and
                  J{\"{o}}rg Tiedemann and
                  Reut Tsarfaty},
  title        = {Leveraging Passage Retrieval with Generative Models for Open Domain
                  Question Answering},
  booktitle    = {Proceedings of the 16th Conference of the European Chapter of the
                  Association for Computational Linguistics: Main Volume, {EACL} 2021,
                  Online, April 19 - 23, 2021},
  pages        = {874--880},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.eacl-main.74},
  doi          = {10.18653/V1/2021.EACL-MAIN.74},
  timestamp    = {Thu, 20 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/eacl/IzacardG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/IzacardG21,
  author       = {Gautier Izacard and
                  Edouard Grave},
  title        = {Distilling Knowledge from Reader to Retriever for Question Answering},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=NTEz-6wysdb},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/IzacardG21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/StockFGGGJJ21,
  author       = {Pierre Stock and
                  Angela Fan and
                  Benjamin Graham and
                  Edouard Grave and
                  R{\'{e}}mi Gribonval and
                  Herv{\'{e}} J{\'{e}}gou and
                  Armand Joulin},
  title        = {Training with Quantization Noise for Extreme Model Compression},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=dV19Yyi1fS3},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/StockFGGGJJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/DuGGCCASC21,
  author       = {Jingfei Du and
                  Edouard Grave and
                  Beliz Gunel and
                  Vishrav Chaudhary and
                  Onur Celebi and
                  Michael Auli and
                  Veselin Stoyanov and
                  Alexis Conneau},
  editor       = {Kristina Toutanova and
                  Anna Rumshisky and
                  Luke Zettlemoyer and
                  Dilek Hakkani{-}T{\"{u}}r and
                  Iz Beltagy and
                  Steven Bethard and
                  Ryan Cotterell and
                  Tanmoy Chakraborty and
                  Yichao Zhou},
  title        = {Self-training Improves Pre-training for Natural Language Understanding},
  booktitle    = {Proceedings of the 2021 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2021, Online, June 6-11, 2021},
  pages        = {5408--5418},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.naacl-main.426},
  doi          = {10.18653/V1/2021.NAACL-MAIN.426},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/DuGGCCASC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-00133,
  author       = {Sewon Min and
                  Jordan L. Boyd{-}Graber and
                  Chris Alberti and
                  Danqi Chen and
                  Eunsol Choi and
                  Michael Collins and
                  Kelvin Guu and
                  Hannaneh Hajishirzi and
                  Kenton Lee and
                  Jennimaria Palomaki and
                  Colin Raffel and
                  Adam Roberts and
                  Tom Kwiatkowski and
                  Patrick S. H. Lewis and
                  Yuxiang Wu and
                  Heinrich K{\"{u}}ttler and
                  Linqing Liu and
                  Pasquale Minervini and
                  Pontus Stenetorp and
                  Sebastian Riedel and
                  Sohee Yang and
                  Minjoon Seo and
                  Gautier Izacard and
                  Fabio Petroni and
                  Lucas Hosseini and
                  Nicola De Cao and
                  Edouard Grave and
                  Ikuya Yamada and
                  Sonse Shimaoka and
                  Masatoshi Suzuki and
                  Shumpei Miyawaki and
                  Shun Sato and
                  Ryo Takahashi and
                  Jun Suzuki and
                  Martin Fajcik and
                  Martin Docekal and
                  Karel Ondrej and
                  Pavel Smrz and
                  Hao Cheng and
                  Yelong Shen and
                  Xiaodong Liu and
                  Pengcheng He and
                  Weizhu Chen and
                  Jianfeng Gao and
                  Barlas Oguz and
                  Xilun Chen and
                  Vladimir Karpukhin and
                  Stan Peshterliev and
                  Dmytro Okhonko and
                  Michael Sejr Schlichtkrull and
                  Sonal Gupta and
                  Yashar Mehdad and
                  Wen{-}tau Yih},
  title        = {NeurIPS 2020 EfficientQA Competition: Systems, Analyses and Lessons
                  Learned},
  journal      = {CoRR},
  volume       = {abs/2101.00133},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.00133},
  eprinttype    = {arXiv},
  eprint       = {2101.00133},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-00133.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-03404,
  author       = {Hugo Touvron and
                  Piotr Bojanowski and
                  Mathilde Caron and
                  Matthieu Cord and
                  Alaaeldin El{-}Nouby and
                  Edouard Grave and
                  Armand Joulin and
                  Gabriel Synnaeve and
                  Jakob Verbeek and
                  Herv{\'{e}} J{\'{e}}gou},
  title        = {ResMLP: Feedforward networks for image classification with data-efficient
                  training},
  journal      = {CoRR},
  volume       = {abs/2105.03404},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.03404},
  eprinttype    = {arXiv},
  eprint       = {2105.03404},
  timestamp    = {Fri, 14 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-03404.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-09118,
  author       = {Gautier Izacard and
                  Mathilde Caron and
                  Lucas Hosseini and
                  Sebastian Riedel and
                  Piotr Bojanowski and
                  Armand Joulin and
                  Edouard Grave},
  title        = {Towards Unsupervised Dense Information Retrieval with Contrastive
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2112.09118},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.09118},
  eprinttype    = {arXiv},
  eprint       = {2112.09118},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-09118.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-09924,
  author       = {Aleksandra Piktus and
                  Fabio Petroni and
                  Vladimir Karpukhin and
                  Dmytro Okhonko and
                  Samuel Broscheit and
                  Gautier Izacard and
                  Patrick S. H. Lewis and
                  Barlas Oguz and
                  Edouard Grave and
                  Wen{-}tau Yih and
                  Sebastian Riedel},
  title        = {The Web Is Your Oyster - Knowledge-Intensive {NLP} against a Very
                  Large Web Corpus},
  journal      = {CoRR},
  volume       = {abs/2112.09924},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.09924},
  eprinttype    = {arXiv},
  eprint       = {2112.09924},
  timestamp    = {Wed, 25 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-09924.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-10740,
  author       = {Alaaeldin El{-}Nouby and
                  Gautier Izacard and
                  Hugo Touvron and
                  Ivan Laptev and
                  Herv{\'{e}} J{\'{e}}gou and
                  Edouard Grave},
  title        = {Are Large-scale Datasets Necessary for Self-Supervised Pre-training?},
  journal      = {CoRR},
  volume       = {abs/2112.10740},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.10740},
  eprinttype    = {arXiv},
  eprint       = {2112.10740},
  timestamp    = {Tue, 04 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-10740.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/ConneauKGCWGGOZ20,
  author       = {Alexis Conneau and
                  Kartikay Khandelwal and
                  Naman Goyal and
                  Vishrav Chaudhary and
                  Guillaume Wenzek and
                  Francisco Guzm{\'{a}}n and
                  Edouard Grave and
                  Myle Ott and
                  Luke Zettlemoyer and
                  Veselin Stoyanov},
  editor       = {Dan Jurafsky and
                  Joyce Chai and
                  Natalie Schluter and
                  Joel R. Tetreault},
  title        = {Unsupervised Cross-lingual Representation Learning at Scale},
  booktitle    = {Proceedings of the 58th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2020, Online, July 5-10, 2020},
  pages        = {8440--8451},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.acl-main.747},
  doi          = {10.18653/V1/2020.ACL-MAIN.747},
  timestamp    = {Wed, 16 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/ConneauKGCWGGOZ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ElbayadGGA20,
  author       = {Maha Elbayad and
                  Jiatao Gu and
                  Edouard Grave and
                  Michael Auli},
  title        = {Depth-Adaptive Transformer},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SJg7KhVKPH},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ElbayadGGA20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/FanGJ20,
  author       = {Angela Fan and
                  Edouard Grave and
                  Armand Joulin},
  title        = {Reducing Transformer Depth on Demand with Structured Dropout},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SylO2yStDr},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/FanGJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/WenzekLCCGJG20,
  author       = {Guillaume Wenzek and
                  Marie{-}Anne Lachaux and
                  Alexis Conneau and
                  Vishrav Chaudhary and
                  Francisco Guzm{\'{a}}n and
                  Armand Joulin and
                  Edouard Grave},
  editor       = {Nicoletta Calzolari and
                  Fr{\'{e}}d{\'{e}}ric B{\'{e}}chet and
                  Philippe Blache and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis},
  title        = {CCNet: Extracting High Quality Monolingual Datasets from Web Crawl
                  Data},
  booktitle    = {Proceedings of The 12th Language Resources and Evaluation Conference,
                  {LREC} 2020, Marseille, France, May 11-16, 2020},
  pages        = {4003--4012},
  publisher    = {European Language Resources Association},
  year         = {2020},
  url          = {https://aclanthology.org/2020.lrec-1.494/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/lrec/WenzekLCCGJG20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MinBACC0GHLPRRK20,
  author       = {Sewon Min and
                  Jordan L. Boyd{-}Graber and
                  Chris Alberti and
                  Danqi Chen and
                  Eunsol Choi and
                  Michael Collins and
                  Kelvin Guu and
                  Hannaneh Hajishirzi and
                  Kenton Lee and
                  Jennimaria Palomaki and
                  Colin Raffel and
                  Adam Roberts and
                  Tom Kwiatkowski and
                  Patrick S. H. Lewis and
                  Yuxiang Wu and
                  Heinrich K{\"{u}}ttler and
                  Linqing Liu and
                  Pasquale Minervini and
                  Pontus Stenetorp and
                  Sebastian Riedel and
                  Sohee Yang and
                  Minjoon Seo and
                  Gautier Izacard and
                  Fabio Petroni and
                  Lucas Hosseini and
                  Nicola De Cao and
                  Edouard Grave and
                  Ikuya Yamada and
                  Sonse Shimaoka and
                  Masatoshi Suzuki and
                  Shumpei Miyawaki and
                  Shun Sato and
                  Ryo Takahashi and
                  Jun Suzuki and
                  Martin Fajcik and
                  Martin Docekal and
                  Karel Ondrej and
                  Pavel Smrz and
                  Hao Cheng and
                  Yelong Shen and
                  Xiaodong Liu and
                  Pengcheng He and
                  Weizhu Chen and
                  Jianfeng Gao and
                  Barlas Oguz and
                  Xilun Chen and
                  Vladimir Karpukhin and
                  Stan Peshterliev and
                  Dmytro Okhonko and
                  Michael Sejr Schlichtkrull and
                  Sonal Gupta and
                  Yashar Mehdad and
                  Wen{-}tau Yih},
  editor       = {Hugo Jair Escalante and
                  Katja Hofmann},
  title        = {NeurIPS 2020 EfficientQA Competition: Systems, Analyses and Lessons
                  Learned},
  booktitle    = {NeurIPS 2020 Competition and Demonstration Track, 6-12 December 2020,
                  Virtual Event / Vancouver, BC, Canada},
  series       = {Proceedings of Machine Learning Research},
  volume       = {133},
  pages        = {86--111},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v133/min21a.html},
  timestamp    = {Thu, 11 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/MinBACC0GHLPRRK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-09402,
  author       = {Angela Fan and
                  Thibaut Lavril and
                  Edouard Grave and
                  Armand Joulin and
                  Sainbayar Sukhbaatar},
  title        = {Accessing Higher-level Representations in Sequential Transformers
                  with Feedback Memory},
  journal      = {CoRR},
  volume       = {abs/2002.09402},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.09402},
  eprinttype    = {arXiv},
  eprint       = {2002.09402},
  timestamp    = {Mon, 02 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-09402.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-07320,
  author       = {Angela Fan and
                  Pierre Stock and
                  Benjamin Graham and
                  Edouard Grave and
                  R{\'{e}}mi Gribonval and
                  Herv{\'{e}} J{\'{e}}gou and
                  Armand Joulin},
  title        = {Training with Quantization Noise for Extreme Model Compression},
  journal      = {CoRR},
  volume       = {abs/2004.07320},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.07320},
  eprinttype    = {arXiv},
  eprint       = {2004.07320},
  timestamp    = {Wed, 22 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-07320.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-01282,
  author       = {Gautier Izacard and
                  Edouard Grave},
  title        = {Leveraging Passage Retrieval with Generative Models for Open Domain
                  Question Answering},
  journal      = {CoRR},
  volume       = {abs/2007.01282},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.01282},
  eprinttype    = {arXiv},
  eprint       = {2007.01282},
  timestamp    = {Mon, 06 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-01282.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-02194,
  author       = {Jingfei Du and
                  Edouard Grave and
                  Beliz Gunel and
                  Vishrav Chaudhary and
                  Onur Celebi and
                  Michael Auli and
                  Ves Stoyanov and
                  Alexis Conneau},
  title        = {Self-training Improves Pre-training for Natural Language Understanding},
  journal      = {CoRR},
  volume       = {abs/2010.02194},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.02194},
  eprinttype    = {arXiv},
  eprint       = {2010.02194},
  timestamp    = {Mon, 12 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-02194.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2010-11125,
  author       = {Angela Fan and
                  Shruti Bhosale and
                  Holger Schwenk and
                  Zhiyi Ma and
                  Ahmed El{-}Kishky and
                  Siddharth Goyal and
                  Mandeep Baines and
                  Onur Celebi and
                  Guillaume Wenzek and
                  Vishrav Chaudhary and
                  Naman Goyal and
                  Tom Birch and
                  Vitaliy Liptchinsky and
                  Sergey Edunov and
                  Edouard Grave and
                  Michael Auli and
                  Armand Joulin},
  title        = {Beyond English-Centric Multilingual Machine Translation},
  journal      = {CoRR},
  volume       = {abs/2010.11125},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.11125},
  eprinttype    = {arXiv},
  eprint       = {2010.11125},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-11125.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-04584,
  author       = {Gautier Izacard and
                  Edouard Grave},
  title        = {Distilling Knowledge from Reader to Retriever for Question Answering},
  journal      = {CoRR},
  volume       = {abs/2012.04584},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.04584},
  eprinttype    = {arXiv},
  eprint       = {2012.04584},
  timestamp    = {Wed, 09 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-04584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-15156,
  author       = {Gautier Izacard and
                  Fabio Petroni and
                  Lucas Hosseini and
                  Nicola De Cao and
                  Sebastian Riedel and
                  Edouard Grave},
  title        = {A Memory Efficient Baseline for Open Domain Question Answering},
  journal      = {CoRR},
  volume       = {abs/2012.15156},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.15156},
  eprinttype    = {arXiv},
  eprint       = {2012.15156},
  timestamp    = {Fri, 08 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-15156.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/SukhbaatarGBJ19,
  author       = {Sainbayar Sukhbaatar and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Armand Joulin},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Adaptive Attention Span in Transformers},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {331--335},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1032},
  doi          = {10.18653/V1/P19-1032},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/SukhbaatarGBJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GraveSBJ19,
  author       = {Edouard Grave and
                  Sainbayar Sukhbaatar and
                  Piotr Bojanowski and
                  Armand Joulin},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Training Hybrid Language Models by Marginalizing over Segmentations},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {1477--1482},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1143},
  doi          = {10.18653/V1/P19-1143},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GraveSBJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/WangHXPMPKTHYJC19,
  author       = {Alex Wang and
                  Jan Hula and
                  Patrick Xia and
                  Raghavendra Pappagari and
                  R. Thomas McCoy and
                  Roma Patel and
                  Najoung Kim and
                  Ian Tenney and
                  Yinghui Huang and
                  Katherin Yu and
                  Shuning Jin and
                  Berlin Chen and
                  Benjamin Van Durme and
                  Edouard Grave and
                  Ellie Pavlick and
                  Samuel R. Bowman},
  editor       = {Anna Korhonen and
                  David R. Traum and
                  Llu{\'{\i}}s M{\`{a}}rquez},
  title        = {Can You Tell Me How to Get Past Sesame Street? Sentence-Level Pretraining
                  Beyond Language Modeling},
  booktitle    = {Proceedings of the 57th Conference of the Association for Computational
                  Linguistics, {ACL} 2019, Florence, Italy, July 28- August 2, 2019,
                  Volume 1: Long Papers},
  pages        = {4465--4476},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/p19-1439},
  doi          = {10.18653/V1/P19-1439},
  timestamp    = {Thu, 23 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/WangHXPMPKTHYJC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/GraveJB19,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Quentin Berthet},
  editor       = {Kamalika Chaudhuri and
                  Masashi Sugiyama},
  title        = {Unsupervised Alignment of Embeddings with Wasserstein Procrustes},
  booktitle    = {The 22nd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan},
  series       = {Proceedings of Machine Learning Research},
  volume       = {89},
  pages        = {1880--1890},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v89/grave19a.html},
  timestamp    = {Fri, 07 Jun 2019 09:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/GraveJB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/CzarnowskaRGCC19,
  author       = {Paula Czarnowska and
                  Sebastian Ruder and
                  Edouard Grave and
                  Ryan Cotterell and
                  Ann A. Copestake},
  editor       = {Kentaro Inui and
                  Jing Jiang and
                  Vincent Ng and
                  Xiaojun Wan},
  title        = {Don't Forget the Long Tail! {A} Comprehensive Analysis of Morphological
                  Generalization in Bilingual Lexicon Induction},
  booktitle    = {Proceedings of the 2019 Conference on Empirical Methods in Natural
                  Language Processing and the 9th International Joint Conference on
                  Natural Language Processing, {EMNLP-IJCNLP} 2019, Hong Kong, China,
                  November 3-7, 2019},
  pages        = {974--983},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/D19-1090},
  doi          = {10.18653/V1/D19-1090},
  timestamp    = {Thu, 07 Apr 2022 09:14:07 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/CzarnowskaRGCC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/AlauxGCJ19,
  author       = {Jean Alaux and
                  Edouard Grave and
                  Marco Cuturi and
                  Armand Joulin},
  title        = {Unsupervised Hyper-alignment for Multilingual Word Embeddings},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=HJe62s09tX},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/AlauxGCJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/EdizelPBFGS19,
  author       = {Bora Edizel and
                  Aleksandra Piktus and
                  Piotr Bojanowski and
                  Rui Ferreira and
                  Edouard Grave and
                  Fabrizio Silvestri},
  editor       = {Jill Burstein and
                  Christy Doran and
                  Thamar Solorio},
  title        = {Misspelling Oblivious Word Embeddings},
  booktitle    = {Proceedings of the 2019 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2019, Minneapolis, MN, USA, June 2-7, 2019, Volume 1 (Long
                  and Short Papers)},
  pages        = {3226--3234},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/n19-1326},
  doi          = {10.18653/V1/N19-1326},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/EdizelPBFGS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-07799,
  author       = {Sainbayar Sukhbaatar and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Armand Joulin},
  title        = {Adaptive Attention Span in Transformers},
  journal      = {CoRR},
  volume       = {abs/1905.07799},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.07799},
  eprinttype    = {arXiv},
  eprint       = {1905.07799},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-07799.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-09755,
  author       = {Bora Edizel and
                  Aleksandra Piktus and
                  Piotr Bojanowski and
                  Rui Ferreira and
                  Edouard Grave and
                  Fabrizio Silvestri},
  title        = {Misspelling Oblivious Word Embeddings},
  journal      = {CoRR},
  volume       = {abs/1905.09755},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.09755},
  eprinttype    = {arXiv},
  eprint       = {1905.09755},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-09755.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-01470,
  author       = {Sainbayar Sukhbaatar and
                  Edouard Grave and
                  Guillaume Lample and
                  Herv{\'{e}} J{\'{e}}gou and
                  Armand Joulin},
  title        = {Augmenting Self-attention with Persistent Memory},
  journal      = {CoRR},
  volume       = {abs/1907.01470},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.01470},
  eprinttype    = {arXiv},
  eprint       = {1907.01470},
  timestamp    = {Wed, 24 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-01470.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-02855,
  author       = {Paula Czarnowska and
                  Sebastian Ruder and
                  Edouard Grave and
                  Ryan Cotterell and
                  Ann A. Copestake},
  title        = {Don't Forget the Long Tail! {A} Comprehensive Analysis of Morphological
                  Generalization in Bilingual Lexicon Induction},
  journal      = {CoRR},
  volume       = {abs/1909.02855},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.02855},
  eprinttype    = {arXiv},
  eprint       = {1909.02855},
  timestamp    = {Mon, 16 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-02855.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1909-11556,
  author       = {Angela Fan and
                  Edouard Grave and
                  Armand Joulin},
  title        = {Reducing Transformer Depth on Demand with Structured Dropout},
  journal      = {CoRR},
  volume       = {abs/1909.11556},
  year         = {2019},
  url          = {http://arxiv.org/abs/1909.11556},
  eprinttype    = {arXiv},
  eprint       = {1909.11556},
  timestamp    = {Fri, 27 Sep 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1909-11556.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-06241,
  author       = {Piotr Bojanowski and
                  Onur Celebi and
                  Tom{\'{a}}s Mikolov and
                  Edouard Grave and
                  Armand Joulin},
  title        = {Updating Pre-trained Word Vectors and Text Classifiers using Monolingual
                  Alignment},
  journal      = {CoRR},
  volume       = {abs/1910.06241},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.06241},
  eprinttype    = {arXiv},
  eprint       = {1910.06241},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-06241.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-10073,
  author       = {Maha Elbayad and
                  Jiatao Gu and
                  Edouard Grave and
                  Michael Auli},
  title        = {Depth-Adaptive Transformer},
  journal      = {CoRR},
  volume       = {abs/1910.10073},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.10073},
  eprinttype    = {arXiv},
  eprint       = {1910.10073},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-10073.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-00359,
  author       = {Guillaume Wenzek and
                  Marie{-}Anne Lachaux and
                  Alexis Conneau and
                  Vishrav Chaudhary and
                  Francisco Guzm{\'{a}}n and
                  Armand Joulin and
                  Edouard Grave},
  title        = {CCNet: Extracting High Quality Monolingual Datasets from Web Crawl
                  Data},
  journal      = {CoRR},
  volume       = {abs/1911.00359},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.00359},
  eprinttype    = {arXiv},
  eprint       = {1911.00359},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-00359.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-02116,
  author       = {Alexis Conneau and
                  Kartikay Khandelwal and
                  Naman Goyal and
                  Vishrav Chaudhary and
                  Guillaume Wenzek and
                  Francisco Guzm{\'{a}}n and
                  Edouard Grave and
                  Myle Ott and
                  Luke Zettlemoyer and
                  Veselin Stoyanov},
  title        = {Unsupervised Cross-lingual Representation Learning at Scale},
  journal      = {CoRR},
  volume       = {abs/1911.02116},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.02116},
  eprinttype    = {arXiv},
  eprint       = {1911.02116},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-02116.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-04944,
  author       = {Holger Schwenk and
                  Guillaume Wenzek and
                  Sergey Edunov and
                  Edouard Grave and
                  Armand Joulin},
  title        = {CCMatrix: Mining Billions of High-Quality Parallel Sentences on the
                  {WEB}},
  journal      = {CoRR},
  volume       = {abs/1911.04944},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.04944},
  eprinttype    = {arXiv},
  eprint       = {1911.04944},
  timestamp    = {Mon, 02 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-04944.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-08460,
  author       = {Gabriel Synnaeve and
                  Qiantong Xu and
                  Jacob Kahn and
                  Edouard Grave and
                  Tatiana Likhomanenko and
                  Vineel Pratap and
                  Anuroop Sriram and
                  Vitaliy Liptchinsky and
                  Ronan Collobert},
  title        = {End-to-end {ASR:} from Supervised to Semi-Supervised Learning with
                  Modern Architectures},
  journal      = {CoRR},
  volume       = {abs/1911.08460},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.08460},
  eprinttype    = {arXiv},
  eprint       = {1911.08460},
  timestamp    = {Tue, 03 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-08460.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KielaGJM18,
  author       = {Douwe Kiela and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Efficient Large-Scale Multi-Modal Classification},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {5198--5204},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11945},
  doi          = {10.1609/AAAI.V32I1.11945},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KielaGJM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/JoulinBMJG18,
  author       = {Armand Joulin and
                  Piotr Bojanowski and
                  Tom{\'{a}}s Mikolov and
                  Herv{\'{e}} J{\'{e}}gou and
                  Edouard Grave},
  editor       = {Ellen Riloff and
                  David Chiang and
                  Julia Hockenmaier and
                  Jun'ichi Tsujii},
  title        = {Loss in Translation: Learning Bilingual Word Mapping with a Retrieval
                  Criterion},
  booktitle    = {Proceedings of the 2018 Conference on Empirical Methods in Natural
                  Language Processing, Brussels, Belgium, October 31 - November 4, 2018},
  pages        = {2979--2984},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/d18-1330},
  doi          = {10.18653/V1/D18-1330},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/JoulinBMJG18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/GraveBGJM18,
  author       = {Edouard Grave and
                  Piotr Bojanowski and
                  Prakhar Gupta and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  editor       = {Nicoletta Calzolari and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  K{\^{o}}iti Hasida and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis and
                  Takenobu Tokunaga},
  title        = {Learning Word Vectors for 157 Languages},
  booktitle    = {Proceedings of the Eleventh International Conference on Language Resources
                  and Evaluation, {LREC} 2018, Miyazaki, Japan, May 7-12, 2018},
  publisher    = {European Language Resources Association {(ELRA)}},
  year         = {2018},
  url          = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/627.html},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/GraveBGJM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/lrec/MikolovGBPJ18,
  author       = {Tom{\'{a}}s Mikolov and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Christian Puhrsch and
                  Armand Joulin},
  editor       = {Nicoletta Calzolari and
                  Khalid Choukri and
                  Christopher Cieri and
                  Thierry Declerck and
                  Sara Goggi and
                  K{\^{o}}iti Hasida and
                  Hitoshi Isahara and
                  Bente Maegaard and
                  Joseph Mariani and
                  H{\'{e}}l{\`{e}}ne Mazo and
                  Asunci{\'{o}}n Moreno and
                  Jan Odijk and
                  Stelios Piperidis and
                  Takenobu Tokunaga},
  title        = {Advances in Pre-Training Distributed Word Representations},
  booktitle    = {Proceedings of the Eleventh International Conference on Language Resources
                  and Evaluation, {LREC} 2018, Miyazaki, Japan, May 7-12, 2018},
  publisher    = {European Language Resources Association {(ELRA)}},
  year         = {2018},
  url          = {http://www.lrec-conf.org/proceedings/lrec2018/summaries/721.html},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/lrec/MikolovGBPJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/GulordavaBGLB18,
  author       = {Kristina Gulordava and
                  Piotr Bojanowski and
                  Edouard Grave and
                  Tal Linzen and
                  Marco Baroni},
  editor       = {Marilyn A. Walker and
                  Heng Ji and
                  Amanda Stent},
  title        = {Colorless Green Recurrent Networks Dream Hierarchically},
  booktitle    = {Proceedings of the 2018 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume
                  1 (Long Papers)},
  pages        = {1195--1205},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/n18-1108},
  doi          = {10.18653/V1/N18-1108},
  timestamp    = {Mon, 26 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/GulordavaBGLB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-02892,
  author       = {Douwe Kiela and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Efficient Large-Scale Multi-Modal Classification},
  journal      = {CoRR},
  volume       = {abs/1802.02892},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.02892},
  eprinttype    = {arXiv},
  eprint       = {1802.02892},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-02892.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1802-06893,
  author       = {Edouard Grave and
                  Piotr Bojanowski and
                  Prakhar Gupta and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Learning Word Vectors for 157 Languages},
  journal      = {CoRR},
  volume       = {abs/1802.06893},
  year         = {2018},
  url          = {http://arxiv.org/abs/1802.06893},
  eprinttype    = {arXiv},
  eprint       = {1802.06893},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1802-06893.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-11138,
  author       = {Kristina Gulordava and
                  Piotr Bojanowski and
                  Edouard Grave and
                  Tal Linzen and
                  Marco Baroni},
  title        = {Colorless green recurrent networks dream hierarchically},
  journal      = {CoRR},
  volume       = {abs/1803.11138},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.11138},
  eprinttype    = {arXiv},
  eprint       = {1803.11138},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-11138.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-07705,
  author       = {Anton Bakhtin and
                  Arthur Szlam and
                  Marc'Aurelio Ranzato and
                  Edouard Grave},
  title        = {Lightweight Adaptive Mixture of Neural and N-gram Language Models},
  journal      = {CoRR},
  volume       = {abs/1804.07705},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.07705},
  eprinttype    = {arXiv},
  eprint       = {1804.07705},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-07705.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-07745,
  author       = {Armand Joulin and
                  Piotr Bojanowski and
                  Tom{\'{a}}s Mikolov and
                  Edouard Grave},
  title        = {Improving Supervised Bilingual Mapping of Word Embeddings},
  journal      = {CoRR},
  volume       = {abs/1804.07745},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.07745},
  eprinttype    = {arXiv},
  eprint       = {1804.07745},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-07745.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1805-11222,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Quentin Berthet},
  title        = {Unsupervised Alignment of Embeddings with Wasserstein Procrustes},
  journal      = {CoRR},
  volume       = {abs/1805.11222},
  year         = {2018},
  url          = {http://arxiv.org/abs/1805.11222},
  eprinttype    = {arXiv},
  eprint       = {1805.11222},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1805-11222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-01124,
  author       = {Jean Alaux and
                  Edouard Grave and
                  Marco Cuturi and
                  Armand Joulin},
  title        = {Unsupervised Hyperalignment for Multilingual Word Embeddings},
  journal      = {CoRR},
  volume       = {abs/1811.01124},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.01124},
  eprinttype    = {arXiv},
  eprint       = {1811.01124},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-01124.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1812-10860,
  author       = {Samuel R. Bowman and
                  Ellie Pavlick and
                  Edouard Grave and
                  Benjamin Van Durme and
                  Alex Wang and
                  Jan Hula and
                  Patrick Xia and
                  Raghavendra Pappagari and
                  R. Thomas McCoy and
                  Roma Patel and
                  Najoung Kim and
                  Ian Tenney and
                  Yinghui Huang and
                  Katherin Yu and
                  Shuning Jin and
                  Berlin Chen},
  title        = {Looking for ELMo's friends: Sentence-Level Pretraining Beyond Language
                  Modeling},
  journal      = {CoRR},
  volume       = {abs/1812.10860},
  year         = {2018},
  url          = {http://arxiv.org/abs/1812.10860},
  eprinttype    = {arXiv},
  eprint       = {1812.10860},
  timestamp    = {Thu, 23 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1812-10860.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jbi/ZhangGSE17,
  author       = {Shaodian Zhang and
                  Edouard Grave and
                  Elizabeth Sklar and
                  No{\'{e}}mie Elhadad},
  title        = {Longitudinal analysis of discussion topics in an online breast cancer
                  community using convolutional neural networks},
  journal      = {J. Biomed. Informatics},
  volume       = {69},
  pages        = {1--9},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.jbi.2017.03.012},
  doi          = {10.1016/J.JBI.2017.03.012},
  timestamp    = {Fri, 21 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jbi/ZhangGSE17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tacl/BojanowskiGJM17,
  author       = {Piotr Bojanowski and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Enriching Word Vectors with Subword Information},
  journal      = {Trans. Assoc. Comput. Linguistics},
  volume       = {5},
  pages        = {135--146},
  year         = {2017},
  url          = {https://doi.org/10.1162/tacl\_a\_00051},
  doi          = {10.1162/TACL\_A\_00051},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tacl/BojanowskiGJM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/akbc/JoulinGBNM17,
  author       = {Armand Joulin and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Maximilian Nickel and
                  Tom{\'{a}}s Mikolov},
  title        = {Fast Linear Model for Knowledge Graph Embeddings},
  booktitle    = {6th Workshop on Automated Knowledge Base Construction, AKBC@NIPS 2017,
                  Long Beach, California, USA, December 8, 2017},
  publisher    = {OpenReview.net},
  year         = {2017},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/akbc/JoulinGBNM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/eacl/GraveMJB17,
  author       = {Armand Joulin and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Tom{\'{a}}s Mikolov},
  editor       = {Mirella Lapata and
                  Phil Blunsom and
                  Alexander Koller},
  title        = {Bag of Tricks for Efficient Text Classification},
  booktitle    = {Proceedings of the 15th Conference of the European Chapter of the
                  Association for Computational Linguistics, {EACL} 2017, Valencia,
                  Spain, April 3-7, 2017, Volume 2: Short Papers},
  pages        = {427--431},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/e17-2068},
  doi          = {10.18653/V1/E17-2068},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/eacl/GraveMJB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/GraveJU17,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Nicolas Usunier},
  title        = {Improving Neural Language Models with a Continuous Cache},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=B184E5qee},
  timestamp    = {Thu, 25 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/GraveJU17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/JerniteGJM17,
  author       = {Yacine Jernite and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Variable Computation in Recurrent Neural Networks},
  booktitle    = {5th International Conference on Learning Representations, {ICLR} 2017,
                  Toulon, France, April 24-26, 2017, Conference Track Proceedings},
  publisher    = {OpenReview.net},
  year         = {2017},
  url          = {https://openreview.net/forum?id=S1LVSrcge},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iclr/JerniteGJM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/CisseBGDU17,
  author       = {Moustapha Ciss{\'{e}} and
                  Piotr Bojanowski and
                  Edouard Grave and
                  Yann N. Dauphin and
                  Nicolas Usunier},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Parseval Networks: Improving Robustness to Adversarial Examples},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {854--863},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/cisse17a.html},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/CisseBGDU17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/GraveJCGJ17,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Moustapha Ciss{\'{e}} and
                  David Grangier and
                  Herv{\'{e}} J{\'{e}}gou},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Efficient softmax approximation for GPUs},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {1302--1310},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/grave17a.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/GraveJCGJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GraveCJ17,
  author       = {Edouard Grave and
                  Moustapha Ciss{\'{e}} and
                  Armand Joulin},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Unbounded cache model for online language modeling with open vocabulary},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {6042--6052},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/f44ee263952e65b3610b8ba51229d1f9-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/GraveCJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/CisseBGDU17,
  author       = {Moustapha Ciss{\'{e}} and
                  Piotr Bojanowski and
                  Edouard Grave and
                  Yann N. Dauphin and
                  Nicolas Usunier},
  title        = {Parseval Networks: Improving Robustness to Adversarial Examples},
  journal      = {CoRR},
  volume       = {abs/1704.08847},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.08847},
  eprinttype    = {arXiv},
  eprint       = {1704.08847},
  timestamp    = {Mon, 22 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/CisseBGDU17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1710-10881,
  author       = {Armand Joulin and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Maximilian Nickel and
                  Tom{\'{a}}s Mikolov},
  title        = {Fast Linear Model for Knowledge Graph Embeddings},
  journal      = {CoRR},
  volume       = {abs/1710.10881},
  year         = {2017},
  url          = {http://arxiv.org/abs/1710.10881},
  eprinttype    = {arXiv},
  eprint       = {1710.10881},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1710-10881.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02604,
  author       = {Edouard Grave and
                  Moustapha Ciss{\'{e}} and
                  Armand Joulin},
  title        = {Unbounded cache model for online language modeling with open vocabulary},
  journal      = {CoRR},
  volume       = {abs/1711.02604},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02604},
  eprinttype    = {arXiv},
  eprint       = {1711.02604},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02604.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1712-09405,
  author       = {Tom{\'{a}}s Mikolov and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Christian Puhrsch and
                  Armand Joulin},
  title        = {Advances in Pre-Training Distributed Word Representations},
  journal      = {CoRR},
  volume       = {abs/1712.09405},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.09405},
  eprinttype    = {arXiv},
  eprint       = {1712.09405},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-09405.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ZhangGSE16,
  author       = {Shaodian Zhang and
                  Edouard Grave and
                  Elizabeth Sklar and
                  Noemie Elhadad},
  title        = {Longitudinal Analysis of Discussion Topics in an Online Breast Cancer
                  Community using Convolutional Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1603.08458},
  year         = {2016},
  url          = {http://arxiv.org/abs/1603.08458},
  eprinttype    = {arXiv},
  eprint       = {1603.08458},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/ZhangGSE16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JoulinGBM16,
  author       = {Armand Joulin and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Tom{\'{a}}s Mikolov},
  title        = {Bag of Tricks for Efficient Text Classification},
  journal      = {CoRR},
  volume       = {abs/1607.01759},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.01759},
  eprinttype    = {arXiv},
  eprint       = {1607.01759},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/JoulinGBM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BojanowskiGJM16,
  author       = {Piotr Bojanowski and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Enriching Word Vectors with Subword Information},
  journal      = {CoRR},
  volume       = {abs/1607.04606},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.04606},
  eprinttype    = {arXiv},
  eprint       = {1607.04606},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BojanowskiGJM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GraveJCGJ16,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Moustapha Ciss{\'{e}} and
                  David Grangier and
                  Herv{\'{e}} J{\'{e}}gou},
  title        = {Efficient softmax approximation for GPUs},
  journal      = {CoRR},
  volume       = {abs/1609.04309},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.04309},
  eprinttype    = {arXiv},
  eprint       = {1609.04309},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GraveJCGJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JerniteGJM16,
  author       = {Yacine Jernite and
                  Edouard Grave and
                  Armand Joulin and
                  Tom{\'{a}}s Mikolov},
  title        = {Variable Computation in Recurrent Neural Networks},
  journal      = {CoRR},
  volume       = {abs/1611.06188},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.06188},
  eprinttype    = {arXiv},
  eprint       = {1611.06188},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/JerniteGJM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JoulinGBDJM16,
  author       = {Armand Joulin and
                  Edouard Grave and
                  Piotr Bojanowski and
                  Matthijs Douze and
                  Herv{\'{e}} J{\'{e}}gou and
                  Tom{\'{a}}s Mikolov},
  title        = {FastText.zip: Compressing text classification models},
  journal      = {CoRR},
  volume       = {abs/1612.03651},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.03651},
  eprinttype    = {arXiv},
  eprint       = {1612.03651},
  timestamp    = {Mon, 28 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/JoulinGBDJM16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GraveJU16,
  author       = {Edouard Grave and
                  Armand Joulin and
                  Nicolas Usunier},
  title        = {Improving Neural Language Models with a Continuous Cache},
  journal      = {CoRR},
  volume       = {abs/1612.04426},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.04426},
  eprinttype    = {arXiv},
  eprint       = {1612.04426},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GraveJU16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jbi/PivovarovPGAWE15,
  author       = {Rimma Pivovarov and
                  Adler J. Perotte and
                  Edouard Grave and
                  John Angiolillo and
                  Chris H. Wiggins and
                  No{\'{e}}mie Elhadad},
  title        = {Learning probabilistic phenotypes from heterogeneous {EHR} data},
  journal      = {J. Biomed. Informatics},
  volume       = {58},
  pages        = {156--165},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.jbi.2015.10.001},
  doi          = {10.1016/J.JBI.2015.10.001},
  timestamp    = {Wed, 17 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jbi/PivovarovPGAWE15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GraveE15,
  author       = {Edouard Grave and
                  No{\'{e}}mie Elhadad},
  title        = {A convex and feature-rich discriminative approach to dependency grammar
                  induction},
  booktitle    = {Proceedings of the 53rd Annual Meeting of the Association for Computational
                  Linguistics and the 7th International Joint Conference on Natural
                  Language Processing of the Asian Federation of Natural Language Processing,
                  {ACL} 2015, July 26-31, 2015, Beijing, China, Volume 1: Long Papers},
  pages        = {1375--1384},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.3115/v1/p15-1133},
  doi          = {10.3115/V1/P15-1133},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GraveE15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/BojanowskiLGBLP15,
  author       = {Piotr Bojanowski and
                  R{\'{e}}mi Lajugie and
                  Edouard Grave and
                  Francis R. Bach and
                  Ivan Laptev and
                  Jean Ponce and
                  Cordelia Schmid},
  title        = {Weakly-Supervised Alignment of Video with Text},
  booktitle    = {2015 {IEEE} International Conference on Computer Vision, {ICCV} 2015,
                  Santiago, Chile, December 7-13, 2015},
  pages        = {4462--4470},
  publisher    = {{IEEE} Computer Society},
  year         = {2015},
  url          = {https://doi.org/10.1109/ICCV.2015.507},
  doi          = {10.1109/ICCV.2015.507},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/BojanowskiLGBLP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BojanowskiLGBLP15,
  author       = {Piotr Bojanowski and
                  R{\'{e}}mi Lajugie and
                  Edouard Grave and
                  Francis R. Bach and
                  Ivan Laptev and
                  Jean Ponce and
                  Cordelia Schmid},
  title        = {Weakly-Supervised Alignment of Video With Text},
  journal      = {CoRR},
  volume       = {abs/1505.06027},
  year         = {2015},
  url          = {http://arxiv.org/abs/1505.06027},
  eprinttype    = {arXiv},
  eprint       = {1505.06027},
  timestamp    = {Tue, 02 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/BojanowskiLGBLP15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/hal/Grave14,
  author       = {Edouard Grave},
  title        = {A Markovian approach to distributional semantics. (Une approche Markovienne
                  {\`{a}} la s{\'{e}}mantique distributionnelle)},
  school       = {Pierre and Marie Curie University, Paris, France},
  year         = {2014},
  url          = {https://tel.archives-ouvertes.fr/tel-00940575},
  timestamp    = {Tue, 21 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/hal/Grave14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/coling/GraveOB14,
  author       = {Edouard Grave and
                  Guillaume Obozinski and
                  Francis R. Bach},
  editor       = {Jan Hajic and
                  Junichi Tsujii},
  title        = {A Markovian approach to distributional semantics with application
                  to semantic compositionality},
  booktitle    = {{COLING} 2014, 25th International Conference on Computational Linguistics,
                  Proceedings of the Conference: Technical Papers, August 23-29, 2014,
                  Dublin, Ireland},
  pages        = {1447--1456},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://aclanthology.org/C14-1137/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/coling/GraveOB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/Grave14,
  author       = {Edouard Grave},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {A convex relaxation for weakly supervised relation extraction},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {1580--1590},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1166},
  doi          = {10.3115/V1/D14-1166},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/Grave14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/conll/GraveOB13,
  author       = {Edouard Grave and
                  Guillaume Obozinski and
                  Francis R. Bach},
  editor       = {Julia Hockenmaier and
                  Sebastian Riedel},
  title        = {Hidden Markov tree models for semantic class induction},
  booktitle    = {Proceedings of the Seventeenth Conference on Computational Natural
                  Language Learning, CoNLL 2013, Sofia, Bulgaria, August 8-9, 2013},
  pages        = {94--103},
  publisher    = {{ACL}},
  year         = {2013},
  url          = {https://aclanthology.org/W13-3511/},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/conll/GraveOB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GraveOB13,
  author       = {Edouard Grave and
                  Guillaume Obozinski and
                  Francis R. Bach},
  title        = {Domain adaptation for sequence labeling using hidden Markov models},
  journal      = {CoRR},
  volume       = {abs/1312.4092},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.4092},
  eprinttype    = {arXiv},
  eprint       = {1312.4092},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GraveOB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GraveOB11,
  author       = {Edouard Grave and
                  Guillaume Obozinski and
                  Francis R. Bach},
  editor       = {John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Peter L. Bartlett and
                  Fernando C. N. Pereira and
                  Kilian Q. Weinberger},
  title        = {Trace Lasso: a trace norm regularization for correlated designs},
  booktitle    = {Advances in Neural Information Processing Systems 24: 25th Annual
                  Conference on Neural Information Processing Systems 2011. Proceedings
                  of a meeting held 12-14 December 2011, Granada, Spain},
  pages        = {2187--2195},
  year         = {2011},
  url          = {https://proceedings.neurips.cc/paper/2011/hash/33ceb07bf4eeb3da587e268d663aba1a-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GraveOB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1109-1990,
  author       = {Edouard Grave and
                  Guillaume Obozinski and
                  Francis R. Bach},
  title        = {Trace Lasso: a trace norm regularization for correlated designs},
  journal      = {CoRR},
  volume       = {abs/1109.1990},
  year         = {2011},
  url          = {http://arxiv.org/abs/1109.1990},
  eprinttype    = {arXiv},
  eprint       = {1109.1990},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1109-1990.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics