BibTeX records: Martin Jaggi

download as .bib file

@inproceedings{DBLP:conf/aaai/KossonFJ24,
  author       = {Atli Kosson and
                  Dongyang Fan and
                  Martin Jaggi},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Ghost Noise for Regularizing Deep Neural Networks},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {13274--13282},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i12.29228},
  doi          = {10.1609/AAAI.V38I12.29228},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KossonFJ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-02622,
  author       = {Matteo Pagliardini and
                  Amirkeivan Mohtashami and
                  Fran{\c{c}}ois Fleuret and
                  Martin Jaggi},
  title        = {DenseFormer: Enhancing Information Flow in Transformers via Depth
                  Weighted Averaging},
  journal      = {CoRR},
  volume       = {abs/2402.02622},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.02622},
  doi          = {10.48550/ARXIV.2402.02622},
  eprinttype    = {arXiv},
  eprint       = {2402.02622},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-02622.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-02933,
  author       = {Vinitra Swamy and
                  Julian Blackwell and
                  Jibril Frej and
                  Martin Jaggi and
                  Tanja K{\"{a}}ser},
  title        = {InterpretCC: Conditional Computation for Inherently Interpretable
                  Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2402.02933},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.02933},
  doi          = {10.48550/ARXIV.2402.02933},
  eprinttype    = {arXiv},
  eprint       = {2402.02933},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-02933.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-04161,
  author       = {Ashok Vardhan Makkuva and
                  Marco Bondaschi and
                  Adway Girish and
                  Alliot Nagle and
                  Martin Jaggi and
                  Hyeji Kim and
                  Michael Gastpar},
  title        = {Attention with Markov: {A} Framework for Principled Analysis of Transformers
                  via Markov Chains},
  journal      = {CoRR},
  volume       = {abs/2402.04161},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.04161},
  doi          = {10.48550/ARXIV.2402.04161},
  eprinttype    = {arXiv},
  eprint       = {2402.04161},
  timestamp    = {Mon, 12 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-04161.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-13089,
  author       = {Dongyang Fan and
                  Bettina Messmer and
                  Martin Jaggi},
  title        = {Towards an empirical understanding of MoE design choices},
  journal      = {CoRR},
  volume       = {abs/2402.13089},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.13089},
  doi          = {10.48550/ARXIV.2402.13089},
  eprinttype    = {arXiv},
  eprint       = {2402.13089},
  timestamp    = {Thu, 21 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-13089.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/npjdm/HeitmannGDDSGBCPMCRSLJGHHFBBHBB23,
  author       = {Julien Heitmann and
                  Alban Glangetas and
                  Jonathan Doenz and
                  Juliane Dervaux and
                  Deeksha M. Shama and
                  Daniel Hinjos Garcia and
                  Mohamed Rida Benissa and
                  Aymeric Cantais and
                  Alexandre Perez and
                  Daniel M{\"{u}}ller and
                  Tatjana Chavdarova and
                  Isabelle Ruchonnet{-}Metrailler and
                  Johan N. Siebert and
                  Laurence Lacroix and
                  Martin Jaggi and
                  Alain Gervaix and
                  Mary{-}Anne Hartley and
                  Florence Hugon and
                  Derrick Fassbind and
                  Makura Barro and
                  Georges Bediang and
                  N. E. L. Hafidi and
                  M. Bouskraoui and
                  Idrissa Ba},
  title        = {DeepBreath - automated detection of respiratory pathology from lung
                  auscultation in 572 pediatric outpatients across 5 countries},
  journal      = {npj Digit. Medicine},
  volume       = {6},
  year         = {2023},
  url          = {https://doi.org/10.1038/s41746-023-00838-3},
  doi          = {10.1038/S41746-023-00838-3},
  timestamp    = {Wed, 24 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/npjdm/HeitmannGDDSGBCPMCRSLJGHHFBBHBB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/BlinovaZJEB23,
  author       = {Sofia Blinova and
                  Xinyu Zhou and
                  Martin Jaggi and
                  Carsten Eickhoff and
                  Seyed Ali Bahrainian},
  editor       = {Anna Rogers and
                  Jordan L. Boyd{-}Graber and
                  Naoaki Okazaki},
  title        = {{SIMSUM:} Document-level Text Simplification via Simultaneous Summarization},
  booktitle    = {Proceedings of the 61st Annual Meeting of the Association for Computational
                  Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada,
                  July 9-14, 2023},
  pages        = {9927--9944},
  publisher    = {Association for Computational Linguistics},
  year         = {2023},
  url          = {https://doi.org/10.18653/v1/2023.acl-long.552},
  doi          = {10.18653/V1/2023.ACL-LONG.552},
  timestamp    = {Thu, 10 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/BlinovaZJEB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/colt/VladareanDJF23,
  author       = {Maria{-}Luiza Vladarean and
                  Nikita Doikov and
                  Martin Jaggi and
                  Nicolas Flammarion},
  editor       = {Gergely Neu and
                  Lorenzo Rosasco},
  title        = {Linearization Algorithms for Fully Composite Optimization},
  booktitle    = {The Thirty Sixth Annual Conference on Learning Theory, {COLT} 2023,
                  12-15 July 2023, Bangalore, India},
  series       = {Proceedings of Machine Learning Research},
  volume       = {195},
  pages        = {3669--3695},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v195/vladarean23a.html},
  timestamp    = {Wed, 06 Sep 2023 17:49:05 +0200},
  biburl       = {https://dblp.org/rec/conf/colt/VladareanDJF23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/PagliardiniJFK23,
  author       = {Matteo Pagliardini and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret and
                  Sai Praneeth Karimireddy},
  title        = {Agree to Disagree: Diversity through Disagreement for Better Transferability},
  booktitle    = {The Eleventh International Conference on Learning Representations,
                  {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023},
  publisher    = {OpenReview.net},
  year         = {2023},
  url          = {https://openreview.net/pdf?id=K7CbYQbyYhY},
  timestamp    = {Fri, 30 Jun 2023 14:38:38 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/PagliardiniJFK23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DoikovCJ23,
  author       = {Nikita Doikov and
                  El Mahdi Chayti and
                  Martin Jaggi},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Second-Order Optimization with Lazy Hessians},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {8138--8161},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/doikov23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DoikovCJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MohtashamiJS23,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi and
                  Sebastian U. Stich},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Special Properties of Gradient Descent with Large Learning Rates},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {25082--25104},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/mohtashami23a.html},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MohtashamiJS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/FanMJ23,
  author       = {Dongyang Fan and
                  Celestine Mendler{-}D{\"{u}}nner and
                  Martin Jaggi},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Collaborative Learning via Prediction Consensus},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/065e259a1d2d955e63b99aac6a3a3081-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/FanMJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KossonJ23,
  author       = {Atli Kosson and
                  Martin Jaggi},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Multiplication-Free Transformer Training via Piecewise Affine Operations},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/19df21cd4931bd0caaa4d8480e9a59cd-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KossonJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/MohtashamiJ23,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Random-Access Infinite Context Length for Transformers},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/ab05dc8bf36a9f66edbff6992ec86f56-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/MohtashamiJ23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/PagliardiniPJF23,
  author       = {Matteo Pagliardini and
                  Daniele Paliotta and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {Fast Attention Over Long Sequences With Dynamic Sparse Flash Attention},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/bc222e8153a49c1b30a1b8ba96b35117-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/PagliardiniPJF23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SwamySFBVJKH23,
  author       = {Vinitra Swamy and
                  Malika Satayeva and
                  Jibril Frej and
                  Thierry Bossy and
                  Thijs Vogels and
                  Martin Jaggi and
                  Tanja K{\"{a}}ser and
                  Mary{-}Anne Hartley},
  editor       = {Alice Oh and
                  Tristan Naumann and
                  Amir Globerson and
                  Kate Saenko and
                  Moritz Hardt and
                  Sergey Levine},
  title        = {MultiMoDN - Multimodal, Multi-Task, Interpretable Modular Networks},
  booktitle    = {Advances in Neural Information Processing Systems 36: Annual Conference
                  on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans,
                  LA, USA, December 10 - 16, 2023},
  year         = {2023},
  url          = {http://papers.nips.cc/paper\_files/paper/2023/hash/5951641ad71b0052cf776f9b71f18932-Abstract-Conference.html},
  timestamp    = {Fri, 01 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SwamySFBVJKH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2301-02151,
  author       = {Thijs Vogels and
                  Hadrien Hendrikx and
                  Martin Jaggi},
  title        = {Beyond spectral gap (extended): The role of the topology in decentralized
                  learning},
  journal      = {CoRR},
  volume       = {abs/2301.02151},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2301.02151},
  doi          = {10.48550/ARXIV.2301.02151},
  eprinttype    = {arXiv},
  eprint       = {2301.02151},
  timestamp    = {Tue, 10 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2301-02151.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-11962,
  author       = {El Mahdi Chayti and
                  Nikita Doikov and
                  Martin Jaggi},
  title        = {Unified Convergence Theory of Stochastic and Variance-Reduced Cubic
                  Newton Methods},
  journal      = {CoRR},
  volume       = {abs/2302.11962},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.11962},
  doi          = {10.48550/ARXIV.2302.11962},
  eprinttype    = {arXiv},
  eprint       = {2302.11962},
  timestamp    = {Tue, 28 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-11962.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-12808,
  author       = {Maria{-}Luiza Vladarean and
                  Nikita Doikov and
                  Martin Jaggi and
                  Nicolas Flammarion},
  title        = {Linearization Algorithms for Fully Composite Optimization},
  journal      = {CoRR},
  volume       = {abs/2302.12808},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.12808},
  doi          = {10.48550/ARXIV.2302.12808},
  eprinttype    = {arXiv},
  eprint       = {2302.12808},
  timestamp    = {Tue, 28 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-12808.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-16300,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi},
  title        = {Landmark Attention: Random-Access Infinite Context Length for Transformers},
  journal      = {CoRR},
  volume       = {abs/2305.16300},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.16300},
  doi          = {10.48550/ARXIV.2305.16300},
  eprinttype    = {arXiv},
  eprint       = {2305.16300},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-16300.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-17190,
  author       = {Atli Kosson and
                  Martin Jaggi},
  title        = {Hardware-Efficient Transformer Training via Piecewise Affine Operations},
  journal      = {CoRR},
  volume       = {abs/2305.17190},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17190},
  doi          = {10.48550/ARXIV.2305.17190},
  eprinttype    = {arXiv},
  eprint       = {2305.17190},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17190.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-17205,
  author       = {Atli Kosson and
                  Dongyang Fan and
                  Martin Jaggi},
  title        = {Ghost Noise for Regularizing Deep Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2305.17205},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17205},
  doi          = {10.48550/ARXIV.2305.17205},
  eprinttype    = {arXiv},
  eprint       = {2305.17205},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17205.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-17212,
  author       = {Atli Kosson and
                  Bettina Messmer and
                  Martin Jaggi},
  title        = {Rotational Optimizers: Simple {\&} Robust {DNN} Training},
  journal      = {CoRR},
  volume       = {abs/2305.17212},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.17212},
  doi          = {10.48550/ARXIV.2305.17212},
  eprinttype    = {arXiv},
  eprint       = {2305.17212},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-17212.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-18497,
  author       = {Dongyang Fan and
                  Celestine Mendler{-}D{\"{u}}nner and
                  Martin Jaggi},
  title        = {Collaborative Learning via Prediction Consensus},
  journal      = {CoRR},
  volume       = {abs/2305.18497},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.18497},
  doi          = {10.48550/ARXIV.2305.18497},
  eprinttype    = {arXiv},
  eprint       = {2305.18497},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-18497.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-19259,
  author       = {Anastasia Koloskova and
                  Nikita Doikov and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Shuffle {SGD} is Always Better than {SGD:} Improved Analysis of {SGD}
                  with Arbitrary Data Orders},
  journal      = {CoRR},
  volume       = {abs/2305.19259},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.19259},
  doi          = {10.48550/ARXIV.2305.19259},
  eprinttype    = {arXiv},
  eprint       = {2305.19259},
  timestamp    = {Wed, 07 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-19259.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-01160,
  author       = {Matteo Pagliardini and
                  Daniele Paliotta and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret},
  title        = {Faster Causal Attention Over Large Sequences Through Sparse Flash
                  Attention},
  journal      = {CoRR},
  volume       = {abs/2306.01160},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.01160},
  doi          = {10.48550/ARXIV.2306.01160},
  eprinttype    = {arXiv},
  eprint       = {2306.01160},
  timestamp    = {Mon, 12 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-01160.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2306-08393,
  author       = {Mariel A. Werner and
                  Lie He and
                  Sai Praneeth Karimireddy and
                  Michael I. Jordan and
                  Martin Jaggi},
  title        = {Provably Personalized and Robust Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2306.08393},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2306.08393},
  doi          = {10.48550/ARXIV.2306.08393},
  eprinttype    = {arXiv},
  eprint       = {2306.08393},
  timestamp    = {Sun, 18 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2306-08393.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2307-06966,
  author       = {Linara Adilova and
                  Asja Fischer and
                  Martin Jaggi},
  title        = {Layerwise Linear Mode Connectivity},
  journal      = {CoRR},
  volume       = {abs/2307.06966},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2307.06966},
  doi          = {10.48550/ARXIV.2307.06966},
  eprinttype    = {arXiv},
  eprint       = {2307.06966},
  timestamp    = {Mon, 24 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2307-06966.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2309-14118,
  author       = {Vinitra Swamy and
                  Malika Satayeva and
                  Jibril Frej and
                  Thierry Bossy and
                  Thijs Vogels and
                  Martin Jaggi and
                  Tanja K{\"{a}}ser and
                  Mary{-}Anne Hartley},
  title        = {MultiModN- Multimodal, Multi-Task, Interpretable Modular Networks},
  journal      = {CoRR},
  volume       = {abs/2309.14118},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2309.14118},
  doi          = {10.48550/ARXIV.2309.14118},
  eprinttype    = {arXiv},
  eprint       = {2309.14118},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2309-14118.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-10845,
  author       = {Amirkeivan Mohtashami and
                  Matteo Pagliardini and
                  Martin Jaggi},
  title        = {CoTFormer: More Tokens With Attention Make Up For Less Depth},
  journal      = {CoRR},
  volume       = {abs/2310.10845},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.10845},
  doi          = {10.48550/ARXIV.2310.10845},
  eprinttype    = {arXiv},
  eprint       = {2310.10845},
  timestamp    = {Thu, 26 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-10845.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-13033,
  author       = {Ashok Vardhan Makkuva and
                  Marco Bondaschi and
                  Thijs Vogels and
                  Martin Jaggi and
                  Hyeji Kim and
                  Michael C. Gastpar},
  title        = {{LASER:} Linear Compression in Wireless Distributed Optimization},
  journal      = {CoRR},
  volume       = {abs/2310.13033},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.13033},
  doi          = {10.48550/ARXIV.2310.13033},
  eprinttype    = {arXiv},
  eprint       = {2310.13033},
  timestamp    = {Fri, 27 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-13033.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-15389,
  author       = {Simin Fan and
                  Martin Jaggi},
  title        = {Irreducible Curriculum for Language Model Pretraining},
  journal      = {CoRR},
  volume       = {abs/2310.15389},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.15389},
  doi          = {10.48550/ARXIV.2310.15389},
  eprinttype    = {arXiv},
  eprint       = {2310.15389},
  timestamp    = {Tue, 31 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-15389.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2310-15393,
  author       = {Simin Fan and
                  Matteo Pagliardini and
                  Martin Jaggi},
  title        = {DoGE: Domain Reweighting with Generalization Estimation},
  journal      = {CoRR},
  volume       = {abs/2310.15393},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.15393},
  doi          = {10.48550/ARXIV.2310.15393},
  eprinttype    = {arXiv},
  eprint       = {2310.15393},
  timestamp    = {Tue, 31 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-15393.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-06724,
  author       = {Seyed Ali Bahrainian and
                  Martin Jaggi and
                  Carsten Eickhoff},
  title        = {Controllable Topic-Focused Abstractive Summarization},
  journal      = {CoRR},
  volume       = {abs/2311.06724},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.06724},
  doi          = {10.48550/ARXIV.2311.06724},
  eprinttype    = {arXiv},
  eprint       = {2311.06724},
  timestamp    = {Wed, 15 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-06724.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2311-16079,
  author       = {Zeming Chen and
                  Alejandro Hern{\'{a}}ndez{-}Cano and
                  Angelika Romanou and
                  Antoine Bonnet and
                  Kyle Matoba and
                  Francesco Salvi and
                  Matteo Pagliardini and
                  Simin Fan and
                  Andreas K{\"{o}}pf and
                  Amirkeivan Mohtashami and
                  Alexandre Sallinen and
                  Alireza Sakhaeirad and
                  Vinitra Swamy and
                  Igor Krawczuk and
                  Deniz Bayazit and
                  Axel Marmet and
                  Syrielle Montariol and
                  Mary{-}Anne Hartley and
                  Martin Jaggi and
                  Antoine Bosselut},
  title        = {{MEDITRON-70B:} Scaling Medical Pretraining for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2311.16079},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.16079},
  doi          = {10.48550/ARXIV.2311.16079},
  eprinttype    = {arXiv},
  eprint       = {2311.16079},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-16079.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/DandiBJ22,
  author       = {Yatin Dandi and
                  Luis Barba and
                  Martin Jaggi},
  title        = {Implicit Gradient Alignment in Distributed and Federated Learning},
  booktitle    = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2022, Thirty-Fourth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22
                  - March 1, 2022},
  pages        = {6454--6462},
  publisher    = {{AAAI} Press},
  year         = {2022},
  url          = {https://doi.org/10.1609/aaai.v36i6.20597},
  doi          = {10.1609/AAAI.V36I6.20597},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DandiBJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/MohtashamiJS22,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi and
                  Sebastian U. Stich},
  editor       = {Gustau Camps{-}Valls and
                  Francisco J. R. Ruiz and
                  Isabel Valera},
  title        = {Masked Training of Neural Networks with Partial Gradients},
  booktitle    = {International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2022, 28-30 March 2022, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {151},
  pages        = {5876--5890},
  publisher    = {{PMLR}},
  year         = {2022},
  url          = {https://proceedings.mlr.press/v151/mohtashami22a.html},
  timestamp    = {Sat, 30 Sep 2023 09:34:08 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/MohtashamiJS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KarimireddyHJ22,
  author       = {Sai Praneeth Karimireddy and
                  Lie He and
                  Martin Jaggi},
  title        = {Byzantine-Robust Learning on Heterogeneous Datasets via Bucketing},
  booktitle    = {The Tenth International Conference on Learning Representations, {ICLR}
                  2022, Virtual Event, April 25-29, 2022},
  publisher    = {OpenReview.net},
  year         = {2022},
  url          = {https://openreview.net/forum?id=jXKKDEi5vJt},
  timestamp    = {Sat, 20 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KarimireddyHJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/MoiseevDAJ22,
  author       = {Fedor Moiseev and
                  Zhe Dong and
                  Enrique Alfonseca and
                  Martin Jaggi},
  editor       = {Marine Carpuat and
                  Marie{-}Catherine de Marneffe and
                  Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z},
  title        = {{SKILL:} Structured Knowledge Infusion for Large Language Models},
  booktitle    = {Proceedings of the 2022 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL} 2022, Seattle, WA, United States, July 10-15, 2022},
  pages        = {1581--1588},
  publisher    = {Association for Computational Linguistics},
  year         = {2022},
  url          = {https://doi.org/10.18653/v1/2022.naacl-main.113},
  doi          = {10.18653/V1/2022.NAACL-MAIN.113},
  timestamp    = {Mon, 01 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/MoiseevDAJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KoloskovaSJ22,
  author       = {Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Sharper Convergence Guarantees for Asynchronous {SGD} for Distributed
                  and Federated Learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/6db3ea527f53682657b3d6b02a841340-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/KoloskovaSJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/TerrailACGHLMMM22,
  author       = {Jean Ogier du Terrail and
                  Samy{-}Safwan Ayed and
                  Edwige Cyffers and
                  Felix Grimberg and
                  Chaoyang He and
                  Regis Loeb and
                  Paul Mangold and
                  Tanguy Marchand and
                  Othmane Marfoq and
                  Erum Mushtaq and
                  Boris Muzellec and
                  Constantin Philippenko and
                  Santiago Silva and
                  Maria Telenczuk and
                  Shadi Albarqouni and
                  Salman Avestimehr and
                  Aur{\'{e}}lien Bellet and
                  Aymeric Dieuleveut and
                  Martin Jaggi and
                  Sai Praneeth Karimireddy and
                  Marco Lorenzi and
                  Giovanni Neglia and
                  Marc Tommasi and
                  Mathieu Andreux},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {FLamby: Datasets and Benchmarks for Cross-Silo Federated Learning
                  in Realistic Healthcare Settings},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/232eee8ef411a0a316efa298d7be3c2b-Abstract-Datasets\_and\_Benchmarks.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/TerrailACGHLMMM22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VogelsHJ22,
  author       = {Thijs Vogels and
                  Hadrien Hendrikx and
                  Martin Jaggi},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Beyond spectral gap: the role of the topology in decentralized learning},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/61162d94822d468ee6e92803340f2040-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/VogelsHJ22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-01545,
  author       = {Lie He and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {Byzantine-Robust Decentralized Learning via Self-Centered Clipping},
  journal      = {CoRR},
  volume       = {abs/2202.01545},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.01545},
  eprinttype    = {arXiv},
  eprint       = {2202.01545},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-01545.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-01838,
  author       = {Amirkeivan Mohtashami and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Characterizing {\&} Finding Good Data Orderings for Fast Convergence
                  of Sequential Gradient Methods},
  journal      = {CoRR},
  volume       = {abs/2202.01838},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.01838},
  eprinttype    = {arXiv},
  eprint       = {2202.01838},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-01838.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-04414,
  author       = {Matteo Pagliardini and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret and
                  Sai Praneeth Karimireddy},
  title        = {Agree to Disagree: Diversity through Disagreement for Better Transferability},
  journal      = {CoRR},
  volume       = {abs/2202.04414},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.04414},
  eprinttype    = {arXiv},
  eprint       = {2202.04414},
  timestamp    = {Fri, 18 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-04414.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-05737,
  author       = {Matteo Pagliardini and
                  Gilberto Manunza and
                  Martin Jaggi and
                  Michael I. Jordan and
                  Tatjana Chavdarova},
  title        = {Improving Generalization via Uncertainty Driven Perturbations},
  journal      = {CoRR},
  volume       = {abs/2202.05737},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.05737},
  eprinttype    = {arXiv},
  eprint       = {2202.05737},
  timestamp    = {Fri, 18 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-05737.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2204-06477,
  author       = {Yatin Dandi and
                  Anastasia Koloskova and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {Data-heterogeneity-aware Mixing for Decentralized Learning},
  journal      = {CoRR},
  volume       = {abs/2204.06477},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2204.06477},
  doi          = {10.48550/ARXIV.2204.06477},
  eprinttype    = {arXiv},
  eprint       = {2204.06477},
  timestamp    = {Tue, 19 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2204-06477.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-08184,
  author       = {Fedor Moiseev and
                  Zhe Dong and
                  Enrique Alfonseca and
                  Martin Jaggi},
  title        = {{SKILL:} Structured Knowledge Infusion for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2205.08184},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.08184},
  doi          = {10.48550/ARXIV.2205.08184},
  eprinttype    = {arXiv},
  eprint       = {2205.08184},
  timestamp    = {Tue, 16 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-08184.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2205-15142,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {On Avoiding Local Minima Using Gradient Descent With Large Learning
                  Rates},
  journal      = {CoRR},
  volume       = {abs/2205.15142},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2205.15142},
  doi          = {10.48550/ARXIV.2205.15142},
  eprinttype    = {arXiv},
  eprint       = {2205.15142},
  timestamp    = {Wed, 01 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2205-15142.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-03093,
  author       = {Thijs Vogels and
                  Hadrien Hendrikx and
                  Martin Jaggi},
  title        = {Beyond spectral gap: The role of the topology in decentralized learning},
  journal      = {CoRR},
  volume       = {abs/2206.03093},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.03093},
  doi          = {10.48550/ARXIV.2206.03093},
  eprinttype    = {arXiv},
  eprint       = {2206.03093},
  timestamp    = {Tue, 14 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-03093.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2206-08307,
  author       = {Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Sharper Convergence Guarantees for Asynchronous {SGD} for Distributed
                  and Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2206.08307},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2206.08307},
  doi          = {10.48550/ARXIV.2206.08307},
  eprinttype    = {arXiv},
  eprint       = {2206.08307},
  timestamp    = {Tue, 21 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2206-08307.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2210-04620,
  author       = {Jean Ogier du Terrail and
                  Samy{-}Safwan Ayed and
                  Edwige Cyffers and
                  Felix Grimberg and
                  Chaoyang He and
                  Regis Loeb and
                  Paul Mangold and
                  Tanguy Marchand and
                  Othmane Marfoq and
                  Erum Mushtaq and
                  Boris Muzellec and
                  Constantin Philippenko and
                  Santiago Silva and
                  Maria Telenczuk and
                  Shadi Albarqouni and
                  Salman Avestimehr and
                  Aur{\'{e}}lien Bellet and
                  Aymeric Dieuleveut and
                  Martin Jaggi and
                  Sai Praneeth Karimireddy and
                  Marco Lorenzi and
                  Giovanni Neglia and
                  Marc Tommasi and
                  Mathieu Andreux},
  title        = {FLamby: Datasets and Benchmarks for Cross-Silo Federated Learning
                  in Realistic Healthcare Settings},
  journal      = {CoRR},
  volume       = {abs/2210.04620},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.04620},
  doi          = {10.48550/ARXIV.2210.04620},
  eprinttype    = {arXiv},
  eprint       = {2210.04620},
  timestamp    = {Wed, 22 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-04620.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-06637,
  author       = {C{\'{e}}cile Trottet and
                  Thijs Vogels and
                  Martin Jaggi and
                  Mary{-}Anne Hartley},
  title        = {Modular Clinical Decision Support Networks (MoDN) - Updatable, Interpretable,
                  and Portable Predictions for Evolving Clinical Environments},
  journal      = {CoRR},
  volume       = {abs/2211.06637},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.06637},
  doi          = {10.48550/ARXIV.2211.06637},
  eprinttype    = {arXiv},
  eprint       = {2211.06637},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-06637.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-10737,
  author       = {Simla Burcu Harma and
                  Canberk S{\"{o}}nmez and
                  Babak Falsafi and
                  Martin Jaggi and
                  Yunho Oh},
  title        = {Accuracy Boosters: Epoch-Driven Mixed-Mantissa Block Floating-Point
                  for {DNN} Training},
  journal      = {CoRR},
  volume       = {abs/2211.10737},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.10737},
  doi          = {10.48550/ARXIV.2211.10737},
  eprinttype    = {arXiv},
  eprint       = {2211.10737},
  timestamp    = {Thu, 24 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-10737.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2211-10943,
  author       = {Fr{\'{e}}d{\'{e}}ric Berdoz and
                  Abhishek Singh and
                  Martin Jaggi and
                  Ramesh Raskar},
  title        = {Scalable Collaborative Learning via Representation Sharing},
  journal      = {CoRR},
  volume       = {abs/2211.10943},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2211.10943},
  doi          = {10.48550/ARXIV.2211.10943},
  eprinttype    = {arXiv},
  eprint       = {2211.10943},
  timestamp    = {Thu, 24 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2211-10943.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2212-00781,
  author       = {Nikita Doikov and
                  El Mahdi Chayti and
                  Martin Jaggi},
  title        = {Second-order optimization with lazy Hessians},
  journal      = {CoRR},
  volume       = {abs/2212.00781},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.00781},
  doi          = {10.48550/ARXIV.2212.00781},
  eprinttype    = {arXiv},
  eprint       = {2212.00781},
  timestamp    = {Thu, 08 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-00781.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftml/KairouzMABBBBCC21,
  author       = {Peter Kairouz and
                  H. Brendan McMahan and
                  Brendan Avent and
                  Aur{\'{e}}lien Bellet and
                  Mehdi Bennis and
                  Arjun Nitin Bhagoji and
                  Kallista A. Bonawitz and
                  Zachary Charles and
                  Graham Cormode and
                  Rachel Cummings and
                  Rafael G. L. D'Oliveira and
                  Hubert Eichner and
                  Salim El Rouayheb and
                  David Evans and
                  Josh Gardner and
                  Zachary Garrett and
                  Adri{\`{a}} Gasc{\'{o}}n and
                  Badih Ghazi and
                  Phillip B. Gibbons and
                  Marco Gruteser and
                  Za{\"{\i}}d Harchaoui and
                  Chaoyang He and
                  Lie He and
                  Zhouyuan Huo and
                  Ben Hutchinson and
                  Justin Hsu and
                  Martin Jaggi and
                  Tara Javidi and
                  Gauri Joshi and
                  Mikhail Khodak and
                  Jakub Kone{\v{c}}n{\'y} and
                  Aleksandra Korolova and
                  Farinaz Koushanfar and
                  Sanmi Koyejo and
                  Tancr{\`{e}}de Lepoint and
                  Yang Liu and
                  Prateek Mittal and
                  Mehryar Mohri and
                  Richard Nock and
                  Ayfer {\"{O}}zg{\"{u}}r and
                  Rasmus Pagh and
                  Hang Qi and
                  Daniel Ramage and
                  Ramesh Raskar and
                  Mariana Raykova and
                  Dawn Song and
                  Weikang Song and
                  Sebastian U. Stich and
                  Ziteng Sun and
                  Ananda Theertha Suresh and
                  Florian Tram{\`{e}}r and
                  Praneeth Vepakomma and
                  Jianyu Wang and
                  Li Xiong and
                  Zheng Xu and
                  Qiang Yang and
                  Felix X. Yu and
                  Han Yu and
                  Sen Zhao},
  title        = {Advances and Open Problems in Federated Learning},
  journal      = {Found. Trends Mach. Learn.},
  volume       = {14},
  number       = {1-2},
  pages        = {1--210},
  year         = {2021},
  url          = {https://doi.org/10.1561/2200000083},
  doi          = {10.1561/2200000083},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ftml/KairouzMABBBBCC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/oms/MaJCST21,
  author       = {Chenxin Ma and
                  Martin Jaggi and
                  Frank E. Curtis and
                  Nathan Srebro and
                  Martin Tak{\'{a}}c},
  title        = {An accelerated communication-efficient primal-dual optimization framework
                  for structured machine learning},
  journal      = {Optim. Methods Softw.},
  volume       = {36},
  number       = {1},
  pages        = {20--44},
  year         = {2021},
  url          = {https://doi.org/10.1080/10556788.2019.1650361},
  doi          = {10.1080/10556788.2019.1650361},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/oms/MaJCST21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/MaoGCJK20,
  author       = {Zhuoyuan Mao and
                  Prakhar Gupta and
                  Chenhui Chu and
                  Martin Jaggi and
                  Sadao Kurohashi},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Lightweight Cross-Lingual Sentence Representation Learning},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {2902--2913},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.226},
  doi          = {10.18653/V1/2021.ACL-LONG.226},
  timestamp    = {Mon, 09 Aug 2021 16:25:37 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/MaoGCJK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/GuptaJ20,
  author       = {Prakhar Gupta and
                  Martin Jaggi},
  editor       = {Chengqing Zong and
                  Fei Xia and
                  Wenjie Li and
                  Roberto Navigli},
  title        = {Obtaining Better Static Word Embeddings Using Contextual Embedding
                  Models},
  booktitle    = {Proceedings of the 59th Annual Meeting of the Association for Computational
                  Linguistics and the 11th International Joint Conference on Natural
                  Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual
                  Event, August 1-6, 2021},
  pages        = {5241--5253},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.acl-long.408},
  doi          = {10.18653/V1/2021.ACL-LONG.408},
  timestamp    = {Mon, 09 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acl/GuptaJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/GhadikolaeiSJ21,
  author       = {Hossein Shokri Ghadikolaei and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Arindam Banerjee and
                  Kenji Fukumizu},
  title        = {{LENA:} Communication-Efficient Distributed Learning with Self-Triggered
                  Gradient Uploads},
  booktitle    = {The 24th International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2021, April 13-15, 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {130},
  pages        = {3943--3951},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v130/shokri-ghadikolaei21a.html},
  timestamp    = {Wed, 14 Apr 2021 16:51:37 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/GhadikolaeiSJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/StichMJ21,
  author       = {Sebastian U. Stich and
                  Amirkeivan Mohtashami and
                  Martin Jaggi},
  editor       = {Arindam Banerjee and
                  Kenji Fukumizu},
  title        = {Critical Parameters for Scalable Distributed Learning with Large Batches
                  and Asynchronous Updates},
  booktitle    = {The 24th International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2021, April 13-15, 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {130},
  pages        = {4042--4050},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v130/stich21a.html},
  timestamp    = {Wed, 14 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/StichMJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/KovalevKJRS21,
  author       = {Dmitry Kovalev and
                  Anastasia Koloskova and
                  Martin Jaggi and
                  Peter Richt{\'{a}}rik and
                  Sebastian U. Stich},
  editor       = {Arindam Banerjee and
                  Kenji Fukumizu},
  title        = {A Linearly Convergent Algorithm for Decentralized Optimization: Sending
                  Less Bits for Free!},
  booktitle    = {The 24th International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2021, April 13-15, 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {130},
  pages        = {4087--4095},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v130/kovalev21a.html},
  timestamp    = {Wed, 14 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/KovalevKJRS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/BahrainianJE21,
  author       = {Seyed Ali Bahrainian and
                  Martin Jaggi and
                  Carsten Eickhoff},
  editor       = {Marie{-}Francine Moens and
                  Xuanjing Huang and
                  Lucia Specia and
                  Scott Wen{-}tau Yih},
  title        = {Self-Supervised Neural Topic Modeling},
  booktitle    = {Findings of the Association for Computational Linguistics: {EMNLP}
                  2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November,
                  2021},
  pages        = {3341--3350},
  publisher    = {Association for Computational Linguistics},
  year         = {2021},
  url          = {https://doi.org/10.18653/v1/2021.findings-emnlp.284},
  doi          = {10.18653/V1/2021.FINDINGS-EMNLP.284},
  timestamp    = {Fri, 16 Feb 2024 08:27:36 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/BahrainianJE21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hipc/WszolaJP21,
  author       = {Eliza Wszola and
                  Martin Jaggi and
                  Markus P{\"{u}}schel},
  title        = {Faster Parallel Training of Word Embeddings},
  booktitle    = {28th {IEEE} International Conference on High Performance Computing,
                  Data, and Analytics, HiPC 2021, Bengaluru, India, December 17-20,
                  2021},
  pages        = {31--41},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/HiPC53243.2021.00017},
  doi          = {10.1109/HIPC53243.2021.00017},
  timestamp    = {Mon, 31 Jan 2022 09:34:30 +0100},
  biburl       = {https://dblp.org/rec/conf/hipc/WszolaJP21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iccv/YukselSJC21,
  author       = {Oguz Kaan Y{\"{u}}ksel and
                  Sebastian U. Stich and
                  Martin Jaggi and
                  Tatjana Chavdarova},
  title        = {Semantic Perturbations with Normalizing Flows for Improved Generalization},
  booktitle    = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV}
                  2021, Montreal, QC, Canada, October 10-17, 2021},
  pages        = {6599--6609},
  publisher    = {{IEEE}},
  year         = {2021},
  url          = {https://doi.org/10.1109/ICCV48922.2021.00655},
  doi          = {10.1109/ICCV48922.2021.00655},
  timestamp    = {Fri, 11 Mar 2022 10:01:27 +0100},
  biburl       = {https://dblp.org/rec/conf/iccv/YukselSJC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/ChavdarovaPSFJ21,
  author       = {Tatjana Chavdarova and
                  Matteo Pagliardini and
                  Sebastian U. Stich and
                  Fran{\c{c}}ois Fleuret and
                  Martin Jaggi},
  title        = {Taming GANs with Lookahead-Minmax},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=ZW0yXJyNmoG},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/ChavdarovaPSFJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LeeATJ21,
  author       = {Namhoon Lee and
                  Thalaiyasingam Ajanthan and
                  Philip H. S. Torr and
                  Martin Jaggi},
  title        = {Understanding the effects of data parallelism and sparsity on neural
                  network training},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=rsogjAnYs4z},
  timestamp    = {Wed, 23 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LeeATJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Cherubin0J21,
  author       = {Giovanni Cherubin and
                  Konstantinos Chatzikokolakis and
                  Martin Jaggi},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Exact Optimization of Conformal Predictors via Incremental and Decremental
                  Learning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {1836--1845},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/cherubin21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Cherubin0J21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KarimireddyHJ21,
  author       = {Sai Praneeth Karimireddy and
                  Lie He and
                  Martin Jaggi},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Learning from History for Byzantine Robust Optimization},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {5311--5319},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/karimireddy21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KarimireddyHJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/00010KJS21,
  author       = {Lingjing Kong and
                  Tao Lin and
                  Anastasia Koloskova and
                  Martin Jaggi and
                  Sebastian U. Stich},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Consensus Control for Decentralized Deep Learning},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {5686--5696},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/kong21a.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/00010KJS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/0004KSJ21,
  author       = {Tao Lin and
                  Sai Praneeth Karimireddy and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Marina Meila and
                  Tong Zhang},
  title        = {Quasi-global Momentum: Accelerating Decentralized Deep Learning on
                  Heterogeneous Data},
  booktitle    = {Proceedings of the 38th International Conference on Machine Learning,
                  {ICML} 2021, 18-24 July 2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {139},
  pages        = {6654--6665},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {http://proceedings.mlr.press/v139/lin21c.html},
  timestamp    = {Wed, 25 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/0004KSJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/micro/DrumondCZYFJ21,
  author       = {Mario Drumond and
                  Louis Coulon and
                  Arash Pourhabibi Zarandi and
                  Ahmet Caner Y{\"{u}}z{\"{u}}g{\"{u}}ler and
                  Babak Falsafi and
                  Martin Jaggi},
  title        = {Equinox: Training (for Free) on a Custom Inference Accelerator},
  booktitle    = {{MICRO} '21: 54th Annual {IEEE/ACM} International Symposium on Microarchitecture,
                  Virtual Event, Greece, October 18-22, 2021},
  pages        = {421--433},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3466752.3480057},
  doi          = {10.1145/3466752.3480057},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/micro/DrumondCZYFJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mobisys/MakhmutovaKFMJC21,
  author       = {Mariko Makhmutova and
                  Raghu Kainkaryam and
                  Marta Ferreira and
                  Jae Min and
                  Martin Jaggi and
                  Ieuan Clay},
  title        = {Prediction of self-reported depression scores using person-generated
                  health data from a virtual 1-year mental health observational study},
  booktitle    = {DigiBiom@MobiSys '21: Proceedings of the 2021 Workshop on Future of
                  Digital Biomarkers, Virtual Event, Wisconsin, USA, 25 June, 2021},
  pages        = {4--11},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3469266.3469878},
  doi          = {10.1145/3469266.3469878},
  timestamp    = {Mon, 26 Jul 2021 11:37:29 +0200},
  biburl       = {https://dblp.org/rec/conf/mobisys/MakhmutovaKFMJC21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VogelsHKKLSJ21,
  author       = {Thijs Vogels and
                  Lie He and
                  Anastasia Koloskova and
                  Sai Praneeth Karimireddy and
                  Tao Lin and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {RelaySum for Decentralized Deep Learning on Heterogeneous Data},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {28004--28015},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/ebbdfea212e3a756a1fded7b35578525-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/VogelsHKKLSJ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/KarimireddyJKMR21,
  author       = {Sai Praneeth Karimireddy and
                  Martin Jaggi and
                  Satyen Kale and
                  Mehryar Mohri and
                  Sashank J. Reddi and
                  Sebastian U. Stich and
                  Ananda Theertha Suresh},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Breaking the centralized barrier for cross-device federated learning},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {28663--28676},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/f0e6be4ce76ccfa73c5a540d992d0756-Abstract.html},
  timestamp    = {Tue, 03 May 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/KarimireddyJKMR21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-03236,
  author       = {Giovanni Cherubin and
                  Konstantinos Chatzikokolakis and
                  Martin Jaggi},
  title        = {Exact Optimization of Conformal Predictors via Incremental and Decremental
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2102.03236},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.03236},
  eprinttype    = {arXiv},
  eprint       = {2102.03236},
  timestamp    = {Wed, 10 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-03236.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-04761,
  author       = {Tao Lin and
                  Sai Praneeth Karimireddy and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Quasi-Global Momentum: Accelerating Decentralized Deep Learning on
                  Heterogeneous Data},
  journal      = {CoRR},
  volume       = {abs/2102.04761},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.04761},
  eprinttype    = {arXiv},
  eprint       = {2102.04761},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-04761.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2102-04828,
  author       = {Lingjing Kong and
                  Tao Lin and
                  Anastasia Koloskova and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {Consensus Control for Decentralized Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2102.04828},
  year         = {2021},
  url          = {https://arxiv.org/abs/2102.04828},
  eprinttype    = {arXiv},
  eprint       = {2102.04828},
  timestamp    = {Mon, 14 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2102-04828.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-02351,
  author       = {Sebastian U. Stich and
                  Amirkeivan Mohtashami and
                  Martin Jaggi},
  title        = {Critical Parameters for Scalable Distributed Learning with Large Batches
                  and Asynchronous Updates},
  journal      = {CoRR},
  volume       = {abs/2103.02351},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.02351},
  eprinttype    = {arXiv},
  eprint       = {2103.02351},
  timestamp    = {Thu, 04 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-02351.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2104-09994,
  author       = {Valerian Rey and
                  Pedro Miguel S{\'{a}}nchez S{\'{a}}nchez and
                  Alberto Huertas Celdr{\'{a}}n and
                  G{\'{e}}r{\^{o}}me Bovet and
                  Martin Jaggi},
  title        = {Federated Learning for Malware Detection in IoT Devices},
  journal      = {CoRR},
  volume       = {abs/2104.09994},
  year         = {2021},
  url          = {https://arxiv.org/abs/2104.09994},
  eprinttype    = {arXiv},
  eprint       = {2104.09994},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2104-09994.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2105-13856,
  author       = {Zhuoyuan Mao and
                  Prakhar Gupta and
                  Chenhui Chu and
                  Martin Jaggi and
                  Sadao Kurohashi},
  title        = {Lightweight Cross-Lingual Sentence Representation Learning},
  journal      = {CoRR},
  volume       = {abs/2105.13856},
  year         = {2021},
  url          = {https://arxiv.org/abs/2105.13856},
  eprinttype    = {arXiv},
  eprint       = {2105.13856},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2105-13856.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-04302,
  author       = {Prakhar Gupta and
                  Martin Jaggi},
  title        = {Obtaining Better Static Word Embeddings Using Contextual Embedding
                  Models},
  journal      = {CoRR},
  volume       = {abs/2106.04302},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.04302},
  eprinttype    = {arXiv},
  eprint       = {2106.04302},
  timestamp    = {Fri, 11 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-04302.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-08895,
  author       = {Amirkeivan Mohtashami and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {Simultaneous Training of Partially Masked Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2106.08895},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.08895},
  eprinttype    = {arXiv},
  eprint       = {2106.08895},
  timestamp    = {Tue, 29 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-08895.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-13897,
  author       = {Yatin Dandi and
                  Luis Barba and
                  Martin Jaggi},
  title        = {Implicit Gradient Alignment in Distributed and Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2106.13897},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.13897},
  eprinttype    = {arXiv},
  eprint       = {2106.13897},
  timestamp    = {Wed, 30 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-13897.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-06580,
  author       = {David Roschewitz and
                  Mary{-}Anne Hartley and
                  Luca Corinzia and
                  Martin Jaggi},
  title        = {IFedAvg: Interpretable Data-Interoperability for Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2107.06580},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.06580},
  eprinttype    = {arXiv},
  eprint       = {2107.06580},
  timestamp    = {Wed, 21 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-06580.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-06917,
  author       = {Jianyu Wang and
                  Zachary Charles and
                  Zheng Xu and
                  Gauri Joshi and
                  H. Brendan McMahan and
                  Blaise Ag{\"{u}}era y Arcas and
                  Maruan Al{-}Shedivat and
                  Galen Andrew and
                  Salman Avestimehr and
                  Katharine Daly and
                  Deepesh Data and
                  Suhas N. Diggavi and
                  Hubert Eichner and
                  Advait Gadhikar and
                  Zachary Garrett and
                  Antonious M. Girgis and
                  Filip Hanzely and
                  Andrew Hard and
                  Chaoyang He and
                  Samuel Horv{\'{a}}th and
                  Zhouyuan Huo and
                  Alex Ingerman and
                  Martin Jaggi and
                  Tara Javidi and
                  Peter Kairouz and
                  Satyen Kale and
                  Sai Praneeth Karimireddy and
                  Jakub Kone{\v{c}}n{\'y} and
                  Sanmi Koyejo and
                  Tian Li and
                  Luyang Liu and
                  Mehryar Mohri and
                  Hang Qi and
                  Sashank J. Reddi and
                  Peter Richt{\'{a}}rik and
                  Karan Singhal and
                  Virginia Smith and
                  Mahdi Soltanolkotabi and
                  Weikang Song and
                  Ananda Theertha Suresh and
                  Sebastian U. Stich and
                  Ameet Talwalkar and
                  Hongyi Wang and
                  Blake E. Woodworth and
                  Shanshan Wu and
                  Felix X. Yu and
                  Honglin Yuan and
                  Manzil Zaheer and
                  Mi Zhang and
                  Tong Zhang and
                  Chunxiang Zheng and
                  Chen Zhu and
                  Wennan Zhu},
  title        = {A Field Guide to Federated Optimization},
  journal      = {CoRR},
  volume       = {abs/2107.06917},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.06917},
  eprinttype    = {arXiv},
  eprint       = {2107.06917},
  timestamp    = {Wed, 06 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-06917.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2108-07958,
  author       = {Oguz Kaan Y{\"{u}}ksel and
                  Sebastian U. Stich and
                  Martin Jaggi and
                  Tatjana Chavdarova},
  title        = {Semantic Perturbations with Normalizing Flows for Improved Generalization},
  journal      = {CoRR},
  volume       = {abs/2108.07958},
  year         = {2021},
  url          = {https://arxiv.org/abs/2108.07958},
  eprinttype    = {arXiv},
  eprint       = {2108.07958},
  timestamp    = {Mon, 23 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2108-07958.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2109-02388,
  author       = {Sebastian Bischoff and
                  Stephan G{\"{u}}nnemann and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {On Second-order Optimization Methods for Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2109.02388},
  year         = {2021},
  url          = {https://arxiv.org/abs/2109.02388},
  eprinttype    = {arXiv},
  eprint       = {2109.02388},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2109-02388.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-04175,
  author       = {Thijs Vogels and
                  Lie He and
                  Anastasia Koloskova and
                  Tao Lin and
                  Sai Praneeth Karimireddy and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {RelaySum for Decentralized Deep Learning on Heterogeneous Data},
  journal      = {CoRR},
  volume       = {abs/2110.04175},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.04175},
  eprinttype    = {arXiv},
  eprint       = {2110.04175},
  timestamp    = {Thu, 21 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-04175.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-06978,
  author       = {Martin Beaussart and
                  Felix Grimberg and
                  Mary{-}Anne Hartley and
                  Martin Jaggi},
  title        = {{WAFFLE:} Weighted Averaging for Personalized Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2110.06978},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.06978},
  eprinttype    = {arXiv},
  eprint       = {2110.06978},
  timestamp    = {Fri, 22 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-06978.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-12946,
  author       = {Felix Grimberg and
                  Mary{-}Anne Hartley and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {Optimal Model Averaging: Towards Personalized Collaborative Learning},
  journal      = {CoRR},
  volume       = {abs/2110.12946},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.12946},
  eprinttype    = {arXiv},
  eprint       = {2110.12946},
  timestamp    = {Thu, 28 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-12946.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-05968,
  author       = {El Mahdi Chayti and
                  Sai Praneeth Karimireddy and
                  Sebastian U. Stich and
                  Nicolas Flammarion and
                  Martin Jaggi},
  title        = {Linear Speedup in Personalized Collaborative Learning},
  journal      = {CoRR},
  volume       = {abs/2111.05968},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.05968},
  eprinttype    = {arXiv},
  eprint       = {2111.05968},
  timestamp    = {Tue, 16 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-05968.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2111-08546,
  author       = {Vinitra Swamy and
                  Angelika Romanou and
                  Martin Jaggi},
  title        = {Interpreting Language Models Through Knowledge Graph Extraction},
  journal      = {CoRR},
  volume       = {abs/2111.08546},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.08546},
  eprinttype    = {arXiv},
  eprint       = {2111.08546},
  timestamp    = {Mon, 22 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-08546.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-08798,
  author       = {Futong Liu and
                  Tao Lin and
                  Martin Jaggi},
  title        = {Understanding Memorization from the Perspective of Optimization via
                  Efficient Influence Estimation},
  journal      = {CoRR},
  volume       = {abs/2112.08798},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.08798},
  eprinttype    = {arXiv},
  eprint       = {2112.08798},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-08798.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/PedregosaNAJ20,
  author       = {Fabian Pedregosa and
                  Geoffrey N{\'{e}}giar and
                  Armin Askari and
                  Martin Jaggi},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {Linearly Convergent Frank-Wolfe without Line-Search},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {1--10},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/pedregosa20a.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/PedregosaNAJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/SinghHDJ20,
  author       = {Sidak Pal Singh and
                  Andreas Hug and
                  Aymeric Dieuleveut and
                  Martin Jaggi},
  editor       = {Silvia Chiappa and
                  Roberto Calandra},
  title        = {Context Mover's Distance {\&} Barycenters: Optimal Transport of
                  Contexts for Building Representations},
  booktitle    = {The 23rd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]},
  series       = {Proceedings of Machine Learning Research},
  volume       = {108},
  pages        = {3437--3449},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v108/singh20a.html},
  timestamp    = {Mon, 29 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/SinghHDJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/ZhaoLMJS20,
  author       = {Mengjie Zhao and
                  Tao Lin and
                  Fei Mi and
                  Martin Jaggi and
                  Hinrich Sch{\"{u}}tze},
  editor       = {Bonnie Webber and
                  Trevor Cohn and
                  Yulan He and
                  Yang Liu},
  title        = {Masking as an Efficient Alternative to Finetuning for Pretrained Language
                  Models},
  booktitle    = {Proceedings of the 2020 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2020, Online, November 16-20, 2020},
  pages        = {2226--2241},
  publisher    = {Association for Computational Linguistics},
  year         = {2020},
  url          = {https://doi.org/10.18653/v1/2020.emnlp-main.174},
  doi          = {10.18653/V1/2020.EMNLP-MAIN.174},
  timestamp    = {Wed, 23 Mar 2022 10:11:55 +0100},
  biburl       = {https://dblp.org/rec/conf/emnlp/ZhaoLMJS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/CordonnierLJ20,
  author       = {Jean{-}Baptiste Cordonnier and
                  Andreas Loukas and
                  Martin Jaggi},
  title        = {On the Relationship between Self-Attention and Convolutional Layers},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=HJlnC1rKPB},
  timestamp    = {Thu, 07 May 2020 17:11:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/CordonnierLJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/KoloskovaLSJ20,
  author       = {Anastasia Koloskova and
                  Tao Lin and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Decentralized Deep Learning with Arbitrary Communication Compression},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SkgGCkrKvH},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/KoloskovaLSJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LinSBDJ20,
  author       = {Tao Lin and
                  Sebastian U. Stich and
                  Luis Barba and
                  Daniil Dmitriev and
                  Martin Jaggi},
  title        = {Dynamic Model Pruning with Feedback},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=SJem8lSFwB},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LinSBDJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/LinSPJ20,
  author       = {Tao Lin and
                  Sebastian U. Stich and
                  Kumar Kshitij Patel and
                  Martin Jaggi},
  title        = {Don't Use Large Mini-batches, Use Local {SGD}},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=B1eyO1BFPr},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/LinSPJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/YuSJMS20,
  author       = {Kaicheng Yu and
                  Christian Sciuto and
                  Martin Jaggi and
                  Claudiu Musat and
                  Mathieu Salzmann},
  title        = {Evaluating The Search Phase of Neural Architecture Search},
  booktitle    = {8th International Conference on Learning Representations, {ICLR} 2020,
                  Addis Ababa, Ethiopia, April 26-30, 2020},
  publisher    = {OpenReview.net},
  year         = {2020},
  url          = {https://openreview.net/forum?id=H1loF2NFwr},
  timestamp    = {Thu, 07 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/YuSJMS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KoloskovaLBJS20,
  author       = {Anastasia Koloskova and
                  Nicolas Loizou and
                  Sadra Boreiri and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {A Unified Theory of Decentralized {SGD} with Changing Topology and
                  Local Updates},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {5381--5393},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/koloskova20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/KoloskovaLBJS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LinKSJ20,
  author       = {Tao Lin and
                  Lingjing Kong and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Extrapolation for Large-batch Training in Deep Learning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {6094--6104},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/lin20b.html},
  timestamp    = {Mon, 14 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LinKSJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/SivaprasadMVJF20,
  author       = {Prabhu Teja Sivaprasad and
                  Florian Mai and
                  Thijs Vogels and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret},
  title        = {Optimizer Benchmarking Needs to Account for Hyperparameter Tuning},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {9036--9045},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/sivaprasad20a.html},
  timestamp    = {Tue, 15 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/SivaprasadMVJF20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/miccai/GrimbergHJK20,
  author       = {Felix Grimberg and
                  Mary{-}Anne Hartley and
                  Martin Jaggi and
                  Sai Praneeth Karimireddy},
  editor       = {Shadi Albarqouni and
                  Spyridon Bakas and
                  Konstantinos Kamnitsas and
                  M. Jorge Cardoso and
                  Bennett A. Landman and
                  Wenqi Li and
                  Fausto Milletari and
                  Nicola Rieke and
                  Holger Roth and
                  Daguang Xu and
                  Ziyue Xu},
  title        = {Weight Erosion: An Update Aggregation Scheme for Personalized Collaborative
                  Machine Learning},
  booktitle    = {Domain Adaptation and Representation Transfer, and Distributed and
                  Collaborative Learning - Second {MICCAI} Workshop, {DART} 2020, and
                  First {MICCAI} Workshop, {DCL} 2020, Held in Conjunction with {MICCAI}
                  2020, Lima, Peru, October 4-8, 2020, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12444},
  pages        = {160--169},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-60548-3\_16},
  doi          = {10.1007/978-3-030-60548-3\_16},
  timestamp    = {Tue, 19 Jul 2022 10:23:16 +0200},
  biburl       = {https://dblp.org/rec/conf/miccai/GrimbergHJK20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LinKSJ20,
  author       = {Tao Lin and
                  Lingjing Kong and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Ensemble Distillation for Robust Model Fusion in Federated Learning},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/18df51b97ccd68128e994804f3eccc87-Abstract.html},
  timestamp    = {Mon, 14 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/LinKSJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/SinghJ20,
  author       = {Sidak Pal Singh and
                  Martin Jaggi},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Model Fusion via Optimal Transport},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/fb2697869f56484404c8ceee2985b01d-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/SinghJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VogelsKJ20,
  author       = {Thijs Vogels and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  editor       = {Hugo Larochelle and
                  Marc'Aurelio Ranzato and
                  Raia Hadsell and
                  Maria{-}Florina Balcan and
                  Hsuan{-}Tien Lin},
  title        = {Practical Low-Rank Communication Compression in Decentralized Deep
                  Learning},
  booktitle    = {Advances in Neural Information Processing Systems 33: Annual Conference
                  on Neural Information Processing Systems 2020, NeurIPS 2020, December
                  6-12, 2020, virtual},
  year         = {2020},
  url          = {https://proceedings.neurips.cc/paper/2020/hash/a376802c0811f1b9088828288eb0d3f0-Abstract.html},
  timestamp    = {Tue, 19 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/VogelsKJ20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-10422,
  author       = {Anastasia Koloskova and
                  Nicolas Loizou and
                  Sadra Boreiri and
                  Martin Jaggi and
                  Sebastian U. Stich},
  title        = {A Unified Theory of Decentralized {SGD} with Changing Topology and
                  Local Updates},
  journal      = {CoRR},
  volume       = {abs/2003.10422},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.10422},
  eprinttype    = {arXiv},
  eprint       = {2003.10422},
  timestamp    = {Tue, 24 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-10422.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-11316,
  author       = {Namhoon Lee and
                  Philip H. S. Torr and
                  Martin Jaggi},
  title        = {Data Parallelism in Training Sparse Neural Networks},
  journal      = {CoRR},
  volume       = {abs/2003.11316},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.11316},
  eprinttype    = {arXiv},
  eprint       = {2003.11316},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-11316.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-12406,
  author       = {Mengjie Zhao and
                  Tao Lin and
                  Martin Jaggi and
                  Hinrich Sch{\"{u}}tze},
  title        = {Masking as an Efficient Alternative to Finetuning for Pretrained Language
                  Models},
  journal      = {CoRR},
  volume       = {abs/2004.12406},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.12406},
  eprinttype    = {arXiv},
  eprint       = {2004.12406},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-12406.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-04747,
  author       = {Lie He and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {Secure Byzantine-Robust Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2006.04747},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.04747},
  eprinttype    = {arXiv},
  eprint       = {2006.04747},
  timestamp    = {Fri, 12 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-04747.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-05720,
  author       = {Tao Lin and
                  Lingjing Kong and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Extrapolation for Large-batch Training in Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2006.05720},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.05720},
  eprinttype    = {arXiv},
  eprint       = {2006.05720},
  timestamp    = {Mon, 14 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-05720.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-07242,
  author       = {Tao Lin and
                  Lingjing Kong and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Ensemble Distillation for Robust Model Fusion in Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2006.07242},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.07242},
  eprinttype    = {arXiv},
  eprint       = {2006.07242},
  timestamp    = {Mon, 14 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-07242.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-07253,
  author       = {Tao Lin and
                  Sebastian U. Stich and
                  Luis Barba and
                  Daniil Dmitriev and
                  Martin Jaggi},
  title        = {Dynamic Model Pruning with Feedback},
  journal      = {CoRR},
  volume       = {abs/2006.07253},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.07253},
  eprinttype    = {arXiv},
  eprint       = {2006.07253},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-07253.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-09365,
  author       = {Lie He and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {Byzantine-Robust Learning on Heterogeneous Datasets via Resampling},
  journal      = {CoRR},
  volume       = {abs/2006.09365},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.09365},
  eprinttype    = {arXiv},
  eprint       = {2006.09365},
  timestamp    = {Wed, 17 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-09365.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-14567,
  author       = {Tatjana Chavdarova and
                  Matteo Pagliardini and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret},
  title        = {Taming GANs with Lookahead},
  journal      = {CoRR},
  volume       = {abs/2006.14567},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.14567},
  eprinttype    = {arXiv},
  eprint       = {2006.14567},
  timestamp    = {Thu, 02 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-14567.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-16362,
  author       = {Jean{-}Baptiste Cordonnier and
                  Andreas Loukas and
                  Martin Jaggi},
  title        = {Multi-Head Attention: Collaborate Instead of Concatenate},
  journal      = {CoRR},
  volume       = {abs/2006.16362},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.16362},
  eprinttype    = {arXiv},
  eprint       = {2006.16362},
  timestamp    = {Thu, 02 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-16362.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-01425,
  author       = {Thijs Vogels and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {PowerGossip: Practical Low-Rank Communication Compression in Decentralized
                  Deep Learning},
  journal      = {CoRR},
  volume       = {abs/2008.01425},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.01425},
  eprinttype    = {arXiv},
  eprint       = {2008.01425},
  timestamp    = {Fri, 07 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-01425.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2008-03606,
  author       = {Sai Praneeth Karimireddy and
                  Martin Jaggi and
                  Satyen Kale and
                  Mehryar Mohri and
                  Sashank J. Reddi and
                  Sebastian U. Stich and
                  Ananda Theertha Suresh},
  title        = {Mime: Mimicking Centralized Stochastic Algorithms in Federated Learning},
  journal      = {CoRR},
  volume       = {abs/2008.03606},
  year         = {2020},
  url          = {https://arxiv.org/abs/2008.03606},
  eprinttype    = {arXiv},
  eprint       = {2008.03606},
  timestamp    = {Fri, 14 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2008-03606.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2009-09271,
  author       = {Negar Foroutan Eghlidi and
                  Martin Jaggi},
  title        = {Sparse Communication for Training Deep Networks},
  journal      = {CoRR},
  volume       = {abs/2009.09271},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.09271},
  eprinttype    = {arXiv},
  eprint       = {2009.09271},
  timestamp    = {Wed, 23 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-09271.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2011-01697,
  author       = {Dmitry Kovalev and
                  Anastasia Koloskova and
                  Martin Jaggi and
                  Peter Richt{\'{a}}rik and
                  Sebastian U. Stich},
  title        = {A Linearly Convergent Algorithm for Decentralized Optimization: Sending
                  Less Bits for Free!},
  journal      = {CoRR},
  volume       = {abs/2011.01697},
  year         = {2020},
  url          = {https://arxiv.org/abs/2011.01697},
  eprinttype    = {arXiv},
  eprint       = {2011.01697},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2011-01697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-10333,
  author       = {Sai Praneeth Karimireddy and
                  Lie He and
                  Martin Jaggi},
  title        = {Learning from History for Byzantine Robust Optimization},
  journal      = {CoRR},
  volume       = {abs/2012.10333},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.10333},
  eprinttype    = {arXiv},
  eprint       = {2012.10333},
  timestamp    = {Mon, 04 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-10333.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/mfc/LangovoyGJ19,
  author       = {Mikhail A. Langovoy and
                  Akhilesh Gotmare and
                  Martin Jaggi},
  title        = {Unsupervised robust nonparametric learning of hidden community properties},
  journal      = {Math. Found. Comput.},
  volume       = {2},
  number       = {2},
  pages        = {127--147},
  year         = {2019},
  url          = {https://doi.org/10.3934/mfc.2019010},
  doi          = {10.3934/MFC.2019010},
  timestamp    = {Tue, 14 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/mfc/LangovoyGJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/KarimireddyKSJ19,
  author       = {Sai Praneeth Karimireddy and
                  Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Kamalika Chaudhuri and
                  Masashi Sugiyama},
  title        = {Efficient Greedy Coordinate Descent for Composite Problems},
  booktitle    = {The 22nd International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan},
  series       = {Proceedings of Machine Learning Research},
  volume       = {89},
  pages        = {2887--2896},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v89/karimireddy19a.html},
  timestamp    = {Fri, 07 Jun 2019 09:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/KarimireddyKSJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/hipc/WszolaMJP19,
  author       = {Eliza Wszola and
                  Celestine Mendler{-}D{\"{u}}nner and
                  Martin Jaggi and
                  Markus P{\"{u}}schel},
  title        = {On Linear Learning with Manycore Processors},
  booktitle    = {26th {IEEE} International Conference on High Performance Computing,
                  Data, and Analytics, HiPC 2019, Hyderabad, India, December 17-20,
                  2019},
  pages        = {184--194},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/HiPC.2019.00032},
  doi          = {10.1109/HIPC.2019.00032},
  timestamp    = {Thu, 20 Feb 2020 16:19:46 +0100},
  biburl       = {https://dblp.org/rec/conf/hipc/WszolaMJP19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/SinghHDJ19,
  author       = {Sidak Pal Singh and
                  Andreas Hug and
                  Aymeric Dieuleveut and
                  Martin Jaggi},
  title        = {Context Mover's Distance {\&} Barycenters: Optimal transport of
                  contexts for building representations},
  booktitle    = {Deep Generative Models for Highly Structured Data, {ICLR} 2019 Workshop,
                  New Orleans, Louisiana, United States, May 6, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=rygiEL8FOV},
  timestamp    = {Thu, 25 Jul 2019 16:26:32 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/SinghHDJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/BenyahiaYBJDSM19,
  author       = {Yassine Benyahia and
                  Kaicheng Yu and
                  Kamil Bennani{-}Smires and
                  Martin Jaggi and
                  Anthony C. Davison and
                  Mathieu Salzmann and
                  Claudiu Musat},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Overcoming Multi-model Forgetting},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {594--603},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/benyahia19a.html},
  timestamp    = {Tue, 11 Jun 2019 15:37:38 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/BenyahiaYBJDSM19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KarimireddyRSJ19,
  author       = {Sai Praneeth Karimireddy and
                  Quentin Rebjock and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Error Feedback Fixes SignSGD and other Gradient Compression Schemes},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3252--3261},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/karimireddy19a.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KarimireddyRSJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KoloskovaSJ19,
  author       = {Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Kamalika Chaudhuri and
                  Ruslan Salakhutdinov},
  title        = {Decentralized Stochastic Optimization and Gossip Algorithms with Compressed
                  Communication},
  booktitle    = {Proceedings of the 36th International Conference on Machine Learning,
                  {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {97},
  pages        = {3478--3487},
  publisher    = {{PMLR}},
  year         = {2019},
  url          = {http://proceedings.mlr.press/v97/koloskova19a.html},
  timestamp    = {Tue, 11 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/KoloskovaSJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/interspeech/SacchiNJC19,
  author       = {Niccol{\`{o}} Sacchi and
                  Alexandre Nanchen and
                  Martin Jaggi and
                  Milos Cernak},
  editor       = {Gernot Kubin and
                  Zdravko Kacic},
  title        = {Open-Vocabulary Keyword Spotting with Audio and Text Embeddings},
  booktitle    = {Interspeech 2019, 20th Annual Conference of the International Speech
                  Communication Association, Graz, Austria, 15-19 September 2019},
  pages        = {3362--3366},
  publisher    = {{ISCA}},
  year         = {2019},
  url          = {https://doi.org/10.21437/Interspeech.2019-1846},
  doi          = {10.21437/INTERSPEECH.2019-1846},
  timestamp    = {Fri, 29 Jan 2021 17:41:10 +0100},
  biburl       = {https://dblp.org/rec/conf/interspeech/SacchiNJC19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/GuptaPJ19,
  author       = {Prakhar Gupta and
                  Matteo Pagliardini and
                  Martin Jaggi},
  editor       = {Jill Burstein and
                  Christy Doran and
                  Thamar Solorio},
  title        = {Better Word Embeddings by Disentangling Contextual n-Gram Information},
  booktitle    = {Proceedings of the 2019 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2019, Minneapolis, MN, USA, June 2-7, 2019, Volume 1 (Long
                  and Short Papers)},
  pages        = {933--939},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/n19-1098},
  doi          = {10.18653/V1/N19-1098},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/GuptaPJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/FranceschiDJ19,
  author       = {Jean{-}Yves Franceschi and
                  Aymeric Dieuleveut and
                  Martin Jaggi},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {Unsupervised Scalable Representation Learning for Multivariate Time
                  Series},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {4652--4663},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/53c6de78244e9f528eb3e1cda69699bb-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/FranceschiDJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/VogelsKJ19,
  author       = {Thijs Vogels and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  editor       = {Hanna M. Wallach and
                  Hugo Larochelle and
                  Alina Beygelzimer and
                  Florence d'Alch{\'{e}}{-}Buc and
                  Emily B. Fox and
                  Roman Garnett},
  title        = {PowerSGD: Practical Low-Rank Gradient Compression for Distributed
                  Optimization},
  booktitle    = {Advances in Neural Information Processing Systems 32: Annual Conference
                  on Neural Information Processing Systems 2019, NeurIPS 2019, December
                  8-14, 2019, Vancouver, BC, Canada},
  pages        = {14236--14245},
  year         = {2019},
  url          = {https://proceedings.neurips.cc/paper/2019/hash/d9fbed9da256e344c1fa46bb46c34c5f-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/VogelsKJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/smm4h/SchneuwlyGLCJ19,
  author       = {Arno Schneuwly and
                  Ralf Grubenmann and
                  S{\'{e}}verine Rion Logean and
                  Mark Cieliebak and
                  Martin Jaggi},
  editor       = {Davy Weissenbacher and
                  Graciela Gonzalez{-}Hernandez},
  title        = {Correlating Twitter Language with Community-Level Health Outcomes},
  booktitle    = {Proceedings of the Fourth Social Media Mining for Health Application
                  Workshop {\&} Shared Task, SMM4H@ACL 2019, Florence, Italy, August
                  2, 2019},
  pages        = {71--78},
  publisher    = {Association for Computational Linguistics},
  year         = {2019},
  url          = {https://doi.org/10.18653/v1/W19-3210},
  doi          = {10.18653/V1/W19-3210},
  timestamp    = {Mon, 22 Apr 2024 17:02:59 +0200},
  biburl       = {https://dblp.org/rec/conf/smm4h/SchneuwlyGLCJ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/wsdm/JosifoskiPPJ019,
  author       = {Martin Josifoski and
                  Ivan S. Paskov and
                  Hristo S. Paskov and
                  Martin Jaggi and
                  Robert West},
  editor       = {J. Shane Culpepper and
                  Alistair Moffat and
                  Paul N. Bennett and
                  Kristina Lerman},
  title        = {Crosslingual Document Embedding as Reduced-Rank Ridge Regression},
  booktitle    = {Proceedings of the Twelfth {ACM} International Conference on Web Search
                  and Data Mining, {WSDM} 2019, Melbourne, VIC, Australia, February
                  11-15, 2019},
  pages        = {744--752},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3289600.3291023},
  doi          = {10.1145/3289600.3291023},
  timestamp    = {Sat, 30 May 2020 20:02:29 +0200},
  biburl       = {https://dblp.org/rec/conf/wsdm/JosifoskiPPJ019.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-09847,
  author       = {Sai Praneeth Karimireddy and
                  Quentin Rebjock and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Error Feedback Fixes SignSGD and other Gradient Compression Schemes},
  journal      = {CoRR},
  volume       = {abs/1901.09847},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.09847},
  eprinttype    = {arXiv},
  eprint       = {1901.09847},
  timestamp    = {Sat, 02 Feb 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-09847.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-10738,
  author       = {Jean{-}Yves Franceschi and
                  Aymeric Dieuleveut and
                  Martin Jaggi},
  title        = {Unsupervised Scalable Representation Learning for Multivariate Time
                  Series},
  journal      = {CoRR},
  volume       = {abs/1901.10738},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.10738},
  eprinttype    = {arXiv},
  eprint       = {1901.10738},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-10738.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-00340,
  author       = {Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Decentralized Stochastic Optimization and Gossip Algorithms with Compressed
                  Communication},
  journal      = {CoRR},
  volume       = {abs/1902.00340},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.00340},
  eprinttype    = {arXiv},
  eprint       = {1902.00340},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-00340.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-08142,
  author       = {Christian Sciuto and
                  Kaicheng Yu and
                  Martin Jaggi and
                  Claudiu Musat and
                  Mathieu Salzmann},
  title        = {Evaluating the Search Phase of Neural Architecture Search},
  journal      = {CoRR},
  volume       = {abs/1902.08142},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.08142},
  eprinttype    = {arXiv},
  eprint       = {1902.08142},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-08142.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-08232,
  author       = {Yassine Benyahia and
                  Kaicheng Yu and
                  Kamil Bennani{-}Smires and
                  Martin Jaggi and
                  Anthony C. Davison and
                  Mathieu Salzmann and
                  Claudiu Musat},
  title        = {Overcoming Multi-Model Forgetting},
  journal      = {CoRR},
  volume       = {abs/1902.08232},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.08232},
  eprinttype    = {arXiv},
  eprint       = {1902.08232},
  timestamp    = {Thu, 06 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-08232.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-09499,
  author       = {Matthias H{\"{u}}ser and
                  Adrian K{\"{u}}ndig and
                  Walter Karlen and
                  Valeria De Luca and
                  Martin Jaggi},
  title        = {Forecasting intracranial hypertension using multi-scale waveform metrics},
  journal      = {CoRR},
  volume       = {abs/1902.09499},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.09499},
  eprinttype    = {arXiv},
  eprint       = {1902.09499},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-09499.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-09713,
  author       = {Khalil Mrini and
                  Claudiu Musat and
                  Michael Baeriswyl and
                  Martin Jaggi},
  title        = {Structure Tree-LSTM: Structure-aware Attentional Document Encoders},
  journal      = {CoRR},
  volume       = {abs/1902.09713},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.09713},
  eprinttype    = {arXiv},
  eprint       = {1902.09713},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-09713.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-03257,
  author       = {Alexander Ratner and
                  Dan Alistarh and
                  Gustavo Alonso and
                  David G. Andersen and
                  Peter Bailis and
                  Sarah Bird and
                  Nicholas Carlini and
                  Bryan Catanzaro and
                  Eric S. Chung and
                  Bill Dally and
                  Jeff Dean and
                  Inderjit S. Dhillon and
                  Alexandros G. Dimakis and
                  Pradeep Dubey and
                  Charles Elkan and
                  Grigori Fursin and
                  Gregory R. Ganger and
                  Lise Getoor and
                  Phillip B. Gibbons and
                  Garth A. Gibson and
                  Joseph E. Gonzalez and
                  Justin Gottschlich and
                  Song Han and
                  Kim M. Hazelwood and
                  Furong Huang and
                  Martin Jaggi and
                  Kevin G. Jamieson and
                  Michael I. Jordan and
                  Gauri Joshi and
                  Rania Khalaf and
                  Jason Knight and
                  Jakub Kone{\v{c}}n{\'y} and
                  Tim Kraska and
                  Arun Kumar and
                  Anastasios Kyrillidis and
                  Jing Li and
                  Samuel Madden and
                  H. Brendan McMahan and
                  Erik Meijer and
                  Ioannis Mitliagkas and
                  Rajat Monga and
                  Derek Gordon Murray and
                  Dimitris S. Papailiopoulos and
                  Gennady Pekhimenko and
                  Theodoros Rekatsinas and
                  Afshin Rostamizadeh and
                  Christopher R{\'{e}} and
                  Christopher De Sa and
                  Hanie Sedghi and
                  Siddhartha Sen and
                  Virginia Smith and
                  Alex Smola and
                  Dawn Song and
                  Evan R. Sparks and
                  Ion Stoica and
                  Vivienne Sze and
                  Madeleine Udell and
                  Joaquin Vanschoren and
                  Shivaram Venkataraman and
                  Rashmi Vinayak and
                  Markus Weimer and
                  Andrew Gordon Wilson and
                  Eric P. Xing and
                  Matei Zaharia and
                  Ce Zhang and
                  Ameet Talwalkar},
  title        = {SysML: The New Frontier of Machine Learning Systems},
  journal      = {CoRR},
  volume       = {abs/1904.03257},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.03257},
  eprinttype    = {arXiv},
  eprint       = {1904.03257},
  timestamp    = {Fri, 11 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-03257.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-03922,
  author       = {Martin Josifoski and
                  Ivan S. Paskov and
                  Hristo S. Paskov and
                  Martin Jaggi and
                  Robert West},
  title        = {Crosslingual Document Embedding as Reduced-Rank Ridge Regression},
  journal      = {CoRR},
  volume       = {abs/1904.03922},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.03922},
  eprinttype    = {arXiv},
  eprint       = {1904.03922},
  timestamp    = {Thu, 25 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-03922.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-05033,
  author       = {Prakhar Gupta and
                  Matteo Pagliardini and
                  Martin Jaggi},
  title        = {Better Word Embeddings by Disentangling Contextual n-Gram Information},
  journal      = {CoRR},
  volume       = {abs/1904.05033},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.05033},
  eprinttype    = {arXiv},
  eprint       = {1904.05033},
  timestamp    = {Thu, 25 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-05033.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-00626,
  author       = {Eliza Wszola and
                  Celestine Mendler{-}D{\"{u}}nner and
                  Martin Jaggi and
                  Markus P{\"{u}}schel},
  title        = {On Linear Learning with Manycore Processors},
  journal      = {CoRR},
  volume       = {abs/1905.00626},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.00626},
  eprinttype    = {arXiv},
  eprint       = {1905.00626},
  timestamp    = {Mon, 27 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-00626.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1905-13727,
  author       = {Thijs Vogels and
                  Sai Praneeth Karimireddy and
                  Martin Jaggi},
  title        = {PowerSGD: Practical Low-Rank Gradient Compression for Distributed
                  Optimization},
  journal      = {CoRR},
  volume       = {abs/1905.13727},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.13727},
  eprinttype    = {arXiv},
  eprint       = {1905.13727},
  timestamp    = {Mon, 03 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-13727.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1906-06465,
  author       = {Arno Schneuwly and
                  Ralf Grubenmann and
                  S{\'{e}}verine Rion Logean and
                  Mark Cieliebak and
                  Martin Jaggi},
  title        = {Correlating Twitter Language with Community-Level Health Outcomes},
  journal      = {CoRR},
  volume       = {abs/1906.06465},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.06465},
  eprinttype    = {arXiv},
  eprint       = {1906.06465},
  timestamp    = {Thu, 27 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-06465.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1907-09356,
  author       = {Anastasia Koloskova and
                  Tao Lin and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Decentralized Deep Learning with Arbitrary Communication Compression},
  journal      = {CoRR},
  volume       = {abs/1907.09356},
  year         = {2019},
  url          = {http://arxiv.org/abs/1907.09356},
  eprinttype    = {arXiv},
  eprint       = {1907.09356},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1907-09356.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-05653,
  author       = {Sidak Pal Singh and
                  Martin Jaggi},
  title        = {Model Fusion via Optimal Transport},
  journal      = {CoRR},
  volume       = {abs/1910.05653},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.05653},
  eprinttype    = {arXiv},
  eprint       = {1910.05653},
  timestamp    = {Wed, 16 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-05653.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-11758,
  author       = {Prabhu Teja Sivaprasad and
                  Florian Mai and
                  Thijs Vogels and
                  Martin Jaggi and
                  Fran{\c{c}}ois Fleuret},
  title        = {On the Tunability of Optimizers in Deep Learning},
  journal      = {CoRR},
  volume       = {abs/1910.11758},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.11758},
  eprinttype    = {arXiv},
  eprint       = {1910.11758},
  timestamp    = {Thu, 31 Oct 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-11758.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1911-03584,
  author       = {Jean{-}Baptiste Cordonnier and
                  Andreas Loukas and
                  Martin Jaggi},
  title        = {On the Relationship between Self-Attention and Convolutional Layers},
  journal      = {CoRR},
  volume       = {abs/1911.03584},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.03584},
  eprinttype    = {arXiv},
  eprint       = {1911.03584},
  timestamp    = {Sun, 01 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-03584.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-04977,
  author       = {Peter Kairouz and
                  H. Brendan McMahan and
                  Brendan Avent and
                  Aur{\'{e}}lien Bellet and
                  Mehdi Bennis and
                  Arjun Nitin Bhagoji and
                  Kallista A. Bonawitz and
                  Zachary Charles and
                  Graham Cormode and
                  Rachel Cummings and
                  Rafael G. L. D'Oliveira and
                  Salim El Rouayheb and
                  David Evans and
                  Josh Gardner and
                  Zachary Garrett and
                  Adri{\`{a}} Gasc{\'{o}}n and
                  Badih Ghazi and
                  Phillip B. Gibbons and
                  Marco Gruteser and
                  Za{\"{\i}}d Harchaoui and
                  Chaoyang He and
                  Lie He and
                  Zhouyuan Huo and
                  Ben Hutchinson and
                  Justin Hsu and
                  Martin Jaggi and
                  Tara Javidi and
                  Gauri Joshi and
                  Mikhail Khodak and
                  Jakub Kone{\v{c}}n{\'y} and
                  Aleksandra Korolova and
                  Farinaz Koushanfar and
                  Sanmi Koyejo and
                  Tancr{\`{e}}de Lepoint and
                  Yang Liu and
                  Prateek Mittal and
                  Mehryar Mohri and
                  Richard Nock and
                  Ayfer {\"{O}}zg{\"{u}}r and
                  Rasmus Pagh and
                  Mariana Raykova and
                  Hang Qi and
                  Daniel Ramage and
                  Ramesh Raskar and
                  Dawn Song and
                  Weikang Song and
                  Sebastian U. Stich and
                  Ziteng Sun and
                  Ananda Theertha Suresh and
                  Florian Tram{\`{e}}r and
                  Praneeth Vepakomma and
                  Jianyu Wang and
                  Li Xiong and
                  Zheng Xu and
                  Qiang Yang and
                  Felix X. Yu and
                  Han Yu and
                  Sen Zhao},
  title        = {Advances and Open Problems in Federated Learning},
  journal      = {CoRR},
  volume       = {abs/1912.04977},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.04977},
  eprinttype    = {arXiv},
  eprint       = {1912.04977},
  timestamp    = {Mon, 11 Jul 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-04977.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-12481,
  author       = {Ali Sabet and
                  Prakhar Gupta and
                  Jean{-}Baptiste Cordonnier and
                  Robert West and
                  Martin Jaggi},
  title        = {Robust Cross-lingual Embeddings from Parallel Sentences},
  journal      = {CoRR},
  volume       = {abs/1912.12481},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.12481},
  eprinttype    = {arXiv},
  eprint       = {1912.12481},
  timestamp    = {Fri, 03 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-12481.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/siamjo/dAspremontGJ18,
  author       = {Alexandre d'Aspremont and
                  Crist{\'{o}}bal Guzm{\'{a}}n and
                  Martin Jaggi},
  title        = {Optimal Affine-Invariant Smooth Minimization Algorithms},
  journal      = {{SIAM} J. Optim.},
  volume       = {28},
  number       = {3},
  pages        = {2384--2405},
  year         = {2018},
  url          = {https://doi.org/10.1137/17M1116842},
  doi          = {10.1137/17M1116842},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/siamjo/dAspremontGJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/KarimireddySJ18,
  author       = {Sai Praneeth Reddy Karimireddy and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Amos J. Storkey and
                  Fernando P{\'{e}}rez{-}Cruz},
  title        = {Adaptive balancing of gradient and update computation times using
                  global geometry and approximate subproblems},
  booktitle    = {International Conference on Artificial Intelligence and Statistics,
                  {AISTATS} 2018, 9-11 April 2018, Playa Blanca, Lanzarote, Canary Islands,
                  Spain},
  series       = {Proceedings of Machine Learning Research},
  volume       = {84},
  pages        = {1204--1213},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v84/karimireddy18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:22 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/KarimireddySJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/conll/Bennani-SmiresM18,
  author       = {Kamil Bennani{-}Smires and
                  Claudiu Musat and
                  Andreea Hossmann and
                  Michael Baeriswyl and
                  Martin Jaggi},
  editor       = {Anna Korhonen and
                  Ivan Titov},
  title        = {Simple Unsupervised Keyphrase Extraction using Sentence Embeddings},
  booktitle    = {Proceedings of the 22nd Conference on Computational Natural Language
                  Learning, CoNLL 2018, Brussels, Belgium, October 31 - November 1,
                  2018},
  pages        = {221--229},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/k18-1022},
  doi          = {10.18653/V1/K18-1022},
  timestamp    = {Sun, 12 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/conll/Bennani-SmiresM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DunnerLGBHJ18,
  author       = {Celestine D{\"{u}}nner and
                  Aur{\'{e}}lien Lucchi and
                  Matilde Gargiani and
                  An Bian and
                  Thomas Hofmann and
                  Martin Jaggi},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {A Distributed Second-Order Algorithm You Can Trust},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {1357--1365},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/duenner18a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:30 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/DunnerLGBHJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LocatelloRKRSSJ18,
  author       = {Francesco Locatello and
                  Anant Raj and
                  Sai Praneeth Karimireddy and
                  Gunnar R{\"{a}}tsch and
                  Bernhard Sch{\"{o}}lkopf and
                  Sebastian U. Stich and
                  Martin Jaggi},
  editor       = {Jennifer G. Dy and
                  Andreas Krause},
  title        = {On Matching Pursuit and Coordinate Descent},
  booktitle    = {Proceedings of the 35th International Conference on Machine Learning,
                  {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July
                  10-15, 2018},
  series       = {Proceedings of Machine Learning Research},
  volume       = {80},
  pages        = {3204--3213},
  publisher    = {{PMLR}},
  year         = {2018},
  url          = {http://proceedings.mlr.press/v80/locatello18a.html},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/LocatelloRKRSSJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/naacl/PagliardiniGJ18,
  author       = {Matteo Pagliardini and
                  Prakhar Gupta and
                  Martin Jaggi},
  editor       = {Marilyn A. Walker and
                  Heng Ji and
                  Amanda Stent},
  title        = {Unsupervised Learning of Sentence Embeddings Using Compositional n-Gram
                  Features},
  booktitle    = {Proceedings of the 2018 Conference of the North American Chapter of
                  the Association for Computational Linguistics: Human Language Technologies,
                  {NAACL-HLT} 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume
                  1 (Long Papers)},
  pages        = {528--540},
  publisher    = {Association for Computational Linguistics},
  year         = {2018},
  url          = {https://doi.org/10.18653/v1/n18-1049},
  doi          = {10.18653/V1/N18-1049},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/naacl/PagliardiniGJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DrumondLJF18,
  author       = {Mario Drumond and
                  Tao Lin and
                  Martin Jaggi and
                  Babak Falsafi},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Training DNNs with Hybrid Block Floating Point},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {451--461},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/6a9aeddfc689c1d0e3b9ccc3ab651bc5-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/DrumondLJF18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/StichCJ18,
  author       = {Sebastian U. Stich and
                  Jean{-}Baptiste Cordonnier and
                  Martin Jaggi},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {Sparsified {SGD} with Memory},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {4452--4463},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/b440509a0106086a67bc2ea9df0a1dab-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/StichCJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/HeBJ18,
  author       = {Lie He and
                  An Bian and
                  Martin Jaggi},
  editor       = {Samy Bengio and
                  Hanna M. Wallach and
                  Hugo Larochelle and
                  Kristen Grauman and
                  Nicol{\`{o}} Cesa{-}Bianchi and
                  Roman Garnett},
  title        = {{COLA:} Decentralized Linear Learning},
  booktitle    = {Advances in Neural Information Processing Systems 31: Annual Conference
                  on Neural Information Processing Systems 2018, NeurIPS 2018, December
                  3-8, 2018, Montr{\'{e}}al, Canada},
  pages        = {4541--4551},
  year         = {2018},
  url          = {https://proceedings.neurips.cc/paper/2018/hash/05a70454516ecd9194c293b0e415777f-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/HeBJ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1801-04470,
  author       = {Kamil Bennani{-}Smires and
                  Claudiu Musat and
                  Martin Jaggi and
                  Andreea Hossmann and
                  Michael Baeriswyl},
  title        = {EmbedRank: Unsupervised Keyphrase Extraction using Sentence Embeddings},
  journal      = {CoRR},
  volume       = {abs/1801.04470},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.04470},
  eprinttype    = {arXiv},
  eprint       = {1801.04470},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-04470.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1803-09539,
  author       = {Francesco Locatello and
                  Anant Raj and
                  Sai Praneeth Karimireddy and
                  Gunnar R{\"{a}}tsch and
                  Bernhard Sch{\"{o}}lkopf and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Revisiting First-Order Convex Optimization Over Linear Spaces},
  journal      = {CoRR},
  volume       = {abs/1803.09539},
  year         = {2018},
  url          = {http://arxiv.org/abs/1803.09539},
  eprinttype    = {arXiv},
  eprint       = {1803.09539},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1803-09539.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1804-01526,
  author       = {Mario Drumond and
                  Tao Lin and
                  Martin Jaggi and
                  Babak Falsafi},
  title        = {End-to-End {DNN} Training with Block Floating Point Arithmetic},
  journal      = {CoRR},
  volume       = {abs/1804.01526},
  year         = {2018},
  url          = {http://arxiv.org/abs/1804.01526},
  eprinttype    = {arXiv},
  eprint       = {1804.01526},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1804-01526.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-00413,
  author       = {Sai Praneeth Karimireddy and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Global linear convergence of Newton's method without strong-convexity
                  or Lipschitz gradients},
  journal      = {CoRR},
  volume       = {abs/1806.00413},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.00413},
  eprinttype    = {arXiv},
  eprint       = {1806.00413},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-00413.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1806-07569,
  author       = {Celestine D{\"{u}}nner and
                  Aur{\'{e}}lien Lucchi and
                  Matilde Gargiani and
                  An Bian and
                  Thomas Hofmann and
                  Martin Jaggi},
  title        = {A Distributed Second-Order Algorithm You Can Trust},
  journal      = {CoRR},
  volume       = {abs/1806.07569},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.07569},
  eprinttype    = {arXiv},
  eprint       = {1806.07569},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-07569.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-04883,
  author       = {Lie He and
                  An Bian and
                  Martin Jaggi},
  title        = {{COLA:} Communication-Efficient Decentralized Linear Learning},
  journal      = {CoRR},
  volume       = {abs/1808.04883},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.04883},
  eprinttype    = {arXiv},
  eprint       = {1808.04883},
  timestamp    = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-04883.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-07217,
  author       = {Tao Lin and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Don't Use Large Mini-Batches, Use Local {SGD}},
  journal      = {CoRR},
  volume       = {abs/1808.07217},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.07217},
  eprinttype    = {arXiv},
  eprint       = {1808.07217},
  timestamp    = {Tue, 01 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-07217.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-09663,
  author       = {Sidak Pal Singh and
                  Andreas Hug and
                  Aymeric Dieuleveut and
                  Martin Jaggi},
  title        = {Wasserstein is all you need},
  journal      = {CoRR},
  volume       = {abs/1808.09663},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.09663},
  eprinttype    = {arXiv},
  eprint       = {1808.09663},
  timestamp    = {Mon, 03 Sep 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-09663.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1809-07599,
  author       = {Sebastian U. Stich and
                  Jean{-}Baptiste Cordonnier and
                  Martin Jaggi},
  title        = {Sparsified {SGD} with Memory},
  journal      = {CoRR},
  volume       = {abs/1809.07599},
  year         = {2018},
  url          = {http://arxiv.org/abs/1809.07599},
  eprinttype    = {arXiv},
  eprint       = {1809.07599},
  timestamp    = {Fri, 05 Oct 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1809-07599.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-06999,
  author       = {Sai Praneeth Karimireddy and
                  Anastasia Koloskova and
                  Sebastian U. Stich and
                  Martin Jaggi},
  title        = {Efficient Greedy Coordinate Descent for Composite Problems},
  journal      = {CoRR},
  volume       = {abs/1810.06999},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.06999},
  eprinttype    = {arXiv},
  eprint       = {1810.06999},
  timestamp    = {Thu, 01 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-06999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/SmithFMTJJ17,
  author       = {Virginia Smith and
                  Simone Forte and
                  Chenxin Ma and
                  Martin Tak{\'{a}}c and
                  Michael I. Jordan and
                  Martin Jaggi},
  title        = {CoCoA: {A} General Framework for Communication-Efficient Distributed
                  Optimization},
  journal      = {J. Mach. Learn. Res.},
  volume       = {18},
  pages        = {230:1--230:49},
  year         = {2017},
  url          = {http://jmlr.org/papers/v18/16-512.html},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jmlr/SmithFMTJJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/oms/MaKJSJRT17,
  author       = {Chenxin Ma and
                  Jakub Kone{\v{c}}n{\'y} and
                  Martin Jaggi and
                  Virginia Smith and
                  Michael I. Jordan and
                  Peter Richt{\'{a}}rik and
                  Martin Tak{\'{a}}c},
  title        = {Distributed optimization with arbitrary local solvers},
  journal      = {Optim. Methods Softw.},
  volume       = {32},
  number       = {4},
  pages        = {813--848},
  year         = {2017},
  url          = {https://doi.org/10.1080/10556788.2016.1278445},
  doi          = {10.1080/10556788.2016.1278445},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/oms/MaKJSJRT17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tgrs/KaiserWLJHS17,
  author       = {Pascal Kaiser and
                  Jan Dirk Wegner and
                  Aur{\'{e}}lien Lucchi and
                  Martin Jaggi and
                  Thomas Hofmann and
                  Konrad Schindler},
  title        = {Learning Aerial Image Segmentation From Online Maps},
  journal      = {{IEEE} Trans. Geosci. Remote. Sens.},
  volume       = {55},
  number       = {11},
  pages        = {6054--6068},
  year         = {2017},
  url          = {https://doi.org/10.1109/TGRS.2017.2719738},
  doi          = {10.1109/TGRS.2017.2719738},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tgrs/KaiserWLJHS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acl/FangJA17,
  author       = {Tina Fang and
                  Martin Jaggi and
                  Katerina J. Argyraki},
  editor       = {Allyson Ettinger and
                  Spandana Gella and
                  Matthieu Labeau and
                  Cecilia Ovesdotter Alm and
                  Marine Carpuat and
                  Mark Dredze},
  title        = {Generating Steganographic Text with LSTMs},
  booktitle    = {Proceedings of the 55th Annual Meeting of the Association for Computational
                  Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Student
                  Research Workshop},
  pages        = {100--106},
  publisher    = {Association for Computational Linguistics},
  year         = {2017},
  url          = {https://doi.org/10.18653/v1/P17-3017},
  doi          = {10.18653/V1/P17-3017},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/acl/FangJA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/LocatelloKTJ17,
  author       = {Francesco Locatello and
                  Rajiv Khanna and
                  Michael Tschannen and
                  Martin Jaggi},
  editor       = {Aarti Singh and
                  Xiaojin (Jerry) Zhu},
  title        = {A Unified Optimization View on Generalized Matching Pursuit and Frank-Wolfe},
  booktitle    = {Proceedings of the 20th International Conference on Artificial Intelligence
                  and Statistics, {AISTATS} 2017, 20-22 April 2017, Fort Lauderdale,
                  FL, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {54},
  pages        = {860--868},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v54/locatello17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/LocatelloKTJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/PerekrestenkoCJ17,
  author       = {Dmytro Perekrestenko and
                  Volkan Cevher and
                  Martin Jaggi},
  editor       = {Aarti Singh and
                  Xiaojin (Jerry) Zhu},
  title        = {Faster Coordinate Descent via Adaptive Importance Sampling},
  booktitle    = {Proceedings of the 20th International Conference on Artificial Intelligence
                  and Statistics, {AISTATS} 2017, 20-22 April 2017, Fort Lauderdale,
                  FL, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {54},
  pages        = {869--877},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v54/perekrestenko17a.html},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aistats/PerekrestenkoCJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/StichRJ17,
  author       = {Sebastian U. Stich and
                  Anant Raj and
                  Martin Jaggi},
  editor       = {Doina Precup and
                  Yee Whye Teh},
  title        = {Approximate Steepest Coordinate Descent},
  booktitle    = {Proceedings of the 34th International Conference on Machine Learning,
                  {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017},
  series       = {Proceedings of Machine Learning Research},
  volume       = {70},
  pages        = {3251--3259},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v70/stich17a.html},
  timestamp    = {Wed, 29 May 2019 08:41:45 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/StichRJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LocatelloTRJ17,
  author       = {Francesco Locatello and
                  Michael Tschannen and
                  Gunnar R{\"{a}}tsch and
                  Martin Jaggi},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Greedy Algorithms for Cone Constrained Optimization with Convergence
                  Guarantees},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {773--784},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/63538fe6ef330c13a05a3ed7e599d5f7-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 13:58:27 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/LocatelloTRJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/DunnerPJ17,
  author       = {Celestine D{\"{u}}nner and
                  Thomas P. Parnell and
                  Martin Jaggi},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Efficient Use of Limited-Memory Accelerators for Linear Learning on
                  Heterogeneous Systems},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {4258--4267},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/e0f7a4d0ef9b84b83b693bbf3feb8e6e-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/DunnerPJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/StichRJ17,
  author       = {Sebastian U. Stich and
                  Anant Raj and
                  Martin Jaggi},
  editor       = {Isabelle Guyon and
                  Ulrike von Luxburg and
                  Samy Bengio and
                  Hanna M. Wallach and
                  Rob Fergus and
                  S. V. N. Vishwanathan and
                  Roman Garnett},
  title        = {Safe Adaptive Importance Sampling},
  booktitle    = {Advances in Neural Information Processing Systems 30: Annual Conference
                  on Neural Information Processing Systems 2017, December 4-9, 2017,
                  Long Beach, CA, {USA}},
  pages        = {4381--4391},
  year         = {2017},
  url          = {https://proceedings.neurips.cc/paper/2017/hash/1177967c7957072da3dc1db4ceb30e7a-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/StichRJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/www/DeriuLLSMCHJ17,
  author       = {Jan Deriu and
                  Aur{\'{e}}lien Lucchi and
                  Valeria De Luca and
                  Aliaksei Severyn and
                  Simon M{\"{u}}ller and
                  Mark Cieliebak and
                  Thomas Hofmann and
                  Martin Jaggi},
  editor       = {Rick Barrett and
                  Rick Cummings and
                  Eugene Agichtein and
                  Evgeniy Gabrilovich},
  title        = {Leveraging Large Amounts of Weakly Supervised Data for Multi-Language
                  Sentiment Classification},
  booktitle    = {Proceedings of the 26th International Conference on World Wide Web,
                  {WWW} 2017, Perth, Australia, April 3-7, 2017},
  pages        = {1045--1052},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3038912.3052611},
  doi          = {10.1145/3038912.3052611},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/www/DeriuLLSMCHJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LocatelloKTJ17,
  author       = {Francesco Locatello and
                  Rajiv Khanna and
                  Michael Tschannen and
                  Martin Jaggi},
  title        = {A Unified Optimization View on Generalized Matching Pursuit and Frank-Wolfe},
  journal      = {CoRR},
  volume       = {abs/1702.06457},
  year         = {2017},
  url          = {http://arxiv.org/abs/1702.06457},
  eprinttype    = {arXiv},
  eprint       = {1702.06457},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LocatelloKTJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DeriuLLSMCHJ17,
  author       = {Jan Deriu and
                  Aur{\'{e}}lien Lucchi and
                  Valeria De Luca and
                  Aliaksei Severyn and
                  Simon M{\"{u}}ller and
                  Mark Cieliebak and
                  Thomas Hofmann and
                  Martin Jaggi},
  title        = {Leveraging Large Amounts of Weakly Supervised Data for Multi-Language
                  Sentiment Classification},
  journal      = {CoRR},
  volume       = {abs/1703.02504},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.02504},
  eprinttype    = {arXiv},
  eprint       = {1703.02504},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/DeriuLLSMCHJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PagliardiniGJ17,
  author       = {Matteo Pagliardini and
                  Prakhar Gupta and
                  Martin Jaggi},
  title        = {Unsupervised Learning of Sentence Embeddings using Compositional n-Gram
                  Features},
  journal      = {CoRR},
  volume       = {abs/1703.02507},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.02507},
  eprinttype    = {arXiv},
  eprint       = {1703.02507},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PagliardiniGJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PerekrestenkoCJ17,
  author       = {Dmytro Perekrestenko and
                  Volkan Cevher and
                  Martin Jaggi},
  title        = {Faster Coordinate Descent via Adaptive Importance Sampling},
  journal      = {CoRR},
  volume       = {abs/1703.02518},
  year         = {2017},
  url          = {http://arxiv.org/abs/1703.02518},
  eprinttype    = {arXiv},
  eprint       = {1703.02518},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PerekrestenkoCJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/FangJA17,
  author       = {Tina Fang and
                  Martin Jaggi and
                  Katerina J. Argyraki},
  title        = {Generating Steganographic Text with LSTMs},
  journal      = {CoRR},
  volume       = {abs/1705.10742},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.10742},
  eprinttype    = {arXiv},
  eprint       = {1705.10742},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/FangJA17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LocatelloTRJ17,
  author       = {Francesco Locatello and
                  Michael Tschannen and
                  Gunnar R{\"{a}}tsch and
                  Martin Jaggi},
  title        = {Greedy Algorithms for Cone Constrained Optimization with Convergence
                  Guarantees},
  journal      = {CoRR},
  volume       = {abs/1705.11041},
  year         = {2017},
  url          = {http://arxiv.org/abs/1705.11041},
  eprinttype    = {arXiv},
  eprint       = {1705.11041},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LocatelloTRJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/StichRJ17,
  author       = {Sebastian U. Stich and
                  Anant Raj and
                  Martin Jaggi},
  title        = {Approximate Steepest Coordinate Descent},
  journal      = {CoRR},
  volume       = {abs/1706.08427},
  year         = {2017},
  url          = {http://arxiv.org/abs/1706.08427},
  eprinttype    = {arXiv},
  eprint       = {1706.08427},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/StichRJ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/LangovoyGJS17,
  author       = {Mikhail A. Langovoy and
                  Akhilesh Gotmare and
                  Martin Jaggi and
                  Suvrit Sra},
  title        = {Unsupervised robust nonparametric learning of hidden community properties},
  journal      = {CoRR},
  volume       = {abs/1707.03494},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.03494},
  eprinttype    = {arXiv},
  eprint       = {1707.03494},
  timestamp    = {Sat, 23 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/LangovoyGJS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KaiserWLJHS17,
  author       = {Pascal Kaiser and
                  Jan Dirk Wegner and
                  Aur{\'{e}}lien Lucchi and
                  Martin Jaggi and
                  Thomas Hofmann and
                  Konrad Schindler},
  title        = {Learning Aerial Image Segmentation from Online Maps},
  journal      = {CoRR},
  volume       = {abs/1707.06879},
  year         = {2017},
  url          = {http://arxiv.org/abs/1707.06879},
  eprinttype    = {arXiv},
  eprint       = {1707.06879},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KaiserWLJHS17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1708-05357,
  author       = {Celestine D{\"{u}}nner and
                  Thomas P. Parnell and
                  Martin Jaggi},
  title        = {Efficient Use of Limited-Memory Resources to Accelerate Linear Learning},
  journal      = {CoRR},
  volume       = {abs/1708.05357},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.05357},
  eprinttype    = {arXiv},
  eprint       = {1708.05357},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-05357.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-02637,
  author       = {Sebastian U. Stich and
                  Anant Raj and
                  Martin Jaggi},
  title        = {Safe Adaptive Importance Sampling},
  journal      = {CoRR},
  volume       = {abs/1711.02637},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.02637},
  eprinttype    = {arXiv},
  eprint       = {1711.02637},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-02637.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-05305,
  author       = {Chenxin Ma and
                  Martin Jaggi and
                  Frank E. Curtis and
                  Nathan Srebro and
                  Martin Tak{\'{a}}c},
  title        = {An Accelerated Communication-Efficient Primal-Dual Optimization Framework
                  for Structured Machine Learning},
  journal      = {CoRR},
  volume       = {abs/1711.05305},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.05305},
  eprinttype    = {arXiv},
  eprint       = {1711.05305},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-05305.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/clef/SprengelJKH16,
  author       = {Elias Sprengel and
                  Martin Jaggi and
                  Yannic Kilcher and
                  Thomas Hofmann},
  editor       = {Krisztian Balog and
                  Linda Cappellato and
                  Nicola Ferro and
                  Craig Macdonald},
  title        = {Audio Based Bird Species Identification using Deep Learning Techniques},
  booktitle    = {Working Notes of {CLEF} 2016 - Conference and Labs of the Evaluation
                  forum, {\'{E}}vora, Portugal, 5-8 September, 2016},
  series       = {{CEUR} Workshop Proceedings},
  volume       = {1609},
  pages        = {547--559},
  publisher    = {CEUR-WS.org},
  year         = {2016},
  url          = {https://ceur-ws.org/Vol-1609/16090547.pdf},
  timestamp    = {Fri, 10 Mar 2023 16:23:40 +0100},
  biburl       = {https://dblp.org/rec/conf/clef/SprengelJKH16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/DunnerFTJ16,
  author       = {Celestine D{\"{u}}nner and
                  Simone Forte and
                  Martin Tak{\'{a}}c and
                  Martin Jaggi},
  editor       = {Maria{-}Florina Balcan and
                  Kilian Q. Weinberger},
  title        = {Primal-Dual Rates and Certificates},
  booktitle    = {Proceedings of the 33nd International Conference on Machine Learning,
                  {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {48},
  pages        = {783--792},
  publisher    = {JMLR.org},
  year         = {2016},
  url          = {http://proceedings.mlr.press/v48/dunner16.html},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/DunnerFTJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/semeval/DeriuGULLJ16,
  author       = {Jan Deriu and
                  Maurice Gonzenbach and
                  Fatih Uzdilli and
                  Aur{\'{e}}lien Lucchi and
                  Valeria De Luca and
                  Martin Jaggi},
  editor       = {Steven Bethard and
                  Daniel M. Cer and
                  Marine Carpuat and
                  David Jurgens and
                  Preslav Nakov and
                  Torsten Zesch},
  title        = {SwissCheese at SemEval-2016 Task 4: Sentiment Classification Using
                  an Ensemble of Convolutional Neural Networks with Distant Supervision},
  booktitle    = {Proceedings of the 10th International Workshop on Semantic Evaluation,
                  SemEval@NAACL-HLT 2016, San Diego, CA, USA, June 16-17, 2016},
  pages        = {1124--1128},
  publisher    = {The Association for Computer Linguistics},
  year         = {2016},
  url          = {https://doi.org/10.18653/v1/s16-1173},
  doi          = {10.18653/V1/S16-1173},
  timestamp    = {Wed, 07 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/semeval/DeriuGULLJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KhannaTJ16,
  author       = {Rajiv Khanna and
                  Michael Tschannen and
                  Martin Jaggi},
  title        = {Pursuits in Structured Non-Convex Matrix Factorizations},
  journal      = {CoRR},
  volume       = {abs/1602.04208},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.04208},
  eprinttype    = {arXiv},
  eprint       = {1602.04208},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KhannaTJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/DunnerFTJ16,
  author       = {Celestine D{\"{u}}nner and
                  Simone Forte and
                  Martin Tak{\'{a}}c and
                  Martin Jaggi},
  title        = {Primal-Dual Rates and Certificates},
  journal      = {CoRR},
  volume       = {abs/1602.05205},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.05205},
  eprinttype    = {arXiv},
  eprint       = {1602.05205},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/DunnerFTJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/RajOGSJ16,
  author       = {Anant Raj and
                  Jakob Olbrich and
                  Bernd G{\"{a}}rtner and
                  Bernhard Sch{\"{o}}lkopf and
                  Martin Jaggi},
  title        = {Screening Rules for Convex Problems},
  journal      = {CoRR},
  volume       = {abs/1609.07478},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.07478},
  eprinttype    = {arXiv},
  eprint       = {1609.07478},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RajOGSJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SmithFMTJJ16,
  author       = {Virginia Smith and
                  Simone Forte and
                  Chenxin Ma and
                  Martin Tak{\'{a}}c and
                  Michael I. Jordan and
                  Martin Jaggi},
  title        = {CoCoA: {A} General Framework for Communication-Efficient Distributed
                  Optimization},
  journal      = {CoRR},
  volume       = {abs/1611.02189},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.02189},
  eprinttype    = {arXiv},
  eprint       = {1611.02189},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/SmithFMTJJ16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/MaSJJRT15,
  author       = {Chenxin Ma and
                  Virginia Smith and
                  Martin Jaggi and
                  Michael I. Jordan and
                  Peter Richt{\'{a}}rik and
                  Martin Tak{\'{a}}c},
  editor       = {Francis R. Bach and
                  David M. Blei},
  title        = {Adding vs. Averaging in Distributed Primal-Dual Optimization},
  booktitle    = {Proceedings of the 32nd International Conference on Machine Learning,
                  {ICML} 2015, Lille, France, 6-11 July 2015},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {37},
  pages        = {1973--1982},
  publisher    = {JMLR.org},
  year         = {2015},
  url          = {http://proceedings.mlr.press/v37/mab15.html},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/MaSJJRT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/Lacoste-JulienJ15,
  author       = {Simon Lacoste{-}Julien and
                  Martin Jaggi},
  editor       = {Corinna Cortes and
                  Neil D. Lawrence and
                  Daniel D. Lee and
                  Masashi Sugiyama and
                  Roman Garnett},
  title        = {On the Global Linear Convergence of Frank-Wolfe Optimization Variants},
  booktitle    = {Advances in Neural Information Processing Systems 28: Annual Conference
                  on Neural Information Processing Systems 2015, December 7-12, 2015,
                  Montreal, Quebec, Canada},
  pages        = {496--504},
  year         = {2015},
  url          = {https://proceedings.neurips.cc/paper/2015/hash/c058f544c737782deacefa532d9add4c-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/Lacoste-JulienJ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/semeval/UzdilliJEJDC15,
  author       = {Fatih Uzdilli and
                  Martin Jaggi and
                  Dominic Egger and
                  Pascal Julmy and
                  Leon Derczynski and
                  Mark Cieliebak},
  editor       = {Daniel M. Cer and
                  David Jurgens and
                  Preslav Nakov and
                  Torsten Zesch},
  title        = {Swiss-Chocolate: Combining Flipout Regularization and Random Forests
                  with Artificially Built Subsystems to Boost Text-Classification for
                  Sentiment},
  booktitle    = {Proceedings of the 9th International Workshop on Semantic Evaluation,
                  SemEval@NAACL-HLT 2015, Denver, Colorado, USA, June 4-5, 2015},
  pages        = {608--612},
  publisher    = {The Association for Computer Linguistics},
  year         = {2015},
  url          = {https://doi.org/10.18653/v1/s15-2101},
  doi          = {10.18653/V1/S15-2101},
  timestamp    = {Sat, 30 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/semeval/UzdilliJEJDC15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MaSJJRT15,
  author       = {Chenxin Ma and
                  Virginia Smith and
                  Martin Jaggi and
                  Michael I. Jordan and
                  Peter Richt{\'{a}}rik and
                  Martin Tak{\'{a}}c},
  title        = {Adding vs. Averaging in Distributed Primal-Dual Optimization},
  journal      = {CoRR},
  volume       = {abs/1502.03508},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.03508},
  eprinttype    = {arXiv},
  eprint       = {1502.03508},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MaSJJRT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/Lacoste-JulienJ15,
  author       = {Simon Lacoste{-}Julien and
                  Martin Jaggi},
  title        = {On the Global Linear Convergence of Frank-Wolfe Optimization Variants},
  journal      = {CoRR},
  volume       = {abs/1511.05932},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.05932},
  eprinttype    = {arXiv},
  eprint       = {1511.05932},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Lacoste-JulienJ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/SmithFJJ15,
  author       = {Virginia Smith and
                  Simone Forte and
                  Michael I. Jordan and
                  Martin Jaggi},
  title        = {L1-Regularized Distributed Optimization: {A} Communication-Efficient
                  Primal-Dual Framework},
  journal      = {CoRR},
  volume       = {abs/1512.04011},
  year         = {2015},
  url          = {http://arxiv.org/abs/1512.04011},
  eprinttype    = {arXiv},
  eprint       = {1512.04011},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/SmithFJJ15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/MaKJSJRT15,
  author       = {Chenxin Ma and
                  Jakub Kone{\v{c}}n{\'y} and
                  Martin Jaggi and
                  Virginia Smith and
                  Michael I. Jordan and
                  Peter Richt{\'{a}}rik and
                  Martin Tak{\'{a}}c},
  title        = {Distributed Optimization with Arbitrary Local Solvers},
  journal      = {CoRR},
  volume       = {abs/1512.04039},
  year         = {2015},
  url          = {http://arxiv.org/abs/1512.04039},
  eprinttype    = {arXiv},
  eprint       = {1512.04039},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/MaKJSJRT15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/JaggiSTTKHJ14,
  author       = {Martin Jaggi and
                  Virginia Smith and
                  Martin Tak{\'{a}}c and
                  Jonathan Terhorst and
                  Sanjay Krishnan and
                  Thomas Hofmann and
                  Michael I. Jordan},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Communication-Efficient Distributed Dual Coordinate Ascent},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {3068--3076},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/894b77f805bd94d292574c38c5d628d5-Abstract.html},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/JaggiSTTKHJ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/semeval/JaggiUC14,
  author       = {Martin Jaggi and
                  Fatih Uzdilli and
                  Mark Cieliebak},
  editor       = {Preslav Nakov and
                  Torsten Zesch},
  title        = {Swiss-Chocolate: Sentiment Detection using Sparse SVMs and Part-Of-Speech
                  n-Grams},
  booktitle    = {Proceedings of the 8th International Workshop on Semantic Evaluation,
                  SemEval@COLING 2014, Dublin, Ireland, August 23-24, 2014},
  pages        = {601--604},
  publisher    = {The Association for Computer Linguistics},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/s14-2105},
  doi          = {10.3115/V1/S14-2105},
  timestamp    = {Fri, 06 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/semeval/JaggiUC14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/JaggiSTTKHJ14,
  author       = {Martin Jaggi and
                  Virginia Smith and
                  Martin Tak{\'{a}}c and
                  Jonathan Terhorst and
                  Sanjay Krishnan and
                  Thomas Hofmann and
                  Michael I. Jordan},
  title        = {Communication-Efficient Distributed Dual Coordinate Ascent},
  journal      = {CoRR},
  volume       = {abs/1409.1458},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.1458},
  eprinttype    = {arXiv},
  eprint       = {1409.1458},
  timestamp    = {Wed, 11 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/JaggiSTTKHJ14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Lacoste-JulienJSP13,
  author       = {Simon Lacoste{-}Julien and
                  Martin Jaggi and
                  Mark Schmidt and
                  Patrick Pletscher},
  title        = {Block-Coordinate Frank-Wolfe Optimization for Structural SVMs},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {53--61},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/lacoste-julien13.html},
  timestamp    = {Thu, 23 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Lacoste-JulienJSP13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Jaggi13,
  author       = {Martin Jaggi},
  title        = {Revisiting Frank-Wolfe: Projection-Free Sparse Convex Optimization},
  booktitle    = {Proceedings of the 30th International Conference on Machine Learning,
                  {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013},
  series       = {{JMLR} Workshop and Conference Proceedings},
  volume       = {28},
  pages        = {427--435},
  publisher    = {JMLR.org},
  year         = {2013},
  url          = {http://proceedings.mlr.press/v28/jaggi13.html},
  timestamp    = {Wed, 29 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Jaggi13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1303-1152,
  author       = {Martin Jaggi},
  title        = {An Equivalence between the Lasso and Support Vector Machines},
  journal      = {CoRR},
  volume       = {abs/1303.1152},
  year         = {2013},
  url          = {http://arxiv.org/abs/1303.1152},
  eprinttype    = {arXiv},
  eprint       = {1303.1152},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1303-1152.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jocg/GartnerJM12,
  author       = {Bernd G{\"{a}}rtner and
                  Martin Jaggi and
                  Cl{\'{e}}ment Maria},
  title        = {An Exponential Lower Bound on the Complexity of Regularization Paths},
  journal      = {J. Comput. Geom.},
  volume       = {3},
  number       = {1},
  pages        = {168--195},
  year         = {2012},
  url          = {https://doi.org/10.20382/jocg.v3i1a9},
  doi          = {10.20382/JOCG.V3I1A9},
  timestamp    = {Thu, 10 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jocg/GartnerJM12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/talg/GiesenJL12,
  author       = {Joachim Giesen and
                  Martin Jaggi and
                  S{\"{o}}ren Laue},
  title        = {Approximating parameterized convex optimization problems},
  journal      = {{ACM} Trans. Algorithms},
  volume       = {9},
  number       = {1},
  pages        = {10:1--10:17},
  year         = {2012},
  url          = {https://doi.org/10.1145/2390176.2390186},
  doi          = {10.1145/2390176.2390186},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/talg/GiesenJL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/esa/GiesenJL12,
  author       = {Joachim Giesen and
                  Martin Jaggi and
                  S{\"{o}}ren Laue},
  editor       = {Leah Epstein and
                  Paolo Ferragina},
  title        = {Optimizing over the Growing Spectrahedron},
  booktitle    = {Algorithms - {ESA} 2012 - 20th Annual European Symposium, Ljubljana,
                  Slovenia, September 10-12, 2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7501},
  pages        = {503--514},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-33090-2\_44},
  doi          = {10.1007/978-3-642-33090-2\_44},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/esa/GiesenJL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/GiesenJL12,
  author       = {Joachim Giesen and
                  Martin Jaggi and
                  S{\"{o}}ren Laue},
  editor       = {Neil D. Lawrence and
                  Mark A. Girolami},
  title        = {Regularization Paths with Guarantees for Convex Semidefinite Optimization},
  booktitle    = {Proceedings of the Fifteenth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2012, La Palma, Canary Islands,
                  Spain, April 21-23, 2012},
  series       = {{JMLR} Proceedings},
  volume       = {22},
  pages        = {432--439},
  publisher    = {JMLR.org},
  year         = {2012},
  url          = {http://proceedings.mlr.press/v22/giesen12.html},
  timestamp    = {Wed, 29 May 2019 08:41:44 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/GiesenJL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1207-4747,
  author       = {Simon Lacoste{-}Julien and
                  Martin Jaggi and
                  Mark Schmidt and
                  Patrick Pletscher},
  title        = {Stochastic Block-Coordinate Frank-Wolfe Optimization for Structural
                  SVMs},
  journal      = {CoRR},
  volume       = {abs/1207.4747},
  year         = {2012},
  url          = {http://arxiv.org/abs/1207.4747},
  eprinttype    = {arXiv},
  eprint       = {1207.4747},
  timestamp    = {Thu, 23 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1207-4747.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/basesearch/Jaggi11,
  author       = {Martin Jaggi},
  title        = {Sparse Convex Optimization Methods for Machine Learning},
  school       = {{ETH} Zurich, Z{\"{u}}rich, Switzerland},
  year         = {2011},
  url          = {https://hdl.handle.net/20.500.11850/72811},
  doi          = {10.3929/ETHZ-A-007050453},
  timestamp    = {Mon, 02 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/phd/basesearch/Jaggi11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1108-1170,
  author       = {Martin Jaggi},
  title        = {Convex Optimization without Projection Steps},
  journal      = {CoRR},
  volume       = {abs/1108.1170},
  year         = {2011},
  url          = {http://arxiv.org/abs/1108.1170},
  eprinttype    = {arXiv},
  eprint       = {1108.1170},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1108-1170.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/esa/GiesenJL10,
  author       = {Joachim Giesen and
                  Martin Jaggi and
                  S{\"{o}}ren Laue},
  editor       = {Mark de Berg and
                  Ulrich Meyer},
  title        = {Approximating Parameterized Convex Optimization Problems},
  booktitle    = {Algorithms - {ESA} 2010, 18th Annual European Symposium, Liverpool,
                  UK, September 6-8, 2010. Proceedings, Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {6346},
  pages        = {524--535},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-3-642-15775-2\_45},
  doi          = {10.1007/978-3-642-15775-2\_45},
  timestamp    = {Tue, 14 May 2019 10:00:54 +0200},
  biburl       = {https://dblp.org/rec/conf/esa/GiesenJL10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/JaggiS10,
  author       = {Martin Jaggi and
                  Marek Sulovsk{\'{y}}},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Thorsten Joachims},
  title        = {A Simple Algorithm for Nuclear Norm Regularized Problems},
  booktitle    = {Proceedings of the 27th International Conference on Machine Learning
                  (ICML-10), June 21-24, 2010, Haifa, Israel},
  pages        = {471--478},
  publisher    = {Omnipress},
  year         = {2010},
  url          = {https://icml.cc/Conferences/2010/papers/196.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/JaggiS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/compgeom/GartnerJ09,
  author       = {Bernd G{\"{a}}rtner and
                  Martin Jaggi},
  editor       = {John Hershberger and
                  Efi Fogel},
  title        = {Coresets for polytope distance},
  booktitle    = {Proceedings of the 25th {ACM} Symposium on Computational Geometry,
                  Aarhus, Denmark, June 8-10, 2009},
  pages        = {33--42},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1542362.1542370},
  doi          = {10.1145/1542362.1542370},
  timestamp    = {Mon, 14 Jun 2021 16:24:56 +0200},
  biburl       = {https://dblp.org/rec/conf/compgeom/GartnerJ09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0903-4817,
  author       = {Bernd G{\"{a}}rtner and
                  Joachim Giesen and
                  Martin Jaggi},
  title        = {An Exponential Lower Bound on the Complexity of Regularization Paths},
  journal      = {CoRR},
  volume       = {abs/0903.4817},
  year         = {2009},
  url          = {http://arxiv.org/abs/0903.4817},
  eprinttype    = {arXiv},
  eprint       = {0903.4817},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0903-4817.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0903-4856,
  author       = {Bernd G{\"{a}}rtner and
                  Joachim Giesen and
                  Martin Jaggi and
                  Torsten Welsch},
  title        = {A Combinatorial Algorithm to Compute Regularization Paths},
  journal      = {CoRR},
  volume       = {abs/0903.4856},
  year         = {2009},
  url          = {http://arxiv.org/abs/0903.4856},
  eprinttype    = {arXiv},
  eprint       = {0903.4856},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0903-4856.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics