Stop the war!
Остановите войну!
for scientists:
default search action
BibTeX records: Martin Jaggi
@inproceedings{DBLP:conf/aaai/KossonFJ24, author = {Atli Kosson and Dongyang Fan and Martin Jaggi}, editor = {Michael J. Wooldridge and Jennifer G. Dy and Sriraam Natarajan}, title = {Ghost Noise for Regularizing Deep Neural Networks}, booktitle = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI} 2024, Thirty-Sixth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver, Canada}, pages = {13274--13282}, publisher = {{AAAI} Press}, year = {2024}, url = {https://doi.org/10.1609/aaai.v38i12.29228}, doi = {10.1609/AAAI.V38I12.29228}, timestamp = {Tue, 02 Apr 2024 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aaai/KossonFJ24.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-02622, author = {Matteo Pagliardini and Amirkeivan Mohtashami and Fran{\c{c}}ois Fleuret and Martin Jaggi}, title = {DenseFormer: Enhancing Information Flow in Transformers via Depth Weighted Averaging}, journal = {CoRR}, volume = {abs/2402.02622}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.02622}, doi = {10.48550/ARXIV.2402.02622}, eprinttype = {arXiv}, eprint = {2402.02622}, timestamp = {Mon, 12 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-02622.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-02933, author = {Vinitra Swamy and Julian Blackwell and Jibril Frej and Martin Jaggi and Tanja K{\"{a}}ser}, title = {InterpretCC: Conditional Computation for Inherently Interpretable Neural Networks}, journal = {CoRR}, volume = {abs/2402.02933}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.02933}, doi = {10.48550/ARXIV.2402.02933}, eprinttype = {arXiv}, eprint = {2402.02933}, timestamp = {Mon, 12 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-02933.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-04161, author = {Ashok Vardhan Makkuva and Marco Bondaschi and Adway Girish and Alliot Nagle and Martin Jaggi and Hyeji Kim and Michael Gastpar}, title = {Attention with Markov: {A} Framework for Principled Analysis of Transformers via Markov Chains}, journal = {CoRR}, volume = {abs/2402.04161}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.04161}, doi = {10.48550/ARXIV.2402.04161}, eprinttype = {arXiv}, eprint = {2402.04161}, timestamp = {Mon, 12 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-04161.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2402-13089, author = {Dongyang Fan and Bettina Messmer and Martin Jaggi}, title = {Towards an empirical understanding of MoE design choices}, journal = {CoRR}, volume = {abs/2402.13089}, year = {2024}, url = {https://doi.org/10.48550/arXiv.2402.13089}, doi = {10.48550/ARXIV.2402.13089}, eprinttype = {arXiv}, eprint = {2402.13089}, timestamp = {Thu, 21 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2402-13089.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/npjdm/HeitmannGDDSGBCPMCRSLJGHHFBBHBB23, author = {Julien Heitmann and Alban Glangetas and Jonathan Doenz and Juliane Dervaux and Deeksha M. Shama and Daniel Hinjos Garcia and Mohamed Rida Benissa and Aymeric Cantais and Alexandre Perez and Daniel M{\"{u}}ller and Tatjana Chavdarova and Isabelle Ruchonnet{-}Metrailler and Johan N. Siebert and Laurence Lacroix and Martin Jaggi and Alain Gervaix and Mary{-}Anne Hartley and Florence Hugon and Derrick Fassbind and Makura Barro and Georges Bediang and N. E. L. Hafidi and M. Bouskraoui and Idrissa Ba}, title = {DeepBreath - automated detection of respiratory pathology from lung auscultation in 572 pediatric outpatients across 5 countries}, journal = {npj Digit. Medicine}, volume = {6}, year = {2023}, url = {https://doi.org/10.1038/s41746-023-00838-3}, doi = {10.1038/S41746-023-00838-3}, timestamp = {Wed, 24 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/npjdm/HeitmannGDDSGBCPMCRSLJGHHFBBHBB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/BlinovaZJEB23, author = {Sofia Blinova and Xinyu Zhou and Martin Jaggi and Carsten Eickhoff and Seyed Ali Bahrainian}, editor = {Anna Rogers and Jordan L. Boyd{-}Graber and Naoaki Okazaki}, title = {{SIMSUM:} Document-level Text Simplification via Simultaneous Summarization}, booktitle = {Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), {ACL} 2023, Toronto, Canada, July 9-14, 2023}, pages = {9927--9944}, publisher = {Association for Computational Linguistics}, year = {2023}, url = {https://doi.org/10.18653/v1/2023.acl-long.552}, doi = {10.18653/V1/2023.ACL-LONG.552}, timestamp = {Thu, 10 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/BlinovaZJEB23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/colt/VladareanDJF23, author = {Maria{-}Luiza Vladarean and Nikita Doikov and Martin Jaggi and Nicolas Flammarion}, editor = {Gergely Neu and Lorenzo Rosasco}, title = {Linearization Algorithms for Fully Composite Optimization}, booktitle = {The Thirty Sixth Annual Conference on Learning Theory, {COLT} 2023, 12-15 July 2023, Bangalore, India}, series = {Proceedings of Machine Learning Research}, volume = {195}, pages = {3669--3695}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v195/vladarean23a.html}, timestamp = {Wed, 06 Sep 2023 17:49:05 +0200}, biburl = {https://dblp.org/rec/conf/colt/VladareanDJF23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/PagliardiniJFK23, author = {Matteo Pagliardini and Martin Jaggi and Fran{\c{c}}ois Fleuret and Sai Praneeth Karimireddy}, title = {Agree to Disagree: Diversity through Disagreement for Better Transferability}, booktitle = {The Eleventh International Conference on Learning Representations, {ICLR} 2023, Kigali, Rwanda, May 1-5, 2023}, publisher = {OpenReview.net}, year = {2023}, url = {https://openreview.net/pdf?id=K7CbYQbyYhY}, timestamp = {Fri, 30 Jun 2023 14:38:38 +0200}, biburl = {https://dblp.org/rec/conf/iclr/PagliardiniJFK23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DoikovCJ23, author = {Nikita Doikov and El Mahdi Chayti and Martin Jaggi}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {Second-Order Optimization with Lazy Hessians}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {8138--8161}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/doikov23a.html}, timestamp = {Mon, 28 Aug 2023 17:23:08 +0200}, biburl = {https://dblp.org/rec/conf/icml/DoikovCJ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/MohtashamiJS23, author = {Amirkeivan Mohtashami and Martin Jaggi and Sebastian U. Stich}, editor = {Andreas Krause and Emma Brunskill and Kyunghyun Cho and Barbara Engelhardt and Sivan Sabato and Jonathan Scarlett}, title = {Special Properties of Gradient Descent with Large Learning Rates}, booktitle = {International Conference on Machine Learning, {ICML} 2023, 23-29 July 2023, Honolulu, Hawaii, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {202}, pages = {25082--25104}, publisher = {{PMLR}}, year = {2023}, url = {https://proceedings.mlr.press/v202/mohtashami23a.html}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/MohtashamiJS23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FanMJ23, author = {Dongyang Fan and Celestine Mendler{-}D{\"{u}}nner and Martin Jaggi}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Collaborative Learning via Prediction Consensus}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/065e259a1d2d955e63b99aac6a3a3081-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/FanMJ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KossonJ23, author = {Atli Kosson and Martin Jaggi}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Multiplication-Free Transformer Training via Piecewise Affine Operations}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/19df21cd4931bd0caaa4d8480e9a59cd-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/KossonJ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/MohtashamiJ23, author = {Amirkeivan Mohtashami and Martin Jaggi}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Random-Access Infinite Context Length for Transformers}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/ab05dc8bf36a9f66edbff6992ec86f56-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/MohtashamiJ23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/PagliardiniPJF23, author = {Matteo Pagliardini and Daniele Paliotta and Martin Jaggi and Fran{\c{c}}ois Fleuret}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {Fast Attention Over Long Sequences With Dynamic Sparse Flash Attention}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/bc222e8153a49c1b30a1b8ba96b35117-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/PagliardiniPJF23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SwamySFBVJKH23, author = {Vinitra Swamy and Malika Satayeva and Jibril Frej and Thierry Bossy and Thijs Vogels and Martin Jaggi and Tanja K{\"{a}}ser and Mary{-}Anne Hartley}, editor = {Alice Oh and Tristan Naumann and Amir Globerson and Kate Saenko and Moritz Hardt and Sergey Levine}, title = {MultiMoDN - Multimodal, Multi-Task, Interpretable Modular Networks}, booktitle = {Advances in Neural Information Processing Systems 36: Annual Conference on Neural Information Processing Systems 2023, NeurIPS 2023, New Orleans, LA, USA, December 10 - 16, 2023}, year = {2023}, url = {http://papers.nips.cc/paper\_files/paper/2023/hash/5951641ad71b0052cf776f9b71f18932-Abstract-Conference.html}, timestamp = {Fri, 01 Mar 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/SwamySFBVJKH23.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2301-02151, author = {Thijs Vogels and Hadrien Hendrikx and Martin Jaggi}, title = {Beyond spectral gap (extended): The role of the topology in decentralized learning}, journal = {CoRR}, volume = {abs/2301.02151}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2301.02151}, doi = {10.48550/ARXIV.2301.02151}, eprinttype = {arXiv}, eprint = {2301.02151}, timestamp = {Tue, 10 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2301-02151.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-11962, author = {El Mahdi Chayti and Nikita Doikov and Martin Jaggi}, title = {Unified Convergence Theory of Stochastic and Variance-Reduced Cubic Newton Methods}, journal = {CoRR}, volume = {abs/2302.11962}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.11962}, doi = {10.48550/ARXIV.2302.11962}, eprinttype = {arXiv}, eprint = {2302.11962}, timestamp = {Tue, 28 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-11962.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2302-12808, author = {Maria{-}Luiza Vladarean and Nikita Doikov and Martin Jaggi and Nicolas Flammarion}, title = {Linearization Algorithms for Fully Composite Optimization}, journal = {CoRR}, volume = {abs/2302.12808}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2302.12808}, doi = {10.48550/ARXIV.2302.12808}, eprinttype = {arXiv}, eprint = {2302.12808}, timestamp = {Tue, 28 Feb 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2302-12808.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-16300, author = {Amirkeivan Mohtashami and Martin Jaggi}, title = {Landmark Attention: Random-Access Infinite Context Length for Transformers}, journal = {CoRR}, volume = {abs/2305.16300}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.16300}, doi = {10.48550/ARXIV.2305.16300}, eprinttype = {arXiv}, eprint = {2305.16300}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-16300.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-17190, author = {Atli Kosson and Martin Jaggi}, title = {Hardware-Efficient Transformer Training via Piecewise Affine Operations}, journal = {CoRR}, volume = {abs/2305.17190}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.17190}, doi = {10.48550/ARXIV.2305.17190}, eprinttype = {arXiv}, eprint = {2305.17190}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-17190.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-17205, author = {Atli Kosson and Dongyang Fan and Martin Jaggi}, title = {Ghost Noise for Regularizing Deep Neural Networks}, journal = {CoRR}, volume = {abs/2305.17205}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.17205}, doi = {10.48550/ARXIV.2305.17205}, eprinttype = {arXiv}, eprint = {2305.17205}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-17205.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-17212, author = {Atli Kosson and Bettina Messmer and Martin Jaggi}, title = {Rotational Optimizers: Simple {\&} Robust {DNN} Training}, journal = {CoRR}, volume = {abs/2305.17212}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.17212}, doi = {10.48550/ARXIV.2305.17212}, eprinttype = {arXiv}, eprint = {2305.17212}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-17212.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-18497, author = {Dongyang Fan and Celestine Mendler{-}D{\"{u}}nner and Martin Jaggi}, title = {Collaborative Learning via Prediction Consensus}, journal = {CoRR}, volume = {abs/2305.18497}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.18497}, doi = {10.48550/ARXIV.2305.18497}, eprinttype = {arXiv}, eprint = {2305.18497}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-18497.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2305-19259, author = {Anastasia Koloskova and Nikita Doikov and Sebastian U. Stich and Martin Jaggi}, title = {Shuffle {SGD} is Always Better than {SGD:} Improved Analysis of {SGD} with Arbitrary Data Orders}, journal = {CoRR}, volume = {abs/2305.19259}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2305.19259}, doi = {10.48550/ARXIV.2305.19259}, eprinttype = {arXiv}, eprint = {2305.19259}, timestamp = {Wed, 07 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2305-19259.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-01160, author = {Matteo Pagliardini and Daniele Paliotta and Martin Jaggi and Fran{\c{c}}ois Fleuret}, title = {Faster Causal Attention Over Large Sequences Through Sparse Flash Attention}, journal = {CoRR}, volume = {abs/2306.01160}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.01160}, doi = {10.48550/ARXIV.2306.01160}, eprinttype = {arXiv}, eprint = {2306.01160}, timestamp = {Mon, 12 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-01160.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2306-08393, author = {Mariel A. Werner and Lie He and Sai Praneeth Karimireddy and Michael I. Jordan and Martin Jaggi}, title = {Provably Personalized and Robust Federated Learning}, journal = {CoRR}, volume = {abs/2306.08393}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2306.08393}, doi = {10.48550/ARXIV.2306.08393}, eprinttype = {arXiv}, eprint = {2306.08393}, timestamp = {Sun, 18 Jun 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2306-08393.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2307-06966, author = {Linara Adilova and Asja Fischer and Martin Jaggi}, title = {Layerwise Linear Mode Connectivity}, journal = {CoRR}, volume = {abs/2307.06966}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2307.06966}, doi = {10.48550/ARXIV.2307.06966}, eprinttype = {arXiv}, eprint = {2307.06966}, timestamp = {Mon, 24 Jul 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2307-06966.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2309-14118, author = {Vinitra Swamy and Malika Satayeva and Jibril Frej and Thierry Bossy and Thijs Vogels and Martin Jaggi and Tanja K{\"{a}}ser and Mary{-}Anne Hartley}, title = {MultiModN- Multimodal, Multi-Task, Interpretable Modular Networks}, journal = {CoRR}, volume = {abs/2309.14118}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2309.14118}, doi = {10.48550/ARXIV.2309.14118}, eprinttype = {arXiv}, eprint = {2309.14118}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2309-14118.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-10845, author = {Amirkeivan Mohtashami and Matteo Pagliardini and Martin Jaggi}, title = {CoTFormer: More Tokens With Attention Make Up For Less Depth}, journal = {CoRR}, volume = {abs/2310.10845}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.10845}, doi = {10.48550/ARXIV.2310.10845}, eprinttype = {arXiv}, eprint = {2310.10845}, timestamp = {Thu, 26 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-10845.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-13033, author = {Ashok Vardhan Makkuva and Marco Bondaschi and Thijs Vogels and Martin Jaggi and Hyeji Kim and Michael C. Gastpar}, title = {{LASER:} Linear Compression in Wireless Distributed Optimization}, journal = {CoRR}, volume = {abs/2310.13033}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.13033}, doi = {10.48550/ARXIV.2310.13033}, eprinttype = {arXiv}, eprint = {2310.13033}, timestamp = {Fri, 27 Oct 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-13033.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-15389, author = {Simin Fan and Martin Jaggi}, title = {Irreducible Curriculum for Language Model Pretraining}, journal = {CoRR}, volume = {abs/2310.15389}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.15389}, doi = {10.48550/ARXIV.2310.15389}, eprinttype = {arXiv}, eprint = {2310.15389}, timestamp = {Tue, 31 Oct 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-15389.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2310-15393, author = {Simin Fan and Matteo Pagliardini and Martin Jaggi}, title = {DoGE: Domain Reweighting with Generalization Estimation}, journal = {CoRR}, volume = {abs/2310.15393}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2310.15393}, doi = {10.48550/ARXIV.2310.15393}, eprinttype = {arXiv}, eprint = {2310.15393}, timestamp = {Tue, 31 Oct 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2310-15393.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-06724, author = {Seyed Ali Bahrainian and Martin Jaggi and Carsten Eickhoff}, title = {Controllable Topic-Focused Abstractive Summarization}, journal = {CoRR}, volume = {abs/2311.06724}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.06724}, doi = {10.48550/ARXIV.2311.06724}, eprinttype = {arXiv}, eprint = {2311.06724}, timestamp = {Wed, 15 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-06724.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2311-16079, author = {Zeming Chen and Alejandro Hern{\'{a}}ndez{-}Cano and Angelika Romanou and Antoine Bonnet and Kyle Matoba and Francesco Salvi and Matteo Pagliardini and Simin Fan and Andreas K{\"{o}}pf and Amirkeivan Mohtashami and Alexandre Sallinen and Alireza Sakhaeirad and Vinitra Swamy and Igor Krawczuk and Deniz Bayazit and Axel Marmet and Syrielle Montariol and Mary{-}Anne Hartley and Martin Jaggi and Antoine Bosselut}, title = {{MEDITRON-70B:} Scaling Medical Pretraining for Large Language Models}, journal = {CoRR}, volume = {abs/2311.16079}, year = {2023}, url = {https://doi.org/10.48550/arXiv.2311.16079}, doi = {10.48550/ARXIV.2311.16079}, eprinttype = {arXiv}, eprint = {2311.16079}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2311-16079.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aaai/DandiBJ22, author = {Yatin Dandi and Luis Barba and Martin Jaggi}, title = {Implicit Gradient Alignment in Distributed and Federated Learning}, booktitle = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI} 2022, Thirty-Fourth Conference on Innovative Applications of Artificial Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22 - March 1, 2022}, pages = {6454--6462}, publisher = {{AAAI} Press}, year = {2022}, url = {https://doi.org/10.1609/aaai.v36i6.20597}, doi = {10.1609/AAAI.V36I6.20597}, timestamp = {Mon, 04 Sep 2023 12:29:24 +0200}, biburl = {https://dblp.org/rec/conf/aaai/DandiBJ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/MohtashamiJS22, author = {Amirkeivan Mohtashami and Martin Jaggi and Sebastian U. Stich}, editor = {Gustau Camps{-}Valls and Francisco J. R. Ruiz and Isabel Valera}, title = {Masked Training of Neural Networks with Partial Gradients}, booktitle = {International Conference on Artificial Intelligence and Statistics, {AISTATS} 2022, 28-30 March 2022, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {151}, pages = {5876--5890}, publisher = {{PMLR}}, year = {2022}, url = {https://proceedings.mlr.press/v151/mohtashami22a.html}, timestamp = {Sat, 30 Sep 2023 09:34:08 +0200}, biburl = {https://dblp.org/rec/conf/aistats/MohtashamiJS22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/KarimireddyHJ22, author = {Sai Praneeth Karimireddy and Lie He and Martin Jaggi}, title = {Byzantine-Robust Learning on Heterogeneous Datasets via Bucketing}, booktitle = {The Tenth International Conference on Learning Representations, {ICLR} 2022, Virtual Event, April 25-29, 2022}, publisher = {OpenReview.net}, year = {2022}, url = {https://openreview.net/forum?id=jXKKDEi5vJt}, timestamp = {Sat, 20 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/KarimireddyHJ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/naacl/MoiseevDAJ22, author = {Fedor Moiseev and Zhe Dong and Enrique Alfonseca and Martin Jaggi}, editor = {Marine Carpuat and Marie{-}Catherine de Marneffe and Iv{\'{a}}n Vladimir Meza Ru{\'{\i}}z}, title = {{SKILL:} Structured Knowledge Infusion for Large Language Models}, booktitle = {Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, {NAACL} 2022, Seattle, WA, United States, July 10-15, 2022}, pages = {1581--1588}, publisher = {Association for Computational Linguistics}, year = {2022}, url = {https://doi.org/10.18653/v1/2022.naacl-main.113}, doi = {10.18653/V1/2022.NAACL-MAIN.113}, timestamp = {Mon, 01 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/naacl/MoiseevDAJ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KoloskovaSJ22, author = {Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Sharper Convergence Guarantees for Asynchronous {SGD} for Distributed and Federated Learning}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/6db3ea527f53682657b3d6b02a841340-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/KoloskovaSJ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/TerrailACGHLMMM22, author = {Jean Ogier du Terrail and Samy{-}Safwan Ayed and Edwige Cyffers and Felix Grimberg and Chaoyang He and Regis Loeb and Paul Mangold and Tanguy Marchand and Othmane Marfoq and Erum Mushtaq and Boris Muzellec and Constantin Philippenko and Santiago Silva and Maria Telenczuk and Shadi Albarqouni and Salman Avestimehr and Aur{\'{e}}lien Bellet and Aymeric Dieuleveut and Martin Jaggi and Sai Praneeth Karimireddy and Marco Lorenzi and Giovanni Neglia and Marc Tommasi and Mathieu Andreux}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {FLamby: Datasets and Benchmarks for Cross-Silo Federated Learning in Realistic Healthcare Settings}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/232eee8ef411a0a316efa298d7be3c2b-Abstract-Datasets\_and\_Benchmarks.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/TerrailACGHLMMM22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/VogelsHJ22, author = {Thijs Vogels and Hadrien Hendrikx and Martin Jaggi}, editor = {Sanmi Koyejo and S. Mohamed and A. Agarwal and Danielle Belgrave and K. Cho and A. Oh}, title = {Beyond spectral gap: the role of the topology in decentralized learning}, booktitle = {Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022}, year = {2022}, url = {http://papers.nips.cc/paper\_files/paper/2022/hash/61162d94822d468ee6e92803340f2040-Abstract-Conference.html}, timestamp = {Mon, 08 Jan 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/VogelsHJ22.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-01545, author = {Lie He and Sai Praneeth Karimireddy and Martin Jaggi}, title = {Byzantine-Robust Decentralized Learning via Self-Centered Clipping}, journal = {CoRR}, volume = {abs/2202.01545}, year = {2022}, url = {https://arxiv.org/abs/2202.01545}, eprinttype = {arXiv}, eprint = {2202.01545}, timestamp = {Wed, 09 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-01545.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-01838, author = {Amirkeivan Mohtashami and Sebastian U. Stich and Martin Jaggi}, title = {Characterizing {\&} Finding Good Data Orderings for Fast Convergence of Sequential Gradient Methods}, journal = {CoRR}, volume = {abs/2202.01838}, year = {2022}, url = {https://arxiv.org/abs/2202.01838}, eprinttype = {arXiv}, eprint = {2202.01838}, timestamp = {Wed, 09 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-01838.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-04414, author = {Matteo Pagliardini and Martin Jaggi and Fran{\c{c}}ois Fleuret and Sai Praneeth Karimireddy}, title = {Agree to Disagree: Diversity through Disagreement for Better Transferability}, journal = {CoRR}, volume = {abs/2202.04414}, year = {2022}, url = {https://arxiv.org/abs/2202.04414}, eprinttype = {arXiv}, eprint = {2202.04414}, timestamp = {Fri, 18 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-04414.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2202-05737, author = {Matteo Pagliardini and Gilberto Manunza and Martin Jaggi and Michael I. Jordan and Tatjana Chavdarova}, title = {Improving Generalization via Uncertainty Driven Perturbations}, journal = {CoRR}, volume = {abs/2202.05737}, year = {2022}, url = {https://arxiv.org/abs/2202.05737}, eprinttype = {arXiv}, eprint = {2202.05737}, timestamp = {Fri, 18 Feb 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2202-05737.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2204-06477, author = {Yatin Dandi and Anastasia Koloskova and Martin Jaggi and Sebastian U. Stich}, title = {Data-heterogeneity-aware Mixing for Decentralized Learning}, journal = {CoRR}, volume = {abs/2204.06477}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2204.06477}, doi = {10.48550/ARXIV.2204.06477}, eprinttype = {arXiv}, eprint = {2204.06477}, timestamp = {Tue, 19 Apr 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2204-06477.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-08184, author = {Fedor Moiseev and Zhe Dong and Enrique Alfonseca and Martin Jaggi}, title = {{SKILL:} Structured Knowledge Infusion for Large Language Models}, journal = {CoRR}, volume = {abs/2205.08184}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.08184}, doi = {10.48550/ARXIV.2205.08184}, eprinttype = {arXiv}, eprint = {2205.08184}, timestamp = {Tue, 16 Aug 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-08184.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2205-15142, author = {Amirkeivan Mohtashami and Martin Jaggi and Sebastian U. Stich}, title = {On Avoiding Local Minima Using Gradient Descent With Large Learning Rates}, journal = {CoRR}, volume = {abs/2205.15142}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2205.15142}, doi = {10.48550/ARXIV.2205.15142}, eprinttype = {arXiv}, eprint = {2205.15142}, timestamp = {Wed, 01 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2205-15142.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-03093, author = {Thijs Vogels and Hadrien Hendrikx and Martin Jaggi}, title = {Beyond spectral gap: The role of the topology in decentralized learning}, journal = {CoRR}, volume = {abs/2206.03093}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.03093}, doi = {10.48550/ARXIV.2206.03093}, eprinttype = {arXiv}, eprint = {2206.03093}, timestamp = {Tue, 14 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-03093.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2206-08307, author = {Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, title = {Sharper Convergence Guarantees for Asynchronous {SGD} for Distributed and Federated Learning}, journal = {CoRR}, volume = {abs/2206.08307}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2206.08307}, doi = {10.48550/ARXIV.2206.08307}, eprinttype = {arXiv}, eprint = {2206.08307}, timestamp = {Tue, 21 Jun 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2206-08307.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2210-04620, author = {Jean Ogier du Terrail and Samy{-}Safwan Ayed and Edwige Cyffers and Felix Grimberg and Chaoyang He and Regis Loeb and Paul Mangold and Tanguy Marchand and Othmane Marfoq and Erum Mushtaq and Boris Muzellec and Constantin Philippenko and Santiago Silva and Maria Telenczuk and Shadi Albarqouni and Salman Avestimehr and Aur{\'{e}}lien Bellet and Aymeric Dieuleveut and Martin Jaggi and Sai Praneeth Karimireddy and Marco Lorenzi and Giovanni Neglia and Marc Tommasi and Mathieu Andreux}, title = {FLamby: Datasets and Benchmarks for Cross-Silo Federated Learning in Realistic Healthcare Settings}, journal = {CoRR}, volume = {abs/2210.04620}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2210.04620}, doi = {10.48550/ARXIV.2210.04620}, eprinttype = {arXiv}, eprint = {2210.04620}, timestamp = {Wed, 22 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2210-04620.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-06637, author = {C{\'{e}}cile Trottet and Thijs Vogels and Martin Jaggi and Mary{-}Anne Hartley}, title = {Modular Clinical Decision Support Networks (MoDN) - Updatable, Interpretable, and Portable Predictions for Evolving Clinical Environments}, journal = {CoRR}, volume = {abs/2211.06637}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.06637}, doi = {10.48550/ARXIV.2211.06637}, eprinttype = {arXiv}, eprint = {2211.06637}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-06637.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-10737, author = {Simla Burcu Harma and Canberk S{\"{o}}nmez and Babak Falsafi and Martin Jaggi and Yunho Oh}, title = {Accuracy Boosters: Epoch-Driven Mixed-Mantissa Block Floating-Point for {DNN} Training}, journal = {CoRR}, volume = {abs/2211.10737}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.10737}, doi = {10.48550/ARXIV.2211.10737}, eprinttype = {arXiv}, eprint = {2211.10737}, timestamp = {Thu, 24 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-10737.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2211-10943, author = {Fr{\'{e}}d{\'{e}}ric Berdoz and Abhishek Singh and Martin Jaggi and Ramesh Raskar}, title = {Scalable Collaborative Learning via Representation Sharing}, journal = {CoRR}, volume = {abs/2211.10943}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2211.10943}, doi = {10.48550/ARXIV.2211.10943}, eprinttype = {arXiv}, eprint = {2211.10943}, timestamp = {Thu, 24 Nov 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2211-10943.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2212-00781, author = {Nikita Doikov and El Mahdi Chayti and Martin Jaggi}, title = {Second-order optimization with lazy Hessians}, journal = {CoRR}, volume = {abs/2212.00781}, year = {2022}, url = {https://doi.org/10.48550/arXiv.2212.00781}, doi = {10.48550/ARXIV.2212.00781}, eprinttype = {arXiv}, eprint = {2212.00781}, timestamp = {Thu, 08 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2212-00781.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/ftml/KairouzMABBBBCC21, author = {Peter Kairouz and H. Brendan McMahan and Brendan Avent and Aur{\'{e}}lien Bellet and Mehdi Bennis and Arjun Nitin Bhagoji and Kallista A. Bonawitz and Zachary Charles and Graham Cormode and Rachel Cummings and Rafael G. L. D'Oliveira and Hubert Eichner and Salim El Rouayheb and David Evans and Josh Gardner and Zachary Garrett and Adri{\`{a}} Gasc{\'{o}}n and Badih Ghazi and Phillip B. Gibbons and Marco Gruteser and Za{\"{\i}}d Harchaoui and Chaoyang He and Lie He and Zhouyuan Huo and Ben Hutchinson and Justin Hsu and Martin Jaggi and Tara Javidi and Gauri Joshi and Mikhail Khodak and Jakub Kone{\v{c}}n{\'y} and Aleksandra Korolova and Farinaz Koushanfar and Sanmi Koyejo and Tancr{\`{e}}de Lepoint and Yang Liu and Prateek Mittal and Mehryar Mohri and Richard Nock and Ayfer {\"{O}}zg{\"{u}}r and Rasmus Pagh and Hang Qi and Daniel Ramage and Ramesh Raskar and Mariana Raykova and Dawn Song and Weikang Song and Sebastian U. Stich and Ziteng Sun and Ananda Theertha Suresh and Florian Tram{\`{e}}r and Praneeth Vepakomma and Jianyu Wang and Li Xiong and Zheng Xu and Qiang Yang and Felix X. Yu and Han Yu and Sen Zhao}, title = {Advances and Open Problems in Federated Learning}, journal = {Found. Trends Mach. Learn.}, volume = {14}, number = {1-2}, pages = {1--210}, year = {2021}, url = {https://doi.org/10.1561/2200000083}, doi = {10.1561/2200000083}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/ftml/KairouzMABBBBCC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/oms/MaJCST21, author = {Chenxin Ma and Martin Jaggi and Frank E. Curtis and Nathan Srebro and Martin Tak{\'{a}}c}, title = {An accelerated communication-efficient primal-dual optimization framework for structured machine learning}, journal = {Optim. Methods Softw.}, volume = {36}, number = {1}, pages = {20--44}, year = {2021}, url = {https://doi.org/10.1080/10556788.2019.1650361}, doi = {10.1080/10556788.2019.1650361}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/oms/MaJCST21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/MaoGCJK20, author = {Zhuoyuan Mao and Prakhar Gupta and Chenhui Chu and Martin Jaggi and Sadao Kurohashi}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {Lightweight Cross-Lingual Sentence Representation Learning}, booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021}, pages = {2902--2913}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.acl-long.226}, doi = {10.18653/V1/2021.ACL-LONG.226}, timestamp = {Mon, 09 Aug 2021 16:25:37 +0200}, biburl = {https://dblp.org/rec/conf/acl/MaoGCJK20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/GuptaJ20, author = {Prakhar Gupta and Martin Jaggi}, editor = {Chengqing Zong and Fei Xia and Wenjie Li and Roberto Navigli}, title = {Obtaining Better Static Word Embeddings Using Contextual Embedding Models}, booktitle = {Proceedings of the 59th Annual Meeting of the Association for Computational Linguistics and the 11th International Joint Conference on Natural Language Processing, {ACL/IJCNLP} 2021, (Volume 1: Long Papers), Virtual Event, August 1-6, 2021}, pages = {5241--5253}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.acl-long.408}, doi = {10.18653/V1/2021.ACL-LONG.408}, timestamp = {Mon, 09 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/acl/GuptaJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/GhadikolaeiSJ21, author = {Hossein Shokri Ghadikolaei and Sebastian U. Stich and Martin Jaggi}, editor = {Arindam Banerjee and Kenji Fukumizu}, title = {{LENA:} Communication-Efficient Distributed Learning with Self-Triggered Gradient Uploads}, booktitle = {The 24th International Conference on Artificial Intelligence and Statistics, {AISTATS} 2021, April 13-15, 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {130}, pages = {3943--3951}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v130/shokri-ghadikolaei21a.html}, timestamp = {Wed, 14 Apr 2021 16:51:37 +0200}, biburl = {https://dblp.org/rec/conf/aistats/GhadikolaeiSJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/StichMJ21, author = {Sebastian U. Stich and Amirkeivan Mohtashami and Martin Jaggi}, editor = {Arindam Banerjee and Kenji Fukumizu}, title = {Critical Parameters for Scalable Distributed Learning with Large Batches and Asynchronous Updates}, booktitle = {The 24th International Conference on Artificial Intelligence and Statistics, {AISTATS} 2021, April 13-15, 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {130}, pages = {4042--4050}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v130/stich21a.html}, timestamp = {Wed, 14 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/StichMJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/KovalevKJRS21, author = {Dmitry Kovalev and Anastasia Koloskova and Martin Jaggi and Peter Richt{\'{a}}rik and Sebastian U. Stich}, editor = {Arindam Banerjee and Kenji Fukumizu}, title = {A Linearly Convergent Algorithm for Decentralized Optimization: Sending Less Bits for Free!}, booktitle = {The 24th International Conference on Artificial Intelligence and Statistics, {AISTATS} 2021, April 13-15, 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {130}, pages = {4087--4095}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v130/kovalev21a.html}, timestamp = {Wed, 14 Apr 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/KovalevKJRS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/BahrainianJE21, author = {Seyed Ali Bahrainian and Martin Jaggi and Carsten Eickhoff}, editor = {Marie{-}Francine Moens and Xuanjing Huang and Lucia Specia and Scott Wen{-}tau Yih}, title = {Self-Supervised Neural Topic Modeling}, booktitle = {Findings of the Association for Computational Linguistics: {EMNLP} 2021, Virtual Event / Punta Cana, Dominican Republic, 16-20 November, 2021}, pages = {3341--3350}, publisher = {Association for Computational Linguistics}, year = {2021}, url = {https://doi.org/10.18653/v1/2021.findings-emnlp.284}, doi = {10.18653/V1/2021.FINDINGS-EMNLP.284}, timestamp = {Fri, 16 Feb 2024 08:27:36 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/BahrainianJE21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hipc/WszolaJP21, author = {Eliza Wszola and Martin Jaggi and Markus P{\"{u}}schel}, title = {Faster Parallel Training of Word Embeddings}, booktitle = {28th {IEEE} International Conference on High Performance Computing, Data, and Analytics, HiPC 2021, Bengaluru, India, December 17-20, 2021}, pages = {31--41}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/HiPC53243.2021.00017}, doi = {10.1109/HIPC53243.2021.00017}, timestamp = {Mon, 31 Jan 2022 09:34:30 +0100}, biburl = {https://dblp.org/rec/conf/hipc/WszolaJP21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iccv/YukselSJC21, author = {Oguz Kaan Y{\"{u}}ksel and Sebastian U. Stich and Martin Jaggi and Tatjana Chavdarova}, title = {Semantic Perturbations with Normalizing Flows for Improved Generalization}, booktitle = {2021 {IEEE/CVF} International Conference on Computer Vision, {ICCV} 2021, Montreal, QC, Canada, October 10-17, 2021}, pages = {6599--6609}, publisher = {{IEEE}}, year = {2021}, url = {https://doi.org/10.1109/ICCV48922.2021.00655}, doi = {10.1109/ICCV48922.2021.00655}, timestamp = {Fri, 11 Mar 2022 10:01:27 +0100}, biburl = {https://dblp.org/rec/conf/iccv/YukselSJC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/ChavdarovaPSFJ21, author = {Tatjana Chavdarova and Matteo Pagliardini and Sebastian U. Stich and Fran{\c{c}}ois Fleuret and Martin Jaggi}, title = {Taming GANs with Lookahead-Minmax}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=ZW0yXJyNmoG}, timestamp = {Wed, 23 Jun 2021 17:36:39 +0200}, biburl = {https://dblp.org/rec/conf/iclr/ChavdarovaPSFJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LeeATJ21, author = {Namhoon Lee and Thalaiyasingam Ajanthan and Philip H. S. Torr and Martin Jaggi}, title = {Understanding the effects of data parallelism and sparsity on neural network training}, booktitle = {9th International Conference on Learning Representations, {ICLR} 2021, Virtual Event, Austria, May 3-7, 2021}, publisher = {OpenReview.net}, year = {2021}, url = {https://openreview.net/forum?id=rsogjAnYs4z}, timestamp = {Wed, 23 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LeeATJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Cherubin0J21, author = {Giovanni Cherubin and Konstantinos Chatzikokolakis and Martin Jaggi}, editor = {Marina Meila and Tong Zhang}, title = {Exact Optimization of Conformal Predictors via Incremental and Decremental Learning}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {1836--1845}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/cherubin21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/Cherubin0J21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KarimireddyHJ21, author = {Sai Praneeth Karimireddy and Lie He and Martin Jaggi}, editor = {Marina Meila and Tong Zhang}, title = {Learning from History for Byzantine Robust Optimization}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {5311--5319}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/karimireddy21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/KarimireddyHJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/00010KJS21, author = {Lingjing Kong and Tao Lin and Anastasia Koloskova and Martin Jaggi and Sebastian U. Stich}, editor = {Marina Meila and Tong Zhang}, title = {Consensus Control for Decentralized Deep Learning}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {5686--5696}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/kong21a.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/00010KJS21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/0004KSJ21, author = {Tao Lin and Sai Praneeth Karimireddy and Sebastian U. Stich and Martin Jaggi}, editor = {Marina Meila and Tong Zhang}, title = {Quasi-global Momentum: Accelerating Decentralized Deep Learning on Heterogeneous Data}, booktitle = {Proceedings of the 38th International Conference on Machine Learning, {ICML} 2021, 18-24 July 2021, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {139}, pages = {6654--6665}, publisher = {{PMLR}}, year = {2021}, url = {http://proceedings.mlr.press/v139/lin21c.html}, timestamp = {Wed, 25 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/0004KSJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/micro/DrumondCZYFJ21, author = {Mario Drumond and Louis Coulon and Arash Pourhabibi Zarandi and Ahmet Caner Y{\"{u}}z{\"{u}}g{\"{u}}ler and Babak Falsafi and Martin Jaggi}, title = {Equinox: Training (for Free) on a Custom Inference Accelerator}, booktitle = {{MICRO} '21: 54th Annual {IEEE/ACM} International Symposium on Microarchitecture, Virtual Event, Greece, October 18-22, 2021}, pages = {421--433}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3466752.3480057}, doi = {10.1145/3466752.3480057}, timestamp = {Mon, 03 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/micro/DrumondCZYFJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/mobisys/MakhmutovaKFMJC21, author = {Mariko Makhmutova and Raghu Kainkaryam and Marta Ferreira and Jae Min and Martin Jaggi and Ieuan Clay}, title = {Prediction of self-reported depression scores using person-generated health data from a virtual 1-year mental health observational study}, booktitle = {DigiBiom@MobiSys '21: Proceedings of the 2021 Workshop on Future of Digital Biomarkers, Virtual Event, Wisconsin, USA, 25 June, 2021}, pages = {4--11}, publisher = {{ACM}}, year = {2021}, url = {https://doi.org/10.1145/3469266.3469878}, doi = {10.1145/3469266.3469878}, timestamp = {Mon, 26 Jul 2021 11:37:29 +0200}, biburl = {https://dblp.org/rec/conf/mobisys/MakhmutovaKFMJC21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/VogelsHKKLSJ21, author = {Thijs Vogels and Lie He and Anastasia Koloskova and Sai Praneeth Karimireddy and Tao Lin and Sebastian U. Stich and Martin Jaggi}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {RelaySum for Decentralized Deep Learning on Heterogeneous Data}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {28004--28015}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/ebbdfea212e3a756a1fded7b35578525-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/VogelsHKKLSJ21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/KarimireddyJKMR21, author = {Sai Praneeth Karimireddy and Martin Jaggi and Satyen Kale and Mehryar Mohri and Sashank J. Reddi and Sebastian U. Stich and Ananda Theertha Suresh}, editor = {Marc'Aurelio Ranzato and Alina Beygelzimer and Yann N. Dauphin and Percy Liang and Jennifer Wortman Vaughan}, title = {Breaking the centralized barrier for cross-device federated learning}, booktitle = {Advances in Neural Information Processing Systems 34: Annual Conference on Neural Information Processing Systems 2021, NeurIPS 2021, December 6-14, 2021, virtual}, pages = {28663--28676}, year = {2021}, url = {https://proceedings.neurips.cc/paper/2021/hash/f0e6be4ce76ccfa73c5a540d992d0756-Abstract.html}, timestamp = {Tue, 03 May 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/KarimireddyJKMR21.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-03236, author = {Giovanni Cherubin and Konstantinos Chatzikokolakis and Martin Jaggi}, title = {Exact Optimization of Conformal Predictors via Incremental and Decremental Learning}, journal = {CoRR}, volume = {abs/2102.03236}, year = {2021}, url = {https://arxiv.org/abs/2102.03236}, eprinttype = {arXiv}, eprint = {2102.03236}, timestamp = {Wed, 10 Feb 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-03236.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-04761, author = {Tao Lin and Sai Praneeth Karimireddy and Sebastian U. Stich and Martin Jaggi}, title = {Quasi-Global Momentum: Accelerating Decentralized Deep Learning on Heterogeneous Data}, journal = {CoRR}, volume = {abs/2102.04761}, year = {2021}, url = {https://arxiv.org/abs/2102.04761}, eprinttype = {arXiv}, eprint = {2102.04761}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-04761.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2102-04828, author = {Lingjing Kong and Tao Lin and Anastasia Koloskova and Martin Jaggi and Sebastian U. Stich}, title = {Consensus Control for Decentralized Deep Learning}, journal = {CoRR}, volume = {abs/2102.04828}, year = {2021}, url = {https://arxiv.org/abs/2102.04828}, eprinttype = {arXiv}, eprint = {2102.04828}, timestamp = {Mon, 14 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2102-04828.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2103-02351, author = {Sebastian U. Stich and Amirkeivan Mohtashami and Martin Jaggi}, title = {Critical Parameters for Scalable Distributed Learning with Large Batches and Asynchronous Updates}, journal = {CoRR}, volume = {abs/2103.02351}, year = {2021}, url = {https://arxiv.org/abs/2103.02351}, eprinttype = {arXiv}, eprint = {2103.02351}, timestamp = {Thu, 04 Mar 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2103-02351.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2104-09994, author = {Valerian Rey and Pedro Miguel S{\'{a}}nchez S{\'{a}}nchez and Alberto Huertas Celdr{\'{a}}n and G{\'{e}}r{\^{o}}me Bovet and Martin Jaggi}, title = {Federated Learning for Malware Detection in IoT Devices}, journal = {CoRR}, volume = {abs/2104.09994}, year = {2021}, url = {https://arxiv.org/abs/2104.09994}, eprinttype = {arXiv}, eprint = {2104.09994}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2104-09994.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2105-13856, author = {Zhuoyuan Mao and Prakhar Gupta and Chenhui Chu and Martin Jaggi and Sadao Kurohashi}, title = {Lightweight Cross-Lingual Sentence Representation Learning}, journal = {CoRR}, volume = {abs/2105.13856}, year = {2021}, url = {https://arxiv.org/abs/2105.13856}, eprinttype = {arXiv}, eprint = {2105.13856}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2105-13856.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-04302, author = {Prakhar Gupta and Martin Jaggi}, title = {Obtaining Better Static Word Embeddings Using Contextual Embedding Models}, journal = {CoRR}, volume = {abs/2106.04302}, year = {2021}, url = {https://arxiv.org/abs/2106.04302}, eprinttype = {arXiv}, eprint = {2106.04302}, timestamp = {Fri, 11 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-04302.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-08895, author = {Amirkeivan Mohtashami and Martin Jaggi and Sebastian U. Stich}, title = {Simultaneous Training of Partially Masked Neural Networks}, journal = {CoRR}, volume = {abs/2106.08895}, year = {2021}, url = {https://arxiv.org/abs/2106.08895}, eprinttype = {arXiv}, eprint = {2106.08895}, timestamp = {Tue, 29 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-08895.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2106-13897, author = {Yatin Dandi and Luis Barba and Martin Jaggi}, title = {Implicit Gradient Alignment in Distributed and Federated Learning}, journal = {CoRR}, volume = {abs/2106.13897}, year = {2021}, url = {https://arxiv.org/abs/2106.13897}, eprinttype = {arXiv}, eprint = {2106.13897}, timestamp = {Wed, 30 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2106-13897.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-06580, author = {David Roschewitz and Mary{-}Anne Hartley and Luca Corinzia and Martin Jaggi}, title = {IFedAvg: Interpretable Data-Interoperability for Federated Learning}, journal = {CoRR}, volume = {abs/2107.06580}, year = {2021}, url = {https://arxiv.org/abs/2107.06580}, eprinttype = {arXiv}, eprint = {2107.06580}, timestamp = {Wed, 21 Jul 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-06580.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2107-06917, author = {Jianyu Wang and Zachary Charles and Zheng Xu and Gauri Joshi and H. Brendan McMahan and Blaise Ag{\"{u}}era y Arcas and Maruan Al{-}Shedivat and Galen Andrew and Salman Avestimehr and Katharine Daly and Deepesh Data and Suhas N. Diggavi and Hubert Eichner and Advait Gadhikar and Zachary Garrett and Antonious M. Girgis and Filip Hanzely and Andrew Hard and Chaoyang He and Samuel Horv{\'{a}}th and Zhouyuan Huo and Alex Ingerman and Martin Jaggi and Tara Javidi and Peter Kairouz and Satyen Kale and Sai Praneeth Karimireddy and Jakub Kone{\v{c}}n{\'y} and Sanmi Koyejo and Tian Li and Luyang Liu and Mehryar Mohri and Hang Qi and Sashank J. Reddi and Peter Richt{\'{a}}rik and Karan Singhal and Virginia Smith and Mahdi Soltanolkotabi and Weikang Song and Ananda Theertha Suresh and Sebastian U. Stich and Ameet Talwalkar and Hongyi Wang and Blake E. Woodworth and Shanshan Wu and Felix X. Yu and Honglin Yuan and Manzil Zaheer and Mi Zhang and Tong Zhang and Chunxiang Zheng and Chen Zhu and Wennan Zhu}, title = {A Field Guide to Federated Optimization}, journal = {CoRR}, volume = {abs/2107.06917}, year = {2021}, url = {https://arxiv.org/abs/2107.06917}, eprinttype = {arXiv}, eprint = {2107.06917}, timestamp = {Wed, 06 Dec 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2107-06917.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2108-07958, author = {Oguz Kaan Y{\"{u}}ksel and Sebastian U. Stich and Martin Jaggi and Tatjana Chavdarova}, title = {Semantic Perturbations with Normalizing Flows for Improved Generalization}, journal = {CoRR}, volume = {abs/2108.07958}, year = {2021}, url = {https://arxiv.org/abs/2108.07958}, eprinttype = {arXiv}, eprint = {2108.07958}, timestamp = {Mon, 23 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2108-07958.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2109-02388, author = {Sebastian Bischoff and Stephan G{\"{u}}nnemann and Martin Jaggi and Sebastian U. Stich}, title = {On Second-order Optimization Methods for Federated Learning}, journal = {CoRR}, volume = {abs/2109.02388}, year = {2021}, url = {https://arxiv.org/abs/2109.02388}, eprinttype = {arXiv}, eprint = {2109.02388}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2109-02388.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-04175, author = {Thijs Vogels and Lie He and Anastasia Koloskova and Tao Lin and Sai Praneeth Karimireddy and Sebastian U. Stich and Martin Jaggi}, title = {RelaySum for Decentralized Deep Learning on Heterogeneous Data}, journal = {CoRR}, volume = {abs/2110.04175}, year = {2021}, url = {https://arxiv.org/abs/2110.04175}, eprinttype = {arXiv}, eprint = {2110.04175}, timestamp = {Thu, 21 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-04175.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-06978, author = {Martin Beaussart and Felix Grimberg and Mary{-}Anne Hartley and Martin Jaggi}, title = {{WAFFLE:} Weighted Averaging for Personalized Federated Learning}, journal = {CoRR}, volume = {abs/2110.06978}, year = {2021}, url = {https://arxiv.org/abs/2110.06978}, eprinttype = {arXiv}, eprint = {2110.06978}, timestamp = {Fri, 22 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-06978.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2110-12946, author = {Felix Grimberg and Mary{-}Anne Hartley and Sai Praneeth Karimireddy and Martin Jaggi}, title = {Optimal Model Averaging: Towards Personalized Collaborative Learning}, journal = {CoRR}, volume = {abs/2110.12946}, year = {2021}, url = {https://arxiv.org/abs/2110.12946}, eprinttype = {arXiv}, eprint = {2110.12946}, timestamp = {Thu, 28 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2110-12946.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2111-05968, author = {El Mahdi Chayti and Sai Praneeth Karimireddy and Sebastian U. Stich and Nicolas Flammarion and Martin Jaggi}, title = {Linear Speedup in Personalized Collaborative Learning}, journal = {CoRR}, volume = {abs/2111.05968}, year = {2021}, url = {https://arxiv.org/abs/2111.05968}, eprinttype = {arXiv}, eprint = {2111.05968}, timestamp = {Tue, 16 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2111-05968.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2111-08546, author = {Vinitra Swamy and Angelika Romanou and Martin Jaggi}, title = {Interpreting Language Models Through Knowledge Graph Extraction}, journal = {CoRR}, volume = {abs/2111.08546}, year = {2021}, url = {https://arxiv.org/abs/2111.08546}, eprinttype = {arXiv}, eprint = {2111.08546}, timestamp = {Mon, 22 Nov 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2111-08546.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2112-08798, author = {Futong Liu and Tao Lin and Martin Jaggi}, title = {Understanding Memorization from the Perspective of Optimization via Efficient Influence Estimation}, journal = {CoRR}, volume = {abs/2112.08798}, year = {2021}, url = {https://arxiv.org/abs/2112.08798}, eprinttype = {arXiv}, eprint = {2112.08798}, timestamp = {Mon, 03 Jan 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2112-08798.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/PedregosaNAJ20, author = {Fabian Pedregosa and Geoffrey N{\'{e}}giar and Armin Askari and Martin Jaggi}, editor = {Silvia Chiappa and Roberto Calandra}, title = {Linearly Convergent Frank-Wolfe without Line-Search}, booktitle = {The 23rd International Conference on Artificial Intelligence and Statistics, {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]}, series = {Proceedings of Machine Learning Research}, volume = {108}, pages = {1--10}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v108/pedregosa20a.html}, timestamp = {Mon, 29 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/PedregosaNAJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/SinghHDJ20, author = {Sidak Pal Singh and Andreas Hug and Aymeric Dieuleveut and Martin Jaggi}, editor = {Silvia Chiappa and Roberto Calandra}, title = {Context Mover's Distance {\&} Barycenters: Optimal Transport of Contexts for Building Representations}, booktitle = {The 23rd International Conference on Artificial Intelligence and Statistics, {AISTATS} 2020, 26-28 August 2020, Online [Palermo, Sicily, Italy]}, series = {Proceedings of Machine Learning Research}, volume = {108}, pages = {3437--3449}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v108/singh20a.html}, timestamp = {Mon, 29 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/SinghHDJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/emnlp/ZhaoLMJS20, author = {Mengjie Zhao and Tao Lin and Fei Mi and Martin Jaggi and Hinrich Sch{\"{u}}tze}, editor = {Bonnie Webber and Trevor Cohn and Yulan He and Yang Liu}, title = {Masking as an Efficient Alternative to Finetuning for Pretrained Language Models}, booktitle = {Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing, {EMNLP} 2020, Online, November 16-20, 2020}, pages = {2226--2241}, publisher = {Association for Computational Linguistics}, year = {2020}, url = {https://doi.org/10.18653/v1/2020.emnlp-main.174}, doi = {10.18653/V1/2020.EMNLP-MAIN.174}, timestamp = {Wed, 23 Mar 2022 10:11:55 +0100}, biburl = {https://dblp.org/rec/conf/emnlp/ZhaoLMJS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/CordonnierLJ20, author = {Jean{-}Baptiste Cordonnier and Andreas Loukas and Martin Jaggi}, title = {On the Relationship between Self-Attention and Convolutional Layers}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=HJlnC1rKPB}, timestamp = {Thu, 07 May 2020 17:11:47 +0200}, biburl = {https://dblp.org/rec/conf/iclr/CordonnierLJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/KoloskovaLSJ20, author = {Anastasia Koloskova and Tao Lin and Sebastian U. Stich and Martin Jaggi}, title = {Decentralized Deep Learning with Arbitrary Communication Compression}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=SkgGCkrKvH}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/KoloskovaLSJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LinSBDJ20, author = {Tao Lin and Sebastian U. Stich and Luis Barba and Daniil Dmitriev and Martin Jaggi}, title = {Dynamic Model Pruning with Feedback}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=SJem8lSFwB}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LinSBDJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/LinSPJ20, author = {Tao Lin and Sebastian U. Stich and Kumar Kshitij Patel and Martin Jaggi}, title = {Don't Use Large Mini-batches, Use Local {SGD}}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=B1eyO1BFPr}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/LinSPJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/YuSJMS20, author = {Kaicheng Yu and Christian Sciuto and Martin Jaggi and Claudiu Musat and Mathieu Salzmann}, title = {Evaluating The Search Phase of Neural Architecture Search}, booktitle = {8th International Conference on Learning Representations, {ICLR} 2020, Addis Ababa, Ethiopia, April 26-30, 2020}, publisher = {OpenReview.net}, year = {2020}, url = {https://openreview.net/forum?id=H1loF2NFwr}, timestamp = {Thu, 07 May 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/iclr/YuSJMS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KoloskovaLBJS20, author = {Anastasia Koloskova and Nicolas Loizou and Sadra Boreiri and Martin Jaggi and Sebastian U. Stich}, title = {A Unified Theory of Decentralized {SGD} with Changing Topology and Local Updates}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {5381--5393}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/koloskova20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/KoloskovaLBJS20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LinKSJ20, author = {Tao Lin and Lingjing Kong and Sebastian U. Stich and Martin Jaggi}, title = {Extrapolation for Large-batch Training in Deep Learning}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {6094--6104}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/lin20b.html}, timestamp = {Mon, 14 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/LinKSJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/SivaprasadMVJF20, author = {Prabhu Teja Sivaprasad and Florian Mai and Thijs Vogels and Martin Jaggi and Fran{\c{c}}ois Fleuret}, title = {Optimizer Benchmarking Needs to Account for Hyperparameter Tuning}, booktitle = {Proceedings of the 37th International Conference on Machine Learning, {ICML} 2020, 13-18 July 2020, Virtual Event}, series = {Proceedings of Machine Learning Research}, volume = {119}, pages = {9036--9045}, publisher = {{PMLR}}, year = {2020}, url = {http://proceedings.mlr.press/v119/sivaprasad20a.html}, timestamp = {Tue, 15 Dec 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/SivaprasadMVJF20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/miccai/GrimbergHJK20, author = {Felix Grimberg and Mary{-}Anne Hartley and Martin Jaggi and Sai Praneeth Karimireddy}, editor = {Shadi Albarqouni and Spyridon Bakas and Konstantinos Kamnitsas and M. Jorge Cardoso and Bennett A. Landman and Wenqi Li and Fausto Milletari and Nicola Rieke and Holger Roth and Daguang Xu and Ziyue Xu}, title = {Weight Erosion: An Update Aggregation Scheme for Personalized Collaborative Machine Learning}, booktitle = {Domain Adaptation and Representation Transfer, and Distributed and Collaborative Learning - Second {MICCAI} Workshop, {DART} 2020, and First {MICCAI} Workshop, {DCL} 2020, Held in Conjunction with {MICCAI} 2020, Lima, Peru, October 4-8, 2020, Proceedings}, series = {Lecture Notes in Computer Science}, volume = {12444}, pages = {160--169}, publisher = {Springer}, year = {2020}, url = {https://doi.org/10.1007/978-3-030-60548-3\_16}, doi = {10.1007/978-3-030-60548-3\_16}, timestamp = {Tue, 19 Jul 2022 10:23:16 +0200}, biburl = {https://dblp.org/rec/conf/miccai/GrimbergHJK20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LinKSJ20, author = {Tao Lin and Lingjing Kong and Sebastian U. Stich and Martin Jaggi}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Ensemble Distillation for Robust Model Fusion in Federated Learning}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/18df51b97ccd68128e994804f3eccc87-Abstract.html}, timestamp = {Mon, 14 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/nips/LinKSJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/SinghJ20, author = {Sidak Pal Singh and Martin Jaggi}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Model Fusion via Optimal Transport}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/fb2697869f56484404c8ceee2985b01d-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/SinghJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/VogelsKJ20, author = {Thijs Vogels and Sai Praneeth Karimireddy and Martin Jaggi}, editor = {Hugo Larochelle and Marc'Aurelio Ranzato and Raia Hadsell and Maria{-}Florina Balcan and Hsuan{-}Tien Lin}, title = {Practical Low-Rank Communication Compression in Decentralized Deep Learning}, booktitle = {Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual}, year = {2020}, url = {https://proceedings.neurips.cc/paper/2020/hash/a376802c0811f1b9088828288eb0d3f0-Abstract.html}, timestamp = {Tue, 19 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/VogelsKJ20.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-10422, author = {Anastasia Koloskova and Nicolas Loizou and Sadra Boreiri and Martin Jaggi and Sebastian U. Stich}, title = {A Unified Theory of Decentralized {SGD} with Changing Topology and Local Updates}, journal = {CoRR}, volume = {abs/2003.10422}, year = {2020}, url = {https://arxiv.org/abs/2003.10422}, eprinttype = {arXiv}, eprint = {2003.10422}, timestamp = {Tue, 24 Mar 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-10422.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2003-11316, author = {Namhoon Lee and Philip H. S. Torr and Martin Jaggi}, title = {Data Parallelism in Training Sparse Neural Networks}, journal = {CoRR}, volume = {abs/2003.11316}, year = {2020}, url = {https://arxiv.org/abs/2003.11316}, eprinttype = {arXiv}, eprint = {2003.11316}, timestamp = {Wed, 01 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2003-11316.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2004-12406, author = {Mengjie Zhao and Tao Lin and Martin Jaggi and Hinrich Sch{\"{u}}tze}, title = {Masking as an Efficient Alternative to Finetuning for Pretrained Language Models}, journal = {CoRR}, volume = {abs/2004.12406}, year = {2020}, url = {https://arxiv.org/abs/2004.12406}, eprinttype = {arXiv}, eprint = {2004.12406}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2004-12406.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-04747, author = {Lie He and Sai Praneeth Karimireddy and Martin Jaggi}, title = {Secure Byzantine-Robust Machine Learning}, journal = {CoRR}, volume = {abs/2006.04747}, year = {2020}, url = {https://arxiv.org/abs/2006.04747}, eprinttype = {arXiv}, eprint = {2006.04747}, timestamp = {Fri, 12 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-04747.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-05720, author = {Tao Lin and Lingjing Kong and Sebastian U. Stich and Martin Jaggi}, title = {Extrapolation for Large-batch Training in Deep Learning}, journal = {CoRR}, volume = {abs/2006.05720}, year = {2020}, url = {https://arxiv.org/abs/2006.05720}, eprinttype = {arXiv}, eprint = {2006.05720}, timestamp = {Mon, 14 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-05720.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-07242, author = {Tao Lin and Lingjing Kong and Sebastian U. Stich and Martin Jaggi}, title = {Ensemble Distillation for Robust Model Fusion in Federated Learning}, journal = {CoRR}, volume = {abs/2006.07242}, year = {2020}, url = {https://arxiv.org/abs/2006.07242}, eprinttype = {arXiv}, eprint = {2006.07242}, timestamp = {Mon, 14 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-07242.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-07253, author = {Tao Lin and Sebastian U. Stich and Luis Barba and Daniil Dmitriev and Martin Jaggi}, title = {Dynamic Model Pruning with Feedback}, journal = {CoRR}, volume = {abs/2006.07253}, year = {2020}, url = {https://arxiv.org/abs/2006.07253}, eprinttype = {arXiv}, eprint = {2006.07253}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-07253.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-09365, author = {Lie He and Sai Praneeth Karimireddy and Martin Jaggi}, title = {Byzantine-Robust Learning on Heterogeneous Datasets via Resampling}, journal = {CoRR}, volume = {abs/2006.09365}, year = {2020}, url = {https://arxiv.org/abs/2006.09365}, eprinttype = {arXiv}, eprint = {2006.09365}, timestamp = {Wed, 17 Jun 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-09365.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-14567, author = {Tatjana Chavdarova and Matteo Pagliardini and Martin Jaggi and Fran{\c{c}}ois Fleuret}, title = {Taming GANs with Lookahead}, journal = {CoRR}, volume = {abs/2006.14567}, year = {2020}, url = {https://arxiv.org/abs/2006.14567}, eprinttype = {arXiv}, eprint = {2006.14567}, timestamp = {Thu, 02 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-14567.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2006-16362, author = {Jean{-}Baptiste Cordonnier and Andreas Loukas and Martin Jaggi}, title = {Multi-Head Attention: Collaborate Instead of Concatenate}, journal = {CoRR}, volume = {abs/2006.16362}, year = {2020}, url = {https://arxiv.org/abs/2006.16362}, eprinttype = {arXiv}, eprint = {2006.16362}, timestamp = {Thu, 02 Jul 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2006-16362.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-01425, author = {Thijs Vogels and Sai Praneeth Karimireddy and Martin Jaggi}, title = {PowerGossip: Practical Low-Rank Communication Compression in Decentralized Deep Learning}, journal = {CoRR}, volume = {abs/2008.01425}, year = {2020}, url = {https://arxiv.org/abs/2008.01425}, eprinttype = {arXiv}, eprint = {2008.01425}, timestamp = {Fri, 07 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-01425.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2008-03606, author = {Sai Praneeth Karimireddy and Martin Jaggi and Satyen Kale and Mehryar Mohri and Sashank J. Reddi and Sebastian U. Stich and Ananda Theertha Suresh}, title = {Mime: Mimicking Centralized Stochastic Algorithms in Federated Learning}, journal = {CoRR}, volume = {abs/2008.03606}, year = {2020}, url = {https://arxiv.org/abs/2008.03606}, eprinttype = {arXiv}, eprint = {2008.03606}, timestamp = {Fri, 14 Aug 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2008-03606.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2009-09271, author = {Negar Foroutan Eghlidi and Martin Jaggi}, title = {Sparse Communication for Training Deep Networks}, journal = {CoRR}, volume = {abs/2009.09271}, year = {2020}, url = {https://arxiv.org/abs/2009.09271}, eprinttype = {arXiv}, eprint = {2009.09271}, timestamp = {Wed, 23 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2009-09271.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2011-01697, author = {Dmitry Kovalev and Anastasia Koloskova and Martin Jaggi and Peter Richt{\'{a}}rik and Sebastian U. Stich}, title = {A Linearly Convergent Algorithm for Decentralized Optimization: Sending Less Bits for Free!}, journal = {CoRR}, volume = {abs/2011.01697}, year = {2020}, url = {https://arxiv.org/abs/2011.01697}, eprinttype = {arXiv}, eprint = {2011.01697}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-2011-01697.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-2012-10333, author = {Sai Praneeth Karimireddy and Lie He and Martin Jaggi}, title = {Learning from History for Byzantine Robust Optimization}, journal = {CoRR}, volume = {abs/2012.10333}, year = {2020}, url = {https://arxiv.org/abs/2012.10333}, eprinttype = {arXiv}, eprint = {2012.10333}, timestamp = {Mon, 04 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-2012-10333.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/mfc/LangovoyGJ19, author = {Mikhail A. Langovoy and Akhilesh Gotmare and Martin Jaggi}, title = {Unsupervised robust nonparametric learning of hidden community properties}, journal = {Math. Found. Comput.}, volume = {2}, number = {2}, pages = {127--147}, year = {2019}, url = {https://doi.org/10.3934/mfc.2019010}, doi = {10.3934/MFC.2019010}, timestamp = {Tue, 14 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/mfc/LangovoyGJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/KarimireddyKSJ19, author = {Sai Praneeth Karimireddy and Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, editor = {Kamalika Chaudhuri and Masashi Sugiyama}, title = {Efficient Greedy Coordinate Descent for Composite Problems}, booktitle = {The 22nd International Conference on Artificial Intelligence and Statistics, {AISTATS} 2019, 16-18 April 2019, Naha, Okinawa, Japan}, series = {Proceedings of Machine Learning Research}, volume = {89}, pages = {2887--2896}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v89/karimireddy19a.html}, timestamp = {Fri, 07 Jun 2019 09:03:47 +0200}, biburl = {https://dblp.org/rec/conf/aistats/KarimireddyKSJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/hipc/WszolaMJP19, author = {Eliza Wszola and Celestine Mendler{-}D{\"{u}}nner and Martin Jaggi and Markus P{\"{u}}schel}, title = {On Linear Learning with Manycore Processors}, booktitle = {26th {IEEE} International Conference on High Performance Computing, Data, and Analytics, HiPC 2019, Hyderabad, India, December 17-20, 2019}, pages = {184--194}, publisher = {{IEEE}}, year = {2019}, url = {https://doi.org/10.1109/HiPC.2019.00032}, doi = {10.1109/HIPC.2019.00032}, timestamp = {Thu, 20 Feb 2020 16:19:46 +0100}, biburl = {https://dblp.org/rec/conf/hipc/WszolaMJP19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/iclr/SinghHDJ19, author = {Sidak Pal Singh and Andreas Hug and Aymeric Dieuleveut and Martin Jaggi}, title = {Context Mover's Distance {\&} Barycenters: Optimal transport of contexts for building representations}, booktitle = {Deep Generative Models for Highly Structured Data, {ICLR} 2019 Workshop, New Orleans, Louisiana, United States, May 6, 2019}, publisher = {OpenReview.net}, year = {2019}, url = {https://openreview.net/forum?id=rygiEL8FOV}, timestamp = {Thu, 25 Jul 2019 16:26:32 +0200}, biburl = {https://dblp.org/rec/conf/iclr/SinghHDJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/BenyahiaYBJDSM19, author = {Yassine Benyahia and Kaicheng Yu and Kamil Bennani{-}Smires and Martin Jaggi and Anthony C. Davison and Mathieu Salzmann and Claudiu Musat}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {Overcoming Multi-model Forgetting}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {594--603}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/benyahia19a.html}, timestamp = {Tue, 11 Jun 2019 15:37:38 +0200}, biburl = {https://dblp.org/rec/conf/icml/BenyahiaYBJDSM19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KarimireddyRSJ19, author = {Sai Praneeth Karimireddy and Quentin Rebjock and Sebastian U. Stich and Martin Jaggi}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {Error Feedback Fixes SignSGD and other Gradient Compression Schemes}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {3252--3261}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/karimireddy19a.html}, timestamp = {Tue, 11 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/KarimireddyRSJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/KoloskovaSJ19, author = {Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, editor = {Kamalika Chaudhuri and Ruslan Salakhutdinov}, title = {Decentralized Stochastic Optimization and Gossip Algorithms with Compressed Communication}, booktitle = {Proceedings of the 36th International Conference on Machine Learning, {ICML} 2019, 9-15 June 2019, Long Beach, California, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {97}, pages = {3478--3487}, publisher = {{PMLR}}, year = {2019}, url = {http://proceedings.mlr.press/v97/koloskova19a.html}, timestamp = {Tue, 11 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/KoloskovaSJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/interspeech/SacchiNJC19, author = {Niccol{\`{o}} Sacchi and Alexandre Nanchen and Martin Jaggi and Milos Cernak}, editor = {Gernot Kubin and Zdravko Kacic}, title = {Open-Vocabulary Keyword Spotting with Audio and Text Embeddings}, booktitle = {Interspeech 2019, 20th Annual Conference of the International Speech Communication Association, Graz, Austria, 15-19 September 2019}, pages = {3362--3366}, publisher = {{ISCA}}, year = {2019}, url = {https://doi.org/10.21437/Interspeech.2019-1846}, doi = {10.21437/INTERSPEECH.2019-1846}, timestamp = {Fri, 29 Jan 2021 17:41:10 +0100}, biburl = {https://dblp.org/rec/conf/interspeech/SacchiNJC19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/naacl/GuptaPJ19, author = {Prakhar Gupta and Matteo Pagliardini and Martin Jaggi}, editor = {Jill Burstein and Christy Doran and Thamar Solorio}, title = {Better Word Embeddings by Disentangling Contextual n-Gram Information}, booktitle = {Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, {NAACL-HLT} 2019, Minneapolis, MN, USA, June 2-7, 2019, Volume 1 (Long and Short Papers)}, pages = {933--939}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/n19-1098}, doi = {10.18653/V1/N19-1098}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/naacl/GuptaPJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/FranceschiDJ19, author = {Jean{-}Yves Franceschi and Aymeric Dieuleveut and Martin Jaggi}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {Unsupervised Scalable Representation Learning for Multivariate Time Series}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {4652--4663}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/53c6de78244e9f528eb3e1cda69699bb-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/FranceschiDJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/VogelsKJ19, author = {Thijs Vogels and Sai Praneeth Karimireddy and Martin Jaggi}, editor = {Hanna M. Wallach and Hugo Larochelle and Alina Beygelzimer and Florence d'Alch{\'{e}}{-}Buc and Emily B. Fox and Roman Garnett}, title = {PowerSGD: Practical Low-Rank Gradient Compression for Distributed Optimization}, booktitle = {Advances in Neural Information Processing Systems 32: Annual Conference on Neural Information Processing Systems 2019, NeurIPS 2019, December 8-14, 2019, Vancouver, BC, Canada}, pages = {14236--14245}, year = {2019}, url = {https://proceedings.neurips.cc/paper/2019/hash/d9fbed9da256e344c1fa46bb46c34c5f-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/VogelsKJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/smm4h/SchneuwlyGLCJ19, author = {Arno Schneuwly and Ralf Grubenmann and S{\'{e}}verine Rion Logean and Mark Cieliebak and Martin Jaggi}, editor = {Davy Weissenbacher and Graciela Gonzalez{-}Hernandez}, title = {Correlating Twitter Language with Community-Level Health Outcomes}, booktitle = {Proceedings of the Fourth Social Media Mining for Health Application Workshop {\&} Shared Task, SMM4H@ACL 2019, Florence, Italy, August 2, 2019}, pages = {71--78}, publisher = {Association for Computational Linguistics}, year = {2019}, url = {https://doi.org/10.18653/v1/W19-3210}, doi = {10.18653/V1/W19-3210}, timestamp = {Mon, 22 Apr 2024 17:02:59 +0200}, biburl = {https://dblp.org/rec/conf/smm4h/SchneuwlyGLCJ19.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/wsdm/JosifoskiPPJ019, author = {Martin Josifoski and Ivan S. Paskov and Hristo S. Paskov and Martin Jaggi and Robert West}, editor = {J. Shane Culpepper and Alistair Moffat and Paul N. Bennett and Kristina Lerman}, title = {Crosslingual Document Embedding as Reduced-Rank Ridge Regression}, booktitle = {Proceedings of the Twelfth {ACM} International Conference on Web Search and Data Mining, {WSDM} 2019, Melbourne, VIC, Australia, February 11-15, 2019}, pages = {744--752}, publisher = {{ACM}}, year = {2019}, url = {https://doi.org/10.1145/3289600.3291023}, doi = {10.1145/3289600.3291023}, timestamp = {Sat, 30 May 2020 20:02:29 +0200}, biburl = {https://dblp.org/rec/conf/wsdm/JosifoskiPPJ019.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-09847, author = {Sai Praneeth Karimireddy and Quentin Rebjock and Sebastian U. Stich and Martin Jaggi}, title = {Error Feedback Fixes SignSGD and other Gradient Compression Schemes}, journal = {CoRR}, volume = {abs/1901.09847}, year = {2019}, url = {http://arxiv.org/abs/1901.09847}, eprinttype = {arXiv}, eprint = {1901.09847}, timestamp = {Sat, 02 Feb 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-09847.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1901-10738, author = {Jean{-}Yves Franceschi and Aymeric Dieuleveut and Martin Jaggi}, title = {Unsupervised Scalable Representation Learning for Multivariate Time Series}, journal = {CoRR}, volume = {abs/1901.10738}, year = {2019}, url = {http://arxiv.org/abs/1901.10738}, eprinttype = {arXiv}, eprint = {1901.10738}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1901-10738.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-00340, author = {Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, title = {Decentralized Stochastic Optimization and Gossip Algorithms with Compressed Communication}, journal = {CoRR}, volume = {abs/1902.00340}, year = {2019}, url = {http://arxiv.org/abs/1902.00340}, eprinttype = {arXiv}, eprint = {1902.00340}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-00340.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-08142, author = {Christian Sciuto and Kaicheng Yu and Martin Jaggi and Claudiu Musat and Mathieu Salzmann}, title = {Evaluating the Search Phase of Neural Architecture Search}, journal = {CoRR}, volume = {abs/1902.08142}, year = {2019}, url = {http://arxiv.org/abs/1902.08142}, eprinttype = {arXiv}, eprint = {1902.08142}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-08142.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-08232, author = {Yassine Benyahia and Kaicheng Yu and Kamil Bennani{-}Smires and Martin Jaggi and Anthony C. Davison and Mathieu Salzmann and Claudiu Musat}, title = {Overcoming Multi-Model Forgetting}, journal = {CoRR}, volume = {abs/1902.08232}, year = {2019}, url = {http://arxiv.org/abs/1902.08232}, eprinttype = {arXiv}, eprint = {1902.08232}, timestamp = {Thu, 06 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-08232.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-09499, author = {Matthias H{\"{u}}ser and Adrian K{\"{u}}ndig and Walter Karlen and Valeria De Luca and Martin Jaggi}, title = {Forecasting intracranial hypertension using multi-scale waveform metrics}, journal = {CoRR}, volume = {abs/1902.09499}, year = {2019}, url = {http://arxiv.org/abs/1902.09499}, eprinttype = {arXiv}, eprint = {1902.09499}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-09499.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1902-09713, author = {Khalil Mrini and Claudiu Musat and Michael Baeriswyl and Martin Jaggi}, title = {Structure Tree-LSTM: Structure-aware Attentional Document Encoders}, journal = {CoRR}, volume = {abs/1902.09713}, year = {2019}, url = {http://arxiv.org/abs/1902.09713}, eprinttype = {arXiv}, eprint = {1902.09713}, timestamp = {Tue, 21 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1902-09713.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-03257, author = {Alexander Ratner and Dan Alistarh and Gustavo Alonso and David G. Andersen and Peter Bailis and Sarah Bird and Nicholas Carlini and Bryan Catanzaro and Eric S. Chung and Bill Dally and Jeff Dean and Inderjit S. Dhillon and Alexandros G. Dimakis and Pradeep Dubey and Charles Elkan and Grigori Fursin and Gregory R. Ganger and Lise Getoor and Phillip B. Gibbons and Garth A. Gibson and Joseph E. Gonzalez and Justin Gottschlich and Song Han and Kim M. Hazelwood and Furong Huang and Martin Jaggi and Kevin G. Jamieson and Michael I. Jordan and Gauri Joshi and Rania Khalaf and Jason Knight and Jakub Kone{\v{c}}n{\'y} and Tim Kraska and Arun Kumar and Anastasios Kyrillidis and Jing Li and Samuel Madden and H. Brendan McMahan and Erik Meijer and Ioannis Mitliagkas and Rajat Monga and Derek Gordon Murray and Dimitris S. Papailiopoulos and Gennady Pekhimenko and Theodoros Rekatsinas and Afshin Rostamizadeh and Christopher R{\'{e}} and Christopher De Sa and Hanie Sedghi and Siddhartha Sen and Virginia Smith and Alex Smola and Dawn Song and Evan R. Sparks and Ion Stoica and Vivienne Sze and Madeleine Udell and Joaquin Vanschoren and Shivaram Venkataraman and Rashmi Vinayak and Markus Weimer and Andrew Gordon Wilson and Eric P. Xing and Matei Zaharia and Ce Zhang and Ameet Talwalkar}, title = {SysML: The New Frontier of Machine Learning Systems}, journal = {CoRR}, volume = {abs/1904.03257}, year = {2019}, url = {http://arxiv.org/abs/1904.03257}, eprinttype = {arXiv}, eprint = {1904.03257}, timestamp = {Fri, 11 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-03257.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-03922, author = {Martin Josifoski and Ivan S. Paskov and Hristo S. Paskov and Martin Jaggi and Robert West}, title = {Crosslingual Document Embedding as Reduced-Rank Ridge Regression}, journal = {CoRR}, volume = {abs/1904.03922}, year = {2019}, url = {http://arxiv.org/abs/1904.03922}, eprinttype = {arXiv}, eprint = {1904.03922}, timestamp = {Thu, 25 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-03922.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1904-05033, author = {Prakhar Gupta and Matteo Pagliardini and Martin Jaggi}, title = {Better Word Embeddings by Disentangling Contextual n-Gram Information}, journal = {CoRR}, volume = {abs/1904.05033}, year = {2019}, url = {http://arxiv.org/abs/1904.05033}, eprinttype = {arXiv}, eprint = {1904.05033}, timestamp = {Thu, 25 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1904-05033.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-00626, author = {Eliza Wszola and Celestine Mendler{-}D{\"{u}}nner and Martin Jaggi and Markus P{\"{u}}schel}, title = {On Linear Learning with Manycore Processors}, journal = {CoRR}, volume = {abs/1905.00626}, year = {2019}, url = {http://arxiv.org/abs/1905.00626}, eprinttype = {arXiv}, eprint = {1905.00626}, timestamp = {Mon, 27 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-00626.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1905-13727, author = {Thijs Vogels and Sai Praneeth Karimireddy and Martin Jaggi}, title = {PowerSGD: Practical Low-Rank Gradient Compression for Distributed Optimization}, journal = {CoRR}, volume = {abs/1905.13727}, year = {2019}, url = {http://arxiv.org/abs/1905.13727}, eprinttype = {arXiv}, eprint = {1905.13727}, timestamp = {Mon, 03 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1905-13727.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1906-06465, author = {Arno Schneuwly and Ralf Grubenmann and S{\'{e}}verine Rion Logean and Mark Cieliebak and Martin Jaggi}, title = {Correlating Twitter Language with Community-Level Health Outcomes}, journal = {CoRR}, volume = {abs/1906.06465}, year = {2019}, url = {http://arxiv.org/abs/1906.06465}, eprinttype = {arXiv}, eprint = {1906.06465}, timestamp = {Thu, 27 Jun 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1906-06465.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1907-09356, author = {Anastasia Koloskova and Tao Lin and Sebastian U. Stich and Martin Jaggi}, title = {Decentralized Deep Learning with Arbitrary Communication Compression}, journal = {CoRR}, volume = {abs/1907.09356}, year = {2019}, url = {http://arxiv.org/abs/1907.09356}, eprinttype = {arXiv}, eprint = {1907.09356}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1907-09356.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-05653, author = {Sidak Pal Singh and Martin Jaggi}, title = {Model Fusion via Optimal Transport}, journal = {CoRR}, volume = {abs/1910.05653}, year = {2019}, url = {http://arxiv.org/abs/1910.05653}, eprinttype = {arXiv}, eprint = {1910.05653}, timestamp = {Wed, 16 Oct 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-05653.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1910-11758, author = {Prabhu Teja Sivaprasad and Florian Mai and Thijs Vogels and Martin Jaggi and Fran{\c{c}}ois Fleuret}, title = {On the Tunability of Optimizers in Deep Learning}, journal = {CoRR}, volume = {abs/1910.11758}, year = {2019}, url = {http://arxiv.org/abs/1910.11758}, eprinttype = {arXiv}, eprint = {1910.11758}, timestamp = {Thu, 31 Oct 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1910-11758.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1911-03584, author = {Jean{-}Baptiste Cordonnier and Andreas Loukas and Martin Jaggi}, title = {On the Relationship between Self-Attention and Convolutional Layers}, journal = {CoRR}, volume = {abs/1911.03584}, year = {2019}, url = {http://arxiv.org/abs/1911.03584}, eprinttype = {arXiv}, eprint = {1911.03584}, timestamp = {Sun, 01 Dec 2019 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1911-03584.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-04977, author = {Peter Kairouz and H. Brendan McMahan and Brendan Avent and Aur{\'{e}}lien Bellet and Mehdi Bennis and Arjun Nitin Bhagoji and Kallista A. Bonawitz and Zachary Charles and Graham Cormode and Rachel Cummings and Rafael G. L. D'Oliveira and Salim El Rouayheb and David Evans and Josh Gardner and Zachary Garrett and Adri{\`{a}} Gasc{\'{o}}n and Badih Ghazi and Phillip B. Gibbons and Marco Gruteser and Za{\"{\i}}d Harchaoui and Chaoyang He and Lie He and Zhouyuan Huo and Ben Hutchinson and Justin Hsu and Martin Jaggi and Tara Javidi and Gauri Joshi and Mikhail Khodak and Jakub Kone{\v{c}}n{\'y} and Aleksandra Korolova and Farinaz Koushanfar and Sanmi Koyejo and Tancr{\`{e}}de Lepoint and Yang Liu and Prateek Mittal and Mehryar Mohri and Richard Nock and Ayfer {\"{O}}zg{\"{u}}r and Rasmus Pagh and Mariana Raykova and Hang Qi and Daniel Ramage and Ramesh Raskar and Dawn Song and Weikang Song and Sebastian U. Stich and Ziteng Sun and Ananda Theertha Suresh and Florian Tram{\`{e}}r and Praneeth Vepakomma and Jianyu Wang and Li Xiong and Zheng Xu and Qiang Yang and Felix X. Yu and Han Yu and Sen Zhao}, title = {Advances and Open Problems in Federated Learning}, journal = {CoRR}, volume = {abs/1912.04977}, year = {2019}, url = {http://arxiv.org/abs/1912.04977}, eprinttype = {arXiv}, eprint = {1912.04977}, timestamp = {Mon, 11 Jul 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-04977.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1912-12481, author = {Ali Sabet and Prakhar Gupta and Jean{-}Baptiste Cordonnier and Robert West and Martin Jaggi}, title = {Robust Cross-lingual Embeddings from Parallel Sentences}, journal = {CoRR}, volume = {abs/1912.12481}, year = {2019}, url = {http://arxiv.org/abs/1912.12481}, eprinttype = {arXiv}, eprint = {1912.12481}, timestamp = {Fri, 03 Jan 2020 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1912-12481.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/siamjo/dAspremontGJ18, author = {Alexandre d'Aspremont and Crist{\'{o}}bal Guzm{\'{a}}n and Martin Jaggi}, title = {Optimal Affine-Invariant Smooth Minimization Algorithms}, journal = {{SIAM} J. Optim.}, volume = {28}, number = {3}, pages = {2384--2405}, year = {2018}, url = {https://doi.org/10.1137/17M1116842}, doi = {10.1137/17M1116842}, timestamp = {Thu, 14 Oct 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/siamjo/dAspremontGJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/KarimireddySJ18, author = {Sai Praneeth Reddy Karimireddy and Sebastian U. Stich and Martin Jaggi}, editor = {Amos J. Storkey and Fernando P{\'{e}}rez{-}Cruz}, title = {Adaptive balancing of gradient and update computation times using global geometry and approximate subproblems}, booktitle = {International Conference on Artificial Intelligence and Statistics, {AISTATS} 2018, 9-11 April 2018, Playa Blanca, Lanzarote, Canary Islands, Spain}, series = {Proceedings of Machine Learning Research}, volume = {84}, pages = {1204--1213}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v84/karimireddy18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:22 +0200}, biburl = {https://dblp.org/rec/conf/aistats/KarimireddySJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/conll/Bennani-SmiresM18, author = {Kamil Bennani{-}Smires and Claudiu Musat and Andreea Hossmann and Michael Baeriswyl and Martin Jaggi}, editor = {Anna Korhonen and Ivan Titov}, title = {Simple Unsupervised Keyphrase Extraction using Sentence Embeddings}, booktitle = {Proceedings of the 22nd Conference on Computational Natural Language Learning, CoNLL 2018, Brussels, Belgium, October 31 - November 1, 2018}, pages = {221--229}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/k18-1022}, doi = {10.18653/V1/K18-1022}, timestamp = {Sun, 12 Nov 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/conll/Bennani-SmiresM18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DunnerLGBHJ18, author = {Celestine D{\"{u}}nner and Aur{\'{e}}lien Lucchi and Matilde Gargiani and An Bian and Thomas Hofmann and Martin Jaggi}, editor = {Jennifer G. Dy and Andreas Krause}, title = {A Distributed Second-Order Algorithm You Can Trust}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {1357--1365}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/duenner18a.html}, timestamp = {Wed, 03 Apr 2019 18:17:30 +0200}, biburl = {https://dblp.org/rec/conf/icml/DunnerLGBHJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/LocatelloRKRSSJ18, author = {Francesco Locatello and Anant Raj and Sai Praneeth Karimireddy and Gunnar R{\"{a}}tsch and Bernhard Sch{\"{o}}lkopf and Sebastian U. Stich and Martin Jaggi}, editor = {Jennifer G. Dy and Andreas Krause}, title = {On Matching Pursuit and Coordinate Descent}, booktitle = {Proceedings of the 35th International Conference on Machine Learning, {ICML} 2018, Stockholmsm{\"{a}}ssan, Stockholm, Sweden, July 10-15, 2018}, series = {Proceedings of Machine Learning Research}, volume = {80}, pages = {3204--3213}, publisher = {{PMLR}}, year = {2018}, url = {http://proceedings.mlr.press/v80/locatello18a.html}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/LocatelloRKRSSJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/naacl/PagliardiniGJ18, author = {Matteo Pagliardini and Prakhar Gupta and Martin Jaggi}, editor = {Marilyn A. Walker and Heng Ji and Amanda Stent}, title = {Unsupervised Learning of Sentence Embeddings Using Compositional n-Gram Features}, booktitle = {Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, {NAACL-HLT} 2018, New Orleans, Louisiana, USA, June 1-6, 2018, Volume 1 (Long Papers)}, pages = {528--540}, publisher = {Association for Computational Linguistics}, year = {2018}, url = {https://doi.org/10.18653/v1/n18-1049}, doi = {10.18653/V1/N18-1049}, timestamp = {Mon, 28 Aug 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/naacl/PagliardiniGJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DrumondLJF18, author = {Mario Drumond and Tao Lin and Martin Jaggi and Babak Falsafi}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Training DNNs with Hybrid Block Floating Point}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {451--461}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/6a9aeddfc689c1d0e3b9ccc3ab651bc5-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/DrumondLJF18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/StichCJ18, author = {Sebastian U. Stich and Jean{-}Baptiste Cordonnier and Martin Jaggi}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {Sparsified {SGD} with Memory}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {4452--4463}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/b440509a0106086a67bc2ea9df0a1dab-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/StichCJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/HeBJ18, author = {Lie He and An Bian and Martin Jaggi}, editor = {Samy Bengio and Hanna M. Wallach and Hugo Larochelle and Kristen Grauman and Nicol{\`{o}} Cesa{-}Bianchi and Roman Garnett}, title = {{COLA:} Decentralized Linear Learning}, booktitle = {Advances in Neural Information Processing Systems 31: Annual Conference on Neural Information Processing Systems 2018, NeurIPS 2018, December 3-8, 2018, Montr{\'{e}}al, Canada}, pages = {4541--4551}, year = {2018}, url = {https://proceedings.neurips.cc/paper/2018/hash/05a70454516ecd9194c293b0e415777f-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/HeBJ18.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1801-04470, author = {Kamil Bennani{-}Smires and Claudiu Musat and Martin Jaggi and Andreea Hossmann and Michael Baeriswyl}, title = {EmbedRank: Unsupervised Keyphrase Extraction using Sentence Embeddings}, journal = {CoRR}, volume = {abs/1801.04470}, year = {2018}, url = {http://arxiv.org/abs/1801.04470}, eprinttype = {arXiv}, eprint = {1801.04470}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1801-04470.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1803-09539, author = {Francesco Locatello and Anant Raj and Sai Praneeth Karimireddy and Gunnar R{\"{a}}tsch and Bernhard Sch{\"{o}}lkopf and Sebastian U. Stich and Martin Jaggi}, title = {Revisiting First-Order Convex Optimization Over Linear Spaces}, journal = {CoRR}, volume = {abs/1803.09539}, year = {2018}, url = {http://arxiv.org/abs/1803.09539}, eprinttype = {arXiv}, eprint = {1803.09539}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1803-09539.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1804-01526, author = {Mario Drumond and Tao Lin and Martin Jaggi and Babak Falsafi}, title = {End-to-End {DNN} Training with Block Floating Point Arithmetic}, journal = {CoRR}, volume = {abs/1804.01526}, year = {2018}, url = {http://arxiv.org/abs/1804.01526}, eprinttype = {arXiv}, eprint = {1804.01526}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1804-01526.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-00413, author = {Sai Praneeth Karimireddy and Sebastian U. Stich and Martin Jaggi}, title = {Global linear convergence of Newton's method without strong-convexity or Lipschitz gradients}, journal = {CoRR}, volume = {abs/1806.00413}, year = {2018}, url = {http://arxiv.org/abs/1806.00413}, eprinttype = {arXiv}, eprint = {1806.00413}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-00413.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1806-07569, author = {Celestine D{\"{u}}nner and Aur{\'{e}}lien Lucchi and Matilde Gargiani and An Bian and Thomas Hofmann and Martin Jaggi}, title = {A Distributed Second-Order Algorithm You Can Trust}, journal = {CoRR}, volume = {abs/1806.07569}, year = {2018}, url = {http://arxiv.org/abs/1806.07569}, eprinttype = {arXiv}, eprint = {1806.07569}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1806-07569.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-04883, author = {Lie He and An Bian and Martin Jaggi}, title = {{COLA:} Communication-Efficient Decentralized Linear Learning}, journal = {CoRR}, volume = {abs/1808.04883}, year = {2018}, url = {http://arxiv.org/abs/1808.04883}, eprinttype = {arXiv}, eprint = {1808.04883}, timestamp = {Sun, 02 Sep 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-04883.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-07217, author = {Tao Lin and Sebastian U. Stich and Martin Jaggi}, title = {Don't Use Large Mini-Batches, Use Local {SGD}}, journal = {CoRR}, volume = {abs/1808.07217}, year = {2018}, url = {http://arxiv.org/abs/1808.07217}, eprinttype = {arXiv}, eprint = {1808.07217}, timestamp = {Tue, 01 Jun 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-07217.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1808-09663, author = {Sidak Pal Singh and Andreas Hug and Aymeric Dieuleveut and Martin Jaggi}, title = {Wasserstein is all you need}, journal = {CoRR}, volume = {abs/1808.09663}, year = {2018}, url = {http://arxiv.org/abs/1808.09663}, eprinttype = {arXiv}, eprint = {1808.09663}, timestamp = {Mon, 03 Sep 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1808-09663.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1809-07599, author = {Sebastian U. Stich and Jean{-}Baptiste Cordonnier and Martin Jaggi}, title = {Sparsified {SGD} with Memory}, journal = {CoRR}, volume = {abs/1809.07599}, year = {2018}, url = {http://arxiv.org/abs/1809.07599}, eprinttype = {arXiv}, eprint = {1809.07599}, timestamp = {Fri, 05 Oct 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1809-07599.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1810-06999, author = {Sai Praneeth Karimireddy and Anastasia Koloskova and Sebastian U. Stich and Martin Jaggi}, title = {Efficient Greedy Coordinate Descent for Composite Problems}, journal = {CoRR}, volume = {abs/1810.06999}, year = {2018}, url = {http://arxiv.org/abs/1810.06999}, eprinttype = {arXiv}, eprint = {1810.06999}, timestamp = {Thu, 01 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1810-06999.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jmlr/SmithFMTJJ17, author = {Virginia Smith and Simone Forte and Chenxin Ma and Martin Tak{\'{a}}c and Michael I. Jordan and Martin Jaggi}, title = {CoCoA: {A} General Framework for Communication-Efficient Distributed Optimization}, journal = {J. Mach. Learn. Res.}, volume = {18}, pages = {230:1--230:49}, year = {2017}, url = {http://jmlr.org/papers/v18/16-512.html}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/jmlr/SmithFMTJJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/oms/MaKJSJRT17, author = {Chenxin Ma and Jakub Kone{\v{c}}n{\'y} and Martin Jaggi and Virginia Smith and Michael I. Jordan and Peter Richt{\'{a}}rik and Martin Tak{\'{a}}c}, title = {Distributed optimization with arbitrary local solvers}, journal = {Optim. Methods Softw.}, volume = {32}, number = {4}, pages = {813--848}, year = {2017}, url = {https://doi.org/10.1080/10556788.2016.1278445}, doi = {10.1080/10556788.2016.1278445}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/oms/MaKJSJRT17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/tgrs/KaiserWLJHS17, author = {Pascal Kaiser and Jan Dirk Wegner and Aur{\'{e}}lien Lucchi and Martin Jaggi and Thomas Hofmann and Konrad Schindler}, title = {Learning Aerial Image Segmentation From Online Maps}, journal = {{IEEE} Trans. Geosci. Remote. Sens.}, volume = {55}, number = {11}, pages = {6054--6068}, year = {2017}, url = {https://doi.org/10.1109/TGRS.2017.2719738}, doi = {10.1109/TGRS.2017.2719738}, timestamp = {Sun, 02 Oct 2022 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/tgrs/KaiserWLJHS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/acl/FangJA17, author = {Tina Fang and Martin Jaggi and Katerina J. Argyraki}, editor = {Allyson Ettinger and Spandana Gella and Matthieu Labeau and Cecilia Ovesdotter Alm and Marine Carpuat and Mark Dredze}, title = {Generating Steganographic Text with LSTMs}, booktitle = {Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics, {ACL} 2017, Vancouver, Canada, July 30 - August 4, Student Research Workshop}, pages = {100--106}, publisher = {Association for Computational Linguistics}, year = {2017}, url = {https://doi.org/10.18653/v1/P17-3017}, doi = {10.18653/V1/P17-3017}, timestamp = {Mon, 05 Feb 2024 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/acl/FangJA17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/LocatelloKTJ17, author = {Francesco Locatello and Rajiv Khanna and Michael Tschannen and Martin Jaggi}, editor = {Aarti Singh and Xiaojin (Jerry) Zhu}, title = {A Unified Optimization View on Generalized Matching Pursuit and Frank-Wolfe}, booktitle = {Proceedings of the 20th International Conference on Artificial Intelligence and Statistics, {AISTATS} 2017, 20-22 April 2017, Fort Lauderdale, FL, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {54}, pages = {860--868}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v54/locatello17a.html}, timestamp = {Wed, 29 May 2019 08:41:44 +0200}, biburl = {https://dblp.org/rec/conf/aistats/LocatelloKTJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/aistats/PerekrestenkoCJ17, author = {Dmytro Perekrestenko and Volkan Cevher and Martin Jaggi}, editor = {Aarti Singh and Xiaojin (Jerry) Zhu}, title = {Faster Coordinate Descent via Adaptive Importance Sampling}, booktitle = {Proceedings of the 20th International Conference on Artificial Intelligence and Statistics, {AISTATS} 2017, 20-22 April 2017, Fort Lauderdale, FL, {USA}}, series = {Proceedings of Machine Learning Research}, volume = {54}, pages = {869--877}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v54/perekrestenko17a.html}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/aistats/PerekrestenkoCJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/StichRJ17, author = {Sebastian U. Stich and Anant Raj and Martin Jaggi}, editor = {Doina Precup and Yee Whye Teh}, title = {Approximate Steepest Coordinate Descent}, booktitle = {Proceedings of the 34th International Conference on Machine Learning, {ICML} 2017, Sydney, NSW, Australia, 6-11 August 2017}, series = {Proceedings of Machine Learning Research}, volume = {70}, pages = {3251--3259}, publisher = {{PMLR}}, year = {2017}, url = {http://proceedings.mlr.press/v70/stich17a.html}, timestamp = {Wed, 29 May 2019 08:41:45 +0200}, biburl = {https://dblp.org/rec/conf/icml/StichRJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/LocatelloTRJ17, author = {Francesco Locatello and Michael Tschannen and Gunnar R{\"{a}}tsch and Martin Jaggi}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Greedy Algorithms for Cone Constrained Optimization with Convergence Guarantees}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {773--784}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/63538fe6ef330c13a05a3ed7e599d5f7-Abstract.html}, timestamp = {Thu, 21 Jan 2021 13:58:27 +0100}, biburl = {https://dblp.org/rec/conf/nips/LocatelloTRJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/DunnerPJ17, author = {Celestine D{\"{u}}nner and Thomas P. Parnell and Martin Jaggi}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Efficient Use of Limited-Memory Accelerators for Linear Learning on Heterogeneous Systems}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {4258--4267}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/e0f7a4d0ef9b84b83b693bbf3feb8e6e-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/DunnerPJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/StichRJ17, author = {Sebastian U. Stich and Anant Raj and Martin Jaggi}, editor = {Isabelle Guyon and Ulrike von Luxburg and Samy Bengio and Hanna M. Wallach and Rob Fergus and S. V. N. Vishwanathan and Roman Garnett}, title = {Safe Adaptive Importance Sampling}, booktitle = {Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems 2017, December 4-9, 2017, Long Beach, CA, {USA}}, pages = {4381--4391}, year = {2017}, url = {https://proceedings.neurips.cc/paper/2017/hash/1177967c7957072da3dc1db4ceb30e7a-Abstract.html}, timestamp = {Thu, 21 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/StichRJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/www/DeriuLLSMCHJ17, author = {Jan Deriu and Aur{\'{e}}lien Lucchi and Valeria De Luca and Aliaksei Severyn and Simon M{\"{u}}ller and Mark Cieliebak and Thomas Hofmann and Martin Jaggi}, editor = {Rick Barrett and Rick Cummings and Eugene Agichtein and Evgeniy Gabrilovich}, title = {Leveraging Large Amounts of Weakly Supervised Data for Multi-Language Sentiment Classification}, booktitle = {Proceedings of the 26th International Conference on World Wide Web, {WWW} 2017, Perth, Australia, April 3-7, 2017}, pages = {1045--1052}, publisher = {{ACM}}, year = {2017}, url = {https://doi.org/10.1145/3038912.3052611}, doi = {10.1145/3038912.3052611}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/www/DeriuLLSMCHJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LocatelloKTJ17, author = {Francesco Locatello and Rajiv Khanna and Michael Tschannen and Martin Jaggi}, title = {A Unified Optimization View on Generalized Matching Pursuit and Frank-Wolfe}, journal = {CoRR}, volume = {abs/1702.06457}, year = {2017}, url = {http://arxiv.org/abs/1702.06457}, eprinttype = {arXiv}, eprint = {1702.06457}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LocatelloKTJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/DeriuLLSMCHJ17, author = {Jan Deriu and Aur{\'{e}}lien Lucchi and Valeria De Luca and Aliaksei Severyn and Simon M{\"{u}}ller and Mark Cieliebak and Thomas Hofmann and Martin Jaggi}, title = {Leveraging Large Amounts of Weakly Supervised Data for Multi-Language Sentiment Classification}, journal = {CoRR}, volume = {abs/1703.02504}, year = {2017}, url = {http://arxiv.org/abs/1703.02504}, eprinttype = {arXiv}, eprint = {1703.02504}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/DeriuLLSMCHJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PagliardiniGJ17, author = {Matteo Pagliardini and Prakhar Gupta and Martin Jaggi}, title = {Unsupervised Learning of Sentence Embeddings using Compositional n-Gram Features}, journal = {CoRR}, volume = {abs/1703.02507}, year = {2017}, url = {http://arxiv.org/abs/1703.02507}, eprinttype = {arXiv}, eprint = {1703.02507}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PagliardiniGJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/PerekrestenkoCJ17, author = {Dmytro Perekrestenko and Volkan Cevher and Martin Jaggi}, title = {Faster Coordinate Descent via Adaptive Importance Sampling}, journal = {CoRR}, volume = {abs/1703.02518}, year = {2017}, url = {http://arxiv.org/abs/1703.02518}, eprinttype = {arXiv}, eprint = {1703.02518}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/PerekrestenkoCJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/FangJA17, author = {Tina Fang and Martin Jaggi and Katerina J. Argyraki}, title = {Generating Steganographic Text with LSTMs}, journal = {CoRR}, volume = {abs/1705.10742}, year = {2017}, url = {http://arxiv.org/abs/1705.10742}, eprinttype = {arXiv}, eprint = {1705.10742}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/FangJA17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LocatelloTRJ17, author = {Francesco Locatello and Michael Tschannen and Gunnar R{\"{a}}tsch and Martin Jaggi}, title = {Greedy Algorithms for Cone Constrained Optimization with Convergence Guarantees}, journal = {CoRR}, volume = {abs/1705.11041}, year = {2017}, url = {http://arxiv.org/abs/1705.11041}, eprinttype = {arXiv}, eprint = {1705.11041}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/LocatelloTRJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/StichRJ17, author = {Sebastian U. Stich and Anant Raj and Martin Jaggi}, title = {Approximate Steepest Coordinate Descent}, journal = {CoRR}, volume = {abs/1706.08427}, year = {2017}, url = {http://arxiv.org/abs/1706.08427}, eprinttype = {arXiv}, eprint = {1706.08427}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/StichRJ17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/LangovoyGJS17, author = {Mikhail A. Langovoy and Akhilesh Gotmare and Martin Jaggi and Suvrit Sra}, title = {Unsupervised robust nonparametric learning of hidden community properties}, journal = {CoRR}, volume = {abs/1707.03494}, year = {2017}, url = {http://arxiv.org/abs/1707.03494}, eprinttype = {arXiv}, eprint = {1707.03494}, timestamp = {Sat, 23 Jan 2021 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/LangovoyGJS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/KaiserWLJHS17, author = {Pascal Kaiser and Jan Dirk Wegner and Aur{\'{e}}lien Lucchi and Martin Jaggi and Thomas Hofmann and Konrad Schindler}, title = {Learning Aerial Image Segmentation from Online Maps}, journal = {CoRR}, volume = {abs/1707.06879}, year = {2017}, url = {http://arxiv.org/abs/1707.06879}, eprinttype = {arXiv}, eprint = {1707.06879}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/KaiserWLJHS17.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1708-05357, author = {Celestine D{\"{u}}nner and Thomas P. Parnell and Martin Jaggi}, title = {Efficient Use of Limited-Memory Resources to Accelerate Linear Learning}, journal = {CoRR}, volume = {abs/1708.05357}, year = {2017}, url = {http://arxiv.org/abs/1708.05357}, eprinttype = {arXiv}, eprint = {1708.05357}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1708-05357.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-02637, author = {Sebastian U. Stich and Anant Raj and Martin Jaggi}, title = {Safe Adaptive Importance Sampling}, journal = {CoRR}, volume = {abs/1711.02637}, year = {2017}, url = {http://arxiv.org/abs/1711.02637}, eprinttype = {arXiv}, eprint = {1711.02637}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-02637.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1711-05305, author = {Chenxin Ma and Martin Jaggi and Frank E. Curtis and Nathan Srebro and Martin Tak{\'{a}}c}, title = {An Accelerated Communication-Efficient Primal-Dual Optimization Framework for Structured Machine Learning}, journal = {CoRR}, volume = {abs/1711.05305}, year = {2017}, url = {http://arxiv.org/abs/1711.05305}, eprinttype = {arXiv}, eprint = {1711.05305}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/abs-1711-05305.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/clef/SprengelJKH16, author = {Elias Sprengel and Martin Jaggi and Yannic Kilcher and Thomas Hofmann}, editor = {Krisztian Balog and Linda Cappellato and Nicola Ferro and Craig Macdonald}, title = {Audio Based Bird Species Identification using Deep Learning Techniques}, booktitle = {Working Notes of {CLEF} 2016 - Conference and Labs of the Evaluation forum, {\'{E}}vora, Portugal, 5-8 September, 2016}, series = {{CEUR} Workshop Proceedings}, volume = {1609}, pages = {547--559}, publisher = {CEUR-WS.org}, year = {2016}, url = {https://ceur-ws.org/Vol-1609/16090547.pdf}, timestamp = {Fri, 10 Mar 2023 16:23:40 +0100}, biburl = {https://dblp.org/rec/conf/clef/SprengelJKH16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/DunnerFTJ16, author = {Celestine D{\"{u}}nner and Simone Forte and Martin Tak{\'{a}}c and Martin Jaggi}, editor = {Maria{-}Florina Balcan and Kilian Q. Weinberger}, title = {Primal-Dual Rates and Certificates}, booktitle = {Proceedings of the 33nd International Conference on Machine Learning, {ICML} 2016, New York City, NY, USA, June 19-24, 2016}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {48}, pages = {783--792}, publisher = {JMLR.org}, year = {2016}, url = {http://proceedings.mlr.press/v48/dunner16.html}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/DunnerFTJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/semeval/DeriuGULLJ16, author = {Jan Deriu and Maurice Gonzenbach and Fatih Uzdilli and Aur{\'{e}}lien Lucchi and Valeria De Luca and Martin Jaggi}, editor = {Steven Bethard and Daniel M. Cer and Marine Carpuat and David Jurgens and Preslav Nakov and Torsten Zesch}, title = {SwissCheese at SemEval-2016 Task 4: Sentiment Classification Using an Ensemble of Convolutional Neural Networks with Distant Supervision}, booktitle = {Proceedings of the 10th International Workshop on Semantic Evaluation, SemEval@NAACL-HLT 2016, San Diego, CA, USA, June 16-17, 2016}, pages = {1124--1128}, publisher = {The Association for Computer Linguistics}, year = {2016}, url = {https://doi.org/10.18653/v1/s16-1173}, doi = {10.18653/V1/S16-1173}, timestamp = {Wed, 07 Dec 2022 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/semeval/DeriuGULLJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/KhannaTJ16, author = {Rajiv Khanna and Michael Tschannen and Martin Jaggi}, title = {Pursuits in Structured Non-Convex Matrix Factorizations}, journal = {CoRR}, volume = {abs/1602.04208}, year = {2016}, url = {http://arxiv.org/abs/1602.04208}, eprinttype = {arXiv}, eprint = {1602.04208}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/KhannaTJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/DunnerFTJ16, author = {Celestine D{\"{u}}nner and Simone Forte and Martin Tak{\'{a}}c and Martin Jaggi}, title = {Primal-Dual Rates and Certificates}, journal = {CoRR}, volume = {abs/1602.05205}, year = {2016}, url = {http://arxiv.org/abs/1602.05205}, eprinttype = {arXiv}, eprint = {1602.05205}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/DunnerFTJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/RajOGSJ16, author = {Anant Raj and Jakob Olbrich and Bernd G{\"{a}}rtner and Bernhard Sch{\"{o}}lkopf and Martin Jaggi}, title = {Screening Rules for Convex Problems}, journal = {CoRR}, volume = {abs/1609.07478}, year = {2016}, url = {http://arxiv.org/abs/1609.07478}, eprinttype = {arXiv}, eprint = {1609.07478}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/RajOGSJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SmithFMTJJ16, author = {Virginia Smith and Simone Forte and Chenxin Ma and Martin Tak{\'{a}}c and Michael I. Jordan and Martin Jaggi}, title = {CoCoA: {A} General Framework for Communication-Efficient Distributed Optimization}, journal = {CoRR}, volume = {abs/1611.02189}, year = {2016}, url = {http://arxiv.org/abs/1611.02189}, eprinttype = {arXiv}, eprint = {1611.02189}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/SmithFMTJJ16.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/MaSJJRT15, author = {Chenxin Ma and Virginia Smith and Martin Jaggi and Michael I. Jordan and Peter Richt{\'{a}}rik and Martin Tak{\'{a}}c}, editor = {Francis R. Bach and David M. Blei}, title = {Adding vs. Averaging in Distributed Primal-Dual Optimization}, booktitle = {Proceedings of the 32nd International Conference on Machine Learning, {ICML} 2015, Lille, France, 6-11 July 2015}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {37}, pages = {1973--1982}, publisher = {JMLR.org}, year = {2015}, url = {http://proceedings.mlr.press/v37/mab15.html}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/icml/MaSJJRT15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/Lacoste-JulienJ15, author = {Simon Lacoste{-}Julien and Martin Jaggi}, editor = {Corinna Cortes and Neil D. Lawrence and Daniel D. Lee and Masashi Sugiyama and Roman Garnett}, title = {On the Global Linear Convergence of Frank-Wolfe Optimization Variants}, booktitle = {Advances in Neural Information Processing Systems 28: Annual Conference on Neural Information Processing Systems 2015, December 7-12, 2015, Montreal, Quebec, Canada}, pages = {496--504}, year = {2015}, url = {https://proceedings.neurips.cc/paper/2015/hash/c058f544c737782deacefa532d9add4c-Abstract.html}, timestamp = {Mon, 16 May 2022 15:41:51 +0200}, biburl = {https://dblp.org/rec/conf/nips/Lacoste-JulienJ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/semeval/UzdilliJEJDC15, author = {Fatih Uzdilli and Martin Jaggi and Dominic Egger and Pascal Julmy and Leon Derczynski and Mark Cieliebak}, editor = {Daniel M. Cer and David Jurgens and Preslav Nakov and Torsten Zesch}, title = {Swiss-Chocolate: Combining Flipout Regularization and Random Forests with Artificially Built Subsystems to Boost Text-Classification for Sentiment}, booktitle = {Proceedings of the 9th International Workshop on Semantic Evaluation, SemEval@NAACL-HLT 2015, Denver, Colorado, USA, June 4-5, 2015}, pages = {608--612}, publisher = {The Association for Computer Linguistics}, year = {2015}, url = {https://doi.org/10.18653/v1/s15-2101}, doi = {10.18653/V1/S15-2101}, timestamp = {Sat, 30 Sep 2023 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/semeval/UzdilliJEJDC15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MaSJJRT15, author = {Chenxin Ma and Virginia Smith and Martin Jaggi and Michael I. Jordan and Peter Richt{\'{a}}rik and Martin Tak{\'{a}}c}, title = {Adding vs. Averaging in Distributed Primal-Dual Optimization}, journal = {CoRR}, volume = {abs/1502.03508}, year = {2015}, url = {http://arxiv.org/abs/1502.03508}, eprinttype = {arXiv}, eprint = {1502.03508}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/MaSJJRT15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/Lacoste-JulienJ15, author = {Simon Lacoste{-}Julien and Martin Jaggi}, title = {On the Global Linear Convergence of Frank-Wolfe Optimization Variants}, journal = {CoRR}, volume = {abs/1511.05932}, year = {2015}, url = {http://arxiv.org/abs/1511.05932}, eprinttype = {arXiv}, eprint = {1511.05932}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/Lacoste-JulienJ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/SmithFJJ15, author = {Virginia Smith and Simone Forte and Michael I. Jordan and Martin Jaggi}, title = {L1-Regularized Distributed Optimization: {A} Communication-Efficient Primal-Dual Framework}, journal = {CoRR}, volume = {abs/1512.04011}, year = {2015}, url = {http://arxiv.org/abs/1512.04011}, eprinttype = {arXiv}, eprint = {1512.04011}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/SmithFJJ15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/MaKJSJRT15, author = {Chenxin Ma and Jakub Kone{\v{c}}n{\'y} and Martin Jaggi and Virginia Smith and Michael I. Jordan and Peter Richt{\'{a}}rik and Martin Tak{\'{a}}c}, title = {Distributed Optimization with Arbitrary Local Solvers}, journal = {CoRR}, volume = {abs/1512.04039}, year = {2015}, url = {http://arxiv.org/abs/1512.04039}, eprinttype = {arXiv}, eprint = {1512.04039}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/MaKJSJRT15.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/nips/JaggiSTTKHJ14, author = {Martin Jaggi and Virginia Smith and Martin Tak{\'{a}}c and Jonathan Terhorst and Sanjay Krishnan and Thomas Hofmann and Michael I. Jordan}, editor = {Zoubin Ghahramani and Max Welling and Corinna Cortes and Neil D. Lawrence and Kilian Q. Weinberger}, title = {Communication-Efficient Distributed Dual Coordinate Ascent}, booktitle = {Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems 2014, December 8-13 2014, Montreal, Quebec, Canada}, pages = {3068--3076}, year = {2014}, url = {https://proceedings.neurips.cc/paper/2014/hash/894b77f805bd94d292574c38c5d628d5-Abstract.html}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/conf/nips/JaggiSTTKHJ14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/semeval/JaggiUC14, author = {Martin Jaggi and Fatih Uzdilli and Mark Cieliebak}, editor = {Preslav Nakov and Torsten Zesch}, title = {Swiss-Chocolate: Sentiment Detection using Sparse SVMs and Part-Of-Speech n-Grams}, booktitle = {Proceedings of the 8th International Workshop on Semantic Evaluation, SemEval@COLING 2014, Dublin, Ireland, August 23-24, 2014}, pages = {601--604}, publisher = {The Association for Computer Linguistics}, year = {2014}, url = {https://doi.org/10.3115/v1/s14-2105}, doi = {10.3115/V1/S14-2105}, timestamp = {Fri, 06 Aug 2021 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/semeval/JaggiUC14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/JaggiSTTKHJ14, author = {Martin Jaggi and Virginia Smith and Martin Tak{\'{a}}c and Jonathan Terhorst and Sanjay Krishnan and Thomas Hofmann and Michael I. Jordan}, title = {Communication-Efficient Distributed Dual Coordinate Ascent}, journal = {CoRR}, volume = {abs/1409.1458}, year = {2014}, url = {http://arxiv.org/abs/1409.1458}, eprinttype = {arXiv}, eprint = {1409.1458}, timestamp = {Wed, 11 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/corr/JaggiSTTKHJ14.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Lacoste-JulienJSP13, author = {Simon Lacoste{-}Julien and Martin Jaggi and Mark Schmidt and Patrick Pletscher}, title = {Block-Coordinate Frank-Wolfe Optimization for Structural SVMs}, booktitle = {Proceedings of the 30th International Conference on Machine Learning, {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {28}, pages = {53--61}, publisher = {JMLR.org}, year = {2013}, url = {http://proceedings.mlr.press/v28/lacoste-julien13.html}, timestamp = {Thu, 23 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/Lacoste-JulienJSP13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/Jaggi13, author = {Martin Jaggi}, title = {Revisiting Frank-Wolfe: Projection-Free Sparse Convex Optimization}, booktitle = {Proceedings of the 30th International Conference on Machine Learning, {ICML} 2013, Atlanta, GA, USA, 16-21 June 2013}, series = {{JMLR} Workshop and Conference Proceedings}, volume = {28}, pages = {427--435}, publisher = {JMLR.org}, year = {2013}, url = {http://proceedings.mlr.press/v28/jaggi13.html}, timestamp = {Wed, 29 May 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/Jaggi13.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1303-1152, author = {Martin Jaggi}, title = {An Equivalence between the Lasso and Support Vector Machines}, journal = {CoRR}, volume = {abs/1303.1152}, year = {2013}, url = {http://arxiv.org/abs/1303.1152}, eprinttype = {arXiv}, eprint = {1303.1152}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1303-1152.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/jocg/GartnerJM12, author = {Bernd G{\"{a}}rtner and Martin Jaggi and Cl{\'{e}}ment Maria}, title = {An Exponential Lower Bound on the Complexity of Regularization Paths}, journal = {J. Comput. Geom.}, volume = {3}, number = {1}, pages = {168--195}, year = {2012}, url = {https://doi.org/10.20382/jocg.v3i1a9}, doi = {10.20382/JOCG.V3I1A9}, timestamp = {Thu, 10 Sep 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/jocg/GartnerJM12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/talg/GiesenJL12, author = {Joachim Giesen and Martin Jaggi and S{\"{o}}ren Laue}, title = {Approximating parameterized convex optimization problems}, journal = {{ACM} Trans. Algorithms}, volume = {9}, number = {1}, pages = {10:1--10:17}, year = {2012}, url = {https://doi.org/10.1145/2390176.2390186}, doi = {10.1145/2390176.2390186}, timestamp = {Tue, 06 Nov 2018 00:00:00 +0100}, biburl = {https://dblp.org/rec/journals/talg/GiesenJL12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/esa/GiesenJL12, author = {Joachim Giesen and Martin Jaggi and S{\"{o}}ren Laue}, editor = {Leah Epstein and Paolo Ferragina}, title = {Optimizing over the Growing Spectrahedron}, booktitle = {Algorithms - {ESA} 2012 - 20th Annual European Symposium, Ljubljana, Slovenia, September 10-12, 2012. Proceedings}, series = {Lecture Notes in Computer Science}, volume = {7501}, pages = {503--514}, publisher = {Springer}, year = {2012}, url = {https://doi.org/10.1007/978-3-642-33090-2\_44}, doi = {10.1007/978-3-642-33090-2\_44}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/esa/GiesenJL12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:journals/jmlr/GiesenJL12, author = {Joachim Giesen and Martin Jaggi and S{\"{o}}ren Laue}, editor = {Neil D. Lawrence and Mark A. Girolami}, title = {Regularization Paths with Guarantees for Convex Semidefinite Optimization}, booktitle = {Proceedings of the Fifteenth International Conference on Artificial Intelligence and Statistics, {AISTATS} 2012, La Palma, Canary Islands, Spain, April 21-23, 2012}, series = {{JMLR} Proceedings}, volume = {22}, pages = {432--439}, publisher = {JMLR.org}, year = {2012}, url = {http://proceedings.mlr.press/v22/giesen12.html}, timestamp = {Wed, 29 May 2019 08:41:44 +0200}, biburl = {https://dblp.org/rec/journals/jmlr/GiesenJL12.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1207-4747, author = {Simon Lacoste{-}Julien and Martin Jaggi and Mark Schmidt and Patrick Pletscher}, title = {Stochastic Block-Coordinate Frank-Wolfe Optimization for Structural SVMs}, journal = {CoRR}, volume = {abs/1207.4747}, year = {2012}, url = {http://arxiv.org/abs/1207.4747}, eprinttype = {arXiv}, eprint = {1207.4747}, timestamp = {Thu, 23 Apr 2020 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1207-4747.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@phdthesis{DBLP:phd/basesearch/Jaggi11, author = {Martin Jaggi}, title = {Sparse Convex Optimization Methods for Machine Learning}, school = {{ETH} Zurich, Z{\"{u}}rich, Switzerland}, year = {2011}, url = {https://hdl.handle.net/20.500.11850/72811}, doi = {10.3929/ETHZ-A-007050453}, timestamp = {Mon, 02 Jan 2023 00:00:00 +0100}, biburl = {https://dblp.org/rec/phd/basesearch/Jaggi11.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-1108-1170, author = {Martin Jaggi}, title = {Convex Optimization without Projection Steps}, journal = {CoRR}, volume = {abs/1108.1170}, year = {2011}, url = {http://arxiv.org/abs/1108.1170}, eprinttype = {arXiv}, eprint = {1108.1170}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-1108-1170.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/esa/GiesenJL10, author = {Joachim Giesen and Martin Jaggi and S{\"{o}}ren Laue}, editor = {Mark de Berg and Ulrich Meyer}, title = {Approximating Parameterized Convex Optimization Problems}, booktitle = {Algorithms - {ESA} 2010, 18th Annual European Symposium, Liverpool, UK, September 6-8, 2010. Proceedings, Part {I}}, series = {Lecture Notes in Computer Science}, volume = {6346}, pages = {524--535}, publisher = {Springer}, year = {2010}, url = {https://doi.org/10.1007/978-3-642-15775-2\_45}, doi = {10.1007/978-3-642-15775-2\_45}, timestamp = {Tue, 14 May 2019 10:00:54 +0200}, biburl = {https://dblp.org/rec/conf/esa/GiesenJL10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/icml/JaggiS10, author = {Martin Jaggi and Marek Sulovsk{\'{y}}}, editor = {Johannes F{\"{u}}rnkranz and Thorsten Joachims}, title = {A Simple Algorithm for Nuclear Norm Regularized Problems}, booktitle = {Proceedings of the 27th International Conference on Machine Learning (ICML-10), June 21-24, 2010, Haifa, Israel}, pages = {471--478}, publisher = {Omnipress}, year = {2010}, url = {https://icml.cc/Conferences/2010/papers/196.pdf}, timestamp = {Wed, 03 Apr 2019 01:00:00 +0200}, biburl = {https://dblp.org/rec/conf/icml/JaggiS10.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@inproceedings{DBLP:conf/compgeom/GartnerJ09, author = {Bernd G{\"{a}}rtner and Martin Jaggi}, editor = {John Hershberger and Efi Fogel}, title = {Coresets for polytope distance}, booktitle = {Proceedings of the 25th {ACM} Symposium on Computational Geometry, Aarhus, Denmark, June 8-10, 2009}, pages = {33--42}, publisher = {{ACM}}, year = {2009}, url = {https://doi.org/10.1145/1542362.1542370}, doi = {10.1145/1542362.1542370}, timestamp = {Mon, 14 Jun 2021 16:24:56 +0200}, biburl = {https://dblp.org/rec/conf/compgeom/GartnerJ09.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-0903-4817, author = {Bernd G{\"{a}}rtner and Joachim Giesen and Martin Jaggi}, title = {An Exponential Lower Bound on the Complexity of Regularization Paths}, journal = {CoRR}, volume = {abs/0903.4817}, year = {2009}, url = {http://arxiv.org/abs/0903.4817}, eprinttype = {arXiv}, eprint = {0903.4817}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-0903-4817.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
@article{DBLP:journals/corr/abs-0903-4856, author = {Bernd G{\"{a}}rtner and Joachim Giesen and Martin Jaggi and Torsten Welsch}, title = {A Combinatorial Algorithm to Compute Regularization Paths}, journal = {CoRR}, volume = {abs/0903.4856}, year = {2009}, url = {http://arxiv.org/abs/0903.4856}, eprinttype = {arXiv}, eprint = {0903.4856}, timestamp = {Mon, 13 Aug 2018 01:00:00 +0200}, biburl = {https://dblp.org/rec/journals/corr/abs-0903-4856.bib}, bibsource = {dblp computer science bibliography, https://dblp.org} }
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.