Please log in to take part in the discussion (add own reviews or comments).
Cite this publication
More citation styles
- please select -
%0 Conference Paper
%1 conf/iclr/KomatsuzakiPLRM23
%A Komatsuzaki, Aran
%A Puigcerver, Joan
%A Lee-Thorp, James
%A Ruiz, Carlos Riquelme
%A Mustafa, Basil
%A Ainslie, Joshua
%A Tay, Yi
%A Dehghani, Mostafa
%A Houlsby, Neil
%B ICLR
%D 2023
%I OpenReview.net
%K dblp
%T Sparse Upcycling: Training Mixture-of-Experts from Dense Checkpoints.
%U http://dblp.uni-trier.de/db/conf/iclr/iclr2023.html#KomatsuzakiPLRM23
@inproceedings{conf/iclr/KomatsuzakiPLRM23,
added-at = {2023-06-30T00:00:00.000+0200},
author = {Komatsuzaki, Aran and Puigcerver, Joan and Lee-Thorp, James and Ruiz, Carlos Riquelme and Mustafa, Basil and Ainslie, Joshua and Tay, Yi and Dehghani, Mostafa and Houlsby, Neil},
biburl = {https://www.bibsonomy.org/bibtex/2e1f1c29c59b19ec27d8acecd1e76071d/dblp},
booktitle = {ICLR},
crossref = {conf/iclr/2023},
ee = {https://openreview.net/pdf?id=T5nUQDrM4u},
interhash = {d91a67d3bf1781437049b22332408e64},
intrahash = {e1f1c29c59b19ec27d8acecd1e76071d},
keywords = {dblp},
publisher = {OpenReview.net},
timestamp = {2024-04-10T01:21:52.000+0200},
title = {Sparse Upcycling: Training Mixture-of-Experts from Dense Checkpoints.},
url = {http://dblp.uni-trier.de/db/conf/iclr/iclr2023.html#KomatsuzakiPLRM23},
year = 2023
}