@article{journals/corr/abs-2401-09149,
added-at = {2024-04-04T00:00:00.000+0200},
author = {Chen, Qiaoling and Gu, Diandian and Wang, Guoteng and Chen, Xun and Xiong, YingTong and Huang, Ting and Hu, Qinghao and Jin, Xin and Wen, Yonggang and Zhang, Tianwei and Sun, Peng},
biburl = {https://www.bibsonomy.org/bibtex/2474e98e13e779c05fc4e67a1d848f545/dblp},
ee = {https://doi.org/10.48550/arXiv.2401.09149},
interhash = {9a05068ced6ba6087469867f0b26344c},
intrahash = {474e98e13e779c05fc4e67a1d848f545},
journal = {CoRR},
keywords = {dblp},
timestamp = {2024-04-08T22:06:05.000+0200},
title = {InternEvo: Efficient Long-sequence Large Language Model Training via Hybrid Parallelism and Redundant Sharding.},
url = {http://dblp.uni-trier.de/db/journals/corr/corr2401.html#abs-2401-09149},
volume = {abs/2401.09149},
year = 2024
}