Bibtex
|
ACM
|
MLA
|
APA
|
Harvard
|
Vancouver
|
Chicago
@misc{Shoeybi2019Megatron, title = {{Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism}}, author = {Shoeybi, Mohammad and Patwary, Mostofa and Puri, Raul and LeGresley, Patrick and Casper, Jared and Catanzaro, Bryan}, year = {2019}, publisher = {arXiv}, doi = {10.48550/arXiv.1909.08053}, }
Mohammad Shoeybi, Mostofa Patwary, Raul Puri, Patrick LeGresley, Jared Casper, and Bryan Catanzaro. 2019. Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism. arXiv.1909.08053, pp. . DOI: https://doi.org/10.48550/arXiv.1909.08053
Shoeybi, Mohammad, Patwary, Mostofa, Puri, Raul, LeGresley, Patrick, Casper, Jared, and Catanzaro, Bryan. "Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism". arXiv.1909.08053, pp. . 2019.
Shoeybi, M., Patwary, M., Puri, R., LeGresley, P., Casper, J., & Catanzaro, B. (2019). Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism. arXiv.1909.08053, pp. .
Shoeybi, M., Patwary, M., Puri, R., LeGresley, P., Casper, J., Catanzaro, B., 2019. Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism.arXiv.1909.08053, pp.
Shoeybi M, Patwary M, Puri R, LeGresley P, Casper J, Catanzaro B. Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism.arXiv.1909.080532019; pp. .
Shoeybi, Mohammad, Patwary, Mostofa, Puri, Raul, LeGresley, Patrick, Casper, Jared, and Catanzaro, Bryan "Megatron-LM: Training Multi-Billion Parameter Language Models Using Model Parallelism". arXiv.1909.08053, pp. . 2019.