@article{
fernandez2025efficient,
title={Efficient Hardware Scaling and Diminishing Returns in Large-Scale Training of Language Models},
author={Jared Fernandez and Luca Wehrstedt and Leonid Shamis and Mostafa Elhoushi and Kalyan Saladi and Yonatan Bisk and Emma Strubell and Jacob Kahn},
journal={Transactions on Machine Learning Research},
issn={2835-8856},
year={2025},
url={https://openreview.net/forum?id=p7jQEf3wlh},
note={}
}