@misc{lin2024remove, title = {Can We Remove the Square-Root in Adaptive Gradient Methods? A Second-Order Perspective}, author = {Lin, Wu and Dangel, Felix and Eschenhagen, Runa and Bae, Juhan and Turner, Richard E. and Makhzani, Alireza}, howpublished = {ar{X}iv 2402.03496}, year = {2024}, }