Noam Shazeer, Mitchell Stern
Adafactor: Adaptive Learning Rates with Sublinear Memory Cost
ICML, 2018.
@inproceedings{ICML-2018-ShazeerS,
author = "Noam Shazeer and Mitchell Stern",
booktitle = "{Proceedings of the 35th International Conference on Machine Learning}",
ee = "http://proceedings.mlr.press/v80/shazeer18a.html",
pages = "4603--4611",
publisher = "{PMLR}",
title = "{Adafactor: Adaptive Learning Rates with Sublinear Memory Cost}",
year = 2018,
}











