Noam Shazeer, Mitchell Stern
Adafactor: Adaptive Learning Rates with Sublinear Memory Cost
ICML, 2018.
@inproceedings{ICML-2018-ShazeerS, author = "Noam Shazeer and Mitchell Stern", booktitle = "{Proceedings of the 35th International Conference on Machine Learning}", ee = "http://proceedings.mlr.press/v80/shazeer18a.html", pages = "4603--4611", publisher = "{PMLR}", title = "{Adafactor: Adaptive Learning Rates with Sublinear Memory Cost}", year = 2018, }