lower default initial learning rate to what Jonathan Ho had in his original repo

This commit is contained in:
Phil Wang
2022-05-14 13:22:43 -07:00
parent d1f02e8f49
commit 591d37e266
3 changed files with 3 additions and 3 deletions

View File

@@ -7,7 +7,7 @@ def separate_weight_decayable_params(params):
def get_optimizer(
params,
lr = 3e-4,
lr = 2e-5,
wd = 1e-2,
betas = (0.9, 0.999),
filter_by_requires_grad = False