Change eps defaults in adafactor_bv again after some checking

small_384_weights
Ross Wightman 2024-11-07 21:45:46 -08:00 committed by Ross Wightman
parent 9d8ccd2ba7
commit 1409ce2dbe
1 changed files with 2 additions and 2 deletions

View File

@ -214,8 +214,8 @@ def _single_tensor_adafactor(
exp_avg = exp_avgs[i]
step_t = state_steps[i]
if eps is None:
# use square of machine eps for grad dtype if not set
eps = torch.finfo(grad.dtype).eps ** 2
# default eps for avoiding div by zero, diff from float type eps
eps = 1e-7 if grad.dtype == torch.float16 else 1e-30
# Update step
step_t += 1