diff --git a/GANDLF/optimizers/thirdparty/adopt.py b/GANDLF/optimizers/thirdparty/adopt.py index e7f32117d..115c61c00 100644 --- a/GANDLF/optimizers/thirdparty/adopt.py +++ b/GANDLF/optimizers/thirdparty/adopt.py @@ -49,7 +49,7 @@ def __init__( if isinstance(lr, Tensor): if foreach and not capturable: raise ValueError( - "lr as a Tensor is not supported for capturable=False and foreach=True" + "lr as a Tensor is not supported for `capturable=False` and `foreach=True`" ) if lr.numel() != 1: raise ValueError("Tensor lr must be 1-element") @@ -512,8 +512,8 @@ def adopt_wrapper(parameters: dict) -> torch.optim.Optimizer: return ADOPT( params=parameters["model_parameters"], lr=parameters.get("learning_rate", 1e-3), - betas=parameters.get("betas", (0.9, 0.999, 0.9999)), - eps=parameters.get("eps", 1e-8), + betas=parameters.get("betas", (0.9, 0.9999)), + eps=parameters.get("eps", 1e-6), weight_decay=parameters.get("weight_decay", 0.0), decoupled=parameters["optimizer"].get("decoupled", False), foreach=parameters.get("foreach", None),