@@ -59,7 +59,7 @@ model:
_target_: torch.optim.AdamW
_partial_: true
lr: 3e-4
- weight_decay: 0.1
+ weight_decay: 0.01
betas: [0.9, 0.95]
eps: 1e-5