flash-attention/training/configs/scheduler/plateau.yaml

10 lines
288 B
YAML
Raw Normal View History

2022-11-29 09:31:19 +08:00
# @package _global_
train:
scheduler_interval: epoch
scheduler_monitor: ???
scheduler:
_target_: torch.optim.lr_scheduler.ReduceLROnPlateau
factor: 0.2 # Decay factor when ReduceLROnPlateau is used
patience: 20
min_lr: 0.0 # Minimum learning rate during annealing