Skip to content

Commit

Permalink
Merge pull request #42 from EleutherAI/main
Browse files Browse the repository at this point in the history
Fixed AnnealingLR Class and Cosine Decay Schedule (EleutherAI#1008)
  • Loading branch information
kshitijkg authored Aug 7, 2023
2 parents 6c1f7bc + 009018e commit 8125ea3
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
2 changes: 1 addition & 1 deletion configs/neox_arguments.md
Original file line number Diff line number Diff line change
Expand Up @@ -111,7 +111,7 @@ Logging Arguments

- **git_hash**: str

Default = e16af33
Default = d3e481c

current git hash of repository

Expand Down
6 changes: 3 additions & 3 deletions megatron/learning_rates.py
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ def get_lr(self):
"""Learning rate decay functions from:
https://openreview.net/pdf?id=BJYwwY9ll pg. 4"""

num_iters_ = min(self.num_iters, self.end_iter - self.warmup_iter)
num_iters_ = self.num_iters
# Warmup.
if self.warmup_iter > 0 and self.num_iters <= self.warmup_iter:
return float(self.start_lr) * num_iters_ / self.warmup_iter
Expand All @@ -73,8 +73,8 @@ def get_lr(self):
if self.decay_style == "linear":
lr = self.start_lr * (self.end_iter - num_iters_) / self.end_iter
elif self.decay_style == "cosine":
lr = (
self.start_lr
lr = self.min_lr + (
(self.start_lr-self.min_lr)
/ 2.0
* (math.cos(math.pi * num_iters_ / self.end_iter) + 1)
)
Expand Down

0 comments on commit 8125ea3

Please sign in to comment.