projects
/
mygptrnn.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
|
inline
| side by side (parent:
a09ee76
)
Update.
author
François Fleuret
<francois@fleuret.org>
Sat, 6 Jan 2024 13:38:09 +0000
(14:38 +0100)
committer
François Fleuret
<francois@fleuret.org>
Sat, 6 Jan 2024 13:38:09 +0000
(14:38 +0100)
main.py
patch
|
blob
|
history
diff --git
a/main.py
b/main.py
index
1a17e51
..
fabebdd
100755
(executable)
--- a/
main.py
+++ b/
main.py
@@
-70,11
+70,11
@@
parser.add_argument("--min_learning_rate", type=float, default=6e-5)
parser.add_argument("--legacy_lr_schedule", action="store_true", default=False)
parser.add_argument("--legacy_lr_schedule", action="store_true", default=False)
-parser.add_argument("--legacy_l
earning_rate
", type=float, default=1e-4)
+parser.add_argument("--legacy_l
arge_lr
", type=float, default=1e-4)
-parser.add_argument("--legacy_
min_learning_rate
", type=float, default=2e-5)
+parser.add_argument("--legacy_
small_lr
", type=float, default=2e-5)
-parser.add_argument("--
nb_large_lr_epochs
", type=float, default=10)
+parser.add_argument("--
legacy_nb_epoch_large_lr
", type=float, default=10)
########################################
########################################
@@
-477,11
+477,11
@@
def get_lr(n_epoch, it):
# warmup though
if it < args.nb_warmup_iter:
# warmup though
if it < args.nb_warmup_iter:
- return args.legacy_l
earning_rate
* it / args.nb_warmup_iter
- elif it < args.
nb_large_lr_epochs
:
- return args.legacy_l
earning_rate
+ return args.legacy_l
arge_lr
* it / args.nb_warmup_iter
+ elif it < args.
legacy_nb_epoch_large_lr
:
+ return args.legacy_l
arge_lr
else:
else:
- return args.legacy_
min_learning_rate
+ return args.legacy_
small_lr
# from nanoGPT
# from nanoGPT