Update chess-mamba-vs-xformer/train_bygame.py
Browse files
chess-mamba-vs-xformer/train_bygame.py
CHANGED
@@ -402,7 +402,7 @@ while True:
|
|
402 |
param_group['lr'] = lr
|
403 |
|
404 |
# Evaluate the loss on train/val sets and write checkpoints
|
405 |
-
if (iter_num % eval_interval == 0 and
|
406 |
torch.cuda.empty_cache()
|
407 |
losses = estimate_loss()
|
408 |
if init_from == 'anneal':
|
|
|
402 |
param_group['lr'] = lr
|
403 |
|
404 |
# Evaluate the loss on train/val sets and write checkpoints
|
405 |
+
if master_process and ((iter_num % eval_interval == 0 and local_iter_num > 0) or abs(games_seen - 12652800) <= 151 or abs(games_seen - 22275000) <= 151 or abs(games_seen - 11536000) <= 151 or abs(games_seen - 16250000) <= 151 or abs(games_seen - 18000000) <= 151 or abs(games_seen - 19690000) <= 151 or abs(games_seen - 22005050) <= 151 or abs(tokens_seen_padded - 7798839804) <= 46238):
|
406 |
torch.cuda.empty_cache()
|
407 |
losses = estimate_loss()
|
408 |
if init_from == 'anneal':
|