Spaces:

flax-community
/

dalle-mini

Running

boris commited on Oct 24, 2021

Commit

36cb737

•

1 Parent(s): 3cd6d41

fix: comment

Files changed (1) hide show

dev/seq2seq/run_seq2seq_flax.py CHANGED Viewed

@@ -753,6 +753,7 @@ def main():
         # restore optimizer state and step
         state = state.restore_state(artifact_dir)
         # TODO: number of remaining training epochs/steps and dataloader state need to be adjusted
     # label smoothed cross entropy
     def loss_fn(logits, labels):
@@ -937,7 +938,7 @@ def main():
     for epoch in epochs:
         # ======================== Training ================================
         step = unreplicate(state.step)
-        # wandb_log({"train/epoch": epoch}, step=step)
         # Generate an epoch by shuffling sampling indices from the train dataset
         if data_args.streaming:

         # restore optimizer state and step
         state = state.restore_state(artifact_dir)
         # TODO: number of remaining training epochs/steps and dataloader state need to be adjusted
+        # TODO: optimizer may use a different step for learning rate, we should serialize/restore entire state
     # label smoothed cross entropy
     def loss_fn(logits, labels):
     for epoch in epochs:
         # ======================== Training ================================
         step = unreplicate(state.step)
+        wandb_log({"train/epoch": epoch}, step=step)
         # Generate an epoch by shuffling sampling indices from the train dataset
         if data_args.streaming: