Spaces:

flax-community
/

dalle-mini

Running

boris commited on Oct 5, 2021

Commit

9ed6378

•

1 Parent(s): 061c06b

feat: update defaults

Files changed (1) hide show

dev/seq2seq/run_seq2seq_flax.py CHANGED Viewed

@@ -253,7 +253,7 @@ class DataTrainingArguments:
         metadata={"help": "Overwrite the cached training and evaluation sets"},
     )
     save_model_steps: Optional[int] = field(
-        default=3000,  # about once every hour in our experiments
         metadata={
             "help": "For logging the model more frequently. Used only when `log_model` is set."
         },
@@ -290,9 +290,9 @@ class DataTrainingArguments:
 class TrainState(train_state.TrainState):
-    dropout_rng: jnp.ndarray
-    grad_accum: jnp.ndarray
-    optimizer_step: int
     def replicate(self):
         return jax_utils.replicate(self).replace(

         metadata={"help": "Overwrite the cached training and evaluation sets"},
     )
     save_model_steps: Optional[int] = field(
+        default=5000,  # about once every 1.5h in our experiments
         metadata={
             "help": "For logging the model more frequently. Used only when `log_model` is set."
         },
 class TrainState(train_state.TrainState):
+    dropout_rng: jnp.ndarray = None
+    grad_accum: jnp.ndarray = None
+    optimizer_step: int = None
     def replicate(self):
         return jax_utils.replicate(self).replace(