Spaces:

flax-community
/

dalle-mini

Running

boris commited on Nov 28, 2021

Commit

80b41d1

1 Parent(s): 0a77f72

feat: avoid OOM

Files changed (1) hide show

dev/seq2seq/run_seq2seq_flax.py CHANGED Viewed

@@ -475,6 +475,8 @@ def main():
         # load model
         model = CustomFlaxBartForConditionalGeneration.from_pretrained(artifact_dir)
         # load tokenizer
         tokenizer = AutoTokenizer.from_pretrained(
@@ -529,7 +531,10 @@ def main():
                 config=config,
                 seed=training_args.seed_model,
                 dtype=getattr(jnp, model_args.dtype),
             )
         else:
             model = CustomFlaxBartForConditionalGeneration(
                 config,

         # load model
         model = CustomFlaxBartForConditionalGeneration.from_pretrained(artifact_dir)
+        # avoid OOM on TPU: see https://github.com/google/flax/issues/1658
+        print(model.params)
         # load tokenizer
         tokenizer = AutoTokenizer.from_pretrained(
                 config=config,
                 seed=training_args.seed_model,
                 dtype=getattr(jnp, model_args.dtype),
+                ignore_mismatched_sizes=True,
             )
+            # avoid OOM on TPU: see https://github.com/google/flax/issues/1658
+            print(model.params)
         else:
             model = CustomFlaxBartForConditionalGeneration(
                 config,