huggingface · elishowk · Sep 14, 2021 · Sep 10, 2021 · Sep 11, 2021 · Sep 14, 2021
diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py
@@ -2544,7 +2544,6 @@ def push_to_hub(self, commit_message: Optional[str] = "add model", **kwargs) ->
                 model_name = Path(self.args.output_dir).name
             else:
                 model_name = self.args.hub_model_id.split("/")[-1]
-            self.create_model_card(model_name=model_name, **kwargs)
         # Needs to be executed on all processes for TPU training, but will only save on the processed determined by
         # self.args.should_save.
         self.save_model()
@@ -2553,7 +2552,16 @@ def push_to_hub(self, commit_message: Optional[str] = "add model", **kwargs) ->
         if not self.is_world_process_zero():
             return
 
-        return self.repo.push_to_hub(commit_message=commit_message)
+        git_head_commit_url = self.repo.push_to_hub(commit_message=commit_message)
+        # push separately the model card to be independant from the rest of the model
+        if self.args.should_save:
+            self.create_model_card(model_name=model_name, **kwargs)
+            try:
+                self.repo.push_to_hub(commit_message="update model card README.md")
+            except Exception as exc:
+                logger.error(f"Error pushing update to the model card. Please read logs and retry. ${exc}")
+
+        return git_head_commit_url
 
     #
     # Deprecated code