Enable `requires_grad` on input embedding to train on top of frozen layers (#21598)

* v1 * make fixup * add more methods

Enable `requires_grad` on input embedding to train on top of frozen layers (#21598)
* v1 * make fixup * add more methods
41fa672d · Younes Belkada · GitHub · 8c502662 · 41fa672d
Unverified Commit 41fa672d authored Feb 14, 2023 by Younes Belkada Committed by GitHub Feb 14, 2023
Show whitespace changes
Inline Side-by-side

Showing with 17 additions and 0 deletions

src/transformers/modeling_utils.py src/transformers/modeling_utils.py +17 -0

No files found.
--- a/src/transformers/modeling_utils.py
+++ b/src/transformers/modeling_utils.py
@@ -1148,6 +1148,23 @@ class PreTrainedModel(nn.Module, ModuleUtilsMixin, GenerationMixin, PushToHubMix
            return False
        return True
+    def enable_input_require_grads(self):
+        """
+        Enables the gradients for the input embeddings. This is useful for fine-tuning adapter weights while keeping
+        the model weights fixed.
+        """
+        def make_inputs_require_grads(module, input, output):
+            output.requires_grad_(True)
+        self._require_grads_hook = self.get_input_embeddings().register_forward_hook(make_inputs_require_grads)
+    def disable_input_require_grads(self):
+        """
+        Removes the `_require_grads_hook`.
+        """
+        self._require_grads_hook.remove()
    def get_input_embeddings(self) -> nn.Module:
        """
        Returns the model's input embeddings.