[chat]fix sft training for bloom, gpt and opt (#3418)

fix sft training for bloom, gpt and opt

[chat]fix sft training for bloom, gpt and opt (#3418)
fix sft training for bloom, gpt and opt
b09adff7 · Yuanchen · GitHub · 638a07a7 · b09adff7 · b09adff7
Unverified Commit b09adff7 authored Apr 04, 2023 by Yuanchen Committed by GitHub Apr 04, 2023
3 changed files
--- a/applications/Chat/coati/models/bloom/bloom_lm.py
+++ b/applications/Chat/coati/models/bloom/bloom_lm.py
@@ -33,3 +33,6 @@ class BLOOMLM(LM):
        if checkpoint:
            model.gradient_checkpointing_enable()
        super().__init__(model, lora_rank, lora_train_bias)
+    def forward(self, input_ids, attention_mask=None, labels=None, **kwargs):
+        return self.model(input_ids, attention_mask=attention_mask, labels=labels, **kwargs)
--- a/applications/Chat/coati/models/gpt/gpt_lm.py
+++ b/applications/Chat/coati/models/gpt/gpt_lm.py
@@ -33,3 +33,6 @@ class GPTLM(LM):
        if checkpoint:
            model.gradient_checkpointing_enable()
        super().__init__(model, lora_rank, lora_train_bias)
+    def forward(self, input_ids, attention_mask=None, labels=None, **kwargs):
+        return self.model(input_ids, attention_mask=attention_mask, labels=labels, **kwargs)
--- a/applications/Chat/coati/models/opt/opt_lm.py
+++ b/applications/Chat/coati/models/opt/opt_lm.py
@@ -33,3 +33,6 @@ class OPTLM(LM):
        if checkpoint:
            model.gradient_checkpointing_enable()
        super().__init__(model, lora_rank, lora_train_bias)
+    def forward(self, input_ids, attention_mask=None, labels=None, **kwargs):
+        return self.model(input_ids, attention_mask=attention_mask, labels=labels, **kwargs)