"...git@developer.sourcefind.cn:chenpangpang/ComfyUI.git" did not exist on "ca2ae98470fdebd951cdb750998b82ecb532c901"
Unverified Commit 36b60ce9 authored by Patrick von Platen's avatar Patrick von Platen Committed by GitHub
Browse files

fix mt5 config (#8832)

parent 18c32eeb
...@@ -60,6 +60,8 @@ class MT5Config(PretrainedConfig): ...@@ -60,6 +60,8 @@ class MT5Config(PretrainedConfig):
testing). testing).
feed_forward_proj (:obj:`string`, `optional`, defaults to :obj:`"gated-gelu"`): feed_forward_proj (:obj:`string`, `optional`, defaults to :obj:`"gated-gelu"`):
Type of feed forward layer to be used. Should be one of :obj:`"relu"` or :obj:`"gated-gelu"`. Type of feed forward layer to be used. Should be one of :obj:`"relu"` or :obj:`"gated-gelu"`.
use_cache (:obj:`bool`, `optional`, defaults to :obj:`True`):
Whether or not the model should return the last key/values attentions (not used by all models).
""" """
model_type = "mt5" model_type = "mt5"
keys_to_ignore_at_inference = ["past_key_values"] keys_to_ignore_at_inference = ["past_key_values"]
...@@ -79,6 +81,7 @@ class MT5Config(PretrainedConfig): ...@@ -79,6 +81,7 @@ class MT5Config(PretrainedConfig):
initializer_factor=1.0, initializer_factor=1.0,
feed_forward_proj="gated-gelu", feed_forward_proj="gated-gelu",
is_encoder_decoder=True, is_encoder_decoder=True,
use_cache=True,
tokenizer_class="T5Tokenizer", tokenizer_class="T5Tokenizer",
tie_word_embeddings=False, tie_word_embeddings=False,
pad_token_id=0, pad_token_id=0,
...@@ -109,6 +112,7 @@ class MT5Config(PretrainedConfig): ...@@ -109,6 +112,7 @@ class MT5Config(PretrainedConfig):
self.layer_norm_epsilon = layer_norm_epsilon self.layer_norm_epsilon = layer_norm_epsilon
self.initializer_factor = initializer_factor self.initializer_factor = initializer_factor
self.feed_forward_proj = feed_forward_proj self.feed_forward_proj = feed_forward_proj
self.use_cache = use_cache
@property @property
def hidden_size(self): def hidden_size(self):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment