# Copied from transformers.models.clip.modeling_clip.CLIPTextTransformer with CLIPText->GroupViTText, CLIPEncoder->GroupViTTextEncoder, CLIP_TEXT->GROUPVIT_TEXT
classGroupViTTextTransformer(nn.Module):
def__init__(self,config:GroupViTTextConfig):
...
...
@@ -1105,12 +1123,9 @@ class GroupViTTextTransformer(nn.Module):