sd2_clip.py 1.4 KB
Newer Older
1
from comfy import sd1_clip
comfyanonymous's avatar
comfyanonymous committed
2
import torch
3
import os
comfyanonymous's avatar
comfyanonymous committed
4

5
6
7
8
class SD2ClipModel(sd1_clip.SD1ClipModel):
    def __init__(self, arch="ViT-H-14", device="cpu", max_length=77, freeze=True, layer="penultimate", layer_idx=None):
        textmodel_json_config = os.path.join(os.path.dirname(os.path.realpath(__file__)), "sd2_clip_config.json")
        super().__init__(device=device, freeze=freeze, textmodel_json_config=textmodel_json_config)
comfyanonymous's avatar
comfyanonymous committed
9
        self.empty_tokens = [[49406] + [49407] + [0] * 75]
10
        if layer == "last":
11
            pass
12
        elif layer == "penultimate":
13
14
            layer_idx = -1
            self.clip_layer(layer_idx)
comfyanonymous's avatar
comfyanonymous committed
15
16
17
        elif self.layer == "hidden":
            assert layer_idx is not None
            assert abs(layer_idx) < 24
18
            self.clip_layer(layer_idx)
comfyanonymous's avatar
comfyanonymous committed
19
20
        else:
            raise NotImplementedError()
21
22
23
24
25
26
27
28
29
30

    def clip_layer(self, layer_idx):
        if layer_idx < 0:
            layer_idx -= 1 #The real last layer of SD2.x clip is the penultimate one. The last one might contain garbage.
        if abs(layer_idx) >= 24:
            self.layer = "hidden"
            self.layer_idx = -2
        else:
            self.layer = "hidden"
            self.layer_idx = layer_idx
comfyanonymous's avatar
comfyanonymous committed
31
32

class SD2Tokenizer(sd1_clip.SD1Tokenizer):
33
34
    def __init__(self, tokenizer_path=None, embedding_directory=None):
        super().__init__(tokenizer_path, pad_with_end=False, embedding_directory=embedding_directory)