Commit e85be36b authored by comfyanonymous's avatar comfyanonymous
Browse files

Add a penultimate_hidden_states to the clip vision output.

parent 10de64af
...@@ -49,12 +49,16 @@ class ClipVisionModel(): ...@@ -49,12 +49,16 @@ class ClipVisionModel():
precision_scope = lambda a, b: contextlib.nullcontext(a) precision_scope = lambda a, b: contextlib.nullcontext(a)
with precision_scope(comfy.model_management.get_autocast_device(self.load_device), torch.float32): with precision_scope(comfy.model_management.get_autocast_device(self.load_device), torch.float32):
outputs = self.model(pixel_values=pixel_values) outputs = self.model(pixel_values=pixel_values, output_hidden_states=True)
for k in outputs: for k in outputs:
t = outputs[k] t = outputs[k]
if t is not None: if t is not None:
if k == 'hidden_states':
outputs["penultimate_hidden_states"] = t[-2].cpu()
else:
outputs[k] = t.cpu() outputs[k] = t.cpu()
return outputs return outputs
def convert_to_transformers(sd, prefix): def convert_to_transformers(sd, prefix):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment