@@ -117,9 +117,6 @@ class Transformer2DModel(ModelMixin, ConfigMixin):
...
@@ -117,9 +117,6 @@ class Transformer2DModel(ModelMixin, ConfigMixin):
self.attention_head_dim=attention_head_dim
self.attention_head_dim=attention_head_dim
inner_dim=num_attention_heads*attention_head_dim
inner_dim=num_attention_heads*attention_head_dim
conv_cls=nn.Conv2d
linear_cls=nn.Linear
# 1. Transformer2DModel can process both standard continuous images of shape `(batch_size, num_channels, width, height)` as well as quantized image embeddings of shape `(batch_size, num_image_vectors)`
# 1. Transformer2DModel can process both standard continuous images of shape `(batch_size, num_channels, width, height)` as well as quantized image embeddings of shape `(batch_size, num_image_vectors)`
# Define whether input is continuous or discrete depending on configuration
# Define whether input is continuous or discrete depending on configuration