Initial commit

e0b10e40 · wanglch · ce623fe2 · e0b10e40
Commit e0b10e40 authored Jul 22, 2024 by wanglch
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 2 deletions

visual.py visual.py +4 -2

No files found.
--- a/visual.py
+++ b/visual.py
@@ -6,6 +6,8 @@ from transformers.activations import ACT2FN
 import math
 from torch.nn import LayerNorm

+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+
 def standard_attention(query_layer, key_layer, value_layer, scaling_attention_score=True):
    if scaling_attention_score:
        query_layer = query_layer / math.sqrt(query_layer.shape[-1])
@@ -39,7 +41,7 @@ class PatchEmbedding(nn.Module):
        self.position_embedding = nn.Embedding(config.num_positions, config.hidden_size)

    def forward(self, images: "tensor(B, C, H, W)") -> "tensor(B, L, D)":
-        x = self.proj(images)
+        x = self.proj(images).to(device)
        x = x.flatten(2).transpose(1, 2)
        cls_token = self.cls_embedding.expand(x.shape[0], -1, -1)
        x = torch.cat((cls_token, x), dim=1)
@@ -66,7 +68,7 @@ class Attention(nn.Module):
        out = attention_fn_default(
            q, k, v
        )
-        output = self.dense(out.transpose(1, 2).view(B, L, -1))
+        output = self.dense(out.transpose(1, 2).reshape(B, L, -1))
        output = self.output_dropout(output)
        return output