(self, x, mask=None)
| 123 | self.norm = nn.LayerNorm(embed_dim) |
| 124 | |
| 125 | def forward(self, x, mask=None): |
| 126 | for layer in self.layers: |
| 127 | x = layer(x, mask) |
| 128 | return self.norm(x) |
| 129 | |
| 130 | class VisionTransformerBlock(nn.Module): |
| 131 | def __init__(self, img_size=224, patch_size=16, in_channels=3, embed_dim=768, |