Satwik Sunnam satwiksunnam19

🏠

Working from home

Deep Learning Engineer

lucidrains / ViT-3d.py

Last active May 5, 2023 17:49

	class ViT(nn.Module):
	def __init__(self, *, image_size, patch_size, num_classes, dim, depth, heads, mlp_dim, channels = 3, dropout = 0., emb_dropout = 0.):
	super().__init__()
	assert image_size % patch_size == 0, 'image dimensions must be divisible by the patch size'
	num_patches = (image_size // patch_size) ** 3
	patch_dim = channels * patch_size ** 3

	self.patch_size = patch_size

	self.pos_embedding = nn.Parameter(torch.randn(1, num_patches + 1, dim))