import torch.nn as nn import torchvision.models.video as models def build_swin_model(): print("Initializing Video Swin Transformer...") # Using torchvision's Swin3D-T (Tiny) # Weights=None for scratch model = models.swin3d_t(weights=None) # Modify Head for Binary Classification # Original head is model.head (Linear) num_features = model.head.in_features model.head = nn.Linear(num_features, 2) return model