TheKernel01's picture
Sync from GitHub via hub-sync
0788e19 verified
from .clip import clip
from PIL import Image
import torch.nn as nn
class CLIPModel(nn.Module):
def __init__(self, name="ViT-L/14", num_classes=1):
super(CLIPModel, self).__init__()
self.model, self.preprocess = clip.load(name, device="cpu") # self.preprecess will not be used during training, which is handled in Dataset class
self.fc = nn.Linear(768, num_classes )
def forward(self, x, return_feature=False):
features = self.model.encode_image(x)
if return_feature:
return features
return self.fc(features)