google
/

tipsv2-so400m14

@@ -50,7 +50,7 @@ transform = transforms.Compose([
     transforms.ToTensor(),
 ])
-url = "https://huggingface.co/spaces/google/tipsv2-gpu-explorer/resolve/main/examples/zeroseg/pascal_context_00049_image.png"
 image = Image.open(requests.get(url, stream=True).raw)
 pixel_values = transform(image).unsqueeze(0)
 out = model.encode_image(pixel_values)
@@ -85,7 +85,7 @@ import numpy as np
 from sklearn.decomposition import PCA
 spatial = out.patch_tokens.reshape(1, 32, 32, 1152)
-feat = spatial[0].detach().numpy().reshape(-1, 1152)
 rgb = PCA(n_components=3, whiten=True).fit_transform(feat).reshape(32, 32, 3)
 rgb = 1 / (1 + np.exp(-2.0 * rgb))  # sigmoid for [0, 1] range with good contrast
 print(rgb.shape)  # (32, 32, 3) — PCA of patch features as RGB

     transforms.ToTensor(),
 ])
+url = "https://huggingface.co/spaces/google/TIPSv2/resolve/main/examples/zeroseg/pascal_context_00049_image.png"
 image = Image.open(requests.get(url, stream=True).raw)
 pixel_values = transform(image).unsqueeze(0)
 out = model.encode_image(pixel_values)
 from sklearn.decomposition import PCA
 spatial = out.patch_tokens.reshape(1, 32, 32, 1152)
+feat = spatial[0].detach().cpu().numpy().reshape(-1, 1152)
 rgb = PCA(n_components=3, whiten=True).fit_transform(feat).reshape(32, 32, 3)
 rgb = 1 / (1 + np.exp(-2.0 * rgb))  # sigmoid for [0, 1] range with good contrast
 print(rgb.shape)  # (32, 32, 3) — PCA of patch features as RGB