Spaces:

probing-vits
/

attention-heat-maps

Runtime error

App Files Files Community

ariG23498 HF Staff commited on Apr 11, 2022

Commit

e1c2e43

1 Parent(s): 1f029d6

chore: add utils

Browse files

Files changed (1) hide show

utils.py +48 -1

utils.py CHANGED Viewed

@@ -1,14 +1,17 @@
 # import the necessary packages
 import tensorflow as tf
 from tensorflow.keras import layers
 from PIL import Image
 from io import BytesIO
 import requests
 import numpy as np
 RESOLUTION = 224
 crop_layer = layers.CenterCrop(RESOLUTION, RESOLUTION)
 norm_layer = layers.Normalization(
@@ -50,4 +53,48 @@ def load_image_from_url(url, model_type):
     response = requests.get(url)
     image = Image.open(BytesIO(response.content))
     preprocessed_image = preprocess_image(image, model_type)
-    return image, preprocessed_image

 # import the necessary packages
 import tensorflow as tf
+from tensorflow import keras
 from tensorflow.keras import layers
 from PIL import Image
 from io import BytesIO
 import requests
 import numpy as np
+from matplotlib import pyplot as plt
 RESOLUTION = 224
+PATCH_SIZE = 16
 crop_layer = layers.CenterCrop(RESOLUTION, RESOLUTION)
 norm_layer = layers.Normalization(
     response = requests.get(url)
     image = Image.open(BytesIO(response.content))
     preprocessed_image = preprocess_image(image, model_type)
+    return image, preprocessed_image
+def attention_heatmap(attention_score_dict, image, model_type="dino", num_heads=12):
+    num_tokens = 2 if "distilled" in model_type else 1
+    # Sort the transformer blocks in order of their depth.
+    attention_score_list = list(attention_score_dict.keys())
+    attention_score_list.sort(key=lambda x: int(x.split("_")[-2]), reverse=True)
+    # Process the attention maps for overlay.
+    w_featmap = image.shape[2] // PATCH_SIZE
+    h_featmap = image.shape[1] // PATCH_SIZE
+    attention_scores = attention_score_dict[attention_score_list[0]]
+    # Taking the representations from CLS token.
+    attentions = attention_scores[0, :, 0, num_tokens:].reshape(num_heads, -1)
+    # Reshape the attention scores to resemble mini patches.
+    attentions = attentions.reshape(num_heads, w_featmap, h_featmap)
+    attentions = attentions.transpose((1, 2, 0))
+    # Resize the attention patches to 224x224 (224: 14x16).
+    attentions = tf.image.resize(attentions, size=(
+        h_featmap * PATCH_SIZE,
+        w_featmap * PATCH_SIZE)
+    )
+    return attentions
+def plot(attentions, image):
+    fig, axes = plt.subplots(nrows=3, ncols=4, figsize=(13, 13))
+    img_count = 0
+    for i in range(3):
+        for j in range(4):
+            if img_count < len(attentions):
+                axes[i, j].imshow(image[0])
+                axes[i, j].imshow(attentions[..., img_count], cmap="inferno", alpha=0.6)
+                axes[i, j].title.set_text(f"Attention head: {img_count}")
+                axes[i, j].axis("off")
+                img_count += 1
+    plt.tight_layout()
+    plt.savefig("heat_map.png")