- grounded_sam_demo.py +51 -159
- segment_anything/segment_anything.egg-info/PKG-INFO +15 -0
- segment_anything/segment_anything.egg-info/SOURCES.txt +26 -0
- segment_anything/segment_anything.egg-info/dependency_links.txt +1 -0
- segment_anything/segment_anything.egg-info/requires.txt +13 -0
- segment_anything/segment_anything.egg-info/top_level.txt +1 -0
- segment_anything/segment_anything/__pycache__/__init__.cpython-310.pyc +0 -0
- segment_anything/segment_anything/__pycache__/automatic_mask_generator.cpython-310.pyc +0 -0
- segment_anything/segment_anything/__pycache__/build_sam.cpython-310.pyc +0 -0
- segment_anything/segment_anything/__pycache__/build_sam_hq.cpython-310.pyc +0 -0
- segment_anything/segment_anything/__pycache__/predictor.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/__init__.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/common.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/image_encoder.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/mask_decoder.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/mask_decoder_hq.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/prompt_encoder.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/sam.cpython-310.pyc +0 -0
- segment_anything/segment_anything/modeling/__pycache__/transformer.cpython-310.pyc +0 -0
- segment_anything/segment_anything/utils/__pycache__/__init__.cpython-310.pyc +0 -0
- segment_anything/segment_anything/utils/__pycache__/amg.cpython-310.pyc +0 -0
- segment_anything/segment_anything/utils/__pycache__/transforms.cpython-310.pyc +0 -0
- test.py +16 -12
grounded_sam_demo.py
CHANGED
|
@@ -1,4 +1,5 @@
|
|
| 1 |
-
import
|
|
|
|
| 2 |
import os
|
| 3 |
import copy
|
| 4 |
|
|
@@ -16,8 +17,8 @@ from GroundingDINO.groundingdino.util.utils import clean_state_dict, get_phrases
|
|
| 16 |
|
| 17 |
# segment anything
|
| 18 |
from segment_anything import (
|
| 19 |
-
|
| 20 |
-
|
| 21 |
SamPredictor
|
| 22 |
)
|
| 23 |
import cv2
|
|
@@ -25,27 +26,13 @@ import numpy as np
|
|
| 25 |
import matplotlib.pyplot as plt
|
| 26 |
|
| 27 |
|
| 28 |
-
def load_image(image_path):
|
| 29 |
-
# load image
|
| 30 |
-
image_pil = Image.open(image_path).convert("RGB") # load image
|
| 31 |
-
|
| 32 |
-
transform = T.Compose(
|
| 33 |
-
[
|
| 34 |
-
T.RandomResize([800], max_size=1333),
|
| 35 |
-
T.ToTensor(),
|
| 36 |
-
T.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
|
| 37 |
-
]
|
| 38 |
-
)
|
| 39 |
-
image, _ = transform(image_pil, None) # 3, h, w
|
| 40 |
-
return image_pil, image
|
| 41 |
-
|
| 42 |
-
|
| 43 |
def load_model(model_config_path, model_checkpoint_path, device):
|
| 44 |
args = SLConfig.fromfile(model_config_path)
|
| 45 |
args.device = device
|
| 46 |
model = build_model(args)
|
| 47 |
checkpoint = torch.load(model_checkpoint_path, map_location="cpu")
|
| 48 |
-
load_res = model.load_state_dict(
|
|
|
|
| 49 |
print(load_res)
|
| 50 |
_ = model.eval()
|
| 51 |
return model
|
|
@@ -72,136 +59,38 @@ def get_grounding_output(model, image, caption, box_threshold, text_threshold, w
|
|
| 72 |
boxes_filt = boxes_filt[filt_mask] # num_filt, 4
|
| 73 |
logits_filt.shape[0]
|
| 74 |
|
| 75 |
-
|
| 76 |
-
tokenlizer = model.tokenizer
|
| 77 |
-
tokenized = tokenlizer(caption)
|
| 78 |
-
# build pred
|
| 79 |
-
pred_phrases = []
|
| 80 |
-
for logit, box in zip(logits_filt, boxes_filt):
|
| 81 |
-
pred_phrase = get_phrases_from_posmap(logit > text_threshold, tokenized, tokenlizer)
|
| 82 |
-
if with_logits:
|
| 83 |
-
pred_phrases.append(pred_phrase + f"({str(logit.max().item())[:4]})")
|
| 84 |
-
else:
|
| 85 |
-
pred_phrases.append(pred_phrase)
|
| 86 |
-
|
| 87 |
-
return boxes_filt, pred_phrases
|
| 88 |
-
|
| 89 |
-
def show_mask(mask, ax, random_color=False):
|
| 90 |
-
if random_color:
|
| 91 |
-
color = np.concatenate([np.random.random(3), np.array([0.6])], axis=0)
|
| 92 |
-
else:
|
| 93 |
-
color = np.array([30/255, 144/255, 255/255, 0.6])
|
| 94 |
-
h, w = mask.shape[-2:]
|
| 95 |
-
mask_image = mask.reshape(h, w, 1) * color.reshape(1, 1, -1)
|
| 96 |
-
ax.imshow(mask_image)
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
def show_box(box, ax, label):
|
| 100 |
-
x0, y0 = box[0], box[1]
|
| 101 |
-
w, h = box[2] - box[0], box[3] - box[1]
|
| 102 |
-
ax.add_patch(plt.Rectangle((x0, y0), w, h, edgecolor='green', facecolor=(0,0,0,0), lw=2))
|
| 103 |
-
ax.text(x0, y0, label)
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
def save_mask_data(output_dir, mask_list, box_list, label_list):
|
| 107 |
-
value = 0 # 0 for background
|
| 108 |
|
| 109 |
-
mask_img = torch.zeros(mask_list.shape[-2:])
|
| 110 |
-
for idx, mask in enumerate(mask_list):
|
| 111 |
-
mask_img[mask.cpu().numpy()[0] == True] = value + idx + 1
|
| 112 |
-
plt.figure(figsize=(10, 10))
|
| 113 |
-
plt.imshow(mask_img.numpy())
|
| 114 |
-
plt.axis('off')
|
| 115 |
-
plt.savefig(os.path.join(output_dir, 'mask.jpg'), bbox_inches="tight", dpi=300, pad_inches=0.0)
|
| 116 |
-
|
| 117 |
-
json_data = [{
|
| 118 |
-
'value': value,
|
| 119 |
-
'label': 'background'
|
| 120 |
-
}]
|
| 121 |
-
for label, box in zip(label_list, box_list):
|
| 122 |
-
value += 1
|
| 123 |
-
name, logit = label.split('(')
|
| 124 |
-
logit = logit[:-1] # the last is ')'
|
| 125 |
-
json_data.append({
|
| 126 |
-
'value': value,
|
| 127 |
-
'label': name,
|
| 128 |
-
'logit': float(logit),
|
| 129 |
-
'box': box.numpy().tolist(),
|
| 130 |
-
})
|
| 131 |
-
with open(os.path.join(output_dir, 'mask.json'), 'w') as f:
|
| 132 |
-
json.dump(json_data, f)
|
| 133 |
-
|
| 134 |
-
|
| 135 |
-
if __name__ == "__main__":
|
| 136 |
-
|
| 137 |
-
parser = argparse.ArgumentParser("Grounded-Segment-Anything Demo", add_help=True)
|
| 138 |
-
parser.add_argument("--config", type=str, required=True, help="path to config file")
|
| 139 |
-
parser.add_argument(
|
| 140 |
-
"--grounded_checkpoint", type=str, required=True, help="path to checkpoint file"
|
| 141 |
-
)
|
| 142 |
-
parser.add_argument(
|
| 143 |
-
"--sam_version", type=str, default="vit_h", required=False, help="SAM ViT version: vit_b / vit_l / vit_h"
|
| 144 |
-
)
|
| 145 |
-
parser.add_argument(
|
| 146 |
-
"--sam_checkpoint", type=str, required=False, help="path to sam checkpoint file"
|
| 147 |
-
)
|
| 148 |
-
parser.add_argument(
|
| 149 |
-
"--sam_hq_checkpoint", type=str, default=None, help="path to sam-hq checkpoint file"
|
| 150 |
-
)
|
| 151 |
-
parser.add_argument(
|
| 152 |
-
"--use_sam_hq", action="store_true", help="using sam-hq for prediction"
|
| 153 |
-
)
|
| 154 |
-
parser.add_argument("--input_image", type=str, required=True, help="path to image file")
|
| 155 |
-
parser.add_argument("--text_prompt", type=str, required=True, help="text prompt")
|
| 156 |
-
parser.add_argument(
|
| 157 |
-
"--output_dir", "-o", type=str, default="outputs", required=True, help="output directory"
|
| 158 |
-
)
|
| 159 |
|
| 160 |
-
|
| 161 |
-
|
| 162 |
-
|
| 163 |
-
parser.add_argument("--device", type=str, default="cpu", help="running on cpu only!, default=False")
|
| 164 |
-
args = parser.parse_args()
|
| 165 |
-
|
| 166 |
-
# cfg
|
| 167 |
-
config_file = args.config # change the path of the model config file
|
| 168 |
-
grounded_checkpoint = args.grounded_checkpoint # change the path of the model
|
| 169 |
-
sam_version = args.sam_version
|
| 170 |
-
sam_checkpoint = args.sam_checkpoint
|
| 171 |
-
sam_hq_checkpoint = args.sam_hq_checkpoint
|
| 172 |
-
use_sam_hq = args.use_sam_hq
|
| 173 |
-
image_path = args.input_image
|
| 174 |
-
text_prompt = args.text_prompt
|
| 175 |
-
output_dir = args.output_dir
|
| 176 |
-
box_threshold = args.box_threshold
|
| 177 |
-
text_threshold = args.text_threshold
|
| 178 |
-
device = args.device
|
| 179 |
-
|
| 180 |
-
# make dir
|
| 181 |
-
os.makedirs(output_dir, exist_ok=True)
|
| 182 |
-
# load image
|
| 183 |
-
image_pil, image = load_image(image_path)
|
| 184 |
-
# load model
|
| 185 |
-
model = load_model(config_file, grounded_checkpoint, device=device)
|
| 186 |
|
| 187 |
-
#
|
| 188 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 189 |
|
| 190 |
-
|
| 191 |
-
|
| 192 |
-
|
| 193 |
-
)
|
|
|
|
|
|
|
|
|
|
| 194 |
|
| 195 |
-
#
|
| 196 |
-
|
| 197 |
-
|
| 198 |
-
|
| 199 |
-
|
| 200 |
-
|
| 201 |
-
image = cv2.cvtColor(
|
| 202 |
predictor.set_image(image)
|
| 203 |
|
| 204 |
-
size =
|
| 205 |
H, W = size[1], size[0]
|
| 206 |
for i in range(boxes_filt.size(0)):
|
| 207 |
boxes_filt[i] = boxes_filt[i] * torch.Tensor([W, H, W, H])
|
|
@@ -209,27 +98,30 @@ if __name__ == "__main__":
|
|
| 209 |
boxes_filt[i][2:] += boxes_filt[i][:2]
|
| 210 |
|
| 211 |
boxes_filt = boxes_filt.cpu()
|
| 212 |
-
transformed_boxes = predictor.transform.apply_boxes_torch(
|
|
|
|
| 213 |
|
| 214 |
masks, _, _ = predictor.predict_torch(
|
| 215 |
-
point_coords
|
| 216 |
-
point_labels
|
| 217 |
-
boxes
|
| 218 |
-
multimask_output
|
| 219 |
)
|
| 220 |
|
| 221 |
-
#
|
| 222 |
-
|
| 223 |
-
|
| 224 |
-
for mask in masks:
|
| 225 |
-
|
| 226 |
-
for box, label in zip(boxes_filt, pred_phrases):
|
| 227 |
-
show_box(box.numpy(), plt.gca(), label)
|
| 228 |
|
|
|
|
|
|
|
| 229 |
plt.axis('off')
|
| 230 |
-
plt.savefig(
|
| 231 |
-
os.path.join(output_dir, "grounded_sam_output.jpg"),
|
| 232 |
-
bbox_inches="tight", dpi=300, pad_inches=0.0
|
| 233 |
-
)
|
| 234 |
|
| 235 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from GroundingDINO.groundingdino.datasets.transforms import Compose, RandomResize, ToTensor, Normalize
|
| 2 |
+
from io import BytesIO
|
| 3 |
import os
|
| 4 |
import copy
|
| 5 |
|
|
|
|
| 17 |
|
| 18 |
# segment anything
|
| 19 |
from segment_anything import (
|
| 20 |
+
build_sam,
|
| 21 |
+
build_sam_hq,
|
| 22 |
SamPredictor
|
| 23 |
)
|
| 24 |
import cv2
|
|
|
|
| 26 |
import matplotlib.pyplot as plt
|
| 27 |
|
| 28 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
def load_model(model_config_path, model_checkpoint_path, device):
|
| 30 |
args = SLConfig.fromfile(model_config_path)
|
| 31 |
args.device = device
|
| 32 |
model = build_model(args)
|
| 33 |
checkpoint = torch.load(model_checkpoint_path, map_location="cpu")
|
| 34 |
+
load_res = model.load_state_dict(
|
| 35 |
+
clean_state_dict(checkpoint["model"]), strict=False)
|
| 36 |
print(load_res)
|
| 37 |
_ = model.eval()
|
| 38 |
return model
|
|
|
|
| 59 |
boxes_filt = boxes_filt[filt_mask] # num_filt, 4
|
| 60 |
logits_filt.shape[0]
|
| 61 |
|
| 62 |
+
return boxes_filt
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 63 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
|
| 65 |
+
def grounded_sam_demo(input_pil, config_file, grounded_checkpoint, sam_checkpoint,
|
| 66 |
+
text_prompt, box_threshold=0.3, text_threshold=0.25,
|
| 67 |
+
device="cuda"):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 68 |
|
| 69 |
+
# Convert PIL image to tensor with normalization
|
| 70 |
+
transform = Compose([
|
| 71 |
+
RandomResize([800], max_size=1333),
|
| 72 |
+
ToTensor(),
|
| 73 |
+
Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),
|
| 74 |
+
])
|
| 75 |
|
| 76 |
+
if input_pil.mode != "RGB":
|
| 77 |
+
input_pil = input_pil.convert("RGB")
|
| 78 |
+
|
| 79 |
+
image, _ = transform(input_pil, None)
|
| 80 |
+
|
| 81 |
+
# Load model
|
| 82 |
+
model = load_model(config_file, grounded_checkpoint, device=device)
|
| 83 |
|
| 84 |
+
# Get grounding dino model output
|
| 85 |
+
boxes_filt = get_grounding_output(
|
| 86 |
+
model, image, text_prompt, box_threshold, text_threshold, device=device)
|
| 87 |
+
|
| 88 |
+
# Initialize SAM
|
| 89 |
+
predictor = SamPredictor(build_sam(checkpoint=sam_checkpoint).to(device))
|
| 90 |
+
image = cv2.cvtColor(np.array(input_pil), cv2.COLOR_RGB2BGR)
|
| 91 |
predictor.set_image(image)
|
| 92 |
|
| 93 |
+
size = input_pil.size
|
| 94 |
H, W = size[1], size[0]
|
| 95 |
for i in range(boxes_filt.size(0)):
|
| 96 |
boxes_filt[i] = boxes_filt[i] * torch.Tensor([W, H, W, H])
|
|
|
|
| 98 |
boxes_filt[i][2:] += boxes_filt[i][:2]
|
| 99 |
|
| 100 |
boxes_filt = boxes_filt.cpu()
|
| 101 |
+
transformed_boxes = predictor.transform.apply_boxes_torch(
|
| 102 |
+
boxes_filt, image.shape[:2]).to(device)
|
| 103 |
|
| 104 |
masks, _, _ = predictor.predict_torch(
|
| 105 |
+
point_coords=None,
|
| 106 |
+
point_labels=None,
|
| 107 |
+
boxes=transformed_boxes.to(device),
|
| 108 |
+
multimask_output=False,
|
| 109 |
)
|
| 110 |
|
| 111 |
+
# Create mask image
|
| 112 |
+
value = 0 # 0 for background
|
| 113 |
+
mask_img = torch.zeros(masks.shape[-2:])
|
| 114 |
+
for idx, mask in enumerate(masks):
|
| 115 |
+
mask_img[mask.cpu().numpy()[0] == True] = value + idx + 1
|
|
|
|
|
|
|
| 116 |
|
| 117 |
+
fig = plt.figure(figsize=(10, 10))
|
| 118 |
+
plt.imshow(mask_img.numpy())
|
| 119 |
plt.axis('off')
|
|
|
|
|
|
|
|
|
|
|
|
|
| 120 |
|
| 121 |
+
buf = BytesIO()
|
| 122 |
+
plt.savefig(buf, format='png', bbox_inches="tight",
|
| 123 |
+
dpi=300, pad_inches=0.0)
|
| 124 |
+
buf.seek(0)
|
| 125 |
+
out_pil = Image.open(buf)
|
| 126 |
+
|
| 127 |
+
return out_pil
|
segment_anything/segment_anything.egg-info/PKG-INFO
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
Metadata-Version: 2.1
|
| 2 |
+
Name: segment-anything
|
| 3 |
+
Version: 1.0
|
| 4 |
+
License-File: LICENSE
|
| 5 |
+
Provides-Extra: all
|
| 6 |
+
Requires-Dist: matplotlib; extra == "all"
|
| 7 |
+
Requires-Dist: pycocotools; extra == "all"
|
| 8 |
+
Requires-Dist: opencv-python; extra == "all"
|
| 9 |
+
Requires-Dist: onnx; extra == "all"
|
| 10 |
+
Requires-Dist: onnxruntime; extra == "all"
|
| 11 |
+
Provides-Extra: dev
|
| 12 |
+
Requires-Dist: flake8; extra == "dev"
|
| 13 |
+
Requires-Dist: isort; extra == "dev"
|
| 14 |
+
Requires-Dist: black; extra == "dev"
|
| 15 |
+
Requires-Dist: mypy; extra == "dev"
|
segment_anything/segment_anything.egg-info/SOURCES.txt
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
LICENSE
|
| 2 |
+
README.md
|
| 3 |
+
setup.cfg
|
| 4 |
+
setup.py
|
| 5 |
+
segment_anything/__init__.py
|
| 6 |
+
segment_anything/automatic_mask_generator.py
|
| 7 |
+
segment_anything/build_sam.py
|
| 8 |
+
segment_anything/build_sam_hq.py
|
| 9 |
+
segment_anything/predictor.py
|
| 10 |
+
segment_anything.egg-info/PKG-INFO
|
| 11 |
+
segment_anything.egg-info/SOURCES.txt
|
| 12 |
+
segment_anything.egg-info/dependency_links.txt
|
| 13 |
+
segment_anything.egg-info/requires.txt
|
| 14 |
+
segment_anything.egg-info/top_level.txt
|
| 15 |
+
segment_anything/modeling/__init__.py
|
| 16 |
+
segment_anything/modeling/common.py
|
| 17 |
+
segment_anything/modeling/image_encoder.py
|
| 18 |
+
segment_anything/modeling/mask_decoder.py
|
| 19 |
+
segment_anything/modeling/mask_decoder_hq.py
|
| 20 |
+
segment_anything/modeling/prompt_encoder.py
|
| 21 |
+
segment_anything/modeling/sam.py
|
| 22 |
+
segment_anything/modeling/transformer.py
|
| 23 |
+
segment_anything/utils/__init__.py
|
| 24 |
+
segment_anything/utils/amg.py
|
| 25 |
+
segment_anything/utils/onnx.py
|
| 26 |
+
segment_anything/utils/transforms.py
|
segment_anything/segment_anything.egg-info/dependency_links.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
|
segment_anything/segment_anything.egg-info/requires.txt
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
[all]
|
| 3 |
+
matplotlib
|
| 4 |
+
pycocotools
|
| 5 |
+
opencv-python
|
| 6 |
+
onnx
|
| 7 |
+
onnxruntime
|
| 8 |
+
|
| 9 |
+
[dev]
|
| 10 |
+
flake8
|
| 11 |
+
isort
|
| 12 |
+
black
|
| 13 |
+
mypy
|
segment_anything/segment_anything.egg-info/top_level.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
segment_anything
|
segment_anything/segment_anything/__pycache__/__init__.cpython-310.pyc
ADDED
|
Binary file (572 Bytes). View file
|
|
|
segment_anything/segment_anything/__pycache__/automatic_mask_generator.cpython-310.pyc
ADDED
|
Binary file (11.4 kB). View file
|
|
|
segment_anything/segment_anything/__pycache__/build_sam.cpython-310.pyc
ADDED
|
Binary file (2.16 kB). View file
|
|
|
segment_anything/segment_anything/__pycache__/build_sam_hq.cpython-310.pyc
ADDED
|
Binary file (2.41 kB). View file
|
|
|
segment_anything/segment_anything/__pycache__/predictor.cpython-310.pyc
ADDED
|
Binary file (10.1 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/__init__.cpython-310.pyc
ADDED
|
Binary file (458 Bytes). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/common.cpython-310.pyc
ADDED
|
Binary file (1.76 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/image_encoder.cpython-310.pyc
ADDED
|
Binary file (12.7 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/mask_decoder.cpython-310.pyc
ADDED
|
Binary file (5.54 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/mask_decoder_hq.cpython-310.pyc
ADDED
|
Binary file (6.62 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/prompt_encoder.cpython-310.pyc
ADDED
|
Binary file (7.69 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/sam.cpython-310.pyc
ADDED
|
Binary file (6.67 kB). View file
|
|
|
segment_anything/segment_anything/modeling/__pycache__/transformer.cpython-310.pyc
ADDED
|
Binary file (6.61 kB). View file
|
|
|
segment_anything/segment_anything/utils/__pycache__/__init__.cpython-310.pyc
ADDED
|
Binary file (165 Bytes). View file
|
|
|
segment_anything/segment_anything/utils/__pycache__/amg.cpython-310.pyc
ADDED
|
Binary file (12.1 kB). View file
|
|
|
segment_anything/segment_anything/utils/__pycache__/transforms.cpython-310.pyc
ADDED
|
Binary file (3.94 kB). View file
|
|
|
test.py
CHANGED
|
@@ -4,33 +4,37 @@ import torch
|
|
| 4 |
import requests
|
| 5 |
from PIL import Image
|
| 6 |
from io import BytesIO
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7 |
|
| 8 |
-
is_production =
|
| 9 |
|
| 10 |
os.chdir("/repository" if is_production else ".")
|
| 11 |
os.environ['AM_I_DOCKER'] = 'False'
|
| 12 |
os.environ['BUILD_WITH_CUDA'] = 'True'
|
| 13 |
os.environ['CUDA_HOME'] = '/usr/local/cuda-11.7/' if is_production else '/usr/local/cuda-12.1/'
|
| 14 |
|
| 15 |
-
|
| 16 |
-
subprocess.run(["python", "-m", "pip", "install", "-e", "segment_anything"])
|
| 17 |
|
| 18 |
-
|
| 19 |
-
subprocess.run(["python", "-m", "pip", "install", "-e", "GroundingDINO"])
|
| 20 |
|
| 21 |
-
|
|
|
|
|
|
|
| 22 |
|
| 23 |
-
|
| 24 |
-
subprocess.run(["pip", "install", "--upgrade", "diffusers[torch]"])
|
| 25 |
|
| 26 |
-
# Install osx
|
| 27 |
subprocess.run(["git", "submodule", "update", "--init", "--recursive"])
|
| 28 |
subprocess.run(["bash", "grounded-sam-osx/install.sh"], cwd="grounded-sam-osx")
|
| 29 |
|
| 30 |
-
# Install RAM & Tag2Text
|
| 31 |
subprocess.run(["git", "clone", "https://github.com/xinyu1205/recognize-anything.git"])
|
| 32 |
-
|
| 33 |
-
|
|
|
|
|
|
|
| 34 |
|
| 35 |
from grounded_sam_demo import grounded_sam_demo
|
| 36 |
import numpy as np
|
|
|
|
| 4 |
import requests
|
| 5 |
from PIL import Image
|
| 6 |
from io import BytesIO
|
| 7 |
+
import subprocess
|
| 8 |
+
import sys
|
| 9 |
+
|
| 10 |
+
def pip_command(command):
|
| 11 |
+
subprocess.check_call([sys.executable, "-m", "pip"] + command.split())
|
| 12 |
|
| 13 |
+
is_production = False
|
| 14 |
|
| 15 |
os.chdir("/repository" if is_production else ".")
|
| 16 |
os.environ['AM_I_DOCKER'] = 'False'
|
| 17 |
os.environ['BUILD_WITH_CUDA'] = 'True'
|
| 18 |
os.environ['CUDA_HOME'] = '/usr/local/cuda-11.7/' if is_production else '/usr/local/cuda-12.1/'
|
| 19 |
|
| 20 |
+
pip_command("install -e segment_anything")
|
|
|
|
| 21 |
|
| 22 |
+
pip_command("install -e GroundingDINO")
|
|
|
|
| 23 |
|
| 24 |
+
response = requests.get("https://huggingface.co/Uminosachi/sam-hq/resolve/main/sam_hq_vit_h.pth")
|
| 25 |
+
with open('./sam_hq_vit_h.pth', 'wb') as file:
|
| 26 |
+
file.write(response.content)
|
| 27 |
|
| 28 |
+
pip_command("install --upgrade diffusers[torch]")
|
|
|
|
| 29 |
|
|
|
|
| 30 |
subprocess.run(["git", "submodule", "update", "--init", "--recursive"])
|
| 31 |
subprocess.run(["bash", "grounded-sam-osx/install.sh"], cwd="grounded-sam-osx")
|
| 32 |
|
|
|
|
| 33 |
subprocess.run(["git", "clone", "https://github.com/xinyu1205/recognize-anything.git"])
|
| 34 |
+
|
| 35 |
+
pip_command("install -r ./recognize-anything/requirements.txt")
|
| 36 |
+
|
| 37 |
+
pip_command("install -e ./recognize-anything/")
|
| 38 |
|
| 39 |
from grounded_sam_demo import grounded_sam_demo
|
| 40 |
import numpy as np
|