RedRocket
/

JointTaggerProject

drhead commited on Jun 25, 2024

Commit

80578f6

verified ·

1 Parent(s): 938a123

minmax performance on those tensor cores lol

Files changed (1) hide show

inference_gradio.py CHANGED Viewed

@@ -123,7 +123,7 @@ model.eval()
 if torch.cuda.is_available():
     model.cuda()
     if torch.cuda.get_device_capability()[0] >= 7: # tensor cores
-        model.half()
 with open("JTP_PILOT/tags.json", "r") as file:
     tags = json.load(file) # type: dict
@@ -139,7 +139,7 @@ def create_tags(image, threshold):
     if torch.cuda.is_available():
         tensor.cuda()
         if torch.cuda.get_device_capability()[0] >= 7:
-            tensor.half()
     with torch.no_grad():
         logits = model(tensor)

 if torch.cuda.is_available():
     model.cuda()
     if torch.cuda.get_device_capability()[0] >= 7: # tensor cores
+        model.to(dtype=torch.float16, memory_format=torch.channels_last)
 with open("JTP_PILOT/tags.json", "r") as file:
     tags = json.load(file) # type: dict
     if torch.cuda.is_available():
         tensor.cuda()
         if torch.cuda.get_device_capability()[0] >= 7:
+            tensor.to(dtype=torch.float16, memory_format=torch.channels_last)
     with torch.no_grad():
         logits = model(tensor)