Final_Assignment_Template_V2

Sleeping

CindyDelage commited on May 4, 2025

Commit

c3af1cf

verified ·

1 Parent(s): 374b8f9

Update tools.py

Files changed (1) hide show

tools.py CHANGED Viewed

@@ -121,10 +121,11 @@ class image_interpreter(Tool):
     description = "Allows you to convert an image to text (the function will describe the image)."
     inputs = {
         'image': {"type": "image", "description": "The image of interest, png format or jpeg (must be the local path of the image)"},
     }
     output_type = "string"
-    def forward(self, image):
         device = "cuda" if torch.cuda.is_available() else "cpu"
         model = Qwen2VLForConditionalGeneration.from_pretrained(
         "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
@@ -136,7 +137,7 @@ class image_interpreter(Tool):
                 "role": "user",
                 "content": [
                     {"type": "image", "image": Image.open(image).convert("RGB")},
-                    {"type": "text", "text": "describe this image, with as much details as you can"},
                 ],
             }
         ]

     description = "Allows you to convert an image to text (the function will describe the image)."
     inputs = {
         'image': {"type": "image", "description": "The image of interest, png format or jpeg (must be the local path of the image)"},
+        'prompt': {"type": "string", "description": "The function returns a description of the image, but you can request specific details with this prompt to ensure they are included in the description."},
     }
     output_type = "string"
+    def forward(self, image, prompt):
         device = "cuda" if torch.cuda.is_available() else "cpu"
         model = Qwen2VLForConditionalGeneration.from_pretrained(
         "Qwen/Qwen2-VL-7B-Instruct", torch_dtype="auto", device_map="auto"
                 "role": "user",
                 "content": [
                     {"type": "image", "image": Image.open(image).convert("RGB")},
+                    {"type": "text", "text": "describe this image, with as much details as you can" + str(prompt)},
                 ],
             }
         ]