Spaces:

creativeforce
/

Copywriting

Paused

App Files Files Community

tunght commited on Mar 20, 2025

Commit

f9cb324

1 Parent(s): efc50bb

fix get image features

Browse files

Files changed (1) hide show

app.py +67 -43

app.py CHANGED Viewed

@@ -419,6 +419,9 @@ Return the product description only.
 </included_phrases>"""
 import base64
 import requests
 from PIL import Image
@@ -433,6 +436,7 @@ import io
 def encode_image(image_path, img_size=1024):
     with open(image_path, "rb") as image_file:
         # b64_img = base64.b64encode(image_file.read()).decode('utf-8')
         # b64_img = base64.b64decode(base64.b64encode(response.content))
@@ -475,49 +479,69 @@ def detect_features(image_paths, garment_type, language="English"):
         if garment_type == "" or garment_type == "all":
             garment_type = "garment"
-        headers = {
-        "Content-Type": "application/json",
-        "Authorization": f"Bearer {openai.api_key}"
-        }
-        payload = {
-        "model": "gpt-4o",
-        # "model": "gpt-4-turbo",
-        "messages": [
-            {
-            "role": "user",
-            "content": [
-                {
-                "type": "text",
-                "text": f"""Describe the features of the {garment_type} in the photos.
-                Return the result in in the following JSON format without any preceding or trailing text:
-                {{
-                    "features": [list of comma separated features],
-                    "intended_use": [list of comma separated intended uses],
-                    "alt_text": [list of alt text for image 1, alt text for image 2]
-                }}"""
-                },
-            ] + [{
-                "type": "image_url",
-                "detail": "low",
-                "image_url": {
-                    "url": f"data:image/jpeg;base64,{base64_image}"
-                }
-                } for base64_image in base64_images]
-            }
-        ],
-        "temperature": 0.0,
-        "max_tokens": 300
-        }
-        response = requests.post("https://api.openai.com/v1/chat/completions", headers=headers, json=payload)
-        print(response)
-        response = response.json()
-        print("image features", response["choices"][0]['message']['content'])
-        jresponse = get_json(response["choices"][0]['message']['content'])
         return jresponse, base64_images
     except Exception as e:
         print(e.__class__, e)

 </included_phrases>"""
+detect_feature_prompt = """Describe the features of the {garment_type} in the photo in less than 150 words.\nReturn the result in in the following JSON format without any preceding or trailing text:\n\n{{\n    \"features\": [list of comma separated features],\n    \"intended_use\": [list of comma separated intended uses],\n    \"alt_text\": alt text for the image,\n    \"category\": the category of the garment, for example 'dress', 'shirt', 'pants', 'shoes', etc\n}}"""
 import base64
 import requests
 from PIL import Image
 def encode_image(image_path, img_size=1024):
+    print("Encoding image", image_path)
     with open(image_path, "rb") as image_file:
         # b64_img = base64.b64encode(image_file.read()).decode('utf-8')
         # b64_img = base64.b64decode(base64.b64encode(response.content))
         if garment_type == "" or garment_type == "all":
             garment_type = "garment"
+        # headers = {
+        # "Content-Type": "application/json",
+        # "Authorization": f"Bearer {openai.api_key}"
+        # }
+        # payload = {
+        # "model": "gpt-4o",
+        # "messages": [
+        #     {
+        #     "role": "user",
+        #     "content": [
+        #         {
+        #         "type": "text",
+        #         "text": f"""Describe the features of the {garment_type} in the photos.
+        #         Return the result in in the following JSON format without any preceding or trailing text:
+        #         {{
+        #             "features": [list of comma separated features],
+        #             "intended_use": [list of comma separated intended uses],
+        #             "alt_text": [list of alt text for image 1, alt text for image 2]
+        #         }}"""
+        #         },
+        #     ] + [{
+        #         "type": "image_url",
+        #         "detail": "low",
+        #         "image_url": {
+        #             "url": f"data:image/jpeg;base64,{base64_image}"
+        #         }
+        #         } for base64_image in base64_images]
+        #     }
+        # ],
+        # "temperature": 0.0,
+        # "max_tokens": 300
+        # }
+        # response = requests.post("https://api.openai.com/v1/chat/completions", headers=headers, json=payload)
+        # print(response)
+        chat = get_model("gpt-4o", temperature=0.0)
+        messages = [[
+                    {
+                        "role": "user",
+                        "content": [
+                            {
+                                "type": "text",
+                                "text": detect_feature_prompt.format(garment_type=garment_type)
+                            },
+                            {
+                                "type": "image_url",
+                                "image_url": {
+                                    "url": f"data:image/jpeg;base64,{base64_image}"
+                                }
+                            }]
+                    }
+                ] for base64_image in base64_images]
+        response = chat.batch(messages)
+        print("image features", response)
+        # print("image features", response["choices"][0]['message']['content'])
+        jresponse = get_json(response[0].content)
         return jresponse, base64_images
     except Exception as e:
         print(e.__class__, e)