Spaces:

bcvilnrotter
/

id-code-identifier

Sleeping

bcvilnrotter commited on Feb 26, 2025

Commit

7cd0cdb

verified ·

1 Parent(s): e290c3b

Update utils/basic_functions.py

Files changed (1) hide show

utils/basic_functions.py CHANGED Viewed

@@ -76,8 +76,9 @@ def gemini_identify_id(url,system_prompt):
 # Huggingface repo usage
 def huggingface_detect_id_box(model_name,url):
     try:
-        image = get_image(url)
         system_prompt = f"""
         You are an AI document processing assistant. Analyze the provided image. Identify the ID number in the document.
         This is usually identified in a location outside of the main content on the document, and usually on the bottom
@@ -88,7 +89,20 @@ def huggingface_detect_id_box(model_name,url):
         """
         processor,model=load_model(model_name)
-        inputs = processor(images=[image],text=system_prompt,return_tensors="pt").to(model.device)
         with torch.no_grad():
             output = model.generate(**inputs)
@@ -99,6 +113,11 @@ def huggingface_detect_id_box(model_name,url):
         except Exception as e:
             print(f"Error parsing bounding box response: {str(e)}")
             return None
         draw = ImageDraw.Draw(image)
         draw.rectangle(bbox,outline="red",width=5)

 # Huggingface repo usage
 def huggingface_detect_id_box(model_name,url):
     try:
+        #image = get_image(url)
+        image = Image.open(requests.get(url,stream=True).raw)
         system_prompt = f"""
         You are an AI document processing assistant. Analyze the provided image. Identify the ID number in the document.
         This is usually identified in a location outside of the main content on the document, and usually on the bottom
         """
         processor,model=load_model(model_name)
+        conversation = [
+            {
+                "role":"user",
+                "content":[
+                    {"type":"text","text":system_prompt},
+                    {"type":"image"},
+                ],
+            },
+        ]
+        prompt = processor.apply_chat_template(conversation,add_generation_prompt=True)
+        inputs = processor(images=image,text=prompt,return_tensors="pt").to(model.device)
+        """
         with torch.no_grad():
             output = model.generate(**inputs)
         except Exception as e:
             print(f"Error parsing bounding box response: {str(e)}")
             return None
+        """
+        output = model.generate(**inputs,max_new_tokens=200,do_sample=False)
+        print(processor.decode(output[0][2:],skip_special_tokens=True))
         draw = ImageDraw.Draw(image)
         draw.rectangle(bbox,outline="red",width=5)