Spaces:

bcvilnrotter
/

id-code-identifier

Sleeping

App Files Files Community

bcvilnrotter commited on Feb 27, 2025

Commit

3c0f5c4

verified ·

1 Parent(s): d0d3110

Update utils/basic_functions.py

Browse files

Files changed (1) hide show

utils/basic_functions.py +14 -0

utils/basic_functions.py CHANGED Viewed

@@ -78,6 +78,7 @@ def huggingface_detect_id_box(model_name,url):
     try:
         #image = get_image(url)
         image = Image.open(requests.get(url,stream=True).raw)
         system_prompt = f"""
         You are an AI document processing assistant. Analyze the provided image. Identify the ID number in the document.
@@ -87,8 +88,10 @@ def huggingface_detect_id_box(model_name,url):
         as well but that looks to be rare. The output should only be a string in the format [x0,y0,x1,y1], and the
         values should fit into the image size which is {image.size}.
         """
         processor,model=load_model(model_name)
         conversation = [
             {
@@ -99,8 +102,13 @@ def huggingface_detect_id_box(model_name,url):
                 ],
             },
         ]
         prompt = processor.apply_chat_template(conversation,add_generation_prompt=True)
         inputs = processor(images=image,text=prompt,return_tensors="pt").to(model.device)
         """
         with torch.no_grad():
@@ -116,12 +124,18 @@ def huggingface_detect_id_box(model_name,url):
         """
         output = model.generate(**inputs,max_new_tokens=200,do_sample=False)
         bbox = processor.decode(output[0][2:],skip_special_tokens=True)
         print(bbox)
         draw = ImageDraw.Draw(image)
         draw.rectangle(bbox,outline="red",width=5)
         #image.save(f'{os.path.dirname(os.path.dirname(os.path.abspath(__file__)))}\\download\\{dt.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")}.jpg')
         return image,bbox
     except Exception as e:

     try:
         #image = get_image(url)
         image = Image.open(requests.get(url,stream=True).raw)
+        print(image)
         system_prompt = f"""
         You are an AI document processing assistant. Analyze the provided image. Identify the ID number in the document.
         as well but that looks to be rare. The output should only be a string in the format [x0,y0,x1,y1], and the
         values should fit into the image size which is {image.size}.
         """
+        print(system_prompt)
         processor,model=load_model(model_name)
+        print(processor,model)
         conversation = [
             {
                 ],
             },
         ]
+        print(conversation)
         prompt = processor.apply_chat_template(conversation,add_generation_prompt=True)
+        print(prompt)
         inputs = processor(images=image,text=prompt,return_tensors="pt").to(model.device)
+        print(inputs)
         """
         with torch.no_grad():
         """
         output = model.generate(**inputs,max_new_tokens=200,do_sample=False)
+        print(output)
         bbox = processor.decode(output[0][2:],skip_special_tokens=True)
         print(bbox)
         draw = ImageDraw.Draw(image)
+        print(draw)
         draw.rectangle(bbox,outline="red",width=5)
+        print(image)
         #image.save(f'{os.path.dirname(os.path.dirname(os.path.abspath(__file__)))}\\download\\{dt.datetime.now().strftime("%Y-%m-%d_%H-%M-%S")}.jpg')
         return image,bbox
     except Exception as e: