mosesb commited on
Commit
f9ddb3b
·
verified ·
1 Parent(s): 49377ba

Upload folder using huggingface_hub

Browse files
Files changed (9) hide show
  1. .gitattributes +4 -0
  2. app.py +49 -0
  3. aura_farmer_1.jpg +3 -0
  4. aura_farmer_2.jpg +3 -0
  5. aura_farmer_3.jpg +3 -0
  6. aura_farmer_4.jpg +3 -0
  7. best.pt +3 -0
  8. last.pt +3 -0
  9. requirements.txt +3 -0
.gitattributes CHANGED
@@ -33,3 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ aura_farmer_1.jpg filter=lfs diff=lfs merge=lfs -text
37
+ aura_farmer_2.jpg filter=lfs diff=lfs merge=lfs -text
38
+ aura_farmer_3.jpg filter=lfs diff=lfs merge=lfs -text
39
+ aura_farmer_4.jpg filter=lfs diff=lfs merge=lfs -text
app.py ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ from ultralytics import YOLO
3
+ import torch
4
+
5
+ model_id = "mosesb/best-comic-panel-detection"
6
+ model = YOLO("best.pt")
7
+
8
+ def detect_panels(pil_image):
9
+ """
10
+ Takes a PIL image, runs YOLOv12 object detection to find comic panels,
11
+ and returns the annotated image with bounding boxes.
12
+ """
13
+ results = model.predict(pil_image, verbose=False)
14
+
15
+ # The .plot() method returns a BGR NumPy array with the detections plotted on the original image.
16
+ annotated_image = results[0].plot()
17
+
18
+ # Gradio's gr.Image component expects an RGB image. The .plot() method
19
+ # returns a BGR image (common in OpenCV), so we convert it.
20
+ annotated_image_rgb = annotated_image[..., ::-1]
21
+
22
+ return annotated_image_rgb
23
+
24
+
25
+ # --- Gradio Interface ---
26
+ title = "YOLOv12 Comic Panel Detection"
27
+ description = """
28
+ This demo showcases a **YOLOv12 object detection model** that has been fine-tuned to detect panels in comic book pages.
29
+ Upload an image of a comic page, and the model will draw bounding boxes around each detected panel.
30
+ This can be a useful first step for downstream tasks like Optical Character Recognition (OCR) or character analysis within comics.
31
+ """
32
+
33
+ article = f"""
34
+ <div style='text-align: center;'>
35
+ <p style='text-align: center'>Model loaded from <a href='https://huggingface.co/{model_id}' target='_blank'>{model_id}</a></p>
36
+ <p style='text-align: center'>For more details on the training process, check out the project repository: <a href='https://github.com/mosesab/YOLOV12-Comic-Panel-Detection/blob/main/comic-boundary-detection.ipynb' target='_blank'>Comic Boundary Detection</a></p>
37
+ </div>
38
+ """
39
+
40
+ gr.Interface(
41
+ fn=detect_panels,
42
+ inputs=gr.Image(type="pil", label="Upload Comic Page Image"),
43
+ outputs=gr.Image(type="pil", label="Detected Panels"),
44
+ title=title,
45
+ description=description,
46
+ article=article,
47
+ examples=[ "aura_farmer_1.jpg", "aura_farmer_2.jpg", "aura_farmer_3.jpg", "aura_farmer_4.jpg" ],
48
+ allow_flagging="auto"
49
+ ).launch()
aura_farmer_1.jpg ADDED

Git LFS Details

  • SHA256: 9db16de607e88c2a970c53b7b6266dc00091bb79934623d33def164ace3f32f5
  • Pointer size: 131 Bytes
  • Size of remote file: 269 kB
aura_farmer_2.jpg ADDED

Git LFS Details

  • SHA256: 7a911fa364a9a0cf6597eba453b616456d644a86b33eee3fbd7feebb75e1a7bf
  • Pointer size: 131 Bytes
  • Size of remote file: 292 kB
aura_farmer_3.jpg ADDED

Git LFS Details

  • SHA256: e5b6426410e879a4b3d69cd607131c7df60602fa0b60e445b79f175f854215c5
  • Pointer size: 131 Bytes
  • Size of remote file: 330 kB
aura_farmer_4.jpg ADDED

Git LFS Details

  • SHA256: 9f77fa0a73913f7db3c8cc249eca31db9f8d23bbcb892ab497aa5a0684ab3b77
  • Pointer size: 131 Bytes
  • Size of remote file: 325 kB
best.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:566e9ff59ec146afb695eb48a8aaae983b43bb72c3a57f63afafe12f3b349af4
3
+ size 119112954
last.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee64422e2d2cea6b37dbd211c7e24137c429030c2e11b85bcd8dbeaa2f7e9295
3
+ size 119112954
requirements.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ torch #2.7.1
2
+ ultralytics #8.3.160
3
+ gradio #5.35.0