Spaces:

GradTeam
/

Final_App

Sleeping

App Files Files Community

ek-5 commited on Mar 9

Commit

a212fdd

verified ·

1 Parent(s): 01f4fe7

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -27

app.py CHANGED Viewed

@@ -9,84 +9,82 @@ from PIL import Image
 import uvicorn
 # --- 1. إعداد التطبيق والموديلات ---
-app = FastAPI(title="YOLO + GIT Captioning")
-# تحديد الجهاز (GPU إذا توفر، وإلا CPU)
 device = "cuda" if torch.cuda.is_available() else "cpu"
-# تحميل الموديلات مرة واحدة عند تشغيل السيرفر
-# تأكدي أن ملف best.pt موجود في نفس المجلد
 MY_MODEL_PATH = 'best.pt'
-print("🔄 جاري تحميل الموديلات... قد يستغرق ذلك دقائق")
-# تحميل موديل YOLO (الخاص بكِ)
-if os.path.exists(MY_MODEL_PATH):
     detection_model = YOLO(MY_MODEL_PATH)
-    print("✅ تم تحميل موديل YOLO بنجاح")
-else:
-    # في حال لم يجد ملفك، سيستخدم موديل أساسي مؤقتاً لكي لا يتعطل السيرفر
-    detection_model = YOLO("yolov8s.pt")
-    print("⚠️ تحذير: لم يتم العثور على best.pt، تم استخدام الموديل الافتراضي.")
-# تحميل موديل GIT-base (أخف وأسرع للمساحات المجانية)
 processor = AutoProcessor.from_pretrained("microsoft/git-base")
 caption_model = AutoModelForCausalLM.from_pretrained("microsoft/git-base").to(device)
 @app.get("/")
 def home():
-    return {"status": "Running", "message": "Go to /docs to test the API"}
-# --- 2. وظيفة المعالجة (نفس منطق كود كولاب الخاص بكِ) ---
 @app.post("/analyze")
 async def analyze_image(file: UploadFile = File(...)):
     data = await file.read()
     original_image = Image.open(io.BytesIO(data)).convert("RGB")
-    # استخدام نفس الإعدادات التي نجحت معكِ في كولاب
     results = detection_model(original_image, conf=0.20)
     integrated_results = []
     for r in results:
         for i, box in enumerate(r.boxes):
             label = r.names[int(box.cls)]
             conf_score = float(box.conf[0])
-            coords = box.xyxy[0].tolist()
-            # عملية القص (Cropping)
             cropped_img = original_image.crop((coords[0], coords[1], coords[2], coords[3]))
-            # وصف الجزء المقصوص
             inputs = processor(images=cropped_img, return_tensors="pt").to(device)
             generated_ids = caption_model.generate(pixel_values=inputs.pixel_values, max_length=40)
             detailed_desc = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
             integrated_results.append({
                 "object_id": i + 1,
-                "yolo_label": label,
                 "confidence": f"{conf_score:.2f}",
-                "detailed_description": detailed_desc
             })
-    # وصف عام إذا لم يتم اكتشاف أجسام
     if not integrated_results:
         inputs = processor(images=original_image, return_tensors="pt").to(device)
         generated_ids = caption_model.generate(pixel_values=inputs.pixel_values, max_length=40)
         general_desc = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
         return {
-            "message": "YOLO لم يكتشف أجساماً، إليك وصفاً عاماً.",
             "general_description": general_desc
         }
     return {
         "detected_count": len(integrated_results),
-        "details": integrated_results
     }
-# --- 3. تشغيل السيرفر (إعدادات Hugging Face) ---
 if name == "__main__":
-    # المنفذ 7860 هو الافتراضي والمطلوب في Hugging Face
     uvicorn.run(app, host="0.0.0.0", port=7860)

 import uvicorn
 # --- 1. إعداد التطبيق والموديلات ---
+app = FastAPI(title="YOLO + GIT Captioning API")
+# تحديد الجهاز (استخدام CPU للمساحات المجانية لضمان الاستقرار)
 device = "cuda" if torch.cuda.is_available() else "cpu"
+# مسار الموديل الذي رفعتِيه يدوياً في القائمة
 MY_MODEL_PATH = 'best.pt'
+print("🔄 جاري تحميل الموديلات... يرجى الانتظار")
+# تحميل موديل YOLO الخاص بكِ
+try:
     detection_model = YOLO(MY_MODEL_PATH)
+    print("✅ تم تحميل موديل YOLO الخاص بك بنجاح")
+except Exception as e:
+    print(f"⚠️ فشل تحميل best.pt، سيتم استخدام الموديل الافتراضي: {e}")
+    detection_model = YOLO("yolov8n.pt")
+# تحميل موديل GIT-base (أخف وأسرع للمساحة المجانية)
 processor = AutoProcessor.from_pretrained("microsoft/git-base")
 caption_model = AutoModelForCausalLM.from_pretrained("microsoft/git-base").to(device)
 @app.get("/")
 def home():
+    return {"status": "Online", "instruction": "Add /docs to the URL to test the model"}
+# --- 2. وظيفة المعالجة (نفس المنطق الذي نجح معكِ في كولاب) ---
 @app.post("/analyze")
 async def analyze_image(file: UploadFile = File(...)):
+    # قراءة الصورة المرفوعة
     data = await file.read()
     original_image = Image.open(io.BytesIO(data)).convert("RGB")
+    # 1. الكشف باستخدام YOLO
     results = detection_model(original_image, conf=0.20)
     integrated_results = []
     for r in results:
         for i, box in enumerate(r.boxes):
             label = r.names[int(box.cls)]
             conf_score = float(box.conf[0])
+            coords = box.xyxy[0].tolist() # [xmin, ymin, xmax, ymax]
+            # 2. عملية القص (Cropping) للجزء المكتشف
             cropped_img = original_image.crop((coords[0], coords[1], coords[2], coords[3]))
+            # 3. وصف الجزء المقصوص عبر موديل GIT
             inputs = processor(images=cropped_img, return_tensors="pt").to(device)
             generated_ids = caption_model.generate(pixel_values=inputs.pixel_values, max_length=40)
             detailed_desc = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
             integrated_results.append({
                 "object_id": i + 1,
+                "label": label,
                 "confidence": f"{conf_score:.2f}",
+                "description": detailed_desc
             })
+    # إذا لم يجد YOLO شيئاً، نصف الصورة كاملة
     if not integrated_results:
         inputs = processor(images=original_image, return_tensors="pt").to(device)
         generated_ids = caption_model.generate(pixel_values=inputs.pixel_values, max_length=40)
         general_desc = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
         return {
+            "message": "No specific objects detected by YOLO. Here is a general description.",
             "general_description": general_desc
         }
     return {
         "detected_count": len(integrated_results),
+        "results": integrated_results
     }
+# --- 3. تشغيل السيرفر ---
 if name == "__main__":
+    # المنفذ 7860 هو المطلوب في Hugging Face
     uvicorn.run(app, host="0.0.0.0", port=7860)