Spaces:

DKethan
/

IPL_Score_Stream

Sleeping

DKethan commited on Mar 29, 2025

Commit

aaa1814

verified ·

1 Parent(s): 0970329

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -32,31 +32,37 @@ def get_match_links_from_main_page():
         soup = BeautifulSoup(response.text, "html.parser")
-        links = []
         all_a_tags = soup.find_all("a", href=True)
-        print(f"🔍 [CRAWL] Total <a> tags found: {len(all_a_tags)}\n")
-        for i, tag in enumerate(all_a_tags):
-            href = tag['href']
-            text = tag.get_text().strip()
-            # Print every link text + href
-            print(f"[A TAG {i+1}] TEXT: '{text}'")
-            print(f"            HREF: {href}\n")
-            # Only keep match score links
-            if "match-full-scores" in href:
                 full_url = BASE_URL + href
-                print(f"✅ [MATCH LINK DETECTED] {text} -> {full_url}")
-                links.append((text, full_url))
-        print(f"\n✅ [DONE] Valid match links extracted: {len(links)}")
         return links
     except Exception as e:
         print(f"❌ [CRAWL ERROR] Failed to fetch match links: {e}")
         return []
 # --- Crawl each link and extract score ---
 def get_scores_from_links(team_name=None):
     print("🟡 [STEP 1] Start crawling for scores...")

         soup = BeautifulSoup(response.text, "html.parser")
         all_a_tags = soup.find_all("a", href=True)
+        print(f"🔍 [CRAWL] Total <a> tags found: {len(all_a_tags)}")
+        links = []
+        for i in range(len(all_a_tags) - 1):
+            tag = all_a_tags[i]
+            next_tag = all_a_tags[i + 1]
+            text = tag.get_text().strip()
+            href = tag['href']
+            # Looking for IPL match result + scorecard links
+            if "cricket-scores" in href and any(team.lower() in text.lower() for team in IPL_TEAMS):
+                title = text
+                result = next_tag.get_text().strip()
                 full_url = BASE_URL + href
+                print(f"\n🎯 [MATCH FOUND]")
+                print(f"🏷️ Title: {title}")
+                print(f"📊 Result: {result}")
+                print(f"🔗 Link: {full_url}")
+                links.append((f"{title} – {result}", full_url))
+        print(f"\n✅ [DONE] Total match results extracted: {len(links)}")
         return links
     except Exception as e:
         print(f"❌ [CRAWL ERROR] Failed to fetch match links: {e}")
         return []
 # --- Crawl each link and extract score ---
 def get_scores_from_links(team_name=None):
     print("🟡 [STEP 1] Start crawling for scores...")