Spaces:

sarim
/

pix

Running

sarim commited on Nov 20, 2025

Commit

550eeeb

1 Parent(s): 72d9d95

get upcomming dividend

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,40 +8,38 @@ app = FastAPI(
     description="Scrape data from PSX website"
 )
-@app.get("/hello")
-def greet_json():
-    return {"Hello": "World!"}
-@app.get("/dividend_history")
-def get_dividend():
-    url = "https://www.psx.com.pk/psx/announcement/financial-announcements"
-    r = requests.get(url)
-    soup = BeautifulSoup(r.text, "html.parser")
     table = soup.find("table")
     if table is None:
-        return {"error": "No table found on PSX page"}
-    rows = table.find_all("tr")
     data = []
     current_date = None
-    for row in rows:
-        # Skip non-tag elements to avoid "NavigableString" errors
         if not isinstance(row, Tag):
-            continue
-        # Date section header
         header = row.find("h4")
         if header:
             current_date = header.get_text(strip=True)
             continue
-        # Regular rows
         cols = row.find_all("td")
         if len(cols) < 4:
-            continue
         company = cols[0].get_text(strip=True)
         dividend_amount = cols[3].get_text(strip=True)
@@ -53,3 +51,19 @@ def get_dividend():
         })
     return data

     description="Scrape data from PSX website"
 )
+def scrape_psx_dividends(url: str):
+    """
+    Scrape company name, dividend date, and dividend amount
+    from PSX financial announcement table.
+    """
+    response = requests.get(url)
+    response.raise_for_status()
+    soup = BeautifulSoup(response.text, "html.parser")
     table = soup.find("table")
     if table is None:
+        raise ValueError("No <table> found on the page!")
     data = []
     current_date = None
+    # Loop through table rows
+    for row in table.find_all("tr"):
         if not isinstance(row, Tag):
+            continue  # Skip non-tag nodes
+        # Detect date header section
         header = row.find("h4")
         if header:
             current_date = header.get_text(strip=True)
             continue
+        # Extract columns from normal rows
         cols = row.find_all("td")
         if len(cols) < 4:
+            continue  # Skip incomplete rows
         company = cols[0].get_text(strip=True)
         dividend_amount = cols[3].get_text(strip=True)
         })
     return data
+@app.get("/hello")
+def greet_json():
+    return {"Hello": "World!"}
+@app.get("/dividend_history")
+def get_dividend():
+    return scrape_psx_dividends(url='https://scstrade.com/MarketStatistics/MS_xDates.aspx')