Spaces:

Engineer786
/

Hackathon

Build error

App Files Files Community

Engineer786 commited on Jan 5, 2025

Commit

a6f7192

verified ·

1 Parent(s): 85e160f

Update tariff_scraper.py

Browse files

Files changed (1) hide show

tariff_scraper.py +7 -36

tariff_scraper.py CHANGED Viewed

@@ -1,8 +1,7 @@
-import streamlit as st
 import requests
 from bs4 import BeautifulSoup
-# Dictionary of companies and their URLs
 TARIFF_URLS = {
     "IESCO": "https://iesco.com.pk/index.php/customer-services/tariff-guide",
     "FESCO": "https://fesco.com.pk/tariff",
@@ -14,16 +13,17 @@ TARIFF_URLS = {
     "TESCO": "https://tesco.gov.pk/index.php/electricity-tariff"
 }
-# Function to scrape tariff data from a given URL
 def scrape_tariff_data(url):
     try:
         response = requests.get(url, headers={"User-Agent": "Mozilla/5.0"})
         response.raise_for_status()  # Raise an error for bad responses
         soup = BeautifulSoup(response.text, 'html.parser')
         # Extract specific elements based on the webpage structure
-        # Assume tariff data is in <table> tags
-        tariff_sections = soup.find_all('table')
         data = []
         for section in tariff_sections:
@@ -35,35 +35,6 @@ def scrape_tariff_data(url):
                 if row_text:  # Add the row text only if it contains data
                     data.append(row_text)
-        return data  # Returns a list of row strings
     except Exception as e:
-        return f"An error occurred: {e}"
-# Streamlit app main function
-def main():
-    st.title("Electricity Tariff Scraper")
-    st.write("Select the company to fetch tariff rates:")
-    # Dropdown menu for company selection
-    company = st.selectbox("Select Company", list(TARIFF_URLS.keys()))
-    if st.button("Scrape"):
-        if company:
-            url = TARIFF_URLS[company]  # Get the URL for the selected company
-            st.write(f"Scraping data for: **{company}**")
-            with st.spinner("Scraping data..."):
-                data = scrape_tariff_data(url)
-                if isinstance(data, list) and data:
-                    st.success("Data scraped successfully!")
-                    st.write("Here is a preview of the data:")
-                    for row in data[:10]:  # Show only the first 10 rows for readability
-                        st.write(row)
-                elif isinstance(data, list) and not data:
-                    st.warning("No data found on the page.")
-                else:
-                    st.error(data)
-        else:
-            st.error("Please select a valid company.")
-if __name__ == "__main__":
-    main()

 import requests
 from bs4 import BeautifulSoup
+# Dictionary mapping companies to their URLs
 TARIFF_URLS = {
     "IESCO": "https://iesco.com.pk/index.php/customer-services/tariff-guide",
     "FESCO": "https://fesco.com.pk/tariff",
     "TESCO": "https://tesco.gov.pk/index.php/electricity-tariff"
 }
 def scrape_tariff_data(url):
+    """
+    Scrape tariff data from the given URL.
+    """
     try:
         response = requests.get(url, headers={"User-Agent": "Mozilla/5.0"})
         response.raise_for_status()  # Raise an error for bad responses
         soup = BeautifulSoup(response.text, 'html.parser')
         # Extract specific elements based on the webpage structure
+        tariff_sections = soup.find_all('table')  # Assume tariff data is in <table> tags
         data = []
         for section in tariff_sections:
                 if row_text:  # Add the row text only if it contains data
                     data.append(row_text)
+        return data if data else ["No data found on the webpage."]
     except Exception as e:
+        return [f"An error occurred: {e}"]