Spaces:

Anuj-Panthri
/

Price-Drop-Detective

Sleeping

App Files Files Community

shivam-kala commited on Mar 30, 2024

Commit

d5ccf1f

1 Parent(s): c2ccfc1

trying

Browse files

Files changed (5) hide show

email_utils.py +14 -13
index.html +0 -0
old_files/DockerFile +0 -6
scraper/old_scraper.py +16 -3
scraper/scraper.py +41 -29

email_utils.py CHANGED Viewed

@@ -39,23 +39,23 @@ def get_template_price_drop_email(name,product_name,product_url,previous_price,n
     prod_name_len = 20
     subject = f""" Price Drop Alert!  | {product_name[:prod_name_len]+("..." if len(product_name)>prod_name_len else "")}"""
-    body = f"""
-    Hello, {name}
-    We are excited to inform you that the price of the product you have been monitoring has dropped!
-    Product Name: {product_name}
-    Previous Price: {previous_price}
-    New Price: {new_price}
-    Buy Product: {product_url}
-    Product Detail: {product_detail_url}
-    Hurry up and grab this opportunity before the price changes again!
-    Thank you for using Price Drop Detective!
-    Best regards,
-    Your Price Drop Detective Team
  """
     return {
@@ -68,6 +68,7 @@ def get_template_price_drop_email(name,product_name,product_url,previous_price,n
 if __name__=="__main__":
     receiver_email = os.environ["TEST_RECEIVER_EMAIL"]  # Enter receiver address
     message = """
     This message is sent from Python.
     """

     prod_name_len = 20
     subject = f""" Price Drop Alert!  | {product_name[:prod_name_len]+("..." if len(product_name)>prod_name_len else "")}"""
+    body = f"""
+Hello, {name}
+We are excited to inform you that the price of the product you have been monitoring has dropped!
+Product Name: {product_name}
+Previous Price: {previous_price}
+New Price: {new_price}
+Buy Product: {product_url}
+Product Detail: https://shivam-kala-price-drop-detective.hf.space{product_detail_url}
+Hurry up and grab this opportunity before the price changes again!
+Thank you for using Price Drop Detective!
+Best regards,
+Your Price Drop Detective Team
  """
     return {
 if __name__=="__main__":
     receiver_email = os.environ["TEST_RECEIVER_EMAIL"]  # Enter receiver address
+    # receiver_email = os.environ["ADMIN_EMAIL"]  # Enter receiver address
     message = """
     This message is sent from Python.
     """

index.html CHANGED Viewed

The diff for this file is too large to render. See raw diff

old_files/DockerFile DELETED Viewed

@@ -1,6 +0,0 @@
-# !pip install selenium                                 # Install selenium
-# !apt-get update                                       # To update ubuntu to correctly run apt install
-# !apt install chromium-chromedriver -y                 # Install chrome driver
-# !cp /usr/lib/chromium-browser/chromedriver /usr/bin   # Adding the driver path

scraper/old_scraper.py CHANGED Viewed

@@ -30,8 +30,16 @@ data = {
 app = Flask(__name__)
-def getData(url,headers={}):
-  html = requests.post("https://anuj-panthri-puppeteer-api.hf.space/html/",data={"url":url,"headers":headers}).json()["html"]
   return html
@@ -50,4 +58,9 @@ def home():
 # img = soup.find_all("img")
 # print(html)
-app.run(debug=True)

 app = Flask(__name__)
+apis = [
+  # "https://anuj-panthri-puppeteer-api.hf.space/html/",
+  "https://anuj-panthri-puppeteer-api-1.hf.space/html/",
+  "https://anuj-panthri-puppeteer-api-2.hf.space/html/",
+  "https://shivam-kala-puppeteer-api-3.hf.space/html/",
+  "https://shivam-kala-puppeteer-api-4.hf.space/html/",
+  ]
+def getData(api,url,headers={}):
+  html = requests.post(api,data={"url":url,"headers":headers}).json()["html"]
   return html
 # img = soup.find_all("img")
 # print(html)
+# app.run(debug=True)
+for api in apis:
+  html=getData(api,"https://api.ipify.org/?format=json")
+  soup = BeautifulSoup(html, 'html.parser')
+  print(api,":\t",soup.find("pre").text)

scraper/scraper.py CHANGED Viewed

@@ -5,7 +5,7 @@ from fake_useragent import UserAgent
 from pathlib import Path
 import os
 from datetime import datetime
-import requests, tempfile, shutil ,uuid
@@ -41,7 +41,19 @@ def getDriver():
     # if driver:  driver.close()
     return driver
 def getHTMLFROMAPI(url):
     headers = {
         "Accept-language": "en-GB,en;q=0.9",
         "Accept-Encoding": "gzip, deflate, br",
@@ -54,8 +66,8 @@ def getHTMLFROMAPI(url):
         "url":url,
         "headers":headers,
     }
-    res = requests.post("https://anuj-panthri-puppeteer-api.hf.space/html",data=data,headers={"Connection": "keep-alive"}).json()
     return (res["html"]).encode("UTF-8")
 class BaseScrapper(ABC):
@@ -224,37 +236,37 @@ if __name__ == "__main__":
     # print(getHTMLFROMAPI(url))
-    scrapper = AmazonScrapper(driver,AmazonScrapper.getShortUrl(url))
-    print(scrapper.url)
-    data=scrapper.getData()
-    print(data)
-    # input("stop")
-    driver.close()
-    exit()
-    url = "https://www.amazon.com/dp/B07PVCK9KX/"
-    scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
-    print(scrapper.url)
-    print(scrapper.getData())
-    url = "https://www.amazon.com/dp/B07CNPBS7T/"
-    scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
-    print(scrapper.url)
-    print(scrapper.getData())
-    # url = "https://www.amazon.com/Hope-Rainbow-Hoda-Kotb/dp/0593624122/?_encoding=UTF8&_encoding=UTF8&ref_=dlx_gate_sd_dcl_tlt_fa13649f_dt_pd_gw_unk&pd_rd_w=FPLOl&content-id=amzn1.sym.81a68cec-8afc-4296-99f7-78cf5ddc15b5&pf_rd_p=81a68cec-8afc-4296-99f7-78cf5ddc15b5&pf_rd_r=KAD1QPN234SH5MXYBNW6&pd_rd_wg=A7ZKi&pd_rd_r=fa39bbc3-93b1-41a2-b592-77d89dfc6566"
-    # url = "https://www.amazon.in/Lux-Cozi-Melange-Regular-Sleeves/dp/B0CH9QMFF4/ref=sl_ob_desktop_dp_0_2_v2?_encoding=UTF8&pd_rd_w=1Bm0J&content-id=amzn1.sym.cdbcd11c-3329-43cb-9547-fb297b2c655b&pf_rd_p=cdbcd11c-3329-43cb-9547-fb297b2c655b&pf_rd_r=PTKWAM93FTVZKNGQFPVM&pd_rd_wg=iE7ky&pd_rd_r=ccfc3bd0-e267-435c-85d3-f63c78a1db0a"
-    url = "https://www.amazon.in/dp/B0CHM745CT/ref=syn_sd_onsite_desktop_0?ie=UTF8&pd_rd_plhdr=t&aref=94rDEQyVIg&th=1"
-    scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
-    print(scrapper.url)
-    print(scrapper.getData())
-    # url = 'https://www.flipkart.com/apple-iphone-15-blue-128-gb/p/itmbf14ef54f645d?pid=MOBGTAGPAQNVFZZY&lid=LSTMOBGTAGPAQNVFZZYO7HQ2L&marketplace=FLIPKART&store=tyy%2F4io&spotlightTagId=BestsellerId_tyy%2F4io&srno=b_1_1&otracker=browse&fm=organic&iid=fedd7fea-5ff7-4bd7-a5f0-a9008f1702c3.MOBGTAGPAQNVFZZY.SEARCH&ppt=browse&ppn=browse&ssid=7un6hxsq6o0000001710258321538'
-    # scrapper = FlipkartScrapper(driver,FlipkartScrapper.getShortUrl(url))
-    # open("index.html","wb").write(scrapper.getHTML())
     # print(scrapper.url)
     # print(scrapper.getData())
     # url = "https://www.flipkart.com/sti-printed-men-round-neck-white-black-t-shirt/p/itm3b20cdb30cb02"
     # scrapper.updateUrl(FlipkartScrapper.getShortUrl(url))

 from pathlib import Path
 import os
 from datetime import datetime
+import requests, shutil ,uuid, random
     # if driver:  driver.close()
     return driver
+apis = [
+  # "https://anuj-panthri-puppeteer-api.hf.space/html/",
+  "https://anuj-panthri-puppeteer-api-1.hf.space/html/",
+  "https://anuj-panthri-puppeteer-api-2.hf.space/html/",
+  "https://shivam-kala-puppeteer-api-3.hf.space/html/",
+  "https://shivam-kala-puppeteer-api-4.hf.space/html/",
+  ]
 def getHTMLFROMAPI(url):
+    api = apis[random.randint(0,len(apis)-1)]
     headers = {
         "Accept-language": "en-GB,en;q=0.9",
         "Accept-Encoding": "gzip, deflate, br",
         "url":url,
         "headers":headers,
     }
+    print("using_api:",api)
+    res = requests.post(api,data=data).json()
     return (res["html"]).encode("UTF-8")
 class BaseScrapper(ABC):
     # print(getHTMLFROMAPI(url))
+    # scrapper = AmazonScrapper(driver,AmazonScrapper.getShortUrl(url))
+    # print(scrapper.url)
+    # data=scrapper.getData()
+    # print(data)
+    # # input("stop")
+    # driver.close()
+    # exit()
+    # url = "https://www.amazon.com/dp/B07PVCK9KX/"
+    # scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
+    # print(scrapper.url)
+    # print(scrapper.getData())
+    # url = "https://www.amazon.com/dp/B07CNPBS7T/"
+    # scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
+    # print(scrapper.url)
+    # print(scrapper.getData())
+    # # url = "https://www.amazon.com/Hope-Rainbow-Hoda-Kotb/dp/0593624122/?_encoding=UTF8&_encoding=UTF8&ref_=dlx_gate_sd_dcl_tlt_fa13649f_dt_pd_gw_unk&pd_rd_w=FPLOl&content-id=amzn1.sym.81a68cec-8afc-4296-99f7-78cf5ddc15b5&pf_rd_p=81a68cec-8afc-4296-99f7-78cf5ddc15b5&pf_rd_r=KAD1QPN234SH5MXYBNW6&pd_rd_wg=A7ZKi&pd_rd_r=fa39bbc3-93b1-41a2-b592-77d89dfc6566"
+    # # url = "https://www.amazon.in/Lux-Cozi-Melange-Regular-Sleeves/dp/B0CH9QMFF4/ref=sl_ob_desktop_dp_0_2_v2?_encoding=UTF8&pd_rd_w=1Bm0J&content-id=amzn1.sym.cdbcd11c-3329-43cb-9547-fb297b2c655b&pf_rd_p=cdbcd11c-3329-43cb-9547-fb297b2c655b&pf_rd_r=PTKWAM93FTVZKNGQFPVM&pd_rd_wg=iE7ky&pd_rd_r=ccfc3bd0-e267-435c-85d3-f63c78a1db0a"
+    # url = "https://www.amazon.in/dp/B0CHM745CT/ref=syn_sd_onsite_desktop_0?ie=UTF8&pd_rd_plhdr=t&aref=94rDEQyVIg&th=1"
+    # scrapper.updateUrl(AmazonScrapper.getShortUrl(url))
     # print(scrapper.url)
     # print(scrapper.getData())
+    url = 'https://www.flipkart.com/apple-iphone-15-blue-128-gb/p/itmbf14ef54f645d?pid=MOBGTAGPAQNVFZZY&lid=LSTMOBGTAGPAQNVFZZYO7HQ2L&marketplace=FLIPKART&store=tyy%2F4io&spotlightTagId=BestsellerId_tyy%2F4io&srno=b_1_1&otracker=browse&fm=organic&iid=fedd7fea-5ff7-4bd7-a5f0-a9008f1702c3.MOBGTAGPAQNVFZZY.SEARCH&ppt=browse&ppn=browse&ssid=7un6hxsq6o0000001710258321538'
+    scrapper = FlipkartScrapper(driver,FlipkartScrapper.getShortUrl(url))
+    open("index.html","wb").write(scrapper.getHTML())
+    print(scrapper.url)
+    print(scrapper.getData())
     # url = "https://www.flipkart.com/sti-printed-men-round-neck-white-black-t-shirt/p/itm3b20cdb30cb02"
     # scrapper.updateUrl(FlipkartScrapper.getShortUrl(url))