File size: 762 Bytes
8d6fb2b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import gradio as gr
import requests
from bs4 import BeautifulSoup
import pandas as pd


def scrape_site(url):
    response = requests.get(url)
    soup = BeautifulSoup(response.text, "html.parser")
    titles = [h.text.strip() for h in soup.find_all("h2")]
    return titles


def clean_data(data):
    df = pd.DataFrame(data, columns=["title"])
    df["title"] = df["title"].str.lower().str.strip()
    df = df.drop_duplicates()
    return df["title"].tolist()


def chatbot(message, history):

    if message.startswith("scrape"):
        url = message.replace("scrape ", "")
        data = scrape_site(url)
        clean = clean_data(data)
        return "\n".join(clean[:10])

    return "Tape: scrape URL"


demo = gr.ChatInterface(fn=chatbot)
demo.launch()