Spaces:
Paused
Paused
File size: 8,166 Bytes
280f977 7c8ba90 357f2cf 7c8ba90 357f2cf 7c8ba90 357f2cf 7c8ba90 357f2cf 7c8ba90 357f2cf 7c8ba90 357f2cf 7c8ba90 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 | import streamlit as st
import requests
from bs4 import BeautifulSoup
import pandas as pd
import plotly.express as px
import plotly.graph_objects as go
from datetime import datetime
import time
st.set_page_config(page_title="Market Price Monitor", layout="wide")
# ==================== WEB SCRAPING FUNCTIONS ====================
def scrape_coinmarketcap():
"""Scrape cryptocurrency prices từ CoinMarketCap"""
url = "https://coinmarketcap.com/"
headers = {"User-Agent": "Mozilla/5.0"}
try:
response = requests.get(url, headers=headers, timeout=10)
if response.status_code != 200:
return pd.DataFrame(), "Error fetching data"
soup = BeautifulSoup(response.content, "html.parser")
rows = soup.select("tbody tr")[:15]
data = []
for row in rows:
cols = row.find_all("td")
if len(cols) >= 7:
name = cols[2].find("p", class_=True).text.strip() if cols[2].find("p") else "N/A"
symbol = cols[2].find("p", class_="coin-item-symbol").text.strip() if cols[2].find("p", class_="coin-item-symbol") else "N/A"
price = cols[3].text.strip() if len(cols) > 3 else "N/A"
change_24h = cols[4].text.strip() if len(cols) > 4 else "N/A"
market_cap = cols[6].text.strip() if len(cols) > 6 else "N/A"
data.append({
"Name": name,
"Symbol": symbol,
"Price": price,
"24h Change": change_24h,
"Market Cap": market_cap
})
df = pd.DataFrame(data)
return df, None
except Exception as e:
return pd.DataFrame(), str(e)
def scrape_product_prices(product_urls):
"""Scrape giá sản phẩm từ nhiều website (tùy chỉnh)"""
data = []
for url in product_urls:
try:
headers = {"User-Agent": "Mozilla/5.0"}
response = requests.get(url, headers=headers, timeout=10)
soup = BeautifulSoup(response.content, "html.parser")
# Tùy chỉnh selector theo website (ví dụ: Amazon, Shopee)
title = soup.find("span", class_="a-size-medium") or soup.find("h1")
price = soup.find("span", class_="a-price-whole") or soup.find("div", class_="price")
data.append({
"URL": url,
"Product": title.text.strip() if title else "Unknown",
"Price": price.text.strip() if price else "N/A",
"Scraped At": datetime.now().strftime("%Y-%m-%d %H:%M")
})
except Exception as e:
data.append({
"URL": url,
"Product": "Error",
"Price": f"Error: {str(e)}",
"Scraped At": datetime.now().strftime("%Y-%m-%d %H:%M")
})
return pd.DataFrame(data)
# ==================== STREAMLIT DASHBOARD ====================
st.title("📊 Market Price Monitor Dashboard")
st.markdown("Theo dõi giá thị trường thời gian thực - Web Scraping tự động")
# Sidebar
st.sidebar.header("⚙️ Cài đặt")
# Chọn loại thị trường
market_type = st.sidebar.radio(
"Chọn thị trường:",
["Cryptocurrency", "Sản phẩm E-commerce", "Cả hai"]
)
auto_refresh = st.sidebar.checkbox("Tự động làm mới (30s)", value=False)
refresh_interval = st.sidebar.slider("Tần suất (giây)", 10, 120, 30)
# ==================== CRYPTOCURRENCY SECTION ====================
if market_type in ["Cryptocurrency", "Cả hai"]:
st.header("🪙 Cryptocurrency Prices")
col1, col2, col3 = st.columns(3)
if market_type == "Cryptocurrency":
df_crypto, error = scrape_coinmarketcap()
if error:
st.error(f"❌ Lỗi: {error}")
else:
# Metrics
with col1:
st.metric("Total Cryptos", len(df_crypto))
with col2:
avg_price = df_crypto["Price"].astype(str).str.replace(r"[^\d.]", "", regex=True).mean()
st.metric("Avg Price", f"${avg_price:.2f}" if avg_price else "N/A")
with col3:
top_gainer = df_crypto.loc[df_crypto["24h Change"].str.contains("+", na=False)].head(1)
if not top_gainer.empty:
st.metric("Top Gainer", f"{top_gainer['Name'].values[0]} ({top_gainer['24h Change'].values[0]})")
else:
st.metric("Top Gainer", "N/A")
# Data table
st.subheader("📋 Dữ liệu chi tiết")
st.dataframe(
df_crypto,
use_container_width=True,
hide_index=True
)
# Charts
col1, col2 = st.columns(2)
with col1:
st.subheader("📈 Top 10 by Price")
df_crypto_clean = df_crypto.copy()
df_crypto_clean["Price"].replace({r"[^\d.]": ""}, regex=True, inplace=True)
df_crypto_clean["Price"] = pd.to_numeric(df_crypto_clean["Price"], errors="coerce")
df_top10 = df_crypto_clean.nlargest(10, "Price")
fig_bar = px.bar(df_top10, x="Symbol", y="Price", color="Name",
title="Top 10 Crypto Prices",
labels={"Price": "Price (USD)"})
st.plotly_chart(fig_bar, use_container_width=True)
with col2:
st.subheader("🥧 Market Cap Distribution")
fig_pie = px.pie(df_crypto.head(10), names="Name", values="Market Cap",
title="Top 10 Market Cap")
st.plotly_chart(fig_pie, use_container_width=True)
# 24h Change chart
st.subheader("📊 24h Change (%)")
df_crypto_clean["24h Change"].replace({r"[^\d.-]": ""}, regex=True, inplace=True)
df_crypto_clean["24h Change"] = pd.to_numeric(df_crypto_clean["24h Change"], errors="coerce")
fig_change = px.bar(df_crypto_clean.head(15), x="Name", y="24h Change",
color="24h Change",
color_continuous_scale="RdYlGn",
title="24h Price Change (%)")
st.plotly_chart(fig_change, use_container_width=True)
# ==================== E-COMMERCE SECTION ====================
if market_type in ["Sản phẩm E-commerce", "Cả hai"]:
st.header("🛒 E-commerce Product Prices")
# Input URLs
st.subheader("🔗 Thêm URL sản phẩm")
url_input = st.text_area(
"Nhập URLs (mỗi dòng 1 URL):",
placeholder="https://amazon.com/product1\nhttps://shopee.vn/product2",
height=150
)
if st.button("🔍 Scrape Prices", type="primary"):
if url_input.strip():
urls = [url.strip() for url in url_input.split("\n") if url.strip()]
with st.spinner("Đang scrape dữ liệu..."):
df_products = scrape_product_prices(urls)
st.subheader("📋 Kết quả")
st.dataframe(df_products, use_container_width=True, hide_index=True)
# Download CSV
csv = df_products.to_csv(index=False).encode("utf-8")
st.download_button(
"📥 Download CSV",
csv,
"market_prices.csv",
"text/csv"
)
else:
st.warning("⚠️ Vui lòng nhập ít nhất 1 URL")
# ==================== FOOTER ====================
st.markdown("---")
st.markdown(
f"""
<div style='text-align: center; color: gray;'>
🔄 Cập nhật: {datetime.now().strftime("%Y-%m-%d %H:%M:%S")} |
Data scraped từ CoinMarketCap & E-commerce sites
</div>
""",
unsafe_allow_html=True
)
# Auto-refresh
if auto_refresh:
time.sleep(refresh_interval)
st.rerun() |