Update app.py
Browse files
app.py
CHANGED
|
@@ -9,6 +9,7 @@ from sklearn.metrics import classification_report, accuracy_score
|
|
| 9 |
import joblib
|
| 10 |
import matplotlib.pyplot as plt
|
| 11 |
import seaborn as sns
|
|
|
|
| 12 |
|
| 13 |
# Streamlit ํ์ด์ง ์ค์
|
| 14 |
st.set_page_config(page_title="์ ์น์ ์ฑํฅ ๋ถ์ ๋ฐ ๋ฐ๋ ๊ด์ ์์ฑ", page_icon="๐ฐ", layout="wide")
|
|
@@ -34,9 +35,9 @@ def fetch_naver_news(query, display=15):
|
|
| 34 |
}
|
| 35 |
params = {
|
| 36 |
"query": query,
|
| 37 |
-
"display": display,
|
| 38 |
"start": 1,
|
| 39 |
-
"sort": "date",
|
| 40 |
}
|
| 41 |
|
| 42 |
response = requests.get(url, headers=headers, params=params)
|
|
@@ -75,7 +76,6 @@ def incremental_training(texts, labels, model, vectorizer):
|
|
| 75 |
joblib.dump(vectorizer, "tfidf_vectorizer.pkl")
|
| 76 |
return model, vectorizer
|
| 77 |
|
| 78 |
-
|
| 79 |
# GPT-4๋ฅผ ์ด์ฉํด ๋ฐ๋ ๊ด์ ๊ธฐ์ฌ ์์ฑ
|
| 80 |
def generate_article_gpt4(prompt):
|
| 81 |
try:
|
|
@@ -100,12 +100,12 @@ st.markdown("๋ค์ด๋ฒ ๋ด์ค์ ํ๊น
ํ์ด์ค ๋ฐ์ดํฐ๋ฅผ ํ์ฉํ์ฌ ๋ด
|
|
| 100 |
huggingface_data = load_huggingface_data()
|
| 101 |
query = st.text_input("๋ค์ด๋ฒ ๋ด์ค์์ ๊ฒ์ํ ํค์๋๋ฅผ ์
๋ ฅํ์ธ์", value="์ ์น")
|
| 102 |
|
|
|
|
| 103 |
if st.button("๋ฐ์ดํฐ ๊ฒฐํฉ ๋ฐ ํ์ต"):
|
| 104 |
texts, labels = combine_datasets(huggingface_data, fetch_naver_news(query))
|
| 105 |
model, vectorizer = initialize_model()
|
| 106 |
model, vectorizer = incremental_training(texts, labels, model, vectorizer)
|
| 107 |
-
|
| 108 |
-
|
| 109 |
# ์ฑ๋ฅ ํ๊ฐ
|
| 110 |
X_test = vectorizer.transform(texts)
|
| 111 |
y_test = [0 if label == "Democrat" else 1 if label == "Republican" else 2 for label in labels]
|
|
@@ -114,11 +114,11 @@ if st.button("๋ฐ์ดํฐ ๊ฒฐํฉ ๋ฐ ํ์ต"):
|
|
| 114 |
st.write(f"๋ชจ๋ธ ์ ํ๋: {accuracy:.2f}")
|
| 115 |
st.text("๋ถ๋ฅ ๋ฆฌํฌํธ:")
|
| 116 |
st.text(classification_report(y_test, y_pred, target_names=["Democrat", "Republican", "NEUTRAL"]))
|
|
|
|
| 117 |
|
| 118 |
# ๋ด์ค ๋ฐ์ดํฐ ๋ถ์ ๋ฐ ๋ฐ๋ ๊ด์ ๊ธฐ์ฌ ์์ฑ
|
| 119 |
if st.button("๋ด์ค ์ฑํฅ ๋ถ์"):
|
| 120 |
-
|
| 121 |
-
model, vectorizer = load_model_from_huggingface(directory="huggingface_model")
|
| 122 |
news_items = fetch_naver_news(query, display=15) # ๋ด์ค 15๊ฐ ๊ฐ์ ธ์ค๊ธฐ
|
| 123 |
|
| 124 |
if news_items:
|
|
@@ -144,4 +144,4 @@ if st.button("๋ด์ค ์ฑํฅ ๋ถ์"):
|
|
| 144 |
st.write(f"**์ฑํฅ:** {sentiment}")
|
| 145 |
st.write(f"**๋ฐ๋ ๊ด์ ๊ธฐ์ฌ:** {opposite_article}")
|
| 146 |
st.write(f"**๋งํฌ:** [๊ธฐ์ฌ ๋งํฌ]({link})")
|
| 147 |
-
st.markdown("---")
|
|
|
|
| 9 |
import joblib
|
| 10 |
import matplotlib.pyplot as plt
|
| 11 |
import seaborn as sns
|
| 12 |
+
from pathlib import Path
|
| 13 |
|
| 14 |
# Streamlit ํ์ด์ง ์ค์
|
| 15 |
st.set_page_config(page_title="์ ์น์ ์ฑํฅ ๋ถ์ ๋ฐ ๋ฐ๋ ๊ด์ ์์ฑ", page_icon="๐ฐ", layout="wide")
|
|
|
|
| 35 |
}
|
| 36 |
params = {
|
| 37 |
"query": query,
|
| 38 |
+
"display": display, # ๋ด์ค 15๊ฐ ๊ฐ์ ธ์ค๊ธฐ
|
| 39 |
"start": 1,
|
| 40 |
+
"sort": "date", # ์ต์ ์์ผ๋ก ์ ๋ ฌ
|
| 41 |
}
|
| 42 |
|
| 43 |
response = requests.get(url, headers=headers, params=params)
|
|
|
|
| 76 |
joblib.dump(vectorizer, "tfidf_vectorizer.pkl")
|
| 77 |
return model, vectorizer
|
| 78 |
|
|
|
|
| 79 |
# GPT-4๋ฅผ ์ด์ฉํด ๋ฐ๋ ๊ด์ ๊ธฐ์ฌ ์์ฑ
|
| 80 |
def generate_article_gpt4(prompt):
|
| 81 |
try:
|
|
|
|
| 100 |
huggingface_data = load_huggingface_data()
|
| 101 |
query = st.text_input("๋ค์ด๋ฒ ๋ด์ค์์ ๊ฒ์ํ ํค์๋๋ฅผ ์
๋ ฅํ์ธ์", value="์ ์น")
|
| 102 |
|
| 103 |
+
# ๋ฐ์ดํฐ ๊ฒฐํฉ ๋ฐ ํ์ต
|
| 104 |
if st.button("๋ฐ์ดํฐ ๊ฒฐํฉ ๋ฐ ํ์ต"):
|
| 105 |
texts, labels = combine_datasets(huggingface_data, fetch_naver_news(query))
|
| 106 |
model, vectorizer = initialize_model()
|
| 107 |
model, vectorizer = incremental_training(texts, labels, model, vectorizer)
|
| 108 |
+
|
|
|
|
| 109 |
# ์ฑ๋ฅ ํ๊ฐ
|
| 110 |
X_test = vectorizer.transform(texts)
|
| 111 |
y_test = [0 if label == "Democrat" else 1 if label == "Republican" else 2 for label in labels]
|
|
|
|
| 114 |
st.write(f"๋ชจ๋ธ ์ ํ๋: {accuracy:.2f}")
|
| 115 |
st.text("๋ถ๋ฅ ๋ฆฌํฌํธ:")
|
| 116 |
st.text(classification_report(y_test, y_pred, target_names=["Democrat", "Republican", "NEUTRAL"]))
|
| 117 |
+
st.success("๋ชจ๋ธ์ด ์๋ก์ด ๋ฐ์ดํฐ๋ก ์ถ๊ฐ ํ์ต๋์์ต๋๋ค.")
|
| 118 |
|
| 119 |
# ๋ด์ค ๋ฐ์ดํฐ ๋ถ์ ๋ฐ ๋ฐ๋ ๊ด์ ๊ธฐ์ฌ ์์ฑ
|
| 120 |
if st.button("๋ด์ค ์ฑํฅ ๋ถ์"):
|
| 121 |
+
model, vectorizer = initialize_model()
|
|
|
|
| 122 |
news_items = fetch_naver_news(query, display=15) # ๋ด์ค 15๊ฐ ๊ฐ์ ธ์ค๊ธฐ
|
| 123 |
|
| 124 |
if news_items:
|
|
|
|
| 144 |
st.write(f"**์ฑํฅ:** {sentiment}")
|
| 145 |
st.write(f"**๋ฐ๋ ๊ด์ ๊ธฐ์ฌ:** {opposite_article}")
|
| 146 |
st.write(f"**๋งํฌ:** [๊ธฐ์ฌ ๋งํฌ]({link})")
|
| 147 |
+
st.markdown("---")
|