Spaces:
Sleeping
Sleeping
rdsarjito commited on
Commit Β·
7e019c7
1
Parent(s): f7834ca
six
Browse files
app.py
CHANGED
|
@@ -2,9 +2,8 @@ import streamlit as st
|
|
| 2 |
import pandas as pd
|
| 3 |
import pickle
|
| 4 |
import numpy as np
|
| 5 |
-
from sklearn.feature_extraction.text import TfidfVectorizer
|
| 6 |
-
from sklearn.multioutput import MultiOutputClassifier
|
| 7 |
import os
|
|
|
|
| 8 |
|
| 9 |
# Konfigurasi halaman
|
| 10 |
st.set_page_config(
|
|
@@ -13,23 +12,27 @@ st.set_page_config(
|
|
| 13 |
layout="wide"
|
| 14 |
)
|
| 15 |
|
| 16 |
-
#
|
| 17 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
def load_models():
|
| 19 |
-
"""Memuat semua model dan
|
| 20 |
models = {}
|
| 21 |
model_files = {
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
}
|
| 26 |
|
| 27 |
-
# Load TF-IDF
|
| 28 |
try:
|
| 29 |
-
with open('
|
| 30 |
tfidf_vectorizer = pickle.load(f)
|
| 31 |
except FileNotFoundError:
|
| 32 |
-
st.error("β TF-IDF
|
| 33 |
return None, None
|
| 34 |
|
| 35 |
# Load models
|
|
@@ -44,188 +47,176 @@ def load_models():
|
|
| 44 |
|
| 45 |
# Fungsi prediksi
|
| 46 |
def predict_allergens(text, model, vectorizer):
|
| 47 |
-
"""Melakukan prediksi alergen
|
| 48 |
-
# Transform text menggunakan TF-IDF
|
| 49 |
-
|
| 50 |
|
| 51 |
# Prediksi
|
| 52 |
-
prediction = model.predict(
|
| 53 |
-
prediction_proba = model.predict_proba(
|
| 54 |
|
| 55 |
return prediction[0], prediction_proba
|
| 56 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 57 |
# Label alergen
|
| 58 |
-
|
| 59 |
-
|
| 60 |
|
| 61 |
-
|
| 62 |
-
|
| 63 |
-
|
| 64 |
-
|
| 65 |
-
|
| 66 |
-
|
| 67 |
-
|
| 68 |
-
|
| 69 |
-
|
| 70 |
-
|
| 71 |
-
|
| 72 |
-
st.sidebar.header("βοΈ Konfigurasi")
|
| 73 |
-
|
| 74 |
-
# Pilihan model
|
| 75 |
-
available_models = list(models.keys())
|
| 76 |
-
if available_models:
|
| 77 |
-
selected_model = st.sidebar.selectbox(
|
| 78 |
-
"Pilih Model:",
|
| 79 |
-
available_models,
|
| 80 |
-
help="Pilih model machine learning untuk prediksi"
|
| 81 |
-
)
|
| 82 |
-
else:
|
| 83 |
-
st.error("β Tidak ada model yang tersedia!")
|
| 84 |
-
st.stop()
|
| 85 |
-
|
| 86 |
-
# Threshold untuk prediksi
|
| 87 |
-
threshold = st.sidebar.slider(
|
| 88 |
-
"Threshold Prediksi:",
|
| 89 |
-
min_value=0.1,
|
| 90 |
-
max_value=0.9,
|
| 91 |
-
value=0.5,
|
| 92 |
-
step=0.1,
|
| 93 |
-
help="Nilai ambang batas untuk menentukan prediksi positif"
|
| 94 |
)
|
| 95 |
|
| 96 |
-
#
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
|
| 107 |
-
|
| 108 |
-
)
|
| 109 |
-
|
| 110 |
-
|
| 111 |
-
|
| 112 |
-
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
|
| 116 |
-
|
| 117 |
-
"roti gandum dengan selai kacang",
|
| 118 |
-
"sup seafood dengan udang dan cumi",
|
| 119 |
-
"kue coklat dengan susu dan mentega",
|
| 120 |
-
"salad buah dengan yogurt"
|
| 121 |
-
]
|
| 122 |
-
|
| 123 |
-
for i, example in enumerate(examples):
|
| 124 |
-
if st.button(f"π {example}", key=f"example_{i}"):
|
| 125 |
-
st.session_state.food_text = example
|
| 126 |
-
st.rerun()
|
| 127 |
-
|
| 128 |
-
# Update text area jika ada contoh yang dipilih
|
| 129 |
-
if 'food_text' in st.session_state:
|
| 130 |
-
food_text = st.session_state.food_text
|
| 131 |
-
|
| 132 |
-
with col2:
|
| 133 |
-
st.header("βΉοΈ Informasi Model")
|
| 134 |
-
|
| 135 |
-
if selected_model in models:
|
| 136 |
-
st.success(f"β
Model aktif: **{selected_model}**")
|
| 137 |
-
|
| 138 |
-
# Informasi tentang alergen
|
| 139 |
-
st.subheader("π·οΈ Alergen yang Diprediksi:")
|
| 140 |
-
for emoji, label in zip(ALLERGEN_EMOJIS, ALLERGEN_LABELS):
|
| 141 |
-
st.write(f"{emoji} {label}")
|
| 142 |
-
|
| 143 |
-
# Hasil prediksi
|
| 144 |
-
if predict_button and food_text.strip():
|
| 145 |
-
st.markdown("---")
|
| 146 |
-
st.header("π Hasil Prediksi")
|
| 147 |
|
| 148 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 149 |
try:
|
| 150 |
-
#
|
| 151 |
-
|
| 152 |
-
|
| 153 |
models[selected_model],
|
| 154 |
tfidf_vectorizer
|
| 155 |
)
|
| 156 |
|
| 157 |
-
|
| 158 |
-
|
| 159 |
|
| 160 |
-
|
|
|
|
| 161 |
|
| 162 |
-
|
| 163 |
-
|
| 164 |
-
|
| 165 |
-
|
| 166 |
-
|
| 167 |
-
|
| 168 |
-
|
| 169 |
-
|
| 170 |
-
else:
|
| 171 |
-
proba = predictions[i]
|
| 172 |
-
|
| 173 |
-
# Tentukan status berdasarkan threshold
|
| 174 |
-
is_detected = predictions[i] == 1 or proba >= threshold
|
| 175 |
-
|
| 176 |
-
if is_detected:
|
| 177 |
-
st.error(f"{emoji} **{label}**\n\nβ οΈ TERDETEKSI\n\n({proba:.2%})")
|
| 178 |
detected_allergens.append(label)
|
| 179 |
else:
|
| 180 |
-
st.
|
| 181 |
-
|
| 182 |
-
# Ringkasan hasil
|
| 183 |
-
st.subheader("π Ringkasan Hasil")
|
| 184 |
|
|
|
|
|
|
|
| 185 |
if detected_allergens:
|
| 186 |
-
st.warning(f"β οΈ **
|
| 187 |
-
|
| 188 |
-
st.write(f"β’ {allergen}")
|
| 189 |
-
|
| 190 |
-
st.info("π‘ **Saran:** Hindari makanan ini jika Anda memiliki alergi terhadap bahan-bahan yang terdeteksi.")
|
| 191 |
else:
|
| 192 |
-
st.success("β
**
|
| 193 |
-
st.
|
| 194 |
|
| 195 |
-
#
|
| 196 |
-
|
| 197 |
-
st.
|
| 198 |
-
|
| 199 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 200 |
|
| 201 |
-
#
|
| 202 |
-
|
| 203 |
-
'Alergen'
|
| 204 |
-
|
| 205 |
-
|
| 206 |
-
|
| 207 |
-
|
| 208 |
-
|
| 209 |
-
st.
|
|
|
|
|
|
|
|
|
|
|
|
|
| 210 |
|
| 211 |
except Exception as e:
|
| 212 |
st.error(f"β Terjadi kesalahan saat prediksi: {str(e)}")
|
| 213 |
-
st.write("Pastikan model
|
| 214 |
-
|
| 215 |
-
|
| 216 |
-
|
| 217 |
-
|
| 218 |
-
|
| 219 |
-
|
| 220 |
-
|
| 221 |
-
|
| 222 |
-
|
| 223 |
-
|
| 224 |
-
|
| 225 |
-
|
| 226 |
-
|
| 227 |
-
|
| 228 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 229 |
|
| 230 |
-
|
| 231 |
-
|
|
|
|
| 2 |
import pandas as pd
|
| 3 |
import pickle
|
| 4 |
import numpy as np
|
|
|
|
|
|
|
| 5 |
import os
|
| 6 |
+
from datetime import datetime
|
| 7 |
|
| 8 |
# Konfigurasi halaman
|
| 9 |
st.set_page_config(
|
|
|
|
| 12 |
layout="wide"
|
| 13 |
)
|
| 14 |
|
| 15 |
+
# Judul aplikasi
|
| 16 |
+
st.title("π½οΈ Sistem Prediksi Alergen Makanan")
|
| 17 |
+
st.markdown("---")
|
| 18 |
+
|
| 19 |
+
# Cache untuk memuat model
|
| 20 |
+
@st.cache_data
|
| 21 |
def load_models():
|
| 22 |
+
"""Memuat semua model dan vectorizer yang tersimpan"""
|
| 23 |
models = {}
|
| 24 |
model_files = {
|
| 25 |
+
"XGBoost": "models/XGBoost_model.pkl",
|
| 26 |
+
"KNN": "models/KNN_model.pkl",
|
| 27 |
+
"Random Forest": "models/Random Forest_model.pkl"
|
| 28 |
}
|
| 29 |
|
| 30 |
+
# Load TF-IDF vectorizer
|
| 31 |
try:
|
| 32 |
+
with open('models/tfidf_vectorizer.pkl', 'rb') as f:
|
| 33 |
tfidf_vectorizer = pickle.load(f)
|
| 34 |
except FileNotFoundError:
|
| 35 |
+
st.error("β TF-IDF vectorizer tidak ditemukan! Pastikan file 'models/tfidf_vectorizer.pkl' ada.")
|
| 36 |
return None, None
|
| 37 |
|
| 38 |
# Load models
|
|
|
|
| 47 |
|
| 48 |
# Fungsi prediksi
|
| 49 |
def predict_allergens(text, model, vectorizer):
|
| 50 |
+
"""Melakukan prediksi alergen dari teks input"""
|
| 51 |
+
# Transform text menggunakan TF-IDF vectorizer
|
| 52 |
+
text_vector = vectorizer.transform([text])
|
| 53 |
|
| 54 |
# Prediksi
|
| 55 |
+
prediction = model.predict(text_vector)
|
| 56 |
+
prediction_proba = model.predict_proba(text_vector)
|
| 57 |
|
| 58 |
return prediction[0], prediction_proba
|
| 59 |
|
| 60 |
+
# Load models
|
| 61 |
+
models, tfidf_vectorizer = load_models()
|
| 62 |
+
|
| 63 |
+
if models is None or tfidf_vectorizer is None:
|
| 64 |
+
st.stop()
|
| 65 |
+
|
| 66 |
+
# Sidebar untuk pemilihan model
|
| 67 |
+
st.sidebar.header("βοΈ Pengaturan")
|
| 68 |
+
selected_model = st.sidebar.selectbox(
|
| 69 |
+
"Pilih Model:",
|
| 70 |
+
list(models.keys()),
|
| 71 |
+
help="Pilih model machine learning untuk prediksi"
|
| 72 |
+
)
|
| 73 |
+
|
| 74 |
# Label alergen
|
| 75 |
+
allergen_labels = ['Susu', 'Kacang', 'Telur', 'Makanan Laut', 'Gandum']
|
| 76 |
+
allergen_emojis = ['π₯', 'π₯', 'π₯', 'π¦', 'πΎ']
|
| 77 |
|
| 78 |
+
# Main interface
|
| 79 |
+
col1, col2 = st.columns([2, 1])
|
| 80 |
+
|
| 81 |
+
with col1:
|
| 82 |
+
st.header("π Input Teks Makanan")
|
| 83 |
+
|
| 84 |
+
# Text input
|
| 85 |
+
user_input = st.text_area(
|
| 86 |
+
"Masukkan deskripsi makanan atau ingredients:",
|
| 87 |
+
placeholder="Contoh: nasi goreng dengan telur, udang, dan kacang tanah",
|
| 88 |
+
height=100
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 89 |
)
|
| 90 |
|
| 91 |
+
# Contoh input
|
| 92 |
+
st.subheader("π‘ Contoh Input:")
|
| 93 |
+
examples = [
|
| 94 |
+
"pizza dengan keju mozzarella dan seafood",
|
| 95 |
+
"roti gandum dengan selai kacang",
|
| 96 |
+
"cake coklat dengan butter dan telur",
|
| 97 |
+
"sup tom yum dengan udang dan cumi",
|
| 98 |
+
"mie instan rasa ayam"
|
| 99 |
+
]
|
| 100 |
+
|
| 101 |
+
example_cols = st.columns(len(examples))
|
| 102 |
+
for i, example in enumerate(examples):
|
| 103 |
+
if example_cols[i].button(f"Contoh {i+1}", help=example):
|
| 104 |
+
user_input = example
|
| 105 |
+
st.rerun()
|
| 106 |
+
|
| 107 |
+
with col2:
|
| 108 |
+
st.header("βΉοΈ Informasi Model")
|
| 109 |
+
if selected_model in models:
|
| 110 |
+
st.success(f"β
Model {selected_model} siap digunakan")
|
| 111 |
+
st.info(f"π Jumlah label: {len(allergen_labels)}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 112 |
|
| 113 |
+
# Model info
|
| 114 |
+
model_info = {
|
| 115 |
+
"XGBoost": "Gradient Boosting yang efisien",
|
| 116 |
+
"KNN": "K-Nearest Neighbors",
|
| 117 |
+
"Random Forest": "Ensemble dari decision trees"
|
| 118 |
+
}
|
| 119 |
+
st.write(f"**Deskripsi:** {model_info.get(selected_model, 'Model machine learning')}")
|
| 120 |
+
|
| 121 |
+
# Prediksi
|
| 122 |
+
if st.button("π Prediksi Alergen", type="primary", use_container_width=True):
|
| 123 |
+
if user_input.strip():
|
| 124 |
+
with st.spinner("Sedang melakukan prediksi..."):
|
| 125 |
try:
|
| 126 |
+
# Prediksi
|
| 127 |
+
prediction, prediction_proba = predict_allergens(
|
| 128 |
+
user_input,
|
| 129 |
models[selected_model],
|
| 130 |
tfidf_vectorizer
|
| 131 |
)
|
| 132 |
|
| 133 |
+
st.markdown("---")
|
| 134 |
+
st.header("π Hasil Prediksi")
|
| 135 |
|
| 136 |
+
# Hasil prediksi dalam bentuk metrics
|
| 137 |
+
st.subheader("π― Deteksi Alergen")
|
| 138 |
|
| 139 |
+
# Buat columns untuk menampilkan hasil
|
| 140 |
+
cols = st.columns(len(allergen_labels))
|
| 141 |
+
|
| 142 |
+
detected_allergens = []
|
| 143 |
+
for i, (label, emoji) in enumerate(zip(allergen_labels, allergen_emojis)):
|
| 144 |
+
with cols[i]:
|
| 145 |
+
if prediction[i] == 1:
|
| 146 |
+
st.success(f"{emoji} **{label}**\n\nβ
**TERDETEKSI**")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 147 |
detected_allergens.append(label)
|
| 148 |
else:
|
| 149 |
+
st.info(f"{emoji} **{label}**\n\nβ Tidak terdeteksi")
|
|
|
|
|
|
|
|
|
|
| 150 |
|
| 151 |
+
# Ringkasan
|
| 152 |
+
st.subheader("π Ringkasan")
|
| 153 |
if detected_allergens:
|
| 154 |
+
st.warning(f"β οΈ **Alergen terdeteksi:** {', '.join(detected_allergens)}")
|
| 155 |
+
st.write("**Rekomendasi:** Harap berhati-hati jika Anda memiliki alergi terhadap bahan-bahan tersebut.")
|
|
|
|
|
|
|
|
|
|
| 156 |
else:
|
| 157 |
+
st.success("β
**Tidak ada alergen utama yang terdeteksi**")
|
| 158 |
+
st.write("**Catatan:** Selalu periksa label produk untuk memastikan keamanan.")
|
| 159 |
|
| 160 |
+
# Probability scores (jika tersedia)
|
| 161 |
+
try:
|
| 162 |
+
st.subheader("π Tingkat Kepercayaan")
|
| 163 |
+
prob_data = []
|
| 164 |
+
|
| 165 |
+
for i, (label, emoji) in enumerate(zip(allergen_labels, allergen_emojis)):
|
| 166 |
+
# Ambil probabilitas untuk kelas positif (indeks 1)
|
| 167 |
+
if hasattr(prediction_proba[i], 'shape') and len(prediction_proba[i][0]) > 1:
|
| 168 |
+
prob = prediction_proba[i][0][1] # Probabilitas kelas 1 (positif)
|
| 169 |
+
else:
|
| 170 |
+
prob = 0.5 # Default jika tidak ada probabilitas
|
| 171 |
+
|
| 172 |
+
prob_data.append({
|
| 173 |
+
'Alergen': f"{emoji} {label}",
|
| 174 |
+
'Probabilitas': prob,
|
| 175 |
+
'Persentase': f"{prob*100:.1f}%"
|
| 176 |
+
})
|
| 177 |
+
|
| 178 |
+
prob_df = pd.DataFrame(prob_data)
|
| 179 |
|
| 180 |
+
# Progress bars
|
| 181 |
+
for _, row in prob_df.iterrows():
|
| 182 |
+
st.write(f"**{row['Alergen']}**")
|
| 183 |
+
st.progress(row['Probabilitas'])
|
| 184 |
+
st.write(f"Kepercayaan: {row['Persentase']}")
|
| 185 |
+
st.write("")
|
| 186 |
+
|
| 187 |
+
except Exception as e:
|
| 188 |
+
st.info("π‘ Tingkat kepercayaan tidak tersedia untuk model ini")
|
| 189 |
+
|
| 190 |
+
# Timestamp
|
| 191 |
+
st.markdown("---")
|
| 192 |
+
st.caption(f"Prediksi dilakukan pada: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}")
|
| 193 |
|
| 194 |
except Exception as e:
|
| 195 |
st.error(f"β Terjadi kesalahan saat prediksi: {str(e)}")
|
| 196 |
+
st.write("Pastikan semua file model sudah tersedia dan format input benar.")
|
| 197 |
+
else:
|
| 198 |
+
st.warning("β οΈ Silakan masukkan teks untuk prediksi!")
|
| 199 |
+
|
| 200 |
+
# Footer
|
| 201 |
+
st.markdown("---")
|
| 202 |
+
st.markdown("""
|
| 203 |
+
### π Catatan Penting:
|
| 204 |
+
- Sistem ini adalah alat bantu dan tidak menggantikan konsultasi medis profesional
|
| 205 |
+
- Selalu periksa label produk dan konsultasikan dengan dokter untuk alergi yang serius
|
| 206 |
+
- Akurasi prediksi tergantung pada kualitas data training dan input yang diberikan
|
| 207 |
+
""")
|
| 208 |
+
|
| 209 |
+
# Informasi tambahan di sidebar
|
| 210 |
+
st.sidebar.markdown("---")
|
| 211 |
+
st.sidebar.header("π Informasi Alergen")
|
| 212 |
+
st.sidebar.markdown("""
|
| 213 |
+
**Alergen yang dideteksi:**
|
| 214 |
+
- π₯ **Susu**: Produk dairy, keju, yogurt
|
| 215 |
+
- π₯ **Kacang**: Kacang tanah, almond, dll
|
| 216 |
+
- π₯ **Telur**: Telur ayam dan produk turunannya
|
| 217 |
+
- π¦ **Makanan Laut**: Udang, ikan, kerang
|
| 218 |
+
- πΎ **Gandum**: Tepung terigu, roti, pasta
|
| 219 |
+
""")
|
| 220 |
|
| 221 |
+
st.sidebar.markdown("---")
|
| 222 |
+
st.sidebar.info("π‘ **Tips:** Semakin detail deskripsi makanan yang Anda berikan, semakin akurat hasil prediksinya.")
|
{saved_models β models}/KNN_model.pkl
RENAMED
|
File without changes
|
{saved_models β models}/Random Forest_model.pkl
RENAMED
|
File without changes
|
{saved_models β models}/XGBoost_model.pkl
RENAMED
|
File without changes
|
{saved_models β models}/tfidf_vectorizer.pkl
RENAMED
|
File without changes
|
requirements.txt
CHANGED
|
@@ -3,4 +3,4 @@ pandas
|
|
| 3 |
scikit-learn
|
| 4 |
xgboost
|
| 5 |
numpy
|
| 6 |
-
pickle
|
|
|
|
| 3 |
scikit-learn
|
| 4 |
xgboost
|
| 5 |
numpy
|
| 6 |
+
pickle
|