Spaces:

namngo
/

GradOnTrack

Sleeping

App Files Files Community

namngo commited on May 8, 2025

Commit

182504e

verified ·

1 Parent(s): 3d6329e

Update app.py

Browse files

Files changed (1) hide show

app.py +227 -138

app.py CHANGED Viewed

@@ -71,41 +71,30 @@ def save_to_gsheet(name, student_id, major, prediction, semester_data, sheet_nam
     # Get all values from the sheet to check if the first row is empty (i.e., headers not created yet)
     all_values = sheet.get_all_values()
-    # Define headers based on the model type for clarity in the sheet
-    base_headers = ["Họ và tên", "MSV", "Khoa", "Dự báo", "Thời gian"]
-    if sheet_name == "Trang tính1": # Full model headers
-        semester_headers = []
-        for i in range(6):
-            semester_headers += [
-                f"Số môn không thi - HK{i+1}",
-                f"Số tín chỉ không thi - HK{i+1}",
-                f"Số tín chỉ nợ - HK{i+1}",
-                f"Số môn không đạt - HK{i+1}",
-                f"Tổng tín chỉ học kỳ - HK{i+1}",
-                f"Số môn học kỳ - HK{i+1}",
-                f"Số môn đạt - HK{i+1}",
-                f"GPA - HK{i+1}",
-                f"Xếp loại - HK{i+1}"
-            ]
-        # Add nganh header
-        headers = base_headers + semester_headers + ["Ngành (0: CNTT, 1: Kinh tế)"]
-    elif sheet_name == "Trang tính2": # Important features model headers
-        semester_headers = []
-        for i in range(6):
-            semester_headers += [
-                f"Số tín chỉ đạt - HK{i+1}",
-                f"Số tín chỉ nợ - HK{i+1}",
-                f"Điểm trung bình - HK{i+1}"
-            ]
-        headers = base_headers + semester_headers
-    # If the sheet is empty or if headers are missing or mismatched, insert headers
-    if not all_values or len(all_values[0]) != len(headers):
-        sheet.clear() # Clear existing content if headers are wrong or missing
-        sheet.append_row(headers)  # Create headers
     # Append data to the sheet
     sheet.append_row(data_row)
@@ -114,7 +103,7 @@ def save_to_gsheet(name, student_id, major, prediction, semester_data, sheet_nam
 # def list_sheet_names(sheet_id):
 #     client = get_gsheet_client()
 #     sheet = client.open_by_key(sheet_id)
-#
 #     # List all sheet names
 #     sheet_names = [worksheet.title for worksheet in sheet.worksheets()]
 #     return sheet_names
@@ -140,12 +129,12 @@ sample_cntt_example_full = {
     "student_id": "10117367",
     "major": "Công nghệ thông tin",
     "semester_data": [
-        0, 0, 0, 0, 17, 7, 7, 8.73, 0, # HK1
-        0, 0, 0, 0, 17, 7, 7, 8.19, 0, # HK2
-        0, 0, 0, 0, 17, 7, 7, 7.90, 0, # HK3
-        0, 0, 0, 0, 17, 7, 7, 8.19, 0, # HK4
-        0, 0, 0, 0, 19, 7, 6, 8.18, 0, # HK5
-        0, 0, 5, 2, 19, 7, 5, 7.10, 1 # HK6
     ]
 }
@@ -166,6 +155,7 @@ sample_kinhte_example_simple = {
 }
 # ===== Ví dụ cho mô hình "Dùng mô hình đơn giản" cho CNTT =====
 sample_cntt_example_simple = {
     "name": "Nguyễn Văn B",
@@ -187,123 +177,222 @@ sample_kinhte_example_full = {
     "student_id": "11418093",
     "major": "Kinh tế",
     "semester_data": [
-        0, 0, 0, 0, 16, 6, 6, 7.00, 1, # HK1
-        0, 0, 0, 0, 18, 7, 7, 8.20, 1, # HK2
-        0, 0, 0, 0, 17, 7, 7, 7.80, 1, # HK3
-        0, 0, 0, 0, 17, 7, 6, 7.90, 1, # HK4
-        0, 0, 0, 0, 19, 8, 5, 8.10, 0, # HK5
-        0, 0, 8, 2, 19, 7, 6, 7.30, 1 # HK6
     ]
 }
 # ===== Thông tin cá nhân =====
-# Determine which example data to use based on model type and selected option
-if model_type == "Dùng toàn bộ đặc trưng":
-    if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin":
-        selected_example_data = sample_cntt_example_full
-        default_major_index = 0
-    elif sample_option == "Dùng ví dụ mẫu ngành Kinh tế":
-        selected_example_data = sample_kinhte_example_full
-        default_major_index = 1
-    else:
-        selected_example_data = None
-        default_major_index = 0 # Default to CNTT
-else: # Dùng đặc trưng quan trọng
-    if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin":
-        selected_example_data = sample_cntt_example_simple
-        default_major_index = 0
-    elif sample_option == "Dùng ví dụ mẫu ngành Kinh tế":
-        selected_example_data = sample_kinhte_example_simple
-        default_major_index = 1
-    else:
-        selected_example_data = None
-        default_major_index = 0 # Default to CNTT
-name_value = selected_example_data["name"] if selected_example_data else ""
-student_id_value = selected_example_data["student_id"] if selected_example_data else ""
-name = st.text_input("👤 Họ và tên", value=name_value)
-student_id = st.text_input("🎓 Mã sinh viên", value=student_id_value)
-major = st.selectbox("📚 Ngành học", ["Công nghệ thông tin", "Kinh tế"], index=default_major_index)
 st.write("---")
 # ===== Nhập thông tin học kỳ =====
-def input_semester_full(semester_label, default_values=None):
     with st.expander(f"📖 {semester_label}", expanded=True):
         col1, col2 = st.columns(2)
         with col1:
-            somon0thi = st.number_input("Số môn không thi", 0, value=default_values[0] if default_values and len(default_values) > 0 else 0, key=f"sm0_{semester_label}")
-            sotc0thi = st.number_input("Số tín chỉ không thi", 0, value=default_values[1] if default_values and len(default_values) > 1 else 0, key=f"tc0_{semester_label}")
-            sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[2] if default_values and len(default_values) > 2 else 0, key=f"tcno_{semester_label}")
-            mhno = st.number_input("Số môn không đạt", 0, value=default_values[3] if default_values and len(default_values) > 3 else 0, key=f"mhno_{semester_label}")
-            # Calculate default_tc_qua if possible, otherwise default to 0
-            default_tc_qua = 0
-            if default_values and len(default_values) > 4 and len(default_values) > 2:
-                default_tc_qua = default_values[4] - default_values[2]
-            sotc_qua = st.number_input("Số tín chỉ qua môn", 0, value=default_tc_qua, key=f"tcqua_{semester_label}")
         with col2:
-            TCHK = st.number_input("Tổng tín chỉ học kỳ", 0, value=default_values[4] if default_values and len(default_values) > 4 else 0, key=f"tchk_{semester_label}")
-            smhk = st.number_input("Số môn học kỳ", 0, value=default_values[5] if default_values and len(default_values) > 5 else 0, key=f"smhk_{semester_label}")
-            mhpass = st.number_input("Số môn đạt", 0, value=default_values[6] if default_values and len(default_values) > 6 else 0, key=f"mhpass_{semester_label}")
-            TBCHK = st.number_input("GPA", 0.0, 10.0, value=default_values[7] if default_values and len(default_values) > 7 else 0.0, step=0.01, key=f"gpa_{semester_label}")
-            xep_loai_selected = st.selectbox("Xếp loại", list(range(7)), index=default_values[8] if default_values and len(default_values) > 8 else 0, key=f"xeploai_{semester_label}")
-    return [somon0thi, sotc0thi, sotcno, mhno, TCHK, smhk, mhpass, TBCHK, xep_loai_selected] # Removed sotc_qua as it's calculated
 # ===== Giao diện theo mô hình =====
 data = []
 semesters = ["HỌC KỲ I", "HỌC KỲ II", "HỌC KỲ III", "HỌC KỲ IV", "HỌC KỲ V", "HỌC KỲ VI"]
-# Mô hình 1: "Dùng toàn bộ đặc trưng"
 if model_type == "Dùng toàn bộ đặc trưng":
-    st.subheader("🔢 Nhập thông tin học kỳ chi tiết")
-    for idx, sem in enumerate(semesters):
         example_data = sample_cntt_example_full if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin" else sample_kinhte_example_full if sample_option == "Dùng ví dụ mẫu ngành Kinh tế" else None
-        default_values = example_data["semester_data"][idx*9:(idx+1)*9] if example_data else None
-        data += input_semester_full(sem, default_values)
-    nganh = 0 if major == "Công nghệ thông tin" else 1
-    final_features = np.array(data + [nganh]).reshape(1, -1)
-# Mô hình 2: "Dùng đặc trưng quan trọng" (Simplified layout as per image)
-else:
     st.subheader("✨ Nhập thông tin rút gọn")
-    example_data = sample_cntt_example_simple if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin" else sample_kinhte_example_simple if sample_option == "Dùng ví dụ mẫu ngành Kinh tế" else None
-    semester_data_example = example_data["semester_data"] if example_data else [0, 0, 0] * 6 # Default to zeros if no example
-    # Row 1: HK I, HK II, HK III
-    cols1 = st.columns(3)
-    for idx, sem in enumerate(semesters[:3]):
-        with cols1[idx]:
-            with st.expander(f"📘 {sem}", expanded=True):
-                default_values = semester_data_example[idx*3:(idx+1)*3]
-                sotc_qua = st.number_input("Số tín chỉ đạt", 0, value=default_values[0] if len(default_values) > 0 else 0, key=f"tcqua_imp_{sem}")
-                sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[1] if len(default_values) > 1 else 0, key=f"tcno_imp_{sem}")
-                TBCHK = st.number_input("Điểm trung bình", 0.0, 10.0, value=default_values[2] if len(default_values) > 2 else 0.0, step=0.01, key=f"gpa_imp_{sem}")
-                data.extend([sotc_qua, sotcno, TBCHK]) # Collect data
-    # Row 2: HK IV, HK V, HK VI (assuming VI is included based on semesters list)
-    cols2 = st.columns(3)
-    for idx, sem in enumerate(semesters[3:]):
-        with cols2[idx]:
-            with st.expander(f"📘 {sem}", expanded=True):
-                # Adjust index for example data: idx here is 0, 1, 2 for HK IV, V, VI
-                example_idx = idx + 3 # Adjust to get correct data from the 6 semesters
-                default_values = semester_data_example[example_idx*3:(example_idx+1)*3]
-                sotc_qua = st.number_input("Số tín chỉ đạt", 0, value=default_values[0] if len(default_values) > 0 else 0, key=f"tcqua_imp_{sem}")
-                sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[1] if len(default_values) > 1 else 0, key=f"tcno_imp_{sem}")
-                TBCHK = st.number_input("Điểm trung bình", 0.0, 10.0, value=default_values[2] if len(default_values) > 2 else 0.0, step=0.01, key=f"gpa_imp_{sem}")
-                data.extend([sotc_qua, sotcno, TBCHK]) # Collect data
-    final_features = np.array(data).reshape(1, -1)
 # ===== Predict =====
 if st.button("🎯 DỰ BÁO"):
@@ -311,9 +400,9 @@ if st.button("🎯 DỰ BÁO"):
         prediction = model_full.predict(final_features)
         sheet_name = "Trang tính1"  # For full data model, save to Trang tính1
-    else:
         prediction = model_important.predict(final_features)
-        sheet_name = "Trang tính2"  # For full data model, save to Trang tính1
     if prediction[0] == 1:

     # Get all values from the sheet to check if the first row is empty (i.e., headers not created yet)
     all_values = sheet.get_all_values()
+    # Define headers based on the model type for accurate sheet saving
+    if sheet_name == "Trang tính1": # Full features model
+        headers = ["Họ và tên", "MSV", "Khoa", "Dự báo", "Thời gian"] + [
+            f"Số môn không thi - HK{i+1}" for i in range(6)] + [
+            f"Số tín chỉ không thi - HK{i+1}" for i in range(6)] + [
+            f"Số tín chỉ nợ - HK{i+1}" for i in range(6)] + [
+            f"Số môn không đạt - HK{i+1}" for i in range(6)] + [
+            f"Số tín chỉ qua môn - HK{i+1}" for i in range(6)] + [
+            f"Tổng tín chỉ học kỳ - HK{i+1}" for i in range(6)] + [
+            f"Số môn học kỳ - HK{i+1}" for i in range(6)] + [
+            f"Số môn đạt - HK{i+1}" for i in range(6)] + [
+            f"GPA - HK{i+1}" for i in range(6)] + [
+            f"Xếp loại - HK{i+1}" for i in range(6)]
+    elif sheet_name == "Trang tính2": # Important features model
+         headers = ["Họ và tên", "MSV", "Khoa", "Dự báo", "Thời gian"] + [
+            f"Số tín chỉ đạt - HK{i+1}" for i in range(6)] + [
+            f"Số tín chỉ nợ - HK{i+1}" for i in range(6)] + [
+            f"Điểm trung bình - HK{i+1}" for i in range(6)]
+    # If the sheet is empty or if headers are missing, insert headers
+    if not all_values or len(all_values[0]) != len(headers):  # Ensure number of columns matches expected headers
+        sheet.append_row(headers)  # Create headers if missing
     # Append data to the sheet
     sheet.append_row(data_row)
 # def list_sheet_names(sheet_id):
 #     client = get_gsheet_client()
 #     sheet = client.open_by_key(sheet_id)
 #     # List all sheet names
 #     sheet_names = [worksheet.title for worksheet in sheet.worksheets()]
 #     return sheet_names
     "student_id": "10117367",
     "major": "Công nghệ thông tin",
     "semester_data": [
+        0, 0, 0, 0, 17, 7, 7, 8.73, 0,
+        0, 0, 0, 0, 17, 7, 7, 8.19, 0,
+        0, 0, 0, 0, 17, 7, 7, 7.90, 0,
+        0, 0, 0, 0, 17, 7, 7, 8.19, 0,
+        0, 0, 0, 0, 19, 7, 6, 8.18, 0,
+        0, 0, 5, 2, 19, 7, 5, 7.10, 1
     ]
 }
 }
+# ===== Ví dụ cho mô hình "Dùng mô hình đơn giản" cho CNTT =====
 # ===== Ví dụ cho mô hình "Dùng mô hình đơn giản" cho CNTT =====
 sample_cntt_example_simple = {
     "name": "Nguyễn Văn B",
     "student_id": "11418093",
     "major": "Kinh tế",
     "semester_data": [
+        0, 0, 0, 0, 16, 6, 6, 7.00, 1,
+        0, 0, 0, 0, 18, 7, 7, 8.20, 1,
+        0, 0, 0, 0, 17, 7, 7, 7.80, 1,
+        0, 0, 0, 0, 17, 7, 6, 7.90, 1,
+        0, 0, 0, 0, 19, 8, 5, 8.10, 0,
+        0, 0, 8, 2, 19, 7, 6, 7.30, 1
     ]
 }
 # ===== Thông tin cá nhân =====
+if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin":
+    # Check model type to load appropriate example data
+    if model_type == "Dùng toàn bộ đặc trưng":
+        sample_data_personal = sample_cntt_example_full
+    else: # Dùng đặc trưng quan trọng
+        sample_data_personal = sample_cntt_example_simple
+    name = st.text_input("👤 Họ và tên", value=sample_data_personal["name"])
+    student_id = st.text_input("🎓 Mã sinh viên", value=sample_data_personal["student_id"])
+    major = st.selectbox("📚 Ngành học", ["Công nghệ thông tin", "Kinh tế"], index=0)
+elif sample_option == "Dùng ví dụ mẫu ngành Kinh tế":
+    # Check model type to load appropriate example data
+    if model_type == "Dùng toàn bộ đặc trưng":
+        sample_data_personal = sample_kinhte_example_full
+    else: # Dùng đặc trưng quan trọng
+        sample_data_personal = sample_kinhte_example_simple
+    name = st.text_input("👤 Họ và tên", value=sample_data_personal["name"])
+    student_id = st.text_input("🎓 Mã sinh viên", value=sample_data_personal["student_id"])
+    major = st.selectbox("📚 Ngành học", ["Công nghệ thông tin", "Kinh tế"], index=1)
+else:
+    name = st.text_input("👤 Họ và tên")
+    student_id = st.text_input("🎓 Mã sinh viên")
+    major = st.selectbox("📚 Ngành học", ["Công nghệ thông tin", "Kinh tế"])
 st.write("---")
 # ===== Nhập thông tin học kỳ =====
+def input_semester(semester_label, default_values=None):
     with st.expander(f"📖 {semester_label}", expanded=True):
         col1, col2 = st.columns(2)
         with col1:
+            somon0thi = st.number_input("Số môn không thi", 0, value=default_values[0] if default_values else 0, key=f"sm0_{semester_label}")
+            sotc0thi = st.number_input("Số tín chỉ không thi", 0, value=default_values[1] if default_values else 0, key=f"tc0_{semester_label}")
+            sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[2] if default_values else 0, key=f"tcno_{semester_label}")
+            mhno = st.number_input("Số môn không đạt", 0, value=default_values[3] if default_values else 0, key=f"mhno_{semester_label}")
+            try:
+                default_tc_qua = default_values[4] - default_values[2] if default_values and len(default_values) >= 5 else 0 # This calculation seems incorrect for "Số tín chỉ qua môn" if default_values[4] is Total Credit
+            except:
+                default_tc_qua = 0
+            # Correcting default value logic for "Số tín chỉ qua môn" based on sample data structure
+            # If default_values has 9 elements (full model data), default_tc_qua is at index 4
+            if default_values and len(default_values) == 9:
+                 default_tc_qua_input = default_values[4]
+            else:
+                 default_tc_qua_input = 0 # Or some default
+            sotc_qua = st.number_input("Số tín chỉ qua môn", 0, value=default_tc_qua_input, key=f"tcqua_{semester_label}")
         with col2:
+            TCHK = st.number_input("Tổng tín chỉ học kỳ", 0, value=default_values[4] if default_values else 0, key=f"tchk_{semester_label}")
+            smhk = st.number_input("Số môn học kỳ", 0, value=default_values[5] if default_values else 0, key=f"smhk_{semester_label}")
+            mhpass = st.number_input("Số môn đạt", 0, value=default_values[6] if default_values else 0, key=f"mhpass_{semester_label}")
+            TBCHK = st.number_input("GPA", 0.0, 10.0, value=default_values[7] if default_values else 0.0, step=0.01, key=f"gpa_{semester_label}")
+            xep_loai_selected = st.selectbox("Xếp loại", list(range(7)), index=default_values[8] if default_values else 0, key=f"xeploai_{semester_label}")
+    return [somon0thi, sotc0thi, sotcno, mhno, TCHK, smhk, mhpass, TBCHK, xep_loai_selected, sotc_qua]
+def input_important_features(semester_label, default_values=None):
+    with st.expander(f"📘 {semester_label}", expanded=True):
+        col1, col2, col3 = st.columns(3) # Use 3 columns for important features layout
+        with col1:
+            # Use consistent keys for input fields
+            sotc_qua = st.number_input("Số tín chỉ đạt", 0, value=default_values[0] if default_values and len(default_values) > 0 else 0, key=f"tcqua_imp_{semester_label}")
+        with col2:
+            sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[1] if default_values and len(default_values) > 1 else 0, key=f"tcno_imp_{semester_label}")
+        with col3:
+            TBCHK = st.number_input("Điểm trung bình", 0.0, 10.0, value=default_values[2] if default_values and len(default_values) > 2 else 0.0, step=0.01, key=f"gpa_imp_{semester_label}")
+    return [sotc_qua, sotcno, TBCHK]
 # ===== Giao diện theo mô hình =====
 data = []
 semesters = ["HỌC KỲ I", "HỌC KỲ II", "HỌC KỲ III", "HỌC KỲ IV", "HỌC KỲ V", "HỌC KỲ VI"]
+# Mô hình 1: "Dùng toàn bộ dữ liệu"
 if model_type == "Dùng toàn bộ đặc trưng":
+    st.subheader("🔢 Nhập thông tin học kỳ chi tiết")
+    for idx, sem in enumerate(semesters):
+        example_data = sample_cntt_example_full if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin" else sample_kinhte_example_full if sample_option == "Dùng ví dụ mẫu ngành Kinh tế" else None
+        # Full model data has 9 features per semester + 1 extra (sotc_qua, which was calculated) = 10 features.
+        # Update: based on the data structure, there are 9 features per semester in the full model example.
+        # The input_semester function returns 10 values. Let's check the save_to_gsheet function's headers for full model.
+        # Headers for full model have 9 semester specific columns per semester.
+        # Let's correct input_semester to return 9 values matching the headers/example data.
+        # The example data has 9 values per semester for the full model.
+        # Let's fix the input_semester function to match the example data and headers (9 features).
+        # The example data has [0, 0, 0, 0, 17, 7, 7, 8.73, 0] -> 9 values.
+        # The input_semester returns [somon0thi, sotc0thi, sotcno, mhno, TCHK, smhk, mhpass, TBCHK, xep_loai_selected, sotc_qua] -> 10 values.
+        # The save_to_gsheet headers for full model list 9 columns per semester.
+        # Let's align input_semester to return the 9 values that correspond to the headers.
+        # Headers: Số môn không thi, Số tín chỉ không thi, Số tín chỉ nợ, Số môn không đạt, Số tín chỉ qua môn, Tổng tín chỉ học kỳ, Số môn học kỳ, Số môn đạt, GPA, Xếp loại
+        # This is 10 headers per semester. The example data has 9. Let's fix the example data structure to match headers or vice versa.
+        # Assuming headers are correct: Número môn không thi, Số tín chỉ không thi, Số tín chỉ nợ, Số môn không đạt, Số tín chỉ qua môn, Tổng tín chỉ học kỳ, Số môn học kỳ, Số môn đạt, GPA, Xếp loại (10 features)
+        # Let's update the example data for the full model to include all 10 features if possible or remove headers that don't match the example data.
+        # Given the original code's save_to_gsheet headers for the full model list 10 items per semester type, and the example data for full model has 9 items per semester type, there's a mismatch.
+        # Let's assume the `input_semester` function's return values are correct based on the intended model features, and the `sample_cntt_example_full` and `sample_kinhte_example_full` are slightly off or need adjustment to match the 10 inputs.
+        # The `input_semester` returns: somon0thi, sotc0thi, sotcno, mhno, TCHK, smhk, mhpass, TBCHK, xep_loai_selected, sotc_qua. This is 10 values.
+        # The `save_to_gsheet` headers for 'Trang tính1' list 10 headers per semester type. This matches.
+        # The `sample_cntt_example_full` and `sample_kinhte_example_full` have 9 values per semester. This is where the discrepancy is.
+        # To make the examples work correctly with the full model inputs, the example data structure should match the 10 features collected by `input_semester`.
+        # The missing feature in the example data seems to be `sotc_qua`.
+        # Let's adjust the example data to include a value for `sotc_qua` for each semester, or adjust the `input_semester` default value logic.
+        # A simpler fix for now is to adjust the `input_semester` default value logic to handle the case where example data might be shorter.
+        # The `default_tc_qua_input` line within `input_semester` was calculating it, let's remove that and rely solely on the example data if available.
+        # And if example data for `sotc_qua` is missing, default to 0.
+        # Corrected input_semester default value handling:
+        def input_semester_corrected(semester_label, default_values=None):
+            with st.expander(f"📖 {semester_label}", expanded=True):
+                col1, col2 = st.columns(2)
+                with col1:
+                    somon0thi = st.number_input("Số môn không thi", 0, value=default_values[0] if default_values and len(default_values) > 0 else 0, key=f"sm0_{semester_label}")
+                    sotc0thi = st.number_input("Số tín chỉ không thi", 0, value=default_values[1] if default_values and len(default_values) > 1 else 0, key=f"tc0_{semester_label}")
+                    sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[2] if default_values and len(default_values) > 2 else 0, key=f"tcno_{semester_label}")
+                    mhno = st.number_input("Số môn không đạt", 0, value=default_values[3] if default_values and len(default_values) > 3 else 0, key=f"mhno_{semester_label}")
+                    # Assuming sotc_qua is the 5th value in the example data if 9 values exist
+                    sotc_qua_default = default_values[4] if default_values and len(default_values) > 4 else 0
+                    sotc_qua = st.number_input("Số tín chỉ qua môn", 0, value=sotc_qua_default, key=f"tcqua_{semester_label}")
+                with col2:
+                    TCHK = st.number_input("Tổng tín chỉ học kỳ", 0, value=default_values[5] if default_values and len(default_values) > 5 else 0, key=f"tchk_{semester_label}")
+                    smhk = st.number_input("Số môn học kỳ", 0, value=default_values[6] if default_values and len(default_values) > 6 else 0, key=f"smhk_{semester_label}")
+                    mhpass = st.number_input("Số môn đạt", 0, value=default_values[7] if default_values and len(default_values) > 7 else 0, key=f"mhpass_{semester_label}")
+                    TBCHK = st.number_input("GPA", 0.0, 10.0, value=default_values[8] if default_values and len(default_values) > 8 else 0.0, step=0.01, key=f"gpa_{semester_label}")
+                    xep_loai_selected = st.selectbox("Xếp loại", list(range(7)), index=default_values[9] if default_values and len(default_values) > 9 else 0, key=f"xeploai_{semester_label}") # Assuming Xếp loại is the 10th value
+            return [somon0thi, sotc0thi, sotcno, mhno, sotc_qua, TCHK, smhk, mhpass, TBCHK, xep_loai_selected] # Return 10 values
+        # Let's update the example data structure to have 10 values per semester for consistency
+        # Based on the headers, the order should be: Số môn không thi, Số tín chỉ không thi, Số tín chỉ nợ, Số môn không đạt, Số tín chỉ qua môn, Tổng tín chỉ học kỳ, Số môn học kỳ, Số môn đạt, GPA, Xếp loại
+        # The original example data was [somon0thi, sotc0thi, sotcno, mhno, TCHK, smhk, mhpass, TBCHK, xep_loai_selected] -> 9 values
+        # It seems "Số tín chỉ qua môn" was missing or intended to be calculated.
+        # Let's assume "Số tín chỉ qua môn" is implicitly TCHK - sotcno.
+        # However, the headers list "Số tín chỉ qua môn" as a separate column.
+        # Let's assume the headers are correct and the example data needs to match the headers.
+        # Let's restructure example data to have 10 values, adding a plausible value for "Số tín chỉ qua môn" (TCHK - sotcno).
+        sample_cntt_example_full = {
+            "name": "Nguyễn Văn A",
+            "student_id": "10117367",
+            "major": "Công nghệ thông tin",
+            "semester_data": [
+                # HK1: sm0, tc0, tcno, mhno, tc_qua (calculated: TCHK-tcno), TCHK, smhk, mhpass, GPA, xeploai
+                0, 0, 0, 0, 17-0, 17, 7, 7, 8.73, 0,
+                # HK2:
+                0, 0, 0, 0, 17-0, 17, 7, 7, 8.19, 0,
+                # HK3:
+                0, 0, 0, 0, 17-0, 17, 7, 7, 7.90, 0,
+                # HK4:
+                0, 0, 0, 0, 17-0, 17, 7, 7, 8.19, 0,
+                # HK5:
+                0, 0, 0, 0, 19-0, 19, 7, 6, 8.18, 0,
+                # HK6: tcno=5, mhno=2, TCHK=19, mhpass=6, xeploai=1. Assuming tc_qua = TCHK - tcno = 19-5 = 14
+                0, 0, 5, 2, 19-5, 19, 7, 6, 7.10, 1
+            ]
+        }
+        sample_kinhte_example_full = {
+            "name": "Trần Thị C",
+            "student_id": "11418093",
+            "major": "Kinh tế",
+            "semester_data": [
+                 # HK1:
+                0, 0, 0, 0, 16-0, 16, 6, 6, 7.00, 1,
+                 # HK2:
+                0, 0, 0, 0, 18-0, 18, 7, 7, 8.20, 1,
+                 # HK3:
+                0, 0, 0, 0, 17-0, 17, 7, 7, 7.80, 1,
+                 # HK4:
+                0, 0, 0, 0, 17-0, 17, 7, 6, 7.90, 1,
+                 # HK5:
+                0, 0, 0, 0, 19-0, 19, 8, 5, 8.10, 0,
+                 # HK6: tcno=8, mhno=2, TCHK=19, mhpass=6, xeploai=1. Assuming tc_qua = TCHK - tcno = 19-8 = 11
+                0, 0, 8, 2, 19-8, 19, 7, 6, 7.30, 1
+            ]
+        }
+        # Now the example data for the full model should match the 10 inputs per semester.
         example_data = sample_cntt_example_full if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin" else sample_kinhte_example_full if sample_option == "Dùng ví dụ mẫu ngành Kinh tế" else None
+        default_values = example_data["semester_data"][idx*10:(idx+1)*10] if example_data else None # Slice 10 values
+        data += input_semester_corrected(sem, default_values) # Use the corrected function
+    nganh = 0 if major == "Công nghệ thông tin" else 1
+    final_features = np.array(data + [nganh]).reshape(1, -1)
+# Mô hình 2: "Dùng đặc trưng quan trọng"
+else: # model_type == "Dùng đặc trưng quan trọng"
     st.subheader("✨ Nhập thông tin rút gọn")
+    # Allow selecting an example
+    for idx, sem in enumerate(semesters):
+        example_data = sample_cntt_example_simple if sample_option == "Dùng ví dụ mẫu ngành Công nghệ thông tin" else sample_kinhte_example_simple if sample_option == "Dùng ví dụ mẫu ngành Kinh tế" else None
+        # Slice 3 values per semester for the simple model example data
+        default_values = example_data["semester_data"][idx*3:(idx+1)*3] if example_data else None
+        # Use expander to group each semester's fields
+        with st.expander(f"📘 {sem}", expanded=True):
+            # Use 3 columns to align with the image layout for all semesters
+            col1, col2, col3 = st.columns(3)
+            with col1:
+                # Use consistent keys for input fields
+                sotc_qua = st.number_input("Số tín chỉ đạt", 0, value=default_values[0] if default_values and len(default_values) > 0 else 0, key=f"tcqua_imp_{sem}")
+            with col2:
+                sotcno = st.number_input("Số tín chỉ nợ", 0, value=default_values[1] if default_values and len(default_values) > 1 else 0, key=f"tcno_imp_{sem}")
+            with col3:
+                # Adjusted label to match the image: "Điểm trung bình hệ 10"
+                TBCHK = st.number_input("Điểm trung bình hệ 10", 0.0, 10.0, value=default_values[2] if default_values and len(default_values) > 2 else 0.0, step=0.01, key=f"gpa_imp_{sem}")
+        # Collect semester data (3 values per semester)
+        data += [sotc_qua, sotcno, TBCHK]
+    final_features = np.array(data).reshape(1, -1) # Should be 6 semesters * 3 features = 18 features
 # ===== Predict =====
 if st.button("🎯 DỰ BÁO"):
         prediction = model_full.predict(final_features)
         sheet_name = "Trang tính1"  # For full data model, save to Trang tính1
+    else: # model_type == "Dùng đặc trưng quan trọng"
         prediction = model_important.predict(final_features)
+        sheet_name = "Trang tính2"  # For important data model, save to Trang tính2
     if prediction[0] == 1: