Spaces:

NghiTran1009
/

annotator-tool

Sleeping

App Files Files Community

NghiTran1009 commited on Mar 12, 2025

Commit

da4e37a

verified ·

1 Parent(s): 03ea370

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -7

app.py CHANGED Viewed

@@ -35,6 +35,9 @@ y_pred = crf.predict(X_test)[0]
 sentence["Predicted_Chunk"] = y_pred
 sentence["Is_Correct"] = sentence["Chunk"] == sentence["Predicted_Chunk"]  # Kiểm tra dự đoán
 # Highlight lỗi: Màu đỏ nếu `Predicted_Chunk` sai
 def highlight_errors(row):
     return ["background-color: #FF9999" if not row["Is_Correct"] else "" for _ in row]
@@ -45,14 +48,13 @@ num_wrong = len(sentence) - num_correct
 st.write(f"✅ **Số token đúng**: {num_correct} / {len(sentence)}")
 st.write(f"❌ **Số token sai**: {num_wrong}")
-# **🔹 Hiển thị bảng đầy đủ (bao gồm `Chunk` nhưng không hiển thị trong Annotator)**
-sentence_display = sentence.copy()
 st.write("🔹 **Câu gốc (Highlight lỗi màu đỏ)**")
 st.dataframe(sentence_display.style.apply(highlight_errors, axis=1))
-# **🔹 Annotator chỉnh sửa `Predicted_Chunk`**
 edited_df = st.data_editor(
-    sentence_display.drop(columns=["Chunk"]),  # Ẩn cột `Chunk`
     num_rows="dynamic",  # Cho phép thêm hàng ở bất kỳ đâu
     key=f"edit_table_{sentence_id}"
 )
@@ -62,8 +64,8 @@ if os.path.exists("corrected_data.csv"):
     with open("corrected_data.csv", "rb") as file:
         st.download_button("📥 Tải xuống corrected_data.csv", file, "corrected_data.csv")
-# Lưu lại dữ liệu chỉnh sửa (bao gồm `Chunk`, nhưng không hiển thị)
 if st.button("Lưu chỉnh sửa"):
-    sentence_display.update(edited_df)  # Cập nhật lại dữ liệu chỉnh sửa
-    sentence_display.to_csv("corrected_data.csv", index=False, encoding="utf-8")
     st.success("✅ Dữ liệu đã được lưu thành corrected_data.csv!")

 sentence["Predicted_Chunk"] = y_pred
 sentence["Is_Correct"] = sentence["Chunk"] == sentence["Predicted_Chunk"]  # Kiểm tra dự đoán
+# **Ẩn cột `Chunk` trong tất cả các bảng**
+sentence_display = sentence.drop(columns=["Chunk"])  # Bỏ hiển thị cột `Chunk`
 # Highlight lỗi: Màu đỏ nếu `Predicted_Chunk` sai
 def highlight_errors(row):
     return ["background-color: #FF9999" if not row["Is_Correct"] else "" for _ in row]
 st.write(f"✅ **Số token đúng**: {num_correct} / {len(sentence)}")
 st.write(f"❌ **Số token sai**: {num_wrong}")
+# **🔹 Hiển thị bảng với highlight lỗi (ẨN `Chunk`)**
 st.write("🔹 **Câu gốc (Highlight lỗi màu đỏ)**")
 st.dataframe(sentence_display.style.apply(highlight_errors, axis=1))
+# **🔹 Annotator chỉnh sửa `Predicted_Chunk` (ẨN `Chunk`)**
 edited_df = st.data_editor(
+    sentence_display[["Token", "POS", "Predicted_Chunk"]],  # Chỉ hiển thị các cột cần thiết
     num_rows="dynamic",  # Cho phép thêm hàng ở bất kỳ đâu
     key=f"edit_table_{sentence_id}"
 )
     with open("corrected_data.csv", "rb") as file:
         st.download_button("📥 Tải xuống corrected_data.csv", file, "corrected_data.csv")
+# Lưu lại dữ liệu chỉnh sửa
 if st.button("Lưu chỉnh sửa"):
+    sentence.update(edited_df)  # Cập nhật lại dữ liệu chỉnh sửa vào dataframe gốc
+    sentence.to_csv("corrected_data.csv", index=False, encoding="utf-8", columns=["Token", "POS", "Predicted_Chunk"])  # Chỉ lưu các cột cần thiết
     st.success("✅ Dữ liệu đã được lưu thành corrected_data.csv!")