Spaces:

thrinadhn
/

text2textwithDockerfile

Build error

App Files Files Community

thrinadhn commited on Feb 11, 2025

Commit

1c67c92

verified ·

1 Parent(s): b1b866f

Create evaluationwithexistingdata.py

Browse files

Files changed (1) hide show

evaluationwithexistingdata.py +64 -0

evaluationwithexistingdata.py ADDED Viewed

	@@ -0,0 +1,64 @@

+import streamlit as st
+from dotenv import load_dotenv
+import phoenix_helpers
+import helpers
+import plotly.express as px
+load_dotenv()
+models = helpers.fetch_models()
+if models:
+    st.subheader("Select a Model")
+    if "selected_model" not in st.session_state:
+        st.session_state.selected_model = models[0]
+    st.selectbox(
+        "Choose a model to use:",
+        models, key = 'selected_model',
+        index=models.index(st.session_state.selected_model) if st.session_state.selected_model in models else 0
+    )
+    datasetName = st.text_input("Dataset name")
+    if datasetName:
+        dataset = phoenix_helpers.get_dataset(name=datasetName)
+        df = dataset = dataset.as_dataframe()
+        eval_res = phoenix_helpers.dataEvalResults(st.session_state.selected_model,df)
+        eval_res["hallucination_eval"] = eval_res["hallucination_eval"].apply(
+            lambda x: x if x in ["hallucinated", "factual"] else "other"
+        )
+        eval_res["qa_eval"] = eval_res["qa_eval"].apply(
+            lambda x: x if x in ["correct", "incorrect"] else "other"
+        )
+        response_counts = eval_res["hallucination_eval"].value_counts().reset_index()
+        response_counts.columns = ["hallucination_eval", "count"]
+        response_counts_qa = eval_res["qa_eval"].value_counts().reset_index()
+        response_counts_qa.columns = ["qa_eval", "count"]
+        st.dataframe(eval_res)
+        fig = px.pie(
+            response_counts,
+            values="count",
+            names="hallucination_eval",
+            title=f"{st.session_state.selected_model} Model Hallucination",
+            hole=0.4
+        )
+        st.plotly_chart(fig)
+        fig = px.pie(
+            response_counts_qa,
+            values="count",
+            names="qa_eval",
+            title=f"{st.session_state.selected_model} Model QA",
+            hole=0.4
+        )
+        st.plotly_chart(fig)