thrinadhn commited on
Commit
a93c639
·
verified ·
1 Parent(s): d66c474

Update LLMasjudge.py

Browse files
Files changed (1) hide show
  1. LLMasjudge.py +36 -0
LLMasjudge.py CHANGED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from dotenv import load_dotenv
3
+
4
+ import phoenix_helpers
5
+ import helpers
6
+
7
+ load_dotenv()
8
+
9
+ if "eval_btn_clicked" not in st.session_state:
10
+ st.session_state.eval_btn_clicked = False
11
+
12
+ def callback2():
13
+ st.session_state.eval_btn_clicked = True
14
+
15
+ models = helpers.fetch_models()
16
+ if models:
17
+ st.subheader("Evaluate LLM")
18
+
19
+ if "evaluation_result" not in st.session_state:
20
+ st.session_state.evaluation_result = None
21
+ if "eval_model" not in st.session_state:
22
+ st.session_state.eval_model = models[0]
23
+ st.selectbox(
24
+ "Choose a model to use for evaluation:",
25
+ models, key = 'eval_model',
26
+ index=models.index(st.session_state.eval_model) if st.session_state.eval_model in models else 0,
27
+ )
28
+ if st.button("Evaluate", on_click=callback2):
29
+ if st.session_state.eval_model:
30
+ try:
31
+ st.session_state.evaluation_result = phoenix_helpers.evaluate_model(st.session_state.eval_model)
32
+ st.dataframe(st.session_state.evaluation_result)
33
+ except Exception as e:
34
+ st.write(e)
35
+
36
+