layton-test / src /streamlit_app.py
cmenasse's picture
Update src/streamlit_app.py
f3dad8e verified
import os
import pandas as pd
import streamlit as st
from datasets import load_dataset
os.environ["HF_HOME"] = "/data/huggingface"
os.environ["HF_DATASETS_CACHE"] = "/data/huggingface/datasets"
os.environ["HUGGINGFACE_HUB_CACHE"] = "/data/huggingface/hub"
os.environ["TRANSFORMERS_CACHE"] = "/data/huggingface/transformers"
os.makedirs("/data/huggingface", exist_ok=True)
tab1, tab2, tab3 = st.tabs(["Benchmark", "Data viz", "Data explorer"])
with tab1:
st.title("Professor Layton LLM Benchmark")
st.caption("Only text questions")
data = {
"provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
"models": ["o3", "o4-mini", "GPT-4o", "Medium 3"],
"release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
"accuracy": [0.85, 0.90, 0.88, 0.56],
"pika": [30000, 34000, 23000, 45000],
"cost": [0.10, 0.15, 0.08, 0.3],
"speed": [120, 100, 150, 455]
}
df = pd.DataFrame(data)
st.dataframe(df)
st.caption("Only text questions with hints")
data = {
"provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
"models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
"release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
"0-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"2-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"3-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"4-hint accuracy": [0.85, 0.90, 0.88, 0.56],
}
df = pd.DataFrame(data)
st.dataframe(df)
st.caption("Text and image questions")
data = {
"provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
"models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
"release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
"accuracy": [0.85, 0.90, 0.88, 0.56],
"pika": [30000, 34000, 23000, 45000],
"cost": [0.10, 0.15, 0.08, 0.3],
"speed": [120, 100, 150, 455]
}
df = pd.DataFrame(data)
st.dataframe(df)
st.caption("Text and image questions with hints")
data = {
"provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
"models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
"release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
"0-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"2-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"3-hint accuracy": [0.85, 0.90, 0.88, 0.56],
"4-hint accuracy": [0.85, 0.90, 0.88, 0.56],
}
df = pd.DataFrame(data)
st.dataframe(df)
with tab2:
dataset = load_dataset("cmenasse/layton")
df = dataset.to_pandas()
# Show the table
st.dataframe(df)
with tab3:
st.markdown("This is an example of a third tab.")