Spaces:

cmenasse
/

layton-test

Sleeping

File size: 2,807 Bytes

import os
import pandas as pd
import streamlit as st
from datasets import load_dataset

os.environ["HF_HOME"] = "/data/huggingface"
os.environ["HF_DATASETS_CACHE"] = "/data/huggingface/datasets"
os.environ["HUGGINGFACE_HUB_CACHE"] = "/data/huggingface/hub"
os.environ["TRANSFORMERS_CACHE"] = "/data/huggingface/transformers"

os.makedirs("/data/huggingface", exist_ok=True)



tab1, tab2, tab3 = st.tabs(["Benchmark", "Data viz", "Data explorer"])

with tab1:
    
    st.title("Professor Layton LLM Benchmark")
    
    st.caption("Only text questions")
    data = {
        "provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
        "models": ["o3", "o4-mini", "GPT-4o", "Medium 3"],
        "release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
        "accuracy": [0.85, 0.90, 0.88, 0.56],
        "pika": [30000, 34000, 23000, 45000],
        "cost": [0.10, 0.15, 0.08, 0.3],
        "speed": [120, 100, 150, 455]
    }
    
    df = pd.DataFrame(data)
    st.dataframe(df)
    
    st.caption("Only text questions with hints")
    data = {
        "provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
        "models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
        "release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
        "0-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "2-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "3-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "4-hint accuracy": [0.85, 0.90, 0.88, 0.56],
    }
    
    df = pd.DataFrame(data)
    st.dataframe(df)
    
    st.caption("Text and image questions")
    data = {
        "provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
        "models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
        "release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
        "accuracy": [0.85, 0.90, 0.88, 0.56],
        "pika": [30000, 34000, 23000, 45000],
        "cost": [0.10, 0.15, 0.08, 0.3],
        "speed": [120, 100, 150, 455]
    }
    
    df = pd.DataFrame(data)
    st.dataframe(df)
    
    st.caption("Text and image questions with hints")
    data = {
        "provider": ["Open AI", "Open AI", "Open AI", "Mistral"],
        "models": ["o3", "o4-mini", "GPT-4o", "Pixtral Large"],
        "release": ["2025-04-16", "2025-04-16", "2025-04-16", "2025-04-16"],
        "0-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "2-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "3-hint accuracy": [0.85, 0.90, 0.88, 0.56],
        "4-hint accuracy": [0.85, 0.90, 0.88, 0.56],
    }
    
    df = pd.DataFrame(data)
    st.dataframe(df)


with tab2:

    dataset = load_dataset("cmenasse/layton")
    df = dataset.to_pandas()
    
    # Show the table
    st.dataframe(df)
       

with tab3:

    st.markdown("This is an example of a third tab.")