Spaces:

darkc0de
/

UGI-Index

Running

File size: 8,063 Bytes

1000923
 
 
e0c9a91
1000923
d66e028
1000923
 
 
d66e028
 
 
 
 
27e1337
d66e028
27e1337
e0c9a91
27e1337
0cfe4b3
27e1337
0cfe4b3
27e1337
 
0cfe4b3
 
 
27e1337
 
e0c9a91
0cfe4b3
 
 
 
e0c9a91
 
 
 
 
 
 
 
 
27e1337
e0c9a91
0cfe4b3
 
 
 
 
 
 
d66e028
e0c9a91
 
 
 
 
 
 
 
 
 
 
 
 
 
0cfe4b3
 
 
e0c9a91
 
5de6b2f
27e1337
 
0cfe4b3
d66e028
 
623209b
e0c9a91
 
 
 
 
 
 
 
 
 
 
a2de6c3
d66e028
0cfe4b3
 
 
 
 
 
e0c9a91
 
0cfe4b3
 
 
e0c9a91
 
 
 
 
 
 
 
 
 
0cfe4b3
e0c9a91
 
 
 
 
 
 
 
 
 
d66e028
 
0cfe4b3
 
 
 
 
 
594f731
1000923
e0c9a91
b5d7438
 
e0c9a91
0cfe4b3
e0c9a91
0cfe4b3
b5d7438
 
e0c9a91
 
 
79360be
 
 
 
 
 
 
e0c9a91
 
79360be
 
 
e0c9a91
79360be
 
 
 
 
 
 
e0c9a91
79360be
 
e0c9a91
79360be
e0c9a91
 
 
79360be

import gradio as gr
import pandas as pd
from huggingface_hub import hf_hub_download
import re

# --- Constants ---
REPO_ID = "DontPlanToEnd/UGI-Leaderboard"
FILENAME = "ugi-leaderboard-data.csv"

def make_clickable_model(model_name, link):
    """Wraps model name in HTML link."""
    if pd.isna(link) or not link or str(link).lower() == "nan":
        return model_name
    return f'<a target="_blank" href="{link}" style="color: #007bff; text-decoration: underline; font-weight: bold;">{model_name}</a>'

def get_data():
    """
    Downloads, processes, and returns the full leaderboard dataframe + status message.
    """
    print("🔄 Starting download...")
    try:
        # 1. Download file
        file_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME, repo_type="space")
        
        # 2. Load CSV
        # utf-8-sig handles the BOM character if present
        df = pd.read_csv(file_path, encoding='utf-8-sig')
        df.columns = df.columns.str.strip()
        
        # 3. Exact & Fuzzy Column Matching
        def get_col(keyword):
            matches = [c for c in df.columns if keyword.lower() in c.lower()]
            return matches[0] if matches else None

        # Prioritize exact names from the CSV, fallback to fuzzy matching
        model_col = "author/model_name" if "author/model_name" in df.columns else (get_col("author") or get_col("model"))
        link_col = "Model Link" if "Model Link" in df.columns else get_col("link")
        ugi_col = "UGI 🏆" if "UGI 🏆" in df.columns else get_col("ugi")
        natint_col = "NatInt 💡" if "NatInt 💡" in df.columns else get_col("natint")
        w10_col = "W/10 👍" if "W/10 👍" in df.columns else get_col("w/10")
        
        # We need TOTAL parameters to accurately estimate the GGUF file size
        param_col = "Total Parameters" if "Total Parameters" in df.columns else (get_col("param") or get_col("size"))

        # 4. Check if we found required columns
        if not all([model_col, ugi_col, natint_col, w10_col]):
            missing = []
            if not model_col: missing.append("Model")
            if not ugi_col: missing.append("UGI")
            if not natint_col: missing.append("NatInt")
            if not w10_col: missing.append("W/10")
            return pd.DataFrame(), f"❌ Error: Could not find columns: {', '.join(missing)}. Found: {list(df.columns)}"

        # 5. Extract Parameter Size & Calculate Q4_K_M size
        if param_col:
            df['Params (B)'] = pd.to_numeric(df[param_col], errors='coerce').fillna(0)
        else:
            # Fallback: Extract from model name (e.g., "Llama-3-70B" -> 70)
            df['Params (B)'] = df[model_col].astype(str).str.extract(r'(?i)(\d+\.?\d*)[bB]').astype(float).fillna(0)
        
        # Q4_K_M size formula: Parameter count * 0.6 GB (e.g., 24B * 0.6 = 14.4 GB)
        df['Q4_K_M Size (GB)'] = (df['Params (B)'] * 0.6).round(1)
        
        # Friendly string representation for the UI
        df['Q4_K_M Size'] = df['Q4_K_M Size (GB)'].apply(lambda x: f"{x} GB" if x > 0 else "API / Unknown")

        # 6. Clean Numeric Data
        for col in [ugi_col, natint_col, w10_col]:
            df[col] = pd.to_numeric(df[col], errors='coerce').fillna(0)

        # 7. Calculate UGI Index (UPDATED LOGIC)
        # Formula: (UGI + NatInt) * (W/10 ^ 2)
        df['UGI Index'] = (df[ugi_col] + df[natint_col]) * (df[w10_col] ** 2)
        df['UGI Index'] = df['UGI Index'].round(2)

        # 8. Sort and Rank
        df = df.sort_values(by='UGI Index', ascending=False)
        df.insert(0, 'Rank', range(1, len(df) + 1))

        # 9. Normalize display columns
        if link_col:
            df['Model'] = df.apply(lambda x: make_clickable_model(x[model_col], x[link_col]), axis=1)
        else:
            df['Model'] = df[model_col]
            
        df['UGI'] = df[ugi_col]
        df['NatInt'] = df[natint_col]
        df['W/10'] = df[w10_col]

        return df, f"✅ Successfully loaded {len(df)} models."

    except Exception as e:
        print(f"Error: {e}")
        return pd.DataFrame(), f"❌ Error: {str(e)}"

# Global cache for search to use
CACHED_DF = pd.DataFrame()

def search(query, max_size):
    """Filters the cached dataframe by search query and Q4_K_M Size."""
    if CACHED_DF.empty:
        return CACHED_DF
    
    df = CACHED_DF.copy()
    
    # Text Filter
    if query:
        df = df[df['Model'].astype(str).str.contains(query, case=False, na=False)]
        
    # Size Filter (128 is the arbitrary "Show All" max value)
    if max_size < 128:
        # Hide API models (Size == 0) and models that exceed the selected size
        df = df[(df['Q4_K_M Size (GB)'] <= max_size) & (df['Q4_K_M Size (GB)'] > 0)]
    
    display_cols = ['Rank', 'Model', 'Q4_K_M Size', 'UGI Index', 'UGI', 'NatInt', 'W/10']
    return df[display_cols]

def app_load(query, max_size):
    """Called when app starts or refreshes."""
    global CACHED_DF
    df, status = get_data()
    CACHED_DF = df
    filtered_df = search(query, max_size)
    return filtered_df, status

# --- UI ---
custom_css = """
.gradio-container {max-width: 95% !important}
footer {visibility: hidden}
"""

with gr.Blocks(css=custom_css, title="UGI Index Leaderboard") as demo:
    gr.Markdown("# 🏆 UGI Index")
    
    # (UPDATED MARKDOWN FORMULA)
    gr.Markdown("""
    ### ℹ️ How is the Score Calculated?
    The **UGI Index** ranks LLMs based on data from [DontPlanToEnd/UGI-Leaderboard](https://huggingface.co/spaces/DontPlanToEnd/UGI-Leaderboard) with a simple holistic mathematical equation that ensures top ranked models posses a high amount of Uncensored Information, are Naturally very Intelligent, and most importantly they are OBEDIENT to the user. This is just my personal "rule of thumb" method for choosing the best uncensored model for LOCAL use on any given hardware I have laying around. Ajust the slider to the amount of RAM on your device to see the best uncensored model for your hardware. It uses Q4_K_M as a refrence point for GGUF size, however there are tons of options so it can be flexable. If your brand new and just want to try a uncensored local LLM for the first time do this: Grab a **mradermacher** quant in **i1-IQ4_XS** and run with **LMstudio.ai**
    
    $$ \\text{UGI Index} = (\\text{UGI} + \\text{NatInt}) \\times \\text{W/10}^2 $$
    
    *   **UGI:** Uncensored General Intelligence
    *   **NatInt:** Natural Intelligence
    *   **W/10:** Willingness (Squared)
    
    *💡 **Note on Model Size:** GGUF size is calculated at standard **Q4_K_M** quantization (`Total Parameters × 0.6 GB`). Lowering the slider automatically hides closed-source API models.*
    """)

    with gr.Row():
        status_box = gr.Textbox(label="Status", value="Initializing...", interactive=False, scale=4)
        refresh_btn = gr.Button("Refresh Data", scale=1)
    
    with gr.Row():
        search_box = gr.Textbox(label="Search Models", placeholder="Type model name...", interactive=True, scale=1)
        size_slider = gr.Slider(minimum=1, maximum=128, value=128, step=1, label="💻 Running Local? Max Q4_K_M Size (GB) - Set to 128 to include API models", interactive=True, scale=1)

    # Initialize with empty dataframe
    data_table = gr.Dataframe(
        headers=['Rank', 'Model', 'Q4_K_M Size', 'UGI Index', 'UGI', 'NatInt', 'W/10'],
        datatype="markdown",
        interactive=False,
        wrap=True
    )

    # Wire up events
    # 1. On Load: Fetch data, update table and status
    demo.load(fn=app_load, inputs=[search_box, size_slider], outputs=[data_table, status_box])
    
    # 2. On Refresh: Fetch data again
    refresh_btn.click(fn=app_load, inputs=[search_box, size_slider], outputs=[data_table, status_box])
    
    # 3. On Search or Slider Change: Filter existing data
    search_box.change(fn=search, inputs=[search_box, size_slider], outputs=data_table)
    size_slider.change(fn=search, inputs=[search_box, size_slider], outputs=data_table)

if __name__ == "__main__":
    demo.launch()