Spaces:

CoreyMorris
/

MMLU-by-task

Runtime error

App Files Files Community

Corey Morris commited on Jul 18, 2023

Commit

88c2b27

1 Parent(s): d701f12

Using data from repository to create leaderboard

Browse files

Files changed (1) hide show

app.py +24 -26

app.py CHANGED Viewed

@@ -1,52 +1,50 @@
 import gradio as gr
 import requests
 import pandas as pd
 class MultiURLData:
     def __init__(self, file_path):
         self.file_path = file_path
     def fetch_data(self):
-        # Read URLs from a file, one per line
-        with open(self.file_path, 'r') as f:
-            file_urls = [line.strip() for line in f.readlines()]
         dataframes = []
-        for url in file_urls:
-            # Derive column names from the URLs
-            column_name = url.split('/')[-1].split('_')[0]
-            # Load data from URL
-            response = requests.get(url)
-            data = response.json()
-            # Convert data into a DataFrame
-            df = pd.DataFrame(data['results']).T
-            # Rename 'acc' column to respective file names
-            df = df.rename(columns={'acc': column_name})
-            # Remove 'hendrycksTest-' from the index
-            df.index = df.index.str.replace('hendrycksTest-', '')
-            print(f"dype df {type(df)}")
-            dataframes.append(df[[column_name]])  # keep only the column of interest
-        # Merge the dataframes
         # Merge the dataframes on index
         data = pd.concat(dataframes, axis=1)
-        print(f"dype data {type(data)}")
         # Transpose the dataframe to swap rows and columns
         data = data.transpose()
-        # Select only columns 'moral_scenarios' and 'moral_disputes'
-        data = data[['moral_scenarios', 'moral_disputes']]
-        ## add a column with the index of the dataframe
         data['Model Name'] = data.index
-        # move the column to the front of the dataframe
         cols = data.columns.tolist()
         cols = cols[-1:] + cols[:-1]
         data = data[cols]

 import gradio as gr
 import requests
 import pandas as pd
+import os
+import fnmatch
+import json
 class MultiURLData:
     def __init__(self, file_path):
         self.file_path = file_path
     def fetch_data(self):
         dataframes = []
+        def find_files(directory, pattern):
+            for root, dirs, files in os.walk(directory):
+                for basename in files:
+                    if fnmatch.fnmatch(basename, pattern):
+                        filename = os.path.join(root, basename)
+                        yield filename
+        for filename in find_files('results', 'results*.json'):
+            model_name = filename.split('/')[2]
+            with open(filename) as f:
+                data = json.load(f)
+                df = pd.DataFrame(data['results']).T
+                # Rename 'acc' column to respective file names
+                df = df.rename(columns={'acc': model_name})
+                # Remove 'hendrycksTest-' from the index
+                df.index = df.index.str.replace('hendrycksTest-', '')
+                # Remove'harness|' from the index
+                df.index = df.index.str.replace('harness|', '')
+                dataframes.append(df[[model_name]])  # keep only the column of interest
         # Merge the dataframes on index
         data = pd.concat(dataframes, axis=1)
         # Transpose the dataframe to swap rows and columns
         data = data.transpose()
         data['Model Name'] = data.index
         cols = data.columns.tolist()
         cols = cols[-1:] + cols[:-1]
         data = data[cols]