Spaces:

AIEnergyScore
/

BulkCalcSpace

Paused

App Files Files Community

meg HF Staff commited on Jan 14, 2025

Commit

92305c2

verified ·

1 Parent(s): ef08818

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -1

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 from fastapi import FastAPI
 from huggingface_hub import HfApi
 TOKEN = os.environ.get("BULK_ENERGY_TOKEN")
 API = HfApi(token=TOKEN)
@@ -8,6 +9,28 @@ API = HfApi(token=TOKEN)
 REPO_ID = "AIEnergyScore/BulkCalcSpace"
 app = FastAPI()
 @app.get("/")
 def start_train():
     model_file = open("models.txt", "r+").readlines()
@@ -25,7 +48,10 @@ def start_train():
             model = model.strip()
             for task in task_file:
                 task = task.strip()
-                os.system(f"./entrypoint.sh {REPO_ID} {model} {task} {hardware}")
     #space_variables = API.get_space_variables(repo_id=REPO_ID)
     #if 'STATUS' not in space_variables or space_variables['STATUS'] != 'COMPUTING':
     #    print("Beginning processing.")

 import os
 from fastapi import FastAPI
 from huggingface_hub import HfApi
+import time
 TOKEN = os.environ.get("BULK_ENERGY_TOKEN")
 API = HfApi(token=TOKEN)
 REPO_ID = "AIEnergyScore/BulkCalcSpace"
 app = FastAPI()
+def check_for_traceback(run_dir):
+    # run_dir="./runs/${experiment_name}/${backend_model}/${now}"
+    found_error = False
+    error_message = ""
+    try:
+        # Read error message
+        with open(f"{run_dir}/error.log", 'r') as f:
+            # There may be a better way to do this that finds the
+            # index of Traceback, then prints from there : end-of-file index (the file length-1).
+            for line in f:
+                # Question: Do we even need to check for this? The presence of the
+                # error file, or at least a non-empty one,
+                # means there's been an error, no?
+                if 'Traceback (most recent call last):' in line:
+                    found_error = True
+                if found_error:
+                    error_message += line
+    except FileNotFoundError as e:
+        # When does this happen?
+        print(f"Could not find {run_dir}/error.log")
+    return error_message
 @app.get("/")
 def start_train():
     model_file = open("models.txt", "r+").readlines()
             model = model.strip()
             for task in task_file:
                 task = task.strip()
+                # Create the name of the directory for output.
+                now = time.time()
+                run_dir = f"/runs/${task}/${model}/${now}"
+                os.system(f"./entrypoint.sh {REPO_ID} {model} {task} {hardware} {run_dir}")
     #space_variables = API.get_space_variables(repo_id=REPO_ID)
     #if 'STATUS' not in space_variables or space_variables['STATUS'] != 'COMPUTING':
     #    print("Beginning processing.")