Applicant-Task-Submission-Test

Running

App Files Files Community

GreenStar24 commited on Apr 28

Commit

67eefaa

1 Parent(s): 51e1a5a

small

Browse files

Files changed (1) hide show

app.py +28 -8

app.py CHANGED Viewed

@@ -66,6 +66,31 @@ SHEET_COLUMNS = [
 ]
 SHEET_HEADERS = [label for _, label in SHEET_COLUMNS]
 def get_model_name():
     return os.environ.get("OPENAI_MODEL_NAME", DEFAULT_MODEL_NAME)
@@ -1812,12 +1837,7 @@ def build_practice_scoring_note(submission_result):
     total_cases = submission_result["total_cases"]
     return (
         f"This practice score is based on {total_cases} hidden calibration cases. "
-        "Each case is run 3 times to check prompt consistency. In each run, "
-        "LLM 1 can earn up to 1 point for correct routing and target-firm "
-        "normalization, and LLM 3 can earn up to 1 point for a correct final "
-        "JSON answer with supported citations. Step 2 is not scored directly, "
-        "but it affects the LLM 3 score because LLM 3 relies on the snippet-level "
-        "analysis. The final submission uses a separate hidden holdout set."
     )
@@ -2023,7 +2043,7 @@ def handle_submission(submission_type, email, name, s1, s2, s3):
 def build_interface():
-    with gr.Blocks() as demo:
         gr.Markdown(
             """
         # Applicant Task: Target Company & Law Firm Identification
@@ -2170,7 +2190,7 @@ def build_interface():
         gr.Markdown(
             """
-        <div style="background-color:#fff7e6; padding:16px; border-radius:8px; border:1px solid #ffe5b4; margin-bottom:1em;">
         <b>Please note:</b><br>
         Each run may take a couple of minutes.<br>
         After you click a button, wait for the result and do not click it again.

 ]
 SHEET_HEADERS = [label for _, label in SHEET_COLUMNS]
+APP_CSS = """
+.submission-note {
+    background: var(--submission-note-bg, #fff7e6);
+    border: 1px solid var(--submission-note-border, #ffe5b4);
+    border-radius: 8px;
+    color: var(--submission-note-text, #3d2b00);
+    margin-bottom: 1em;
+    padding: 16px;
+}
+@media (prefers-color-scheme: dark) {
+    .submission-note {
+        --submission-note-bg: #2b2111;
+        --submission-note-border: #6b4b18;
+        --submission-note-text: #f7e8c5;
+    }
+}
+.dark .submission-note {
+    --submission-note-bg: #2b2111;
+    --submission-note-border: #6b4b18;
+    --submission-note-text: #f7e8c5;
+}
+"""
 def get_model_name():
     return os.environ.get("OPENAI_MODEL_NAME", DEFAULT_MODEL_NAME)
     total_cases = submission_result["total_cases"]
     return (
         f"This practice score is based on {total_cases} hidden calibration cases. "
+        "Each case is run 3 times to check prompt consistency."
     )
 def build_interface():
+    with gr.Blocks(css=APP_CSS) as demo:
         gr.Markdown(
             """
         # Applicant Task: Target Company & Law Firm Identification
         gr.Markdown(
             """
+        <div class="submission-note">
         <b>Please note:</b><br>
         Each run may take a couple of minutes.<br>
         After you click a button, wait for the result and do not click it again.