CatsCanWrite commited on
Commit
e2fdcf9
·
1 Parent(s): c799558

reorg page text a little

Browse files
Files changed (2) hide show
  1. about.py +10 -8
  2. app.py +3 -1
about.py CHANGED
@@ -4,7 +4,9 @@ INTRODUCTION_TEXT = """
4
  #### I run model evaluations via API on request.
5
 
6
  To request a model evaluation, click **Request Evaluation** tab and enter the model ID.
 
7
 
 
8
  ## What is this anyway?
9
 
10
  I test the lyrical capabilities of LLMs by telling them to write songs entirely as meowing.
@@ -17,14 +19,6 @@ By forcing the model to generate nonsensical content, it condenses the test down
17
 
18
  Also, it's funny.
19
 
20
- ## About the Metrics
21
-
22
- - **Meter** - How closely the model sticks to the meter of the lines.
23
- - **Verse** - How closely the model aligns the lines to the verse and chorus breakup.
24
- - **Focus** - How much of the response is extraneous commentary instead of the song. Focus in particular has a very minor contribution to the final score
25
- """
26
-
27
- CITATION_BUTTON_TEXT = """
28
  ## Citation
29
 
30
  If you use this benchmark, please cite:
@@ -41,3 +35,11 @@ If you use this benchmark, please cite:
41
 
42
  For questions or issues, please open a discussion on the Hugging Face community tab.
43
  """
 
 
 
 
 
 
 
 
 
4
  #### I run model evaluations via API on request.
5
 
6
  To request a model evaluation, click **Request Evaluation** tab and enter the model ID.
7
+ """
8
 
9
+ CITATION_BUTTON_TEXT = """
10
  ## What is this anyway?
11
 
12
  I test the lyrical capabilities of LLMs by telling them to write songs entirely as meowing.
 
19
 
20
  Also, it's funny.
21
 
 
 
 
 
 
 
 
 
22
  ## Citation
23
 
24
  If you use this benchmark, please cite:
 
35
 
36
  For questions or issues, please open a discussion on the Hugging Face community tab.
37
  """
38
+
39
+ METRIC_INFO_TEXT = """
40
+ ## About the Metrics
41
+
42
+ - **Meter** - How closely the model sticks to the meter of the lines.
43
+ - **Verse** - How closely the model aligns the lines to the verse and chorus breakup.
44
+ - **Focus** - How much of the response is extraneous commentary instead of the song. Focus in particular has a very minor contribution to the final score
45
+ """
app.py CHANGED
@@ -1,5 +1,5 @@
1
  import gradio as gr
2
- from about import TITLE, INTRODUCTION_TEXT, CITATION_BUTTON_TEXT
3
  from utils import empty_leaderboard, load_leaderboard, request_model
4
 
5
 
@@ -45,6 +45,8 @@ with gr.Blocks() as demo:
45
  with gr.Tab("About"):
46
  gr.Markdown(CITATION_BUTTON_TEXT)
47
 
 
 
48
  demo.load(fn=load_leaderboard, outputs=leaderboard_df)
49
 
50
  demo.queue().launch()
 
1
  import gradio as gr
2
+ from about import METRIC_INFO_TEXT, TITLE, INTRODUCTION_TEXT, CITATION_BUTTON_TEXT
3
  from utils import empty_leaderboard, load_leaderboard, request_model
4
 
5
 
 
45
  with gr.Tab("About"):
46
  gr.Markdown(CITATION_BUTTON_TEXT)
47
 
48
+ gr.Markdown(METRIC_INFO_TEXT)
49
+
50
  demo.load(fn=load_leaderboard, outputs=leaderboard_df)
51
 
52
  demo.queue().launch()