Danny Liu commited on
Commit
4da9687
·
1 Parent(s): 5f4879e

keep debugging

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -46,8 +46,8 @@ with demo:
46
  gr.Markdown("### Model evaluation on VerilogEval-Human V1 benchmark (156 problems, 10 rollouts each)")
47
  leaderboard = init_leaderboard(LEADERBOARD_DF)
48
 
49
- gr.Markdown("### Evaluation Results")
50
- gr.Markdown(CONCLUSION_TEXT, elem_classes="markdown-text")
51
 
52
  gr.Markdown("### Transition Matrices")
53
  gr.Markdown("The transition matrices below show how errors evolve during the SFT and RL phases, revealing the surface convergence gap where optimization reduces syntax errors but increases functional testbench failures.")
 
46
  gr.Markdown("### Model evaluation on VerilogEval-Human V1 benchmark (156 problems, 10 rollouts each)")
47
  leaderboard = init_leaderboard(LEADERBOARD_DF)
48
 
49
+ #gr.Markdown("### Evaluation Results")
50
+ #gr.Markdown(CONCLUSION_TEXT, elem_classes="markdown-text")
51
 
52
  gr.Markdown("### Transition Matrices")
53
  gr.Markdown("The transition matrices below show how errors evolve during the SFT and RL phases, revealing the surface convergence gap where optimization reduces syntax errors but increases functional testbench failures.")