Danny Liu commited on
Commit
3a69eb0
·
1 Parent(s): e37c78d

keep debugging v3

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -45,8 +45,8 @@ with demo:
45
  gr.Markdown("## Benchmark")
46
  gr.Markdown("### Model evaluation on VerilogEval-Human V1 benchmark (156 problems, 10 rollouts each)")
47
  leaderboard = init_leaderboard(LEADERBOARD_DF)
48
- gr.Markdown("### Evaluation Results")
49
- #gr.Markdown(CONCLUSION_TEXT, elem_classes="markdown-text")
50
 
51
  gr.Markdown("### Transition Matrices")
52
  gr.Markdown("The transition matrices below show how errors evolve during the SFT and RL phases, revealing the surface convergence gap where optimization reduces syntax errors but increases functional testbench failures.")
 
45
  gr.Markdown("## Benchmark")
46
  gr.Markdown("### Model evaluation on VerilogEval-Human V1 benchmark (156 problems, 10 rollouts each)")
47
  leaderboard = init_leaderboard(LEADERBOARD_DF)
48
+ #gr.Markdown("### Evaluation Results")
49
+ gr.Markdown(CONCLUSION_TEXT, elem_classes="markdown-text")
50
 
51
  gr.Markdown("### Transition Matrices")
52
  gr.Markdown("The transition matrices below show how errors evolve during the SFT and RL phases, revealing the surface convergence gap where optimization reduces syntax errors but increases functional testbench failures.")