lainwired commited on
Commit
c3be2d3
·
verified ·
1 Parent(s): 3910891

fix OBL + BC weight_file paths; Flawed description; flag Prolific as LBF-only

Browse files
benchmark_ui/backend/envs/hanabi.py CHANGED
@@ -175,7 +175,7 @@ class HanabiRenderer(EnvRenderer):
175
  key="flawed",
176
  display_name="Flawed",
177
  difficulty="easy",
178
- description="IGGI but plays at 40% confidence (more reckless). Walton-Rivers low-competence partner.",
179
  load_fn=lambda: self._make_partner("flawed", play_threshold=0.4),
180
  tags=["heuristic", "walton-rivers"],
181
  ),
@@ -441,10 +441,13 @@ class HanabiRenderer(EnvRenderer):
441
  elif actor_type == "smartbot":
442
  policy = HanabiSmartBotPolicyWrapper(**common)
443
  elif actor_type == "obl_r2d2":
444
- policy = HanabiOBLPolicyWrapper(using_log_wrapper=False)
 
 
 
445
  elif actor_type == "bc_lstm":
446
  policy = HanabiBCLSTMPolicyWrapper(
447
- weight_file="agents/hanabi/bc_lstm_weights/bc_2p.safetensors",
448
  using_log_wrapper=False,
449
  )
450
  else:
 
175
  key="flawed",
176
  display_name="Flawed",
177
  difficulty="easy",
178
+ description="IGGI but with a lower play threshold (0.4 vs Piers' 0.6); plays cards it isn't sure about. Walton-Rivers low-competence partner.",
179
  load_fn=lambda: self._make_partner("flawed", play_threshold=0.4),
180
  tags=["heuristic", "walton-rivers"],
181
  ),
 
441
  elif actor_type == "smartbot":
442
  policy = HanabiSmartBotPolicyWrapper(**common)
443
  elif actor_type == "obl_r2d2":
444
+ policy = HanabiOBLPolicyWrapper(
445
+ weight_file="agents/hanabi/obl-r2d2-flax/icml_OBL1/OFF_BELIEF1_SHUFFLE_COLOR0_BZA0_BELIEF_a.safetensors",
446
+ using_log_wrapper=False,
447
+ )
448
  elif actor_type == "bc_lstm":
449
  policy = HanabiBCLSTMPolicyWrapper(
450
+ weight_file="agents/bc_weights/hanabi_ah2ac2_bc.safetensors",
451
  using_log_wrapper=False,
452
  )
453
  else:
benchmark_ui/frontend/src/pages/Home.tsx CHANGED
@@ -82,7 +82,7 @@ export function Home() {
82
  </li>
83
  <li>
84
  <span className="text-ink-200 font-medium">Run a Prolific study</span>
85
- {" "}across multiple games and get a completion code.
86
  </li>
87
  </ul>
88
  </section>
 
82
  </li>
83
  <li>
84
  <span className="text-ink-200 font-medium">Run a Prolific study</span>
85
+ {" "}across multiple games (LBF only for now).
86
  </li>
87
  </ul>
88
  </section>