funnel-4. 1 token, chunk size 8
mode="mul",
num_actions_chunk=8,
num_actions_per_token=8,
action_head_name="fel",
num_blocks=4,
model_type="llama3.2",
funnel-4. 1 token, chunk size 8
mode="mul",
num_actions_chunk=8,
num_actions_per_token=8,
action_head_name="fel",
num_blocks=4,
model_type="llama3.2",