Reward Trace · Episode

step={trace.length}/10 cum={cumReward.toFixed(2)}

{Array.from({ length: 10 }).map((_, i) => { const v = trace[i] const has = typeof v === 'number' const upFrac = has && v > 0 ? Math.min(1, v / Math.max(hi, 0.01)) : 0 const downFrac = has && v < 0 ? Math.min(1, -v / Math.max(-lo, 0.01)) : 0 const upPct = `${(upFrac * 100 * (1 - zeroFrac)).toFixed(0)}%` const downPct = `${(downFrac * 100 * zeroFrac).toFixed(0)}%` return (

= 0 ? 'pos' : 'neg') : 'empty'}`} title={has ? `R${i + 1}: reward ${v >= 0 ? '+' : ''}${v.toFixed(3)}` : `R${i + 1}: pending`} >

{i + 1}

) })}

last_step {lastReward === null ? '—' : `${lastReward >= 0 ? '+' : ''}${Number(lastReward).toFixed(3)}`}

) }