Spaces:
Running
Running
File size: 13,544 Bytes
c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 e1f5917 c94b185 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 | <!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>Code Debug Environment</title>
<style>
* { box-sizing: border-box; margin: 0; padding: 0; }
body { font-family: system-ui, sans-serif; background: #0f1117; color: #e0e0e0; min-height: 100vh; padding: 2rem 1rem; }
.container { max-width: 860px; margin: 0 auto; }
.header { text-align: center; margin-bottom: 2.5rem; padding-bottom: 2rem; border-bottom: 1px solid #2a2a3a; }
.badge { display: inline-block; background: #1e3a5f; color: #60a5fa; font-size: 12px; padding: 4px 12px; border-radius: 20px; margin-bottom: 1rem; }
h1 { font-size: 2rem; font-weight: 600; color: #ffffff; margin-bottom: 0.5rem; }
.subtitle { color: #9ca3af; font-size: 1rem; }
.status-bar { display: flex; align-items: center; justify-content: center; gap: 8px; margin-top: 1rem; }
.dot { width: 8px; height: 8px; border-radius: 50%; background: #22c55e; animation: pulse 2s infinite; }
@keyframes pulse { 0%, 100% { opacity: 1; } 50% { opacity: 0.4; } }
.status-text { font-size: 13px; color: #22c55e; }
.stats { display: grid; grid-template-columns: repeat(3, 1fr); gap: 12px; margin-bottom: 2rem; }
.stat { background: #1a1a2e; border: 1px solid #2a2a3a; border-radius: 10px; padding: 1.2rem; text-align: center; }
.stat-value { font-size: 1.8rem; font-weight: 700; color: #60a5fa; }
.stat-label { font-size: 12px; color: #6b7280; margin-top: 4px; }
.section-title { font-size: 13px; font-weight: 600; color: #6b7280; text-transform: uppercase; letter-spacing: 0.05em; margin-bottom: 1rem; }
.tester { background: #1a1a2e; border: 1px solid #2a2a3a; border-radius: 12px; padding: 1.5rem; margin-bottom: 2rem; }
.tester-title { font-size: 15px; font-weight: 600; color: #fff; margin-bottom: 1.2rem; }
.select-row { display: flex; gap: 10px; margin-bottom: 1rem; align-items: center; }
select { background: #0f1117; color: #e0e0e0; border: 1px solid #3a3a5a; border-radius: 8px; padding: 8px 14px; font-size: 14px; cursor: pointer; flex: 1; outline: none; }
select:hover { border-color: #60a5fa; }
.btn { padding: 9px 20px; border-radius: 8px; font-size: 14px; font-weight: 500; cursor: pointer; border: none; transition: all 0.2s; }
.btn-blue { background: #1e3a5f; color: #60a5fa; border: 1px solid #2a4a7f; }
.btn-blue:hover { background: #2a4a7f; }
.btn-green { background: #0d3321; color: #22c55e; border: 1px solid #1a5a3a; }
.btn-green:hover { background: #1a5a3a; }
.task-box { background: #0f1117; border: 1px solid #2a2a3a; border-radius: 8px; padding: 1rem; margin-bottom: 1rem; display: none; }
.task-box.visible { display: block; }
.task-meta { display: flex; gap: 10px; margin-bottom: 10px; flex-wrap: wrap; }
.tag { font-size: 11px; padding: 3px 10px; border-radius: 20px; font-weight: 600; }
.tag-easy { background: #0d3321; color: #22c55e; }
.tag-medium { background: #3a2500; color: #f59e0b; }
.tag-hard { background: #3a0d0d; color: #ef4444; }
.tag-id { background: #1a1a2e; color: #9ca3af; border: 1px solid #2a2a3a; }
.task-instructions { font-size: 13px; color: #9ca3af; margin-bottom: 10px; line-height: 1.5; }
.code-label { font-size: 11px; color: #6b7280; margin-bottom: 6px; text-transform: uppercase; letter-spacing: 0.05em; }
pre { background: #0a0a14; border: 1px solid #2a2a3a; border-radius: 6px; padding: 12px; font-size: 13px; color: #e0e0e0; overflow-x: auto; white-space: pre-wrap; font-family: monospace; }
textarea { width: 100%; background: #0a0a14; border: 1px solid #2a2a3a; border-radius: 6px; padding: 12px; font-size: 13px; color: #e0e0e0; font-family: monospace; resize: vertical; min-height: 120px; outline: none; margin-top: 6px; }
textarea:focus { border-color: #60a5fa; }
.reward-box { display: none; background: #0f1117; border-radius: 8px; padding: 1rem; margin-top: 1rem; border: 1px solid #2a2a3a; }
.reward-box.visible { display: block; }
.reward-value { font-size: 2rem; font-weight: 700; text-align: center; margin-bottom: 6px; }
.reward-1 { color: #22c55e; }
.reward-mid { color: #f59e0b; }
.reward-0 { color: #ef4444; }
.feedback-text { font-size: 12px; color: #9ca3af; white-space: pre-wrap; line-height: 1.6; margin-top: 8px; border-top: 1px solid #2a2a3a; padding-top: 8px; }
.loading { color: #6b7280; font-size: 13px; text-align: center; padding: 1rem; display: none; }
.loading.visible { display: block; }
.endpoints { display: flex; flex-direction: column; gap: 10px; margin-bottom: 2rem; }
.endpoint { background: #1a1a2e; border: 1px solid #2a2a3a; border-radius: 10px; padding: 1rem 1.25rem; display: flex; align-items: center; gap: 12px; text-decoration: none; transition: border-color 0.2s; }
.endpoint:hover { border-color: #3b82f6; }
.method { font-size: 11px; font-weight: 700; padding: 3px 8px; border-radius: 5px; min-width: 42px; text-align: center; }
.get { background: #0d3321; color: #22c55e; }
.post { background: #1e3a5f; color: #60a5fa; }
.endpoint-info { flex: 1; }
.endpoint-path { font-size: 14px; font-weight: 500; color: #e0e0e0; font-family: monospace; }
.endpoint-desc { font-size: 12px; color: #6b7280; margin-top: 2px; }
.arrow { color: #4b5563; font-size: 14px; }
.difficulties { display: grid; grid-template-columns: repeat(3, 1fr); gap: 10px; margin-bottom: 2rem; }
.diff { background: #1a1a2e; border: 1px solid #2a2a3a; border-radius: 10px; padding: 1rem; text-align: center; }
.diff-name { font-size: 14px; font-weight: 600; margin-bottom: 4px; }
.diff-name.easy { color: #22c55e; }
.diff-name.medium { color: #f59e0b; }
.diff-name.hard { color: #ef4444; }
.diff-detail { font-size: 12px; color: #6b7280; line-height: 1.5; }
.footer { text-align: center; padding-top: 1.5rem; border-top: 1px solid #2a2a3a; }
.docs-btn { display: inline-block; background: #1e3a5f; color: #60a5fa; padding: 10px 24px; border-radius: 8px; text-decoration: none; font-size: 14px; font-weight: 500; }
.docs-btn:hover { background: #2a4a7f; }
</style>
</head>
<body>
<div class="container">
<div class="header">
<div class="badge">OpenEnv Compatible</div>
<h1>Code Debug Environment</h1>
<p class="subtitle">An RL environment where LLM agents diagnose and fix buggy Python code</p>
<div class="status-bar"><div class="dot"></div><span class="status-text">Live and Running</span></div>
</div>
<div class="stats">
<div class="stat"><div class="stat-value">45</div><div class="stat-label">Total Tasks</div></div>
<div class="stat"><div class="stat-value">3</div><div class="stat-label">Difficulty Levels</div></div>
<div class="stat"><div class="stat-value">0 to 1.0</div><div class="stat-label">Reward Range</div></div>
</div>
<div class="section-title">Live Tester</div>
<div class="tester">
<div class="tester-title">Try the environment interactively</div>
<div class="select-row">
<select id="difficulty-select">
<option value="">Random difficulty</option>
<option value="easy">Easy — 1 bug</option>
<option value="medium">Medium — 2 bugs</option>
<option value="hard">Hard — algorithmic bug + explanation</option>
</select>
<button class="btn btn-blue" onclick="doReset()">Get Task</button>
</div>
<div class="loading" id="loading-reset">Loading task...</div>
<div class="task-box" id="task-box">
<div class="task-meta">
<span class="tag tag-id" id="tag-id"></span>
<span class="tag" id="tag-diff"></span>
</div>
<div class="task-instructions" id="task-instructions"></div>
<div class="code-label">Buggy code</div>
<pre id="buggy-code"></pre>
<div class="code-label" style="margin-top:1rem;">Your fix</div>
<textarea id="fixed-code" placeholder="Paste your fixed code here..."></textarea>
<div id="explanation-section" style="display:none;">
<div class="code-label" style="margin-top:1rem;">Explanation (required for hard tasks)</div>
<textarea id="explanation" placeholder="Explain what was wrong and why your fix is correct..." style="min-height:80px;"></textarea>
</div>
<div style="margin-top:1rem;">
<button class="btn btn-green" onclick="doStep()">Submit Fix</button>
</div>
</div>
<div class="loading" id="loading-step">Grading your fix...</div>
<div class="reward-box" id="reward-box">
<div class="reward-value" id="reward-value"></div>
<div style="text-align:center; font-size:13px; color:#6b7280;" id="tests-info"></div>
<div class="feedback-text" id="feedback-text"></div>
</div>
</div>
<div class="section-title">API Endpoints</div>
<div class="endpoints">
<a class="endpoint" href="/health"><span class="method get">GET</span><div class="endpoint-info"><div class="endpoint-path">/health</div><div class="endpoint-desc">Health check</div></div><span class="arrow">→</span></a>
<a class="endpoint" href="/docs"><span class="method post">POST</span><div class="endpoint-info"><div class="endpoint-path">/reset</div><div class="endpoint-desc">Start a new episode — pass difficulty: easy | medium | hard</div></div><span class="arrow">→</span></a>
<a class="endpoint" href="/docs"><span class="method post">POST</span><div class="endpoint-info"><div class="endpoint-path">/step</div><div class="endpoint-desc">Submit fixed code — returns reward (0.0 to 1.0) and feedback</div></div><span class="arrow">→</span></a>
<a class="endpoint" href="/state"><span class="method get">GET</span><div class="endpoint-info"><div class="endpoint-path">/state</div><div class="endpoint-desc">Current episode state</div></div><span class="arrow">→</span></a>
<a class="endpoint" href="/tasks"><span class="method get">GET</span><div class="endpoint-info"><div class="endpoint-path">/tasks</div><div class="endpoint-desc">List all 45 task IDs</div></div><span class="arrow">→</span></a>
</div>
<div class="section-title">Difficulty Levels</div>
<div class="difficulties">
<div class="diff"><div class="diff-name easy">Easy</div><div class="diff-detail">15 tasks<br>1 bug per task<br>reward = tests passed / 3</div></div>
<div class="diff"><div class="diff-name medium">Medium</div><div class="diff-detail">15 tasks<br>2 bugs per task<br>reward = tests passed / 3</div></div>
<div class="diff"><div class="diff-name hard">Hard</div><div class="diff-detail">15 tasks<br>algorithmic bug<br>reward = 0.7 x code + 0.3 x explanation</div></div>
</div>
<div class="footer"><a class="docs-btn" href="/docs">Open Interactive API Docs</a></div>
</div>
<script>
async function doReset() {
const sel = document.getElementById('difficulty-select').value;
document.getElementById('loading-reset').classList.add('visible');
document.getElementById('task-box').classList.remove('visible');
document.getElementById('reward-box').classList.remove('visible');
document.getElementById('loading-step').classList.remove('visible');
try {
const body = sel ? { difficulty: sel } : {};
const res = await fetch('/reset', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify(body) });
const data = await res.json();
const obs = data.observation;
document.getElementById('tag-id').textContent = obs.task_id;
const diffTag = document.getElementById('tag-diff');
diffTag.textContent = obs.difficulty.toUpperCase();
diffTag.className = 'tag tag-' + obs.difficulty;
document.getElementById('task-instructions').textContent = obs.instructions;
document.getElementById('buggy-code').textContent = obs.buggy_code;
document.getElementById('fixed-code').value = obs.buggy_code;
document.getElementById('explanation-section').style.display = obs.difficulty === 'hard' ? 'block' : 'none';
document.getElementById('task-box').classList.add('visible');
} catch(e) { alert('Error: ' + e.message); }
finally { document.getElementById('loading-reset').classList.remove('visible'); }
}
async function doStep() {
const fixedCode = document.getElementById('fixed-code').value.trim();
if (!fixedCode) { alert('Please enter your fixed code!'); return; }
document.getElementById('loading-step').classList.add('visible');
document.getElementById('reward-box').classList.remove('visible');
try {
const payload = { fixed_code: fixedCode };
const explanation = document.getElementById('explanation').value.trim();
if (explanation) payload.explanation = explanation;
const res = await fetch('/step', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify(payload) });
const data = await res.json();
const obs = data.observation;
const reward = data.reward;
const rewardEl = document.getElementById('reward-value');
rewardEl.textContent = 'Reward: ' + reward.toFixed(2);
rewardEl.className = 'reward-value ' + (reward === 1.0 ? 'reward-1' : reward > 0 ? 'reward-mid' : 'reward-0');
document.getElementById('tests-info').textContent = obs.passed_tests + ' / ' + obs.total_tests + ' tests passed' + (data.done ? ' — Episode complete' : '');
document.getElementById('feedback-text').textContent = obs.feedback || '';
document.getElementById('reward-box').classList.add('visible');
} catch(e) { alert('Error: ' + e.message); }
finally { document.getElementById('loading-step').classList.remove('visible'); }
}
</script>
</body>
</html> |