Spaces:
Sleeping
Sleeping
File size: 7,386 Bytes
90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 b83c8ad 90fc756 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 | [
{
"task_id": "easy_001",
"difficulty": "easy",
"query": "SELCT * FORM users WEHRE id = 1;",
"schema": {
"users": {
"id": "INT PRIMARY KEY",
"name": "VARCHAR(255)",
"email": "VARCHAR(255)"
}
},
"context": "Fetch a user profile by id for the account page.",
"ground_truth_issues": [
{
"id": "easy_001_select",
"category": "syntax",
"description": "SELCT should be SELECT.",
"severity": 0.35,
"fix": "SELECT * FROM users WHERE id = 1;",
"keywords": [
"selct", "select", "misspelled", "keyword", "syntax", "typo",
"spelling", "incorrect keyword", "wrong keyword", "misspelling",
"invalid keyword", "selct typo"
]
},
{
"id": "easy_001_from",
"category": "syntax",
"description": "FORM should be FROM.",
"severity": 0.35,
"fix": "SELECT * FROM users WHERE id = 1;",
"keywords": [
"form", "from", "misspelled", "keyword", "syntax", "typo",
"spelling", "table reference", "from clause", "misspelling"
]
},
{
"id": "easy_001_where",
"category": "syntax",
"description": "WEHRE should be WHERE.",
"severity": 0.25,
"fix": "SELECT * FROM users WHERE id = 1;",
"keywords": [
"wehre", "where", "misspelled", "keyword", "syntax", "typo",
"filter", "condition", "where clause", "misspelling"
]
},
{
"id": "easy_001_projection",
"category": "performance",
"description": "SELECT * fetches unnecessary columns for a profile lookup.",
"severity": 0.15,
"fix": "SELECT id, name, email FROM users WHERE id = 1;",
"keywords": [
"select *", "star", "unnecessary columns", "projection", "performance",
"all columns", "wildcard", "specific columns", "column selection",
"over-fetching", "fetch all", "select star"
]
}
],
"max_steps": 5
},
{
"task_id": "easy_002",
"difficulty": "easy",
"query": "SELECT id, email users WHERE active = 1;",
"schema": {
"users": {
"id": "INT PRIMARY KEY",
"email": "VARCHAR(255)",
"active": "BOOLEAN"
}
},
"context": "List active user emails for a notification job.",
"ground_truth_issues": [
{
"id": "easy_002_missing_from",
"category": "syntax",
"description": "The query is missing the FROM clause before users.",
"severity": 0.6,
"fix": "SELECT id, email FROM users WHERE active = 1;",
"keywords": [
"missing from", "from clause", "syntax", "users", "no from",
"omitted from", "table reference", "absent from", "from keyword",
"missing keyword"
]
}
],
"max_steps": 4
},
{
"task_id": "easy_003",
"difficulty": "easy",
"query": "SELECT order_id, total FROM orders WHERE shipped_at = NULL;",
"schema": {
"orders": {
"order_id": "INT PRIMARY KEY",
"total": "DECIMAL(10,2)",
"shipped_at": "TIMESTAMP NULL"
}
},
"context": "Find orders that still need to ship.",
"ground_truth_issues": [
{
"id": "easy_003_null_check",
"category": "logic",
"description": "NULL must be compared with IS NULL instead of = NULL.",
"severity": 0.7,
"fix": "SELECT order_id, total FROM orders WHERE shipped_at IS NULL;",
"keywords": [
"is null", "= null", "null comparison", "logic", "null check",
"equals null", "compare null", "null equality", "null predicate",
"three-valued logic", "null handling"
]
}
],
"max_steps": 4
},
{
"task_id": "easy_004",
"difficulty": "easy",
"query": "SELECT name FROM customers WHERE city = 'Boston;",
"schema": {
"customers": {
"id": "INT PRIMARY KEY",
"name": "VARCHAR(255)",
"city": "VARCHAR(128)"
}
},
"context": "Filter customers who live in Boston.",
"ground_truth_issues": [
{
"id": "easy_004_unclosed_quote",
"category": "syntax",
"description": "The string literal is not terminated with a closing quote.",
"severity": 0.75,
"fix": "SELECT name FROM customers WHERE city = 'Boston';",
"keywords": [
"unclosed quote", "unterminated string", "syntax", "quote",
"missing quote", "string literal", "closing quote", "open quote",
"single quote", "unmatched quote", "parse error"
]
}
],
"max_steps": 4
},
{
"task_id": "easy_005",
"difficulty": "easy",
"query": "SELECT id, statuz FROM orders WHERE status = 'paid';",
"schema": {
"orders": {
"id": "INT PRIMARY KEY",
"status": "VARCHAR(32)",
"total": "DECIMAL(10,2)",
"created_at": "TIMESTAMP"
}
},
"context": "List paid orders for revenue accounting.",
"ground_truth_issues": [
{
"id": "easy_005_bad_column",
"category": "logic",
"description": "Column statuz does not exist; the intended column is status.",
"severity": 0.65,
"fix": "SELECT id, status FROM orders WHERE status = 'paid';",
"keywords": [
"unknown column", "statuz", "status", "column name", "typo",
"misspelled column", "invalid column", "column not found",
"does not exist", "wrong column", "nonexistent column"
]
}
],
"max_steps": 4
},
{
"task_id": "easy_006",
"difficulty": "easy",
"query": "DELETE FROM orders;",
"schema": {
"orders": {
"id": "INT PRIMARY KEY",
"user_id": "INT",
"total": "DECIMAL(10,2)",
"status": "VARCHAR(32)"
}
},
"context": "Remove cancelled orders from the database.",
"ground_truth_issues": [
{
"id": "easy_006_no_where",
"category": "logic",
"description": "DELETE without WHERE clause will remove ALL rows from the table.",
"severity": 1.0,
"fix": "DELETE FROM orders WHERE status = 'cancelled';",
"keywords": [
"delete", "no where", "missing where", "all rows", "dangerous",
"destructive", "entire table", "unfiltered delete", "data loss",
"without condition", "unconditional"
]
}
],
"max_steps": 4
},
{
"task_id": "easy_007",
"difficulty": "easy",
"query": "SELECT id FROM users WHERE email = email;",
"schema": {
"users": {
"id": "INT PRIMARY KEY",
"email": "VARCHAR(255)"
}
},
"context": "Find user by email for login lookup.",
"ground_truth_issues": [
{
"id": "easy_007_self_compare",
"category": "logic",
"description": "Comparing column to itself (email = email) is always true. Should compare to a string literal.",
"severity": 0.8,
"fix": "SELECT id FROM users WHERE email = 'user@example.com';",
"keywords": [
"self comparison", "column compared to itself", "always true",
"tautology", "email = email", "missing literal", "missing value",
"string literal", "parameter", "no filter"
]
}
],
"max_steps": 4
}
]
|