File size: 11,348 Bytes
715a633
 
 
 
 
 
 
bf68f4e
715a633
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
758564e
715a633
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
# src/gaia_agent/tools/safe_code_run.py
from __future__ import annotations
import io, os, sys, uuid, base64, traceback, contextlib, tempfile, shutil
import multiprocessing as mp
from typing import Optional, Dict, Any, List
from pydantic import ValidationError
from langchain_core.tools import tool
from src.utils.code_run import (
    CodeRunRequest, CodeRunResult, EnvInfo,
    PlotArtifact, DataFrameArtifact,
)

# ====================== HELPERS ======================

def _b64_png(fig, dpi: int) -> str:
    import matplotlib.pyplot as plt
    buf = io.BytesIO()
    fig.savefig(buf, format="png", dpi=dpi, bbox_inches="tight")
    buf.seek(0)
    data = base64.b64encode(buf.read()).decode("utf-8")
    buf.close()
    return data

def _clip_df(df, max_rows: int, max_cols: int):
    sub = df.iloc[:max_rows, :max_cols]
    head = sub.to_dict(orient="records")
    dtypes = {str(k): str(v) for k, v in sub.dtypes.to_dict().items()}
    return head, list(df.shape), dtypes

def _env_info() -> EnvInfo:
    try:
        import numpy as _np; nv = _np.__version__
    except Exception:
        nv = None
    try:
        import pandas as _pd; pv = _pd.__version__
    except Exception:
        pv = None
    return EnvInfo(numpy=nv, pandas=pv)

# ====================== CHILD PROCESS ======================

def _child_exec(payload: Dict[str, Any], queue: mp.Queue):
    """
    Изолированное выполнение user-кода:
      - урезанные builtins
      - безопасный open (read-only в sandbox)
      - белый список импортов
      - запрет сети
      - temp cwd + очистка
      - RLIMIT CPU/AS (Unix)
      - захват stdout/stderr
      - сбор matplotlib и pandas.DataFrame (по флагам)
    """
    import builtins, importlib

    code: str = payload["code"]
    limits: Dict[str, Any] = payload["limits"]
    allowed: List[str] = payload["allowed"]
    return_plots: bool = payload["return_plots"]
    return_dfs: bool = payload["return_dfs"]

    # ---------- OS limits (Unix) ----------
    try:
        import resource
        cpu = max(1, int(limits["timeout_seconds"]))
        resource.setrlimit(resource.RLIMIT_CPU, (cpu, cpu + 1))
        # мягкий лимит RAM ~1.5GB (подстрой при необходимости)
        one_gb = 1024 * 1024 * 1024
        resource.setrlimit(resource.RLIMIT_AS, (int(1.5 * one_gb), int(1.5 * one_gb)))
        # ограничим размеры файлов
        resource.setrlimit(resource.RLIMIT_FSIZE, (50 * 1024 * 1024, 50 * 1024 * 1024))
    except Exception:
        pass

    # ---------- Sandbox FS ----------
    workdir = tempfile.mkdtemp(prefix="ci_")
    os.chdir(workdir)

    # ---------- Network ban ----------
    try:
        import socket
        class _NoNet(socket.socket):
            def __init__(self, *a, **kw):
                raise OSError("Network disabled in sandbox")
        socket.socket = _NoNet  # type: ignore
    except Exception:
        pass

    # ---------- Builtins ----------
    safe_names = [
        "abs","all","any","bool","dict","float","int","len","list","max","min",
        "range","str","sum","print","enumerate","zip","map","filter","sorted",
        "reversed","complex","pow","divmod", "round", "next", "set", "tuple", "type", "isinstance", "issubclass",
    ]
    safe_builtins = {n: getattr(builtins, n) for n in safe_names}

    # сохранём реальный open, потом подменим на безопасный
    real_open = open

    def _safe_open(path, mode="r", *a, **kw):
        # Разрешаем ТОЛЬКО чтение, ТОЛЬКО внутри workdir
        if any(m in mode for m in ("w", "a", "+", "x")):
            raise PermissionError("Write access forbidden in sandbox")
        abspath = os.path.abspath(path)
        # запрещаем выход из песочницы и следование symlink наружу
        if not abspath.startswith(workdir + os.sep) and abspath != workdir:
            raise PermissionError("Access outside sandbox forbidden")
        # запретим двоичный write по flags
        return real_open(abspath, mode, *a, **kw)

    # удалим опасные builtins и поставим наш open
    for banned in ["exec","eval","__import__","compile","input","globals","locals","vars","dir","help","__build_class__"]:
        safe_builtins.pop(banned, None)
    safe_builtins["open"] = _safe_open

    # ---------- Import whitelist ----------
    real_import = builtins.__import__
    ALLOWED = set(allowed)
    def _safe_import(name, globals=None, locals=None, fromlist=(), level=0):
        base = name.split(".")[0]
        if (name not in ALLOWED) and (base not in ALLOWED):
            raise ImportError(f"Module '{name}' is not allowed")
        return real_import(name, globals, locals, fromlist, level)

    glb: Dict[str, Any] = {"__builtins__": safe_builtins}
    lcl: Dict[str, Any] = {}

    # ---------- Matplotlib headless ----------
    plt = None
    if return_plots:
        try:
            import matplotlib
            matplotlib.use("Agg")
            import matplotlib.pyplot as _plt
            plt = _plt
        except Exception:
            plt = None

    # ---------- Preload whitelisted mods ----------
    preloads = [
        "math","random","statistics","datetime","re","json","fractions","decimal",
        "numpy","pandas","cmath",
        "matplotlib","matplotlib.pyplot"
    ]
    for mod in preloads:
        try:
            if (mod in ALLOWED) or (mod.split(".")[0] in ALLOWED):
                glb[mod.split(".")[-1]] = importlib.import_module(mod)
        except Exception:
            pass

    # включаем безопасный импорт
    safe_builtins["__import__"] = _safe_import

    # ---------- Execute ----------
    out_buf, err_buf = io.StringIO(), io.StringIO()
    status = "error"
    result_repr: Optional[str] = None
    plots: List[Dict[str, Any]] = []
    dataframes: List[Dict[str, Any]] = []

    try:
        with contextlib.redirect_stdout(out_buf), contextlib.redirect_stderr(err_buf):
            exec(code, glb, lcl)
            status = "success"

            # вернём repr результата, если есть _ или result
            if "_" in lcl:
                result_repr = repr(lcl["_"])
            elif "result" in lcl:
                result_repr = repr(lcl["result"])

            # графики
            if plt is not None and return_plots:
                fig_nums = plt.get_fignums()[: int(limits["max_plots"])]
                for num in fig_nums:
                    fig = plt.figure(num)
                    b64 = _b64_png(fig, dpi=int(limits["plot_dpi"]))
                    plots.append({"data_base64": b64, "format": "png"})
                plt.close("all")

            # DataFrame’ы
            if return_dfs:
                try:
                    import pandas as _pd
                    for name, val in list(lcl.items()):
                        if isinstance(val, _pd.DataFrame):
                            if len(dataframes) >= int(limits["max_dataframes"]):
                                break
                            head, shape, dtypes = _clip_df(
                                val,
                                max_rows=int(limits["max_df_rows"]),
                                max_cols=int(limits["max_df_cols"]),
                            )
                            dataframes.append({
                                "name": str(name),
                                "head": head,
                                "shape": shape,
                                "dtypes": dtypes,
                            })
                except Exception:
                    pass

    except Exception:
        status = "error"
        print(traceback.format_exc(), file=err_buf)
    finally:
        try:
            shutil.rmtree(workdir, ignore_errors=True)
        except Exception:
            pass

    queue.put({
        "status": status,
        "stdout": out_buf.getvalue(),
        "stderr": err_buf.getvalue(),
        "result_repr": result_repr,
        "plots": plots,
        "dataframes": dataframes,
    })

# ====================== HOST PROCESS ======================

def run_python_in_subprocess(req: CodeRunRequest) -> CodeRunResult:
    exec_id = str(uuid.uuid4())
    ctx = mp.get_context("spawn")
    q: mp.Queue = ctx.Queue()

    payload = {
        "code": req.code,
        "limits": req.limits.model_dump(),
        "allowed": list(req.allowed_modules),
        "return_plots": bool(req.return_plots),
        "return_dfs": bool(req.return_dataframes),
    }

    p = ctx.Process(target=_child_exec, args=(payload, q), daemon=True)
    p.start()
    p.join(req.limits.timeout_seconds)

    status = "timeout"
    stdout = ""
    stderr = "Timed out."
    result_repr = None
    plots: List[PlotArtifact] = []
    dataframes: List[DataFrameArtifact] = []

    if p.is_alive():
        p.terminate()
        p.join(1)
    else:
        try:
            msg = q.get_nowait()
            status = msg.get("status", "error")
            stdout = (msg.get("stdout") or "")[: req.limits.max_stdout_chars]
            stderr = (msg.get("stderr") or "")[: req.limits.max_stderr_chars]
            result_repr = msg.get("result_repr")
            plots = [PlotArtifact(**p_) for p_ in msg.get("plots", [])]
            dataframes = [DataFrameArtifact(**d_) for d_ in msg.get("dataframes", [])]
        except Exception as e:
            status = "error"
            stderr = f"Worker crashed: {e}"

    return CodeRunResult(
        execution_id=exec_id,
        status=status,
        stdout=stdout,
        stderr=stderr,
        result_repr=result_repr,
        plots=plots,
        dataframes=dataframes,
        env=_env_info(),
    )

# ====================== LangChain TOOL ======================

@tool
def safe_code_run(code:str) -> str:
    """
    Safely execute Python code in an isolated subprocess with security restrictions.
    
    IMPORTANT - To see output, you MUST:
    - Use print() statements for output
    - Assign final result to variable 'result' or '_' 
    - Save data to variables for DataFrame/plot capture
    
    Examples:
    ✅ Good:
    result = 2 + 2
    print(f"Answer: {result}")
    
    ✅ Good:
    import numpy as np
    arr = np.array([1, 2, 3])
    print(arr.mean())
    
    ✅ Good:
    import pandas as pd
    df = pd.DataFrame({'x': [1, 2], 'y': [3, 4]})
    print(df)
    result = df.sum()
    
    ❌ Bad (no output):
    2 + 2  # This won't show anything
    
    Security features:
    - Whitelisted imports only (numpy, pandas, matplotlib, etc.)
    - Read-only file access within sandbox
    - Network disabled
    - Memory/CPU limits
    - Timeout protection
    
    Returns JSON with: status, stdout, stderr, result_repr, plots, dataframes, env info
    """

    # упаковываем запрос в JSON
    req = CodeRunRequest(
        code=code,
        # для первого запуска дайте запас
        limits=dict(timeout_seconds=35)  # или 45
    ).model_dump_json()

    res = run_python_in_subprocess(CodeRunRequest.model_validate_json(req))
    return res.model_dump_json()