File size: 1,590 Bytes
c78c2fe
 
29473f6
c78c2fe
 
 
29473f6
 
 
 
 
 
 
 
 
 
 
 
 
c78c2fe
 
29473f6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
import os
import sys
import pytest

sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))

from server.data_wrangler_environment import DataWranglerEnvironment
from models import DataWranglerAction

def test_environment_reset():
    env = DataWranglerEnvironment()
    obs = env.reset()
    assert obs.columns == ["User Name", "Unnamed: 0", "Age"]
    assert obs.row_count == 3
    assert not obs.is_done

def test_drop_action_scoring():
    env = DataWranglerEnvironment()
    env.reset()
    env.target_df["User Name"] = [1, 2, 3] # Enforce it post-reset as well
    # It should penalize dropping a column that exists in target_df
    action = DataWranglerAction(action_type="drop_column", target_column="User Name")
    obs = env.step(action)
    assert "User Name" not in obs.columns
    assert "Warning" in obs.last_action_feedback or "Error" in obs.last_action_feedback
    
def test_successful_grading():
    import os
    os.environ["TASK_LEVEL"] = "1"
    env = DataWranglerEnvironment()
    env.reset()
    
    # 1. Drop Unnamed: 0
    env.step(DataWranglerAction(action_type="drop_column", target_column="Unnamed: 0"))
    
    # 2. Rename User Name
    env.step(DataWranglerAction(action_type="rename_column", target_column="User Name", new_name="user_name"))
    
    # 3. Rename Age
    env.step(DataWranglerAction(action_type="rename_column", target_column="Age", new_name="age"))
    
    # 4. Submit
    obs = env.step(DataWranglerAction(action_type="submit"))
    assert obs.is_done
    assert obs.reward > 0.8  # partial credit + efficiency