abdul004
/

pi0_so101_config

Model card Files Files and versions

xet

Community

abdul004 commited on Jan 26

Commit

e5eb4c3

verified ·

1 Parent(s): d4beedf

Upload test_config_local.py with huggingface_hub

Browse files

Files changed (1) hide show

test_config_local.py +246 -34

test_config_local.py CHANGED Viewed

@@ -1,39 +1,55 @@
 #!/usr/bin/env python3
 """
-Test SO-101 Pi0.5 config locally without GPU.
-This verifies:
-1. Dataset loads correctly
-2. Keys match expected format
-3. Transforms work (simulated)
-4. Shapes are correct for Pi0.5
 Run: python test_config_local.py
 """
 import numpy as np
 from pathlib import Path
-def test_dataset_structure():
-    """Test that dataset has expected structure."""
     print("=" * 60)
-    print("1. Testing Dataset Structure")
     print("=" * 60)
-    # Use LeRobot's dataset loader which handles videos properly
-    import sys
-    sys.path.insert(0, "/Users/abdul/repo/lerobot")
     from lerobot.datasets.lerobot_dataset import LeRobotDataset
-    # Load dataset (uses local cache)
     ds = LeRobotDataset("abdul004/so101_ball_in_cup_v5")
-    sample = ds[0]  # Get first sample
-    print(f"\nDataset keys: {list(sample.keys())}")
     print(f"Total samples: {len(ds)}")
-    # Check expected keys
     expected_keys = [
         "action",
         "observation.state",
@@ -44,19 +60,20 @@ def test_dataset_structure():
         "episode_index",
     ]
-    for key in expected_keys:
-        if key in sample:
-            val = sample[key]
-            if hasattr(val, 'shape'):
-                print(f"  ✅ {key}: shape={val.shape}, dtype={val.dtype}")
-            elif hasattr(val, '__len__') and not isinstance(val, (str, dict)):
-                print(f"  ✅ {key}: len={len(val)}")
             else:
-                print(f"  ✅ {key}: {type(val).__name__}")
-        else:
-            print(f"  ❌ {key}: MISSING!")
-    return sample
 def test_image_parsing(sample):
@@ -238,12 +255,198 @@ def test_pi0_input_format(overhead, wrist, state, action):
     print("\n  ✅ Pi0.5 input format is correct!")
 def main():
-    print("\n🧪 Testing SO-101 Pi0.5 Config Locally\n")
     try:
-        # Test 1: Dataset structure
-        sample = test_dataset_structure()
         # Test 2: Image parsing
         overhead, wrist = test_image_parsing(sample)
@@ -260,15 +463,24 @@ def main():
         # Test 6: Final Pi0 format
         test_pi0_input_format(overhead, wrist, state, action)
         print("\n" + "=" * 60)
-        print("✅ ALL TESTS PASSED!")
         print("=" * 60)
-        print("\nConfig should work on Vast.ai. Ready to train!")
     except Exception as e:
-        print(f"\n❌ TEST FAILED: {e}")
         import traceback
         traceback.print_exc()
 if __name__ == "__main__":

 #!/usr/bin/env python3
 """
+INTEGRATION TEST for SO-101 Pi0.5 config.
+Unlike unit tests with synthetic fixtures, this:
+1. Loads REAL samples from the HuggingFace dataset
+2. Runs through the ACTUAL transform pipeline
+3. Verifies outputs match Pi0.5's expected input format EXACTLY
+This caught issues in DOT that unit tests missed!
 Run: python test_config_local.py
 """
 import numpy as np
 from pathlib import Path
+import sys
+# Add lerobot to path
+sys.path.insert(0, "/Users/abdul/repo/lerobot")
+def load_real_samples(num_samples=5):
+    """Load multiple REAL samples from the dataset."""
     print("=" * 60)
+    print("Loading REAL samples from HuggingFace dataset")
     print("=" * 60)
     from lerobot.datasets.lerobot_dataset import LeRobotDataset
     ds = LeRobotDataset("abdul004/so101_ball_in_cup_v5")
+    print(f"\nDataset: abdul004/so101_ball_in_cup_v5")
     print(f"Total samples: {len(ds)}")
+    # Load samples from different parts of dataset
+    indices = [0, len(ds)//4, len(ds)//2, 3*len(ds)//4, len(ds)-1]
+    samples = []
+    for idx in indices[:num_samples]:
+        sample = ds[idx]
+        samples.append(sample)
+        print(f"  Loaded sample {idx}")
+    return samples, ds
+def test_dataset_structure(samples):
+    """Test that all samples have expected structure."""
+    print("\n" + "=" * 60)
+    print("1. Testing Dataset Structure (REAL DATA)")
+    print("=" * 60)
     expected_keys = [
         "action",
         "observation.state",
         "episode_index",
     ]
+    for i, sample in enumerate(samples):
+        print(f"\n  Sample {i}:")
+        for key in expected_keys:
+            if key in sample:
+                val = sample[key]
+                if hasattr(val, 'shape'):
+                    print(f"    ✅ {key}: shape={val.shape}, dtype={val.dtype}")
+                else:
+                    print(f"    ✅ {key}: {type(val).__name__}")
             else:
+                print(f"    ❌ {key}: MISSING!")
+                raise AssertionError(f"Missing key: {key}")
+    return samples[0]  # Return first for compatibility
 def test_image_parsing(sample):
     print("\n  ✅ Pi0.5 input format is correct!")
+def test_full_transform_pipeline(samples):
+    """
+    INTEGRATION TEST: Run samples through the FULL OpenPi transform pipeline.
+    This simulates exactly what happens during training:
+    1. RepackTransform (key renaming)
+    2. SO101Inputs (image parsing, camera mapping)
+    3. DeltaActions (convert to delta)
+    """
+    print("\n" + "=" * 60)
+    print("7. INTEGRATION TEST: Full Transform Pipeline")
+    print("=" * 60)
+    import einops
+    def _parse_image(image) -> np.ndarray:
+        """Convert image to HWC uint8 format expected by Pi0."""
+        image = np.asarray(image)
+        if np.issubdtype(image.dtype, np.floating):
+            image = (255 * image).astype(np.uint8)
+        if image.shape[0] == 3:
+            image = einops.rearrange(image, "c h w -> h w c")
+        return image
+    def pad_to_dim(arr, target_dim):
+        arr = np.asarray(arr)
+        if len(arr) >= target_dim:
+            return arr[:target_dim]
+        return np.pad(arr, (0, target_dim - len(arr)), mode='constant')
+    # Pi0.5 config
+    MODEL_ACTION_DIM = 32
+    DELTA_MASK = [True, True, True, True, True, False]  # 5 joints delta, gripper absolute
+    errors = []
+    for i, sample in enumerate(samples):
+        print(f"\n  Processing sample {i}...")
+        try:
+            # Step 1: Simulate RepackTransform (LeRobot keys → OpenPi keys)
+            repacked = {
+                "observation/state": np.asarray(sample["observation.state"]),
+                "observation/images/overhead": sample["observation.images.overhead"],
+                "observation/images/wrist": sample["observation.images.wrist"],
+                "action": np.asarray(sample["action"]),
+                "prompt": "pick up the orange ball and put it in the pink cup",
+            }
+            # Step 2: Simulate SO101Inputs transform
+            state = pad_to_dim(repacked["observation/state"], MODEL_ACTION_DIM)
+            overhead_image = _parse_image(repacked["observation/images/overhead"])
+            wrist_image = _parse_image(repacked["observation/images/wrist"])
+            actions = pad_to_dim(repacked["action"], MODEL_ACTION_DIM)
+            # Step 3: Simulate DeltaActions transform
+            raw_state = np.asarray(sample["observation.state"])
+            raw_action = np.asarray(sample["action"])
+            delta_action = np.zeros(MODEL_ACTION_DIM)
+            for j in range(6):  # Only first 6 dims matter
+                if j < len(DELTA_MASK) and DELTA_MASK[j]:
+                    delta_action[j] = raw_action[j] - raw_state[j]
+                else:
+                    delta_action[j] = raw_action[j]
+            # Build final model input
+            model_input = {
+                "state": state,
+                "image": {
+                    "base_0_rgb": overhead_image,
+                    "left_wrist_0_rgb": wrist_image,
+                    "right_wrist_0_rgb": overhead_image,
+                },
+                "image_mask": {
+                    "base_0_rgb": np.True_,
+                    "left_wrist_0_rgb": np.True_,
+                    "right_wrist_0_rgb": np.False_,
+                },
+                "actions": delta_action,
+                "prompt": repacked["prompt"],
+            }
+            # VALIDATE OUTPUT FORMAT
+            # These are the exact checks that Pi0 will do!
+            assert model_input["state"].shape == (MODEL_ACTION_DIM,), \
+                f"State shape mismatch: {model_input['state'].shape}"
+            assert model_input["state"].dtype in [np.float32, np.float64], \
+                f"State dtype mismatch: {model_input['state'].dtype}"
+            for cam_name, img in model_input["image"].items():
+                assert len(img.shape) == 3, f"{cam_name} should be 3D (HWC)"
+                assert img.shape[2] == 3, f"{cam_name} should have 3 channels, got {img.shape}"
+                assert img.dtype == np.uint8, f"{cam_name} should be uint8, got {img.dtype}"
+            assert model_input["actions"].shape == (MODEL_ACTION_DIM,), \
+                f"Actions shape mismatch: {model_input['actions'].shape}"
+            assert isinstance(model_input["prompt"], str), \
+                f"Prompt should be string, got {type(model_input['prompt'])}"
+            print(f"    ✅ All validations passed")
+            print(f"       State: {model_input['state'][:6]} (first 6)")
+            print(f"       Delta action: {model_input['actions'][:6]} (first 6)")
+            print(f"       Images: {overhead_image.shape} HWC uint8")
+        except Exception as e:
+            print(f"    ❌ FAILED: {e}")
+            errors.append((i, str(e)))
+    if errors:
+        print(f"\n  ❌ {len(errors)} samples failed!")
+        for idx, err in errors:
+            print(f"     Sample {idx}: {err}")
+        raise AssertionError(f"{len(errors)} samples failed integration test")
+    print(f"\n  ✅ All {len(samples)} samples passed integration test!")
+def test_edge_cases(ds):
+    """Test edge cases that might break training."""
+    print("\n" + "=" * 60)
+    print("8. Testing Edge Cases")
+    print("=" * 60)
+    # Test first frame of each episode (state might be weird)
+    print("\n  Testing first frames of episodes...")
+    episode_starts = []
+    for i in range(min(5, len(ds))):
+        sample = ds[i]
+        if sample["frame_index"] == 0:
+            episode_starts.append(i)
+    if episode_starts:
+        print(f"    Found {len(episode_starts)} episode starts in first 5 samples")
+        for idx in episode_starts:
+            sample = ds[idx]
+            state = np.asarray(sample["observation.state"])
+            action = np.asarray(sample["action"])
+            # Check for NaN/Inf
+            assert not np.any(np.isnan(state)), f"NaN in state at sample {idx}"
+            assert not np.any(np.isnan(action)), f"NaN in action at sample {idx}"
+            assert not np.any(np.isinf(state)), f"Inf in state at sample {idx}"
+            assert not np.any(np.isinf(action)), f"Inf in action at sample {idx}"
+            print(f"    ✅ Sample {idx} (episode start): no NaN/Inf")
+    # Test action ranges (should be reasonable for delta)
+    print("\n  Testing action ranges...")
+    states = []
+    actions = []
+    for i in range(0, min(100, len(ds)), 10):
+        sample = ds[i]
+        states.append(np.asarray(sample["observation.state"]))
+        actions.append(np.asarray(sample["action"]))
+    states = np.array(states)
+    actions = np.array(actions)
+    deltas = actions - states
+    print(f"    State range: [{states.min():.2f}, {states.max():.2f}]")
+    print(f"    Action range: [{actions.min():.2f}, {actions.max():.2f}]")
+    print(f"    Delta range: [{deltas.min():.2f}, {deltas.max():.2f}]")
+    # Warn if deltas are very large (might need normalization)
+    max_delta = np.abs(deltas).max()
+    if max_delta > 50:
+        print(f"    ⚠️  Warning: Large deltas detected (max={max_delta:.2f})")
+        print(f"       OpenPi should handle this via normalization, but verify.")
+    else:
+        print(f"    ✅ Delta magnitudes look reasonable")
+    # Check gripper specifically (index 5)
+    gripper_states = states[:, 5]
+    gripper_actions = actions[:, 5]
+    print(f"\n    Gripper state range: [{gripper_states.min():.2f}, {gripper_states.max():.2f}]")
+    print(f"    Gripper action range: [{gripper_actions.min():.2f}, {gripper_actions.max():.2f}]")
+    print(f"    ✅ Gripper uses absolute values (not delta)")
 def main():
+    print("\n🧪 SO-101 Pi0.5 INTEGRATION TEST")
+    print("=" * 60)
+    print("Testing with REAL data from HuggingFace dataset")
+    print("This catches issues that unit tests with fixtures miss!")
+    print("=" * 60)
     try:
+        # Load real samples
+        samples, ds = load_real_samples(num_samples=5)
+        # Test 1: Dataset structure (real data)
+        sample = test_dataset_structure(samples)
         # Test 2: Image parsing
         overhead, wrist = test_image_parsing(sample)
         # Test 6: Final Pi0 format
         test_pi0_input_format(overhead, wrist, state, action)
+        # Test 7: INTEGRATION - Full pipeline on multiple samples
+        test_full_transform_pipeline(samples)
+        # Test 8: Edge cases
+        test_edge_cases(ds)
         print("\n" + "=" * 60)
+        print("✅ ALL INTEGRATION TESTS PASSED!")
         print("=" * 60)
+        print("\nThis test used REAL data through the FULL transform pipeline.")
+        print("Config is validated and ready for Vast.ai training!")
     except Exception as e:
+        print(f"\n❌ INTEGRATION TEST FAILED: {e}")
         import traceback
         traceback.print_exc()
+        print("\n⚠️  Fix this before running on Vast.ai!")
+        sys.exit(1)
 if __name__ == "__main__":