| |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| """Tests for Diffusion policy processor.""" |
|
|
| import tempfile |
|
|
| import pytest |
| import torch |
|
|
| from lerobot.configs.types import FeatureType, NormalizationMode, PolicyFeature |
| from lerobot.policies.diffusion.configuration_diffusion import DiffusionConfig |
| from lerobot.policies.diffusion.processor_diffusion import make_diffusion_pre_post_processors |
| from lerobot.processor import ( |
| AddBatchDimensionProcessorStep, |
| DataProcessorPipeline, |
| DeviceProcessorStep, |
| NormalizerProcessorStep, |
| RenameObservationsProcessorStep, |
| TransitionKey, |
| UnnormalizerProcessorStep, |
| ) |
| from lerobot.processor.converters import create_transition, transition_to_batch |
| from lerobot.utils.constants import ACTION, OBS_IMAGE, OBS_STATE |
|
|
|
|
| def create_default_config(): |
| """Create a default Diffusion configuration for testing.""" |
| config = DiffusionConfig() |
| config.input_features = { |
| OBS_STATE: PolicyFeature(type=FeatureType.STATE, shape=(7,)), |
| OBS_IMAGE: PolicyFeature(type=FeatureType.VISUAL, shape=(3, 224, 224)), |
| } |
| config.output_features = { |
| ACTION: PolicyFeature(type=FeatureType.ACTION, shape=(6,)), |
| } |
| config.normalization_mapping = { |
| FeatureType.STATE: NormalizationMode.MEAN_STD, |
| FeatureType.VISUAL: NormalizationMode.IDENTITY, |
| FeatureType.ACTION: NormalizationMode.MIN_MAX, |
| } |
| config.device = "cpu" |
| return config |
|
|
|
|
| def create_default_stats(): |
| """Create default dataset statistics for testing.""" |
| return { |
| OBS_STATE: {"mean": torch.zeros(7), "std": torch.ones(7)}, |
| OBS_IMAGE: {}, |
| ACTION: {"min": torch.full((6,), -1.0), "max": torch.ones(6)}, |
| } |
|
|
|
|
| def test_make_diffusion_processor_basic(): |
| """Test basic creation of Diffusion processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats) |
|
|
| |
| assert preprocessor.name == "policy_preprocessor" |
| assert postprocessor.name == "policy_postprocessor" |
|
|
| |
| assert len(preprocessor.steps) == 4 |
| assert isinstance(preprocessor.steps[0], RenameObservationsProcessorStep) |
| assert isinstance(preprocessor.steps[1], AddBatchDimensionProcessorStep) |
| assert isinstance(preprocessor.steps[2], DeviceProcessorStep) |
| assert isinstance(preprocessor.steps[3], NormalizerProcessorStep) |
|
|
| |
| assert len(postprocessor.steps) == 2 |
| assert isinstance(postprocessor.steps[0], UnnormalizerProcessorStep) |
| assert isinstance(postprocessor.steps[1], DeviceProcessorStep) |
|
|
|
|
| def test_diffusion_processor_with_images(): |
| """Test Diffusion processor with image observations.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(7), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(6) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].shape == (1, 7) |
| assert processed[OBS_IMAGE].shape == (1, 3, 224, 224) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 6) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_diffusion_processor_cuda(): |
| """Test Diffusion processor with CUDA device.""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(7), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(6) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device.type == "cuda" |
| assert processed[OBS_IMAGE].device.type == "cuda" |
| assert processed[TransitionKey.ACTION.value].device.type == "cuda" |
|
|
| |
| postprocessed = postprocessor(processed[TransitionKey.ACTION.value]) |
|
|
| |
| assert postprocessed.device.type == "cpu" |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_diffusion_processor_accelerate_scenario(): |
| """Test Diffusion processor in simulated Accelerate scenario.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| device = torch.device("cuda:0") |
| observation = { |
| OBS_STATE: torch.randn(1, 7).to(device), |
| OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device), |
| } |
| action = torch.randn(1, 6).to(device) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[OBS_IMAGE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| @pytest.mark.skipif(torch.cuda.device_count() < 2, reason="Requires at least 2 GPUs") |
| def test_diffusion_processor_multi_gpu(): |
| """Test Diffusion processor with multi-GPU setup.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats) |
|
|
| |
| device = torch.device("cuda:1") |
| observation = { |
| OBS_STATE: torch.randn(1, 7).to(device), |
| OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device), |
| } |
| action = torch.randn(1, 6).to(device) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[OBS_IMAGE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| def test_diffusion_processor_without_stats(): |
| """Test Diffusion processor creation without dataset statistics.""" |
| config = create_default_config() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| dataset_stats=None, |
| ) |
|
|
| |
| assert preprocessor is not None |
| assert postprocessor is not None |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(7), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(6) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| processed = preprocessor(batch) |
| assert processed is not None |
|
|
|
|
| def test_diffusion_processor_save_and_load(): |
| """Test saving and loading Diffusion processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats) |
|
|
| with tempfile.TemporaryDirectory() as tmpdir: |
| |
| preprocessor.save_pretrained(tmpdir) |
|
|
| |
| loaded_preprocessor = DataProcessorPipeline.from_pretrained( |
| tmpdir, config_filename="policy_preprocessor.json" |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(7), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(6) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| processed = loaded_preprocessor(batch) |
| assert processed[OBS_STATE].shape == (1, 7) |
| assert processed[OBS_IMAGE].shape == (1, 3, 224, 224) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 6) |
|
|
|
|
| def test_diffusion_processor_identity_normalization(): |
| """Test that images with IDENTITY normalization are not normalized.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| image_value = torch.rand(3, 224, 224) * 255 |
| observation = { |
| OBS_STATE: torch.randn(7), |
| OBS_IMAGE: image_value.clone(), |
| } |
| action = torch.randn(6) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| |
| assert torch.allclose(processed[OBS_IMAGE][0], image_value, rtol=1e-5) |
|
|
|
|
| def test_diffusion_processor_batch_consistency(): |
| """Test Diffusion processor with different batch sizes.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_diffusion_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| for batch_size in [1, 8, 32]: |
| observation = { |
| OBS_STATE: torch.randn(batch_size, 7) if batch_size > 1 else torch.randn(7), |
| OBS_IMAGE: torch.randn(batch_size, 3, 224, 224) if batch_size > 1 else torch.randn(3, 224, 224), |
| } |
| action = torch.randn(batch_size, 6) if batch_size > 1 else torch.randn(6) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| processed = preprocessor(batch) |
|
|
| |
| expected_batch = batch_size if batch_size > 1 else 1 |
| assert processed[OBS_STATE].shape[0] == expected_batch |
| assert processed[OBS_IMAGE].shape[0] == expected_batch |
| assert processed[TransitionKey.ACTION.value].shape[0] == expected_batch |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_diffusion_processor_bfloat16_device_float32_normalizer(): |
| """Test: DeviceProcessor(bfloat16) + NormalizerProcessor(float32) → output bfloat16 via automatic adaptation""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, _ = make_diffusion_pre_post_processors(config, stats) |
|
|
| |
| modified_steps = [] |
| for step in preprocessor.steps: |
| if isinstance(step, DeviceProcessorStep): |
| |
| modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="bfloat16")) |
| elif isinstance(step, NormalizerProcessorStep): |
| |
| norm_step = step |
| modified_steps.append( |
| NormalizerProcessorStep( |
| features=norm_step.features, |
| norm_map=norm_step.norm_map, |
| stats=norm_step.stats, |
| device=config.device, |
| dtype=torch.float32, |
| ) |
| ) |
| else: |
| modified_steps.append(step) |
| preprocessor.steps = modified_steps |
|
|
| |
| normalizer_step = preprocessor.steps[3] |
| assert normalizer_step.dtype == torch.float32 |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(7, dtype=torch.float32), |
| OBS_IMAGE: torch.randn(3, 224, 224, dtype=torch.float32), |
| } |
| action = torch.randn(6, dtype=torch.float32) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].dtype == torch.bfloat16 |
| assert processed[OBS_IMAGE].dtype == torch.bfloat16 |
| assert processed[TransitionKey.ACTION.value].dtype == torch.bfloat16 |
|
|
| |
| assert normalizer_step.dtype == torch.bfloat16 |
| |
| for stat_tensor in normalizer_step._tensor_stats[OBS_STATE].values(): |
| assert stat_tensor.dtype == torch.bfloat16 |
| |
|
|