| |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| """Tests for SAC policy processor.""" |
|
|
| import tempfile |
|
|
| import pytest |
| import torch |
|
|
| from lerobot.configs.types import FeatureType, NormalizationMode, PolicyFeature |
| from lerobot.policies.sac.configuration_sac import SACConfig |
| from lerobot.policies.sac.processor_sac import make_sac_pre_post_processors |
| from lerobot.processor import ( |
| AddBatchDimensionProcessorStep, |
| DataProcessorPipeline, |
| DeviceProcessorStep, |
| NormalizerProcessorStep, |
| RenameObservationsProcessorStep, |
| TransitionKey, |
| UnnormalizerProcessorStep, |
| ) |
| from lerobot.processor.converters import create_transition, transition_to_batch |
| from lerobot.utils.constants import ACTION, OBS_STATE |
|
|
|
|
| def create_default_config(): |
| """Create a default SAC configuration for testing.""" |
| config = SACConfig() |
| config.input_features = { |
| OBS_STATE: PolicyFeature(type=FeatureType.STATE, shape=(10,)), |
| } |
| config.output_features = { |
| ACTION: PolicyFeature(type=FeatureType.ACTION, shape=(5,)), |
| } |
| config.normalization_mapping = { |
| FeatureType.STATE: NormalizationMode.MEAN_STD, |
| FeatureType.ACTION: NormalizationMode.MIN_MAX, |
| } |
| config.device = "cpu" |
| return config |
|
|
|
|
| def create_default_stats(): |
| """Create default dataset statistics for testing.""" |
| return { |
| OBS_STATE: {"mean": torch.zeros(10), "std": torch.ones(10)}, |
| ACTION: {"min": torch.full((5,), -1.0), "max": torch.ones(5)}, |
| } |
|
|
|
|
| def test_make_sac_processor_basic(): |
| """Test basic creation of SAC processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| assert preprocessor.name == "policy_preprocessor" |
| assert postprocessor.name == "policy_postprocessor" |
|
|
| |
| assert len(preprocessor.steps) == 4 |
| assert isinstance(preprocessor.steps[0], RenameObservationsProcessorStep) |
| assert isinstance(preprocessor.steps[1], AddBatchDimensionProcessorStep) |
| assert isinstance(preprocessor.steps[2], DeviceProcessorStep) |
| assert isinstance(preprocessor.steps[3], NormalizerProcessorStep) |
|
|
| |
| assert len(postprocessor.steps) == 2 |
| assert isinstance(postprocessor.steps[0], UnnormalizerProcessorStep) |
| assert isinstance(postprocessor.steps[1], DeviceProcessorStep) |
|
|
|
|
| def test_sac_processor_normalization_modes(): |
| """Test that SAC processor correctly handles different normalization modes.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = {OBS_STATE: torch.randn(10) * 2} |
| action = torch.rand(5) * 2 - 1 |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| |
| |
| assert processed[OBS_STATE].shape == (1, 10) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 5) |
|
|
| |
| postprocessed = postprocessor(processed[TransitionKey.ACTION.value]) |
|
|
| |
| assert postprocessed.shape == (1, 5) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_sac_processor_cuda(): |
| """Test SAC processor with CUDA device.""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = {OBS_STATE: torch.randn(10)} |
| action = torch.randn(5) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device.type == "cuda" |
| assert processed[TransitionKey.ACTION.value].device.type == "cuda" |
|
|
| |
| postprocessed = postprocessor(processed[TransitionKey.ACTION.value]) |
|
|
| |
| assert postprocessed.device.type == "cpu" |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_sac_processor_accelerate_scenario(): |
| """Test SAC processor in simulated Accelerate scenario.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| device = torch.device("cuda:0") |
| observation = {OBS_STATE: torch.randn(10).to(device)} |
| action = torch.randn(5).to(device) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| @pytest.mark.skipif(torch.cuda.device_count() < 2, reason="Requires at least 2 GPUs") |
| def test_sac_processor_multi_gpu(): |
| """Test SAC processor with multi-GPU setup.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| device = torch.device("cuda:1") |
| observation = {OBS_STATE: torch.randn(10).to(device)} |
| action = torch.randn(5).to(device) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| def test_sac_processor_without_stats(): |
| """Test SAC processor creation without dataset statistics.""" |
| config = create_default_config() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors(config, dataset_stats=None) |
|
|
| |
| assert preprocessor is not None |
| assert postprocessor is not None |
|
|
| |
| observation = {OBS_STATE: torch.randn(10)} |
| action = torch.randn(5) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| processed = preprocessor(batch) |
| assert processed is not None |
|
|
|
|
| def test_sac_processor_save_and_load(): |
| """Test saving and loading SAC processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| with tempfile.TemporaryDirectory() as tmpdir: |
| |
| preprocessor.save_pretrained(tmpdir) |
|
|
| |
| loaded_preprocessor = DataProcessorPipeline.from_pretrained( |
| tmpdir, config_filename="policy_preprocessor.json" |
| ) |
|
|
| |
| observation = {OBS_STATE: torch.randn(10)} |
| action = torch.randn(5) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| processed = loaded_preprocessor(batch) |
| assert processed[OBS_STATE].shape == (1, 10) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 5) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_sac_processor_mixed_precision(): |
| """Test SAC processor with mixed precision.""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| |
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| modified_steps = [] |
| for step in preprocessor.steps: |
| if isinstance(step, DeviceProcessorStep): |
| modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="float16")) |
| elif isinstance(step, NormalizerProcessorStep): |
| |
| norm_step = step |
| modified_steps.append( |
| NormalizerProcessorStep( |
| features=norm_step.features, |
| norm_map=norm_step.norm_map, |
| stats=norm_step.stats, |
| device=config.device, |
| dtype=torch.float16, |
| ) |
| ) |
| else: |
| modified_steps.append(step) |
| preprocessor.steps = modified_steps |
|
|
| |
| observation = {OBS_STATE: torch.randn(10, dtype=torch.float32)} |
| action = torch.randn(5, dtype=torch.float32) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].dtype == torch.float16 |
| assert processed[TransitionKey.ACTION.value].dtype == torch.float16 |
|
|
|
|
| def test_sac_processor_batch_data(): |
| """Test SAC processor with batched data.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| batch_size = 32 |
| observation = {OBS_STATE: torch.randn(batch_size, 10)} |
| action = torch.randn(batch_size, 5) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].shape == (batch_size, 10) |
| assert processed[TransitionKey.ACTION.value].shape == (batch_size, 5) |
|
|
|
|
| def test_sac_processor_edge_cases(): |
| """Test SAC processor with edge cases.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = {"observation.dummy": torch.randn(1)} |
| action = torch.randn(5) |
| batch = {TransitionKey.ACTION.value: action, **observation} |
| processed = preprocessor(batch) |
| |
| assert OBS_STATE not in processed |
| assert processed[TransitionKey.ACTION.value].shape == (1, 5) |
|
|
| |
| transition = create_transition(observation={OBS_STATE: torch.randn(10)}, action=torch.zeros(5)) |
| batch = transition_to_batch(transition) |
| processed = preprocessor(batch) |
| assert processed[OBS_STATE].shape == (1, 10) |
| |
| assert processed[TransitionKey.ACTION.value].shape == (1, 5) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_sac_processor_bfloat16_device_float32_normalizer(): |
| """Test: DeviceProcessor(bfloat16) + NormalizerProcessor(float32) → output bfloat16 via automatic adaptation""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, _ = make_sac_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| modified_steps = [] |
| for step in preprocessor.steps: |
| if isinstance(step, DeviceProcessorStep): |
| |
| modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="bfloat16")) |
| elif isinstance(step, NormalizerProcessorStep): |
| |
| norm_step = step |
| modified_steps.append( |
| NormalizerProcessorStep( |
| features=norm_step.features, |
| norm_map=norm_step.norm_map, |
| stats=norm_step.stats, |
| device=config.device, |
| dtype=torch.float32, |
| ) |
| ) |
| else: |
| modified_steps.append(step) |
| preprocessor.steps = modified_steps |
|
|
| |
| normalizer_step = preprocessor.steps[3] |
| assert normalizer_step.dtype == torch.float32 |
|
|
| |
| observation = {OBS_STATE: torch.randn(10, dtype=torch.float32)} |
| action = torch.randn(5, dtype=torch.float32) |
| transition = create_transition(observation, action) |
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].dtype == torch.bfloat16 |
| assert processed[TransitionKey.ACTION.value].dtype == torch.bfloat16 |
|
|
| |
| assert normalizer_step.dtype == torch.bfloat16 |
| for stat_tensor in normalizer_step._tensor_stats[OBS_STATE].values(): |
| assert stat_tensor.dtype == torch.bfloat16 |
|
|