| |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| """Tests for VQBeT policy processor.""" |
|
|
| import tempfile |
|
|
| import pytest |
| import torch |
|
|
| from lerobot.configs.types import FeatureType, NormalizationMode, PolicyFeature |
| from lerobot.policies.vqbet.configuration_vqbet import VQBeTConfig |
| from lerobot.policies.vqbet.processor_vqbet import make_vqbet_pre_post_processors |
| from lerobot.processor import ( |
| AddBatchDimensionProcessorStep, |
| DataProcessorPipeline, |
| DeviceProcessorStep, |
| NormalizerProcessorStep, |
| RenameObservationsProcessorStep, |
| TransitionKey, |
| UnnormalizerProcessorStep, |
| ) |
| from lerobot.processor.converters import create_transition, transition_to_batch |
| from lerobot.utils.constants import ACTION, OBS_IMAGE, OBS_STATE |
|
|
|
|
| def create_default_config(): |
| """Create a default VQBeT configuration for testing.""" |
| config = VQBeTConfig() |
| config.input_features = { |
| OBS_STATE: PolicyFeature(type=FeatureType.STATE, shape=(8,)), |
| OBS_IMAGE: PolicyFeature(type=FeatureType.VISUAL, shape=(3, 224, 224)), |
| } |
| config.output_features = { |
| ACTION: PolicyFeature(type=FeatureType.ACTION, shape=(7,)), |
| } |
| config.normalization_mapping = { |
| FeatureType.STATE: NormalizationMode.MEAN_STD, |
| FeatureType.VISUAL: NormalizationMode.IDENTITY, |
| FeatureType.ACTION: NormalizationMode.MIN_MAX, |
| } |
| config.device = "cpu" |
| return config |
|
|
|
|
| def create_default_stats(): |
| """Create default dataset statistics for testing.""" |
| return { |
| OBS_STATE: {"mean": torch.zeros(8), "std": torch.ones(8)}, |
| OBS_IMAGE: {}, |
| ACTION: {"min": torch.full((7,), -1.0), "max": torch.ones(7)}, |
| } |
|
|
|
|
| def test_make_vqbet_processor_basic(): |
| """Test basic creation of VQBeT processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| assert preprocessor.name == "policy_preprocessor" |
| assert postprocessor.name == "policy_postprocessor" |
|
|
| |
| assert len(preprocessor.steps) == 4 |
| assert isinstance(preprocessor.steps[0], RenameObservationsProcessorStep) |
| assert isinstance(preprocessor.steps[1], AddBatchDimensionProcessorStep) |
| assert isinstance(preprocessor.steps[2], DeviceProcessorStep) |
| assert isinstance(preprocessor.steps[3], NormalizerProcessorStep) |
|
|
| |
| assert len(postprocessor.steps) == 2 |
| assert isinstance(postprocessor.steps[0], UnnormalizerProcessorStep) |
| assert isinstance(postprocessor.steps[1], DeviceProcessorStep) |
|
|
|
|
| def test_vqbet_processor_with_images(): |
| """Test VQBeT processor with image and state observations.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].shape == (1, 8) |
| assert processed[OBS_IMAGE].shape == (1, 3, 224, 224) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 7) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_vqbet_processor_cuda(): |
| """Test VQBeT processor with CUDA device.""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device.type == "cuda" |
| assert processed[OBS_IMAGE].device.type == "cuda" |
| assert processed[TransitionKey.ACTION.value].device.type == "cuda" |
|
|
| |
| postprocessed = postprocessor(processed[TransitionKey.ACTION.value]) |
|
|
| |
| assert postprocessed.device.type == "cpu" |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_vqbet_processor_accelerate_scenario(): |
| """Test VQBeT processor in simulated Accelerate scenario.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| device = torch.device("cuda:0") |
| observation = { |
| OBS_STATE: torch.randn(1, 8).to(device), |
| OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device), |
| } |
| action = torch.randn(1, 7).to(device) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[OBS_IMAGE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| @pytest.mark.skipif(torch.cuda.device_count() < 2, reason="Requires at least 2 GPUs") |
| def test_vqbet_processor_multi_gpu(): |
| """Test VQBeT processor with multi-GPU setup.""" |
| config = create_default_config() |
| config.device = "cuda:0" |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| device = torch.device("cuda:1") |
| observation = { |
| OBS_STATE: torch.randn(1, 8).to(device), |
| OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device), |
| } |
| action = torch.randn(1, 7).to(device) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].device == device |
| assert processed[OBS_IMAGE].device == device |
| assert processed[TransitionKey.ACTION.value].device == device |
|
|
|
|
| def test_vqbet_processor_without_stats(): |
| """Test VQBeT processor creation without dataset statistics.""" |
| config = create_default_config() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors(config, dataset_stats=None) |
|
|
| |
| assert preprocessor is not None |
| assert postprocessor is not None |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| processed = preprocessor(batch) |
| assert processed is not None |
|
|
|
|
| def test_vqbet_processor_save_and_load(): |
| """Test saving and loading VQBeT processor.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| with tempfile.TemporaryDirectory() as tmpdir: |
| |
| preprocessor.save_pretrained(tmpdir) |
|
|
| |
| loaded_preprocessor = DataProcessorPipeline.from_pretrained( |
| tmpdir, config_filename="policy_preprocessor.json" |
| ) |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
| processed = loaded_preprocessor(batch) |
| assert processed[OBS_STATE].shape == (1, 8) |
| assert processed[OBS_IMAGE].shape == (1, 3, 224, 224) |
| assert processed[TransitionKey.ACTION.value].shape == (1, 7) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_vqbet_processor_mixed_precision(): |
| """Test VQBeT processor with mixed precision.""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| |
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| modified_steps = [] |
| for step in preprocessor.steps: |
| if isinstance(step, DeviceProcessorStep): |
| modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="float16")) |
| elif isinstance(step, NormalizerProcessorStep): |
| |
| modified_steps.append( |
| NormalizerProcessorStep( |
| features=step.features, |
| norm_map=step.norm_map, |
| stats=step.stats, |
| device=config.device, |
| dtype=torch.float16, |
| ) |
| ) |
| else: |
| modified_steps.append(step) |
| preprocessor.steps = modified_steps |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8, dtype=torch.float32), |
| OBS_IMAGE: torch.randn(3, 224, 224, dtype=torch.float32), |
| } |
| action = torch.randn(7, dtype=torch.float32) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].dtype == torch.float16 |
| assert processed[OBS_IMAGE].dtype == torch.float16 |
| assert processed[TransitionKey.ACTION.value].dtype == torch.float16 |
|
|
|
|
| def test_vqbet_processor_large_batch(): |
| """Test VQBeT processor with large batch sizes.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| batch_size = 128 |
| observation = { |
| OBS_STATE: torch.randn(batch_size, 8), |
| OBS_IMAGE: torch.randn(batch_size, 3, 224, 224), |
| } |
| action = torch.randn(batch_size, 7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
|
|
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].shape == (batch_size, 8) |
| assert processed[OBS_IMAGE].shape == (batch_size, 3, 224, 224) |
| assert processed[TransitionKey.ACTION.value].shape == (batch_size, 7) |
|
|
|
|
| def test_vqbet_processor_sequential_processing(): |
| """Test VQBeT processor with sequential data processing.""" |
| config = create_default_config() |
| stats = create_default_stats() |
|
|
| preprocessor, postprocessor = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| results = [] |
| for _ in range(5): |
| observation = { |
| OBS_STATE: torch.randn(8), |
| OBS_IMAGE: torch.randn(3, 224, 224), |
| } |
| action = torch.randn(7) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| processed = preprocessor(batch) |
| results.append(processed) |
|
|
| |
| for result in results: |
| assert result[OBS_STATE].shape == (1, 8) |
| assert result[OBS_IMAGE].shape == (1, 3, 224, 224) |
| assert result[TransitionKey.ACTION.value].shape == (1, 7) |
|
|
|
|
| @pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available") |
| def test_vqbet_processor_bfloat16_device_float32_normalizer(): |
| """Test: DeviceProcessor(bfloat16) + NormalizerProcessor(float32) → output bfloat16 via automatic adaptation""" |
| config = create_default_config() |
| config.device = "cuda" |
| stats = create_default_stats() |
|
|
| preprocessor, _ = make_vqbet_pre_post_processors( |
| config, |
| stats, |
| ) |
|
|
| |
| modified_steps = [] |
| for step in preprocessor.steps: |
| if isinstance(step, DeviceProcessorStep): |
| |
| modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="bfloat16")) |
| elif isinstance(step, NormalizerProcessorStep): |
| |
| modified_steps.append( |
| NormalizerProcessorStep( |
| features=step.features, |
| norm_map=step.norm_map, |
| stats=step.stats, |
| device=config.device, |
| dtype=torch.float32, |
| ) |
| ) |
| else: |
| modified_steps.append(step) |
| preprocessor.steps = modified_steps |
|
|
| |
| normalizer_step = preprocessor.steps[3] |
| assert normalizer_step.dtype == torch.float32 |
|
|
| |
| observation = { |
| OBS_STATE: torch.randn(8, dtype=torch.float32), |
| OBS_IMAGE: torch.randn(3, 224, 224, dtype=torch.float32), |
| } |
| action = torch.randn(7, dtype=torch.float32) |
| transition = create_transition(observation, action) |
|
|
| batch = transition_to_batch(transition) |
|
|
| |
| processed = preprocessor(batch) |
|
|
| |
| assert processed[OBS_STATE].dtype == torch.bfloat16 |
| assert processed[OBS_IMAGE].dtype == torch.bfloat16 |
| assert processed[TransitionKey.ACTION.value].dtype == torch.bfloat16 |
|
|
| |
| assert normalizer_step.dtype == torch.bfloat16 |
| |
| for stat_tensor in normalizer_step._tensor_stats[OBS_STATE].values(): |
| assert stat_tensor.dtype == torch.bfloat16 |
| |
|
|