pi05-so100-diverse / lerobot /tests /processor /test_diffusion_processor.py

bot

Update lerobot to latest with SO100 rename_map fix

a8eb6e5 about 2 months ago

13.9 kB

	#!/usr/bin/env python

	# Copyright 2025 The HuggingFace Inc. team. All rights reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	"""Tests for Diffusion policy processor."""

	import tempfile

	import pytest
	import torch

	from lerobot.configs.types import FeatureType, NormalizationMode, PolicyFeature
	from lerobot.policies.diffusion.configuration_diffusion import DiffusionConfig
	from lerobot.policies.diffusion.processor_diffusion import make_diffusion_pre_post_processors
	from lerobot.processor import (
	AddBatchDimensionProcessorStep,
	DataProcessorPipeline,
	DeviceProcessorStep,
	NormalizerProcessorStep,
	RenameObservationsProcessorStep,
	TransitionKey,
	UnnormalizerProcessorStep,
	)
	from lerobot.processor.converters import create_transition, transition_to_batch
	from lerobot.utils.constants import ACTION, OBS_IMAGE, OBS_STATE


	def create_default_config():
	"""Create a default Diffusion configuration for testing."""
	config = DiffusionConfig()
	config.input_features = {
	OBS_STATE: PolicyFeature(type=FeatureType.STATE, shape=(7,)),
	OBS_IMAGE: PolicyFeature(type=FeatureType.VISUAL, shape=(3, 224, 224)),
	}
	config.output_features = {
	ACTION: PolicyFeature(type=FeatureType.ACTION, shape=(6,)),
	}
	config.normalization_mapping = {
	FeatureType.STATE: NormalizationMode.MEAN_STD,
	FeatureType.VISUAL: NormalizationMode.IDENTITY,
	FeatureType.ACTION: NormalizationMode.MIN_MAX,
	}
	config.device = "cpu"
	return config


	def create_default_stats():
	"""Create default dataset statistics for testing."""
	return {
	OBS_STATE: {"mean": torch.zeros(7), "std": torch.ones(7)},
	OBS_IMAGE: {}, # No normalization for images
	ACTION: {"min": torch.full((6,), -1.0), "max": torch.ones(6)},
	}


	def test_make_diffusion_processor_basic():
	"""Test basic creation of Diffusion processor."""
	config = create_default_config()
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats)

	# Check processor names
	assert preprocessor.name == "policy_preprocessor"
	assert postprocessor.name == "policy_postprocessor"

	# Check steps in preprocessor
	assert len(preprocessor.steps) == 4
	assert isinstance(preprocessor.steps[0], RenameObservationsProcessorStep)
	assert isinstance(preprocessor.steps[1], AddBatchDimensionProcessorStep)
	assert isinstance(preprocessor.steps[2], DeviceProcessorStep)
	assert isinstance(preprocessor.steps[3], NormalizerProcessorStep)

	# Check steps in postprocessor
	assert len(postprocessor.steps) == 2
	assert isinstance(postprocessor.steps[0], UnnormalizerProcessorStep)
	assert isinstance(postprocessor.steps[1], DeviceProcessorStep)


	def test_diffusion_processor_with_images():
	"""Test Diffusion processor with image observations."""
	config = create_default_config()
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	stats,
	)

	# Create test data with images
	observation = {
	OBS_STATE: torch.randn(7),
	OBS_IMAGE: torch.randn(3, 224, 224),
	}
	action = torch.randn(6)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through preprocessor

	processed = preprocessor(batch)

	# Check that data is batched
	assert processed[OBS_STATE].shape == (1, 7)
	assert processed[OBS_IMAGE].shape == (1, 3, 224, 224)
	assert processed[TransitionKey.ACTION.value].shape == (1, 6)


	@pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available")
	def test_diffusion_processor_cuda():
	"""Test Diffusion processor with CUDA device."""
	config = create_default_config()
	config.device = "cuda"
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	stats,
	)

	# Create CPU data
	observation = {
	OBS_STATE: torch.randn(7),
	OBS_IMAGE: torch.randn(3, 224, 224),
	}
	action = torch.randn(6)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through preprocessor

	processed = preprocessor(batch)

	# Check that data is on CUDA
	assert processed[OBS_STATE].device.type == "cuda"
	assert processed[OBS_IMAGE].device.type == "cuda"
	assert processed[TransitionKey.ACTION.value].device.type == "cuda"

	# Process through postprocessor
	postprocessed = postprocessor(processed[TransitionKey.ACTION.value])

	# Check that action is back on CPU
	assert postprocessed.device.type == "cpu"


	@pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available")
	def test_diffusion_processor_accelerate_scenario():
	"""Test Diffusion processor in simulated Accelerate scenario."""
	config = create_default_config()
	config.device = "cuda:0"
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	stats,
	)

	# Simulate Accelerate: data already on GPU
	device = torch.device("cuda:0")
	observation = {
	OBS_STATE: torch.randn(1, 7).to(device),
	OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device),
	}
	action = torch.randn(1, 6).to(device)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through preprocessor

	processed = preprocessor(batch)

	# Check that data stays on same GPU
	assert processed[OBS_STATE].device == device
	assert processed[OBS_IMAGE].device == device
	assert processed[TransitionKey.ACTION.value].device == device


	@pytest.mark.skipif(torch.cuda.device_count() < 2, reason="Requires at least 2 GPUs")
	def test_diffusion_processor_multi_gpu():
	"""Test Diffusion processor with multi-GPU setup."""
	config = create_default_config()
	config.device = "cuda:0"
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats)

	# Simulate data on different GPU
	device = torch.device("cuda:1")
	observation = {
	OBS_STATE: torch.randn(1, 7).to(device),
	OBS_IMAGE: torch.randn(1, 3, 224, 224).to(device),
	}
	action = torch.randn(1, 6).to(device)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through preprocessor

	processed = preprocessor(batch)

	# Check that data stays on cuda:1
	assert processed[OBS_STATE].device == device
	assert processed[OBS_IMAGE].device == device
	assert processed[TransitionKey.ACTION.value].device == device


	def test_diffusion_processor_without_stats():
	"""Test Diffusion processor creation without dataset statistics."""
	config = create_default_config()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	dataset_stats=None,
	)

	# Should still create processors
	assert preprocessor is not None
	assert postprocessor is not None

	# Process should still work
	observation = {
	OBS_STATE: torch.randn(7),
	OBS_IMAGE: torch.randn(3, 224, 224),
	}
	action = torch.randn(6)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	processed = preprocessor(batch)
	assert processed is not None


	def test_diffusion_processor_save_and_load():
	"""Test saving and loading Diffusion processor."""
	config = create_default_config()
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(config, stats)

	with tempfile.TemporaryDirectory() as tmpdir:
	# Save preprocessor
	preprocessor.save_pretrained(tmpdir)

	# Load preprocessor
	loaded_preprocessor = DataProcessorPipeline.from_pretrained(
	tmpdir, config_filename="policy_preprocessor.json"
	)

	# Test that loaded processor works
	observation = {
	OBS_STATE: torch.randn(7),
	OBS_IMAGE: torch.randn(3, 224, 224),
	}
	action = torch.randn(6)
	transition = create_transition(observation, action)
	batch = transition_to_batch(transition)

	processed = loaded_preprocessor(batch)
	assert processed[OBS_STATE].shape == (1, 7)
	assert processed[OBS_IMAGE].shape == (1, 3, 224, 224)
	assert processed[TransitionKey.ACTION.value].shape == (1, 6)


	def test_diffusion_processor_identity_normalization():
	"""Test that images with IDENTITY normalization are not normalized."""
	config = create_default_config()
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	stats,
	)

	# Create test data
	image_value = torch.rand(3, 224, 224) * 255 # Large values
	observation = {
	OBS_STATE: torch.randn(7),
	OBS_IMAGE: image_value.clone(),
	}
	action = torch.randn(6)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through preprocessor

	processed = preprocessor(batch)

	# Image should not be normalized (IDENTITY mode)
	# Just batched
	assert torch.allclose(processed[OBS_IMAGE][0], image_value, rtol=1e-5)


	def test_diffusion_processor_batch_consistency():
	"""Test Diffusion processor with different batch sizes."""
	config = create_default_config()
	stats = create_default_stats()

	preprocessor, postprocessor = make_diffusion_pre_post_processors(
	config,
	stats,
	)

	# Test with different batch sizes
	for batch_size in [1, 8, 32]:
	observation = {
	OBS_STATE: torch.randn(batch_size, 7) if batch_size > 1 else torch.randn(7),
	OBS_IMAGE: torch.randn(batch_size, 3, 224, 224) if batch_size > 1 else torch.randn(3, 224, 224),
	}
	action = torch.randn(batch_size, 6) if batch_size > 1 else torch.randn(6)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	processed = preprocessor(batch)

	# Check correct batch size
	expected_batch = batch_size if batch_size > 1 else 1
	assert processed[OBS_STATE].shape[0] == expected_batch
	assert processed[OBS_IMAGE].shape[0] == expected_batch
	assert processed[TransitionKey.ACTION.value].shape[0] == expected_batch


	@pytest.mark.skipif(not torch.cuda.is_available(), reason="CUDA not available")
	def test_diffusion_processor_bfloat16_device_float32_normalizer():
	"""Test: DeviceProcessor(bfloat16) + NormalizerProcessor(float32) → output bfloat16 via automatic adaptation"""
	config = create_default_config()
	config.device = "cuda"
	stats = create_default_stats()

	preprocessor, _ = make_diffusion_pre_post_processors(config, stats)

	# Modify the pipeline to use bfloat16 device processor with float32 normalizer
	modified_steps = []
	for step in preprocessor.steps:
	if isinstance(step, DeviceProcessorStep):
	# Device processor converts to bfloat16
	modified_steps.append(DeviceProcessorStep(device=config.device, float_dtype="bfloat16"))
	elif isinstance(step, NormalizerProcessorStep):
	# Normalizer stays configured as float32 (will auto-adapt to bfloat16)
	norm_step = step # Now type checker knows this is NormalizerProcessorStep
	modified_steps.append(
	NormalizerProcessorStep(
	features=norm_step.features,
	norm_map=norm_step.norm_map,
	stats=norm_step.stats,
	device=config.device,
	dtype=torch.float32, # Deliberately configured as float32
	)
	)
	else:
	modified_steps.append(step)
	preprocessor.steps = modified_steps

	# Verify initial normalizer configuration
	normalizer_step = preprocessor.steps[3] # NormalizerProcessorStep
	assert normalizer_step.dtype == torch.float32

	# Create test data with both state and visual observations
	observation = {
	OBS_STATE: torch.randn(7, dtype=torch.float32),
	OBS_IMAGE: torch.randn(3, 224, 224, dtype=torch.float32),
	}
	action = torch.randn(6, dtype=torch.float32)
	transition = create_transition(observation, action)

	batch = transition_to_batch(transition)

	# Process through full pipeline
	processed = preprocessor(batch)

	# Verify: DeviceProcessor → bfloat16, NormalizerProcessor adapts → final output is bfloat16
	assert processed[OBS_STATE].dtype == torch.bfloat16
	assert processed[OBS_IMAGE].dtype == torch.bfloat16 # IDENTITY normalization still gets dtype conversion
	assert processed[TransitionKey.ACTION.value].dtype == torch.bfloat16

	# Verify normalizer automatically adapted its internal state
	assert normalizer_step.dtype == torch.bfloat16
	# Check state stats (has normalization)
	for stat_tensor in normalizer_step._tensor_stats[OBS_STATE].values():
	assert stat_tensor.dtype == torch.bfloat16
	# OBS_IMAGE uses IDENTITY normalization, so no stats to check