refactor(pipeline): enforce ProcessorStep inheritance for pipeline steps (#1862)

- Updated the DataProcessorPipeline to require that all steps inherit from ProcessorStep, enhancing type safety and clarity. - Adjusted tests to utilize a MockTokenizerProcessorStep that adheres to the ProcessorStep interface, ensuring consistent behavior across tests. - Refactored various mock step classes in tests to inherit from ProcessorStep for improved consistency and maintainability.
2026-05-15 16:49:55 +00:00 · 2025-09-04 16:22:03 +02:00
parent fc43246942
commit 332ca4ccc5
4 changed files with 85 additions and 38 deletions
@@ -30,13 +30,31 @@ from lerobot.policies.smolvla.processor_smolvla import (
 from lerobot.processor import (
    AddBatchDimensionProcessorStep,
    DeviceProcessorStep,
+    EnvTransition,
    NormalizerProcessorStep,
+    ProcessorStep,
    RenameProcessorStep,
    TransitionKey,
    UnnormalizerProcessorStep,
 )


+class MockTokenizerProcessorStep(ProcessorStep):
+    """Mock tokenizer processor step for testing."""
+
+    def __init__(self, *args, **kwargs):
+        # Accept any arguments to mimic the real TokenizerProcessorStep interface
+        pass
+
+    def __call__(self, transition: EnvTransition) -> EnvTransition:
+        # Pass through transition unchanged
+        return transition
+
+    def transform_features(self, features):
+        # Pass through features unchanged
+        return features
+
+
 def create_transition(observation=None, action=None, **kwargs):
    """Helper function to create a transition dictionary."""
    transition = {}
@@ -88,7 +106,9 @@ def test_make_smolvla_processor_basic():
    config = create_default_config()
    stats = create_default_stats()

-    with patch("lerobot.policies.smolvla.processor_smolvla.TokenizerProcessorStep"):
+    with patch(
+        "lerobot.policies.smolvla.processor_smolvla.TokenizerProcessorStep", MockTokenizerProcessorStep
+    ):
        preprocessor, postprocessor = make_smolvla_pre_post_processors(
            config,
            stats,
@@ -170,7 +190,7 @@ def test_smolvla_processor_cuda():
    stats = create_default_stats()

    # Mock the tokenizer processor to act as pass-through
-    class MockTokenizerProcessorStep:
+    class MockTokenizerProcessorStep(ProcessorStep):
        def __init__(self, *args, **kwargs):
            pass

@@ -227,7 +247,7 @@ def test_smolvla_processor_accelerate_scenario():
    stats = create_default_stats()

    # Mock the tokenizer processor to act as pass-through
-    class MockTokenizerProcessorStep:
+    class MockTokenizerProcessorStep(ProcessorStep):
        def __init__(self, *args, **kwargs):
            pass

@@ -285,7 +305,7 @@ def test_smolvla_processor_multi_gpu():
    stats = create_default_stats()

    # Mock the tokenizer processor to act as pass-through
-    class MockTokenizerProcessorStep:
+    class MockTokenizerProcessorStep(ProcessorStep):
        def __init__(self, *args, **kwargs):
            pass

@@ -340,7 +360,9 @@ def test_smolvla_processor_without_stats():
    config = create_default_config()

    # Mock the tokenizer processor
-    with patch("lerobot.policies.smolvla.processor_smolvla.TokenizerProcessorStep"):
+    with patch(
+        "lerobot.policies.smolvla.processor_smolvla.TokenizerProcessorStep", MockTokenizerProcessorStep
+    ):
        preprocessor, postprocessor = make_smolvla_pre_post_processors(
            config,
            dataset_stats=None,