Merge branch 'main' into alert-autofix-2150

Potential fix for code scanning alert no. 2150: Workflow does not contain permissions
Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>
2026-03-22 08:28:14 +08:00 · 2026-03-09 15:57:20 +05:30 · 2026-03-09 10:08:14 +05:30
3 changed files with 73 additions and 58 deletions
--- a/.github/workflows/pr_tests.yml
+++ b/.github/workflows/pr_tests.yml
@@ -16,9 +16,6 @@ on:
    branches:
      - ci-*

-permissions:
-  contents: read
-
 concurrency:
  group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
  cancel-in-progress: true
--- a/.github/workflows/pr_tests_gpu.yml
+++ b/.github/workflows/pr_tests_gpu.yml
@@ -1,5 +1,8 @@
 name: Fast GPU Tests on PR

+permissions:
+  contents: read
+
 on:
  pull_request:
    branches: main
--- a/tests/hooks/test_group_offloading.py
+++ b/tests/hooks/test_group_offloading.py
@@ -14,15 +14,16 @@

 import contextlib
 import gc
-import logging
+import unittest

-import pytest
 import torch
+from parameterized import parameterized

 from diffusers import AutoencoderKL
 from diffusers.hooks import HookRegistry, ModelHook
 from diffusers.models import ModelMixin
 from diffusers.pipelines.pipeline_utils import DiffusionPipeline
+from diffusers.utils import get_logger
 from diffusers.utils.import_utils import compare_versions

 from ..testing_utils import (
@@ -218,18 +219,20 @@ class NestedContainer(torch.nn.Module):


@require_torch_accelerator
-class TestGroupOffload:
+class GroupOffloadTests(unittest.TestCase):
    in_features = 64
    hidden_features = 256
    out_features = 64
    num_layers = 4

-    def setup_method(self):
+    def setUp(self):
        with torch.no_grad():
            self.model = self.get_model()
            self.input = torch.randn((4, self.in_features)).to(torch_device)

-    def teardown_method(self):
+    def tearDown(self):
+        super().tearDown()
+
        del self.model
        del self.input
        gc.collect()
@@ -245,20 +248,18 @@ class TestGroupOffload:
            num_layers=self.num_layers,
        )

-    @pytest.mark.skipif(
-        torch.device(torch_device).type not in ["cuda", "xpu"],
-        reason="Test requires a CUDA or XPU device.",
-    )
    def test_offloading_forward_pass(self):
        @torch.no_grad()
        def run_forward(model):
            gc.collect()
            backend_empty_cache(torch_device)
            backend_reset_peak_memory_stats(torch_device)
-            assert all(
-                module._diffusers_hook.get_hook("group_offloading") is not None
-                for module in model.modules()
-                if hasattr(module, "_diffusers_hook")
+            self.assertTrue(
+                all(
+                    module._diffusers_hook.get_hook("group_offloading") is not None
+                    for module in model.modules()
+                    if hasattr(module, "_diffusers_hook")
+                )
            )
            model.eval()
            output = model(self.input)[0].cpu()
@@ -290,37 +291,41 @@ class TestGroupOffload:
        output_with_group_offloading5, mem5 = run_forward(model)

        # Precision assertions - offloading should not impact the output
-        assert torch.allclose(output_without_group_offloading, output_with_group_offloading1, atol=1e-5)
-        assert torch.allclose(output_without_group_offloading, output_with_group_offloading2, atol=1e-5)
-        assert torch.allclose(output_without_group_offloading, output_with_group_offloading3, atol=1e-5)
-        assert torch.allclose(output_without_group_offloading, output_with_group_offloading4, atol=1e-5)
-        assert torch.allclose(output_without_group_offloading, output_with_group_offloading5, atol=1e-5)
+        self.assertTrue(torch.allclose(output_without_group_offloading, output_with_group_offloading1, atol=1e-5))
+        self.assertTrue(torch.allclose(output_without_group_offloading, output_with_group_offloading2, atol=1e-5))
+        self.assertTrue(torch.allclose(output_without_group_offloading, output_with_group_offloading3, atol=1e-5))
+        self.assertTrue(torch.allclose(output_without_group_offloading, output_with_group_offloading4, atol=1e-5))
+        self.assertTrue(torch.allclose(output_without_group_offloading, output_with_group_offloading5, atol=1e-5))

        # Memory assertions - offloading should reduce memory usage
-        assert mem4 <= mem5 < mem2 <= mem3 < mem1 < mem_baseline
+        self.assertTrue(mem4 <= mem5 < mem2 <= mem3 < mem1 < mem_baseline)

-    def test_warning_logged_if_group_offloaded_module_moved_to_accelerator(self, caplog):
+    def test_warning_logged_if_group_offloaded_module_moved_to_accelerator(self):
        if torch.device(torch_device).type not in ["cuda", "xpu"]:
            return
        self.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)
-        with caplog.at_level(logging.WARNING, logger="diffusers.models.modeling_utils"):
+        logger = get_logger("diffusers.models.modeling_utils")
+        logger.setLevel("INFO")
+        with self.assertLogs(logger, level="WARNING") as cm:
            self.model.to(torch_device)
-        assert f"The module '{self.model.__class__.__name__}' is group offloaded" in caplog.text
+        self.assertIn(f"The module '{self.model.__class__.__name__}' is group offloaded", cm.output[0])

-    def test_warning_logged_if_group_offloaded_pipe_moved_to_accelerator(self, caplog):
+    def test_warning_logged_if_group_offloaded_pipe_moved_to_accelerator(self):
        if torch.device(torch_device).type not in ["cuda", "xpu"]:
            return
        pipe = DummyPipeline(self.model)
        self.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)
-        with caplog.at_level(logging.WARNING, logger="diffusers.pipelines.pipeline_utils"):
+        logger = get_logger("diffusers.pipelines.pipeline_utils")
+        logger.setLevel("INFO")
+        with self.assertLogs(logger, level="WARNING") as cm:
            pipe.to(torch_device)
-        assert f"The module '{self.model.__class__.__name__}' is group offloaded" in caplog.text
+        self.assertIn(f"The module '{self.model.__class__.__name__}' is group offloaded", cm.output[0])

    def test_error_raised_if_streams_used_and_no_accelerator_device(self):
        torch_accelerator_module = getattr(torch, torch_device, torch.cuda)
        original_is_available = torch_accelerator_module.is_available
        torch_accelerator_module.is_available = lambda: False
-        with pytest.raises(ValueError):
+        with self.assertRaises(ValueError):
            self.model.enable_group_offload(
                onload_device=torch.device(torch_device), offload_type="leaf_level", use_stream=True
            )
@@ -328,31 +333,31 @@ class TestGroupOffload:

    def test_error_raised_if_supports_group_offloading_false(self):
        self.model._supports_group_offloading = False
-        with pytest.raises(ValueError, match="does not support group offloading"):
+        with self.assertRaisesRegex(ValueError, "does not support group offloading"):
            self.model.enable_group_offload(onload_device=torch.device(torch_device))

    def test_error_raised_if_model_offloading_applied_on_group_offloaded_module(self):
        pipe = DummyPipeline(self.model)
        pipe.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)
-        with pytest.raises(ValueError, match="You are trying to apply model/sequential CPU offloading"):
+        with self.assertRaisesRegex(ValueError, "You are trying to apply model/sequential CPU offloading"):
            pipe.enable_model_cpu_offload()

    def test_error_raised_if_sequential_offloading_applied_on_group_offloaded_module(self):
        pipe = DummyPipeline(self.model)
        pipe.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)
-        with pytest.raises(ValueError, match="You are trying to apply model/sequential CPU offloading"):
+        with self.assertRaisesRegex(ValueError, "You are trying to apply model/sequential CPU offloading"):
            pipe.enable_sequential_cpu_offload()

    def test_error_raised_if_group_offloading_applied_on_model_offloaded_module(self):
        pipe = DummyPipeline(self.model)
        pipe.enable_model_cpu_offload()
-        with pytest.raises(ValueError, match="Cannot apply group offloading"):
+        with self.assertRaisesRegex(ValueError, "Cannot apply group offloading"):
            pipe.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)

    def test_error_raised_if_group_offloading_applied_on_sequential_offloaded_module(self):
        pipe = DummyPipeline(self.model)
        pipe.enable_sequential_cpu_offload()
-        with pytest.raises(ValueError, match="Cannot apply group offloading"):
+        with self.assertRaisesRegex(ValueError, "Cannot apply group offloading"):
            pipe.model.enable_group_offload(torch_device, offload_type="block_level", num_blocks_per_group=3)

    def test_block_level_stream_with_invocation_order_different_from_initialization_order(self):
@@ -371,12 +376,12 @@ class TestGroupOffload:
        context = contextlib.nullcontext()
        if compare_versions("diffusers", "<=", "0.33.0"):
            # Will raise a device mismatch RuntimeError mentioning weights are on CPU but input is on device
-            context = pytest.raises(RuntimeError, match="Expected all tensors to be on the same device")
+            context = self.assertRaisesRegex(RuntimeError, "Expected all tensors to be on the same device")

        with context:
            model(self.input)

-    @pytest.mark.parametrize("offload_type", ["block_level", "leaf_level"])
+    @parameterized.expand([("block_level",), ("leaf_level",)])
    def test_block_level_offloading_with_parameter_only_module_group(self, offload_type: str):
        if torch.device(torch_device).type not in ["cuda", "xpu"]:
            return
@@ -402,14 +407,14 @@ class TestGroupOffload:

        out_ref = model_ref(x)
        out = model(x)
-        assert torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match."
+        self.assertTrue(torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match.")

        num_repeats = 2
        for i in range(num_repeats):
            out_ref = model_ref(x)
            out = model(x)

-        assert torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match after multiple invocations."
+        self.assertTrue(torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match after multiple invocations.")

        for (ref_name, ref_module), (name, module) in zip(model_ref.named_modules(), model.named_modules()):
            assert ref_name == name
@@ -423,7 +428,9 @@ class TestGroupOffload:
                absdiff = diff.abs()
                absmax = absdiff.max().item()
                cumulated_absmax += absmax
-            assert cumulated_absmax < 1e-5, f"Output differences for {name} exceeded threshold: {cumulated_absmax:.5f}"
+            self.assertLess(
+                cumulated_absmax, 1e-5, f"Output differences for {name} exceeded threshold: {cumulated_absmax:.5f}"
+            )

    def test_vae_like_model_without_streams(self):
        """Test VAE-like model with block-level offloading but without streams."""
@@ -445,7 +452,9 @@ class TestGroupOffload:
            out_ref = model_ref(x).sample
            out = model(x).sample

-        assert torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match for VAE-like model without streams."
+        self.assertTrue(
+            torch.allclose(out_ref, out, atol=1e-5), "Outputs do not match for VAE-like model without streams."
+        )

    def test_model_with_only_standalone_layers(self):
        """Test that models with only standalone layers (no ModuleList/Sequential) work with block-level offloading."""
@@ -466,11 +475,12 @@ class TestGroupOffload:
            for i in range(2):
                out_ref = model_ref(x)
                out = model(x)
-                assert torch.allclose(out_ref, out, atol=1e-5), (
-                    f"Outputs do not match at iteration {i} for model with standalone layers."
+                self.assertTrue(
+                    torch.allclose(out_ref, out, atol=1e-5),
+                    f"Outputs do not match at iteration {i} for model with standalone layers.",
                )

-    @pytest.mark.parametrize("offload_type", ["block_level", "leaf_level"])
+    @parameterized.expand([("block_level",), ("leaf_level",)])
    def test_standalone_conv_layers_with_both_offload_types(self, offload_type: str):
        """Test that standalone Conv2d layers work correctly with both block-level and leaf-level offloading."""
        if torch.device(torch_device).type not in ["cuda", "xpu"]:
@@ -491,8 +501,9 @@ class TestGroupOffload:
            out_ref = model_ref(x).sample
            out = model(x).sample

-        assert torch.allclose(out_ref, out, atol=1e-5), (
-            f"Outputs do not match for standalone Conv layers with {offload_type}."
+        self.assertTrue(
+            torch.allclose(out_ref, out, atol=1e-5),
+            f"Outputs do not match for standalone Conv layers with {offload_type}.",
        )

    def test_multiple_invocations_with_vae_like_model(self):
@@ -515,7 +526,7 @@ class TestGroupOffload:
            for i in range(2):
                out_ref = model_ref(x).sample
                out = model(x).sample
-                assert torch.allclose(out_ref, out, atol=1e-5), f"Outputs do not match at iteration {i}."
+                self.assertTrue(torch.allclose(out_ref, out, atol=1e-5), f"Outputs do not match at iteration {i}.")

    def test_nested_container_parameters_offloading(self):
        """Test that parameters from non-computational layers in nested containers are handled correctly."""
@@ -536,8 +547,9 @@ class TestGroupOffload:
            for i in range(2):
                out_ref = model_ref(x)
                out = model(x)
-                assert torch.allclose(out_ref, out, atol=1e-5), (
-                    f"Outputs do not match at iteration {i} for nested parameters."
+                self.assertTrue(
+                    torch.allclose(out_ref, out, atol=1e-5),
+                    f"Outputs do not match at iteration {i} for nested parameters.",
                )

    def get_autoencoder_kl_config(self, block_out_channels=None, norm_num_groups=None):
@@ -590,7 +602,7 @@ class DummyModelWithConditionalModules(ModelMixin):
        return x


-class TestConditionalModuleGroupOffload(TestGroupOffload):
+class ConditionalModuleGroupOffloadTests(GroupOffloadTests):
    """Tests for conditionally-executed modules under group offloading with streams.

    Regression tests for the case where a module is not executed during the first forward pass
@@ -608,10 +620,10 @@ class TestConditionalModuleGroupOffload(TestGroupOffload):
            num_layers=self.num_layers,
        )

-    @pytest.mark.parametrize("offload_type", ["leaf_level", "block_level"])
-    @pytest.mark.skipif(
+    @parameterized.expand([("leaf_level",), ("block_level",)])
+    @unittest.skipIf(
        torch.device(torch_device).type not in ["cuda", "xpu"],
-        reason="Test requires a CUDA or XPU device.",
+        "Test requires a CUDA or XPU device.",
    )
    def test_conditional_modules_with_stream(self, offload_type: str):
        """Regression test: conditionally-executed modules must not cause device mismatch when using streams.
@@ -658,20 +670,23 @@ class TestConditionalModuleGroupOffload(TestGroupOffload):
            # execution order is traced. optional_proj_1/2 are NOT in the traced order.
            out_ref_no_opt = model_ref(x, optional_input=None)
            out_no_opt = model(x, optional_input=None)
-            assert torch.allclose(out_ref_no_opt, out_no_opt, atol=1e-5), (
-                f"[{offload_type}] Outputs do not match on first pass (no optional_input)."
+            self.assertTrue(
+                torch.allclose(out_ref_no_opt, out_no_opt, atol=1e-5),
+                f"[{offload_type}] Outputs do not match on first pass (no optional_input).",
            )

            # Second forward pass WITH optional_input — optional_proj_1/2 ARE now called.
            out_ref_with_opt = model_ref(x, optional_input=optional_input)
            out_with_opt = model(x, optional_input=optional_input)
-            assert torch.allclose(out_ref_with_opt, out_with_opt, atol=1e-5), (
-                f"[{offload_type}] Outputs do not match on second pass (with optional_input)."
+            self.assertTrue(
+                torch.allclose(out_ref_with_opt, out_with_opt, atol=1e-5),
+                f"[{offload_type}] Outputs do not match on second pass (with optional_input).",
            )

            # Third pass again without optional_input — verify stable behavior.
            out_ref_no_opt2 = model_ref(x, optional_input=None)
            out_no_opt2 = model(x, optional_input=None)
-            assert torch.allclose(out_ref_no_opt2, out_no_opt2, atol=1e-5), (
-                f"[{offload_type}] Outputs do not match on third pass (back to no optional_input)."
+            self.assertTrue(
+                torch.allclose(out_ref_no_opt2, out_no_opt2, atol=1e-5),
+                f"[{offload_type}] Outputs do not match on third pass (back to no optional_input).",
            )
Author	SHA1	Message	Date
Sayak Paul	d500bb94e7	Merge branch 'main' into alert-autofix-2150	2026-03-09 15:57:20 +05:30
Dhruv Nair	ee0d4ed02d	Potential fix for code scanning alert no. 2150: Workflow does not contain permissions Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>	2026-03-09 10:08:14 +05:30