try fix for tests

new_forward support
2025-12-11 06:54:32 +08:00 · 2025-02-21 09:49:42 +01:00 · 2025-02-21 08:41:11 +01:00 · 2025-02-21 06:18:13 +01:00 · 2025-02-21 06:00:30 +01:00
5 changed files with 180 additions and 2 deletions
--- a/src/diffusers/hooks/group_offloading.py
+++ b/src/diffusers/hooks/group_offloading.py
@@ -124,6 +124,7 @@ class GroupOffloadingHook(ModelHook):
        group: ModuleGroup,
        next_group: Optional[ModuleGroup] = None,
    ) -> None:
        super().__init__()
        self.group = group
        self.next_group = next_group
@@ -168,6 +169,7 @@ class LazyPrefetchGroupOffloadingHook(ModelHook):
    _is_stateful = False
    def __init__(self):
        super().__init__()
        self.execution_order: List[Tuple[str, torch.nn.Module]] = []
        self._layer_execution_tracker_module_names = set()
@@ -253,6 +255,7 @@ class LayerExecutionTrackerHook(ModelHook):
    _is_stateful = False
    def __init__(self, execution_order_update_callback):
        super().__init__()
        self.execution_order_update_callback = execution_order_update_callback
    def pre_forward(self, module, *args, **kwargs):
--- a/src/diffusers/hooks/hooks.py
+++ b/src/diffusers/hooks/hooks.py
@@ -32,6 +32,7 @@ class ModelHook:
    def __init__(self):
        self.fn_ref: "HookFunctionReference" = None
        self._is_enabled = True
    def initialize_hook(self, module: torch.nn.Module) -> torch.nn.Module:
        r"""
@@ -142,8 +143,10 @@ class HookRegistry:
        self._module_ref = hook.initialize_hook(self._module_ref)
-        def create_new_forward(function_reference: HookFunctionReference):
+        def create_new_forward(hook: ModelHook, function_reference: HookFunctionReference):
            def new_forward(module, *args, **kwargs):
                if not hook._is_enabled:
                    return function_reference.original_forward(*args, **kwargs)
                args, kwargs = function_reference.pre_forward(module, *args, **kwargs)
                output = function_reference.forward(*args, **kwargs)
                return function_reference.post_forward(module, output)
@@ -155,6 +158,7 @@ class HookRegistry:
        fn_ref = HookFunctionReference()
        fn_ref.pre_forward = hook.pre_forward
        fn_ref.post_forward = hook.post_forward
        fn_ref.original_forward = forward
        fn_ref.forward = forward
        if hasattr(hook, "new_forward"):
@@ -163,7 +167,7 @@ class HookRegistry:
                functools.partial(hook.new_forward, self._module_ref), hook.new_forward
            )
-        rewritten_forward = create_new_forward(fn_ref)
+        rewritten_forward = create_new_forward(hook, fn_ref)
        self._module_ref.forward = functools.update_wrapper(
            functools.partial(rewritten_forward, self._module_ref), rewritten_forward
        )
@@ -234,3 +238,19 @@ class HookRegistry:
            if i < len(self._hook_order) - 1:
                registry_repr += "\n"
        return f"HookRegistry(\n{registry_repr}\n)"
 def _set_hook_state(module: torch.nn.Module, name: str, value: bool) -> None:
    for submodule in module.modules():
        if hasattr(submodule, "_diffusers_hook"):
            hook = submodule._diffusers_hook.get_hook(name)
            if hook is not None:
                hook._is_enabled = value
 def _remove_all_hooks(module: torch.nn.Module):
    for submodule in module.modules():
        if hasattr(submodule, "_diffusers_hook"):
            for hook_name in list(submodule._diffusers_hook.hooks.keys()):
                submodule._diffusers_hook.remove_hook(hook_name, recurse=False)
            del submodule._diffusers_hook
--- a/src/diffusers/hooks/layerwise_casting.py
+++ b/src/diffusers/hooks/layerwise_casting.py
@@ -52,6 +52,8 @@ class LayerwiseCastingHook(ModelHook):
    _is_stateful = False
    def __init__(self, storage_dtype: torch.dtype, compute_dtype: torch.dtype, non_blocking: bool) -> None:
        super().__init__()
        self.storage_dtype = storage_dtype
        self.compute_dtype = compute_dtype
        self.non_blocking = non_blocking
--- a/src/diffusers/models/modeling_utils.py
+++ b/src/diffusers/models/modeling_utils.py
@@ -1755,6 +1755,44 @@ class ModelMixin(torch.nn.Module, PushToHubMixin):
                state_dict[f"{path}.to_out.0.bias"] = state_dict.pop(f"{path}.proj_attn.bias")
        return state_dict
    def _enable_hook(self, name: str) -> None:
        r"""
        This method enables the hook with the given name on the model and all its submodules.
        Args:
            name (`str`):
                The name of the hook to enable.
        This method is not backwards compatible and may be subject to change in future versions.
        """
        from ..hooks.hooks import _set_hook_state
        _set_hook_state(self, name, True)
    def _disable_hook(self, name: str) -> None:
        r"""
        This method disables the hook with the given name on the model and all its submodules.
        Args:
            name (`str`):
                The name of the hook to disable.
        This method is not backwards compatible and may be subject to change in future versions.
        """
        from ..hooks.hooks import _set_hook_state
        _set_hook_state(self, name, False)
    def _remove_all_hooks(self) -> None:
        r"""
        This method removes all hooks from the model and all its submodules.
        This method is not backwards compatible and may be subject to change in future versions.
        """
        from ..hooks.hooks import _remove_all_hooks
        _remove_all_hooks(self)
 class LegacyModelMixin(ModelMixin):
    r"""
--- a/tests/hooks/test_hooks.py
+++ b/tests/hooks/test_hooks.py
@@ -17,7 +17,9 @@ import unittest
 import torch
 from diffusers.configuration_utils import ConfigMixin
 from diffusers.hooks import HookRegistry, ModelHook
 from diffusers.models.modeling_utils import ModelMixin
 from diffusers.training_utils import free_memory
 from diffusers.utils.logging import get_logger
 from diffusers.utils.testing_utils import CaptureLogger, torch_device
@@ -61,6 +63,26 @@ class DummyModel(torch.nn.Module):
        return x
 class DummyModelWithMixin(ModelMixin, ConfigMixin):
    def __init__(self, in_features: int, hidden_features: int, out_features: int, num_layers: int) -> None:
        super().__init__()
        self.linear_1 = torch.nn.Linear(in_features, hidden_features)
        self.activation = torch.nn.ReLU()
        self.blocks = torch.nn.ModuleList(
            [DummyBlock(hidden_features, hidden_features, hidden_features) for _ in range(num_layers)]
        )
        self.linear_2 = torch.nn.Linear(hidden_features, out_features)
    def forward(self, x: torch.Tensor) -> torch.Tensor:
        x = self.linear_1(x)
        x = self.activation(x)
        for block in self.blocks:
            x = block(x)
        x = self.linear_2(x)
        return x
 class AddHook(ModelHook):
    def __init__(self, value: int):
        super().__init__()
@@ -380,3 +402,96 @@ class HookTests(unittest.TestCase):
            .replace("\n", "")
        )
        self.assertEqual(output, expected_invocation_order_log)
 class ModelMixinHookTests(unittest.TestCase):
    in_features = 4
    hidden_features = 8
    out_features = 4
    num_layers = 2
    def setUp(self):
        params = self.get_module_parameters()
        self.model = DummyModelWithMixin(**params)
        self.model.to(torch_device)
    def tearDown(self):
        super().tearDown()
        del self.model
        gc.collect()
        free_memory()
    def get_module_parameters(self):
        return {
            "in_features": self.in_features,
            "hidden_features": self.hidden_features,
            "out_features": self.out_features,
            "num_layers": self.num_layers,
        }
    def get_generator(self):
        return torch.manual_seed(0)
    def test_enable_disable_hook(self):
        registry = HookRegistry.check_if_exists_or_initialize(self.model)
        registry.register_hook(AddHook(1), "add_hook")
        registry.register_hook(MultiplyHook(2), "multiply_hook")
        input = torch.randn(1, 4, device=torch_device, generator=self.get_generator())
        output1 = self.model(input).mean().detach().cpu().item()
        self.model._disable_hook("multiply_hook")
        output2 = self.model(input).mean().detach().cpu().item()
        self.model._enable_hook("multiply_hook")
        output3 = self.model(input).mean().detach().cpu().item()
        self.assertNotEqual(output1, output2)
        self.assertEqual(output1, output3)
    def test_enable_disable_hook_containing_new_forward(self):
        registry = HookRegistry.check_if_exists_or_initialize(self.model)
        registry.register_hook(AddHook(1), "add_hook")
        for block in self.model.blocks:
            block_registry = HookRegistry.check_if_exists_or_initialize(block)
            block_registry.register_hook(SkipLayerHook(skip_layer=True), "skip_layer_hook")
        registry.register_hook(MultiplyHook(2), "multiply_hook")
        input = torch.randn(1, 4, device=torch_device, generator=self.get_generator())
        output1 = self.model(input).mean().detach().cpu().item()
        self.model._disable_hook("skip_layer_hook")
        output2 = self.model(input).mean().detach().cpu().item()
        self.model._disable_hook("add_hook")
        output3 = self.model(input).mean().detach().cpu().item()
        self.model._enable_hook("skip_layer_hook")
        self.model._enable_hook("add_hook")
        output4 = self.model(input).mean().detach().cpu().item()
        self.assertNotEqual(output1, output2)
        self.assertNotEqual(output2, output3)
        self.assertEqual(output1, output4)
    def test_remove_all_hooks(self):
        registry = HookRegistry.check_if_exists_or_initialize(self.model)
        registry.register_hook(AddHook(1), "add_hook")
        registry.register_hook(MultiplyHook(2), "multiply_hook")
        input = torch.randn(1, 4, device=torch_device, generator=self.get_generator())
        output1 = self.model(input).mean().detach().cpu().item()
        self.model._disable_hook("add_hook")
        self.model._disable_hook("multiply_hook")
        output2 = self.model(input).mean().detach().cpu().item()
        self.model._remove_all_hooks()
        output3 = self.model(input).mean().detach().cpu().item()
        for module in self.model.modules():
            self.assertFalse(hasattr(module, "_diffusers_hook"))
        self.assertNotEqual(output1, output3)
        self.assertEqual(output2, output3)
Author	SHA1	Message	Date
Aryan	2bff2d5eb1	try fix for tests	2025-02-21 09:49:42 +01:00
Aryan	d080379e94	try fix for tests	2025-02-21 08:41:11 +01:00
Aryan	8546c9ed29	new_forward support	2025-02-21 06:18:13 +01:00
Aryan	e08285ef9c	update	2025-02-21 06:00:30 +01:00