Source code for cw.lib.models.sd15_controlnet

#!/usr/bin/env python3
"""
Stable Diffusion 1.5 ControlNet model implementation.

Combines a StableDiffusion 1.5 base model with a ControlNet conditioning model
to generate images guided by structural control signals (edges, depth, line art).
"""

import logging

import torch
from diffusers import ControlNetModel, StableDiffusionControlNetPipeline

from .base import BaseModel
from .mixins import CompelPromptMixin

logger = logging.getLogger(__name__)



[docs]
class SD15ControlNetModel(CompelPromptMixin, BaseModel):
    """SD 1.5 + ControlNet implementation for structure-guided generation."""

    def __init__(self, model_config: dict, model_path: str):
        super().__init__(model_config, model_path)
        self.controlnet_path = self.settings.get("controlnet_path", "")

    def _create_pipeline(self):
        """Load SD 1.5 pipeline with ControlNet."""
        logger.info(f"Loading ControlNet from: {self.controlnet_path}")
        controlnet = ControlNetModel.from_pretrained(
            self.controlnet_path,
            torch_dtype=self.dtype,
        )

        logger.info(f"Loading SD 1.5 base model from: {self.model_path}")
        return StableDiffusionControlNetPipeline.from_pretrained(
            self.model_path,
            controlnet=controlnet,
            torch_dtype=self.dtype,
        )

    def _build_pipeline_kwargs(self, params, progress_callback):
        """Add ControlNet-specific kwargs (control image, conditioning scale)."""
        kwargs = super()._build_pipeline_kwargs(params, progress_callback)

        # Inject the preprocessed control image
        if "control_image" in params:
            kwargs["image"] = params["control_image"]

        # ControlNet conditioning parameters
        if "conditioning_scale" in params:
            kwargs["controlnet_conditioning_scale"] = params["conditioning_scale"]
        if "guidance_end" in params:
            kwargs["control_guidance_end"] = params["guidance_end"]

        return kwargs

    def _build_metadata(self, params):
        """Add ControlNet info to generation metadata."""
        metadata = super()._build_metadata(params)
        metadata["controlnet"] = {
            "path": self.controlnet_path,
            "conditioning_scale": params.get("conditioning_scale"),
            "guidance_end": params.get("guidance_end"),
        }
        return metadata

    def _post_lora_load_fixes(self):
        """Re-apply MPS VAE fix after LoRA loading."""
        if self.device and self.device.type == "mps" and hasattr(self.pipeline, "vae"):
            logger.info("[SD15-CN MPS Fix] Re-applying VAE float32 after LoRA load")
            self.pipeline.vae = self.pipeline.vae.to(dtype=torch.float32)

    def _post_lora_unload_fixes(self):
        """Re-apply MPS VAE fix after LoRA unloading."""
        if self.device and self.device.type == "mps" and hasattr(self.pipeline, "vae"):
            logger.info("[SD15-CN MPS Fix] Re-applying VAE float32 after LoRA unload")
            self.pipeline.vae = self.pipeline.vae.to(dtype=torch.float32)