Modular Diffusers: bloques modulares para pipelines de difusión

Cargando...

Modular Diffusers: bloques modulares para pipelines de difusión | Keryc

import torch
from diffusers import ModularPipeline

pipe = ModularPipeline.from_pretrained("black-forest-labs/FLUX.2-klein-4B")
pipe.load_components(torch_dtype=torch.bfloat16)
pipe.to("cuda")
image = pipe(prompt="a serene landscape at sunset", num_inference_steps=4).images[0]
image.save("output.png")

# sacar el bloque de texto y ejecutarlo por separado
text_blocks = pipe.blocks.sub_blocks.pop("text_encoder")
text_pipe = text_blocks.init_pipeline("black-forest-labs/FLUX.2-klein-4B")
text_pipe.load_components(torch_dtype=torch.bfloat16)
text_pipe.to("cuda")
prompt_embeds = text_pipe(prompt="a serene landscape at sunset").prompt_embeds

remaining_pipe = pipe.blocks.init_pipeline("black-forest-labs/FLUX.2-klein-4B")
remaining_pipe.load_components(torch_dtype=torch.bfloat16)
remaining_pipe.to("cuda")
image = remaining_pipe(prompt_embeds=prompt_embeds, num_inference_steps=4).images[0]

class DepthProcessorBlock(ModularPipelineBlocks):
    @property
    def expected_components(self):
        return [ComponentSpec("depth_processor", DepthPreprocessor, pretrained_model_name_or_path="depth-anything/Depth-Anything-V2-Large-hf")]

    @property
    def inputs(self):
        return [InputParam("image", required=True, description="Image(s) to extract depth maps from")]

    @property
    def intermediate_outputs(self):
        return [OutputParam("control_image", type_hint=torch.Tensor, description="Depth map(s) of input image(s)")]

    @torch.no_grad()
    def __call__(self, components, state):
        block_state = self.get_block_state(state)
        depth_map = components.depth_processor(block_state.image)
        block_state.control_image = depth_map.to(block_state.device)
        self.set_block_state(state, block_state)
        return components, state

{
  "transformer": ["diffusers", "Flux2Transformer2DModel", {"pretrained_model_name_or_path": "diffusers/flux2-bnb-4bit-modular", "subfolder": "transformer"}],
  "vae": ["diffusers", "AutoencoderKLFlux2", {"pretrained_model_name_or_path": "black-forest-labs/FLUX.2-dev", "subfolder": "vae"}]
}

Qué es Modular Diffusers y por qué importa

Cómo funciona — ejemplo práctico y conceptos técnicos

Flujo de trabajo por bloques

Crear bloques personalizados

Repos modulares y publicación en el Hub

Integración visual: Mellon

Casos de uso y ejemplos de la comunidad

Consideraciones prácticas y recomendaciones

Reflexión final

Fuente original

¡Mantente al día!

Modular Diffusers: bloques modulares para pipelines de difusión