Codestin Search App

DefTruth · 2025-12-08T13:53:40Z

fixed #540, add refresh cache context api to reduce dependency on num_inference_steps.

Qwen-Image

import cache_dit
from cache_dit import DBCacheConfig
from diffusers import DiffusionPipeline

# Init cache context with num_inference_steps=None (default)
pipe = DiffusionPipeline.from_pretrained("Qwen/Qwen-Image")
pipe = cache_dit.enable_cache(pipe.transformer, cache_config=DBCacheConfig(num_inference_steps=None))

# Assume num_inference_steps is 28, and we want to refresh the context
cache_dit.refresh_context(transformer, num_inference_steps=28, verbose=True)
output = pipe(...) # Just call the pipe as normal.
stats = cache_dit.summary(pipe.transformer) # Then, get the summary

# Update the cache context with new num_inference_steps=50.
cache_dit.refresh_context(pipe.transformer, num_inference_steps=50, verbose=True)
output = pipe(...) # Just call the pipe as normal.
stats = cache_dit.summary(pipe.transformer) # Then, get the summary

# Update the cache context with new cache_config.
cache_dit.refresh_context(
    pipe.transformer,
    cache_config=DBCacheConfig(
        residual_diff_threshold=0.1,
        max_warmup_steps=10,
        max_cached_steps=20,
        max_continuous_cached_steps=4,
        num_inference_steps=50,
    ),
    verbose=True,
)
output = pipe(...) # Just call the pipe as normal.
stats = cache_dit.summary(pipe.transformer) # Then, get the summary

Wan 2.2 T2V

import diffusers
from diffusers import WanPipeline, AutoencoderKLWan, WanTransformer3DModel
import cache_dit

pipe = WanPipeline.from_pretrained(
    (
        args.model_path
        if args.model_path is not None
        else os.environ.get(
            "WAN_2_2_DIR",
            "Wan-AI/Wan2.2-T2V-A14B-Diffusers",
        )
    ),
    torch_dtype=torch.bfloat16,
    # https://huggingface.co/docs/diffusers/main/en/tutorials/inference_with_big_models#device-placement
    device_map=("balanced" if (torch.cuda.device_count() > 1 and GiB() <= 48) else None),
)

if args.cache:
    from cache_dit import (
        BlockAdapter,
        ForwardPattern,
        ParamsModifier,
        DBCacheConfig,
    )

    assert isinstance(pipe.transformer, WanTransformer3DModel)
    assert isinstance(pipe.transformer_2, WanTransformer3DModel)

    # Dual transformer caching with transformer-only api in cache-dit.
    cache_dit.enable_cache(
        BlockAdapter(
            transformer=[
                pipe.transformer,
                pipe.transformer_2,
            ],
            blocks=[
                pipe.transformer.blocks,
                pipe.transformer_2.blocks,
            ],
            forward_pattern=[
                ForwardPattern.Pattern_2,
                ForwardPattern.Pattern_2,
            ],
            params_modifiers=[
                # high-noise transformer only have 30% steps
                ParamsModifier(
                    cache_config=DBCacheConfig().reset(
                        max_warmup_steps=4,
                        max_cached_steps=8,
                    ),
                ),
                ParamsModifier(
                    cache_config=DBCacheConfig().reset(
                        max_warmup_steps=2,
                        max_cached_steps=20,
                    ),
                ),
            ],
            has_separate_cfg=True,
        ),
        cache_config=DBCacheConfig(
            Fn_compute_blocks=args.Fn,
            Bn_compute_blocks=args.Bn,
            max_warmup_steps=args.max_warmup_steps,
            max_cached_steps=args.max_cached_steps,
            max_continuous_cached_steps=args.max_continuous_cached_steps,
            residual_diff_threshold=args.rdt,
            # NOTE: num_inference_steps can be None here, we will
            # set it properly during cache refreshing.
            num_inference_steps=None,
        ),
    )

def split_inference_steps(num_inference_steps: int = 30) -> tuple[int, int]:
    if pipe.config.boundary_ratio is not None:
        boundary_timestep = pipe.config.boundary_ratio * pipe.scheduler.config.num_train_timesteps
    else:
        boundary_timestep = None
    pipe.scheduler.set_timesteps(num_inference_steps, device="cuda")
    timesteps = pipe.scheduler.timesteps
    num_high_noise_steps = 0  # high-noise steps for transformer
    for t in timesteps:
        if boundary_timestep is not None and t >= boundary_timestep:
            num_high_noise_steps += 1
    # low-noise steps for transformer_2
    num_low_noise_steps = num_inference_steps - num_high_noise_steps
    return num_high_noise_steps, num_low_noise_steps


def run_pipe(steps: int = 30):

    if args.cache:
        # Refresh cache context with proper num_inference_steps
        num_high_noise_steps, num_low_noise_steps = split_inference_steps(
            num_inference_steps=steps,
        )

        cache_dit.refresh_context(
            pipe.transformer,
            num_inference_steps=num_high_noise_steps,
            verbose=True,
        )
        cache_dit.refresh_context(
            pipe.transformer_2,
            num_inference_steps=num_low_noise_steps,
            verbose=True,
        )

    video = pipe(
        prompt=prompt,
        height=height,
        width=width,
        num_frames=81,
        num_inference_steps=steps,
        generator=torch.Generator("cpu").manual_seed(0),
    ).frames[0]
    return video

DefTruth added 9 commits December 8, 2025 12:37

feat: add refresh cache context api

69e12ab

feat: add refresh cache context api

d537818

feat: add refresh cache context api

ec38503

feat: add refresh cache context api

fb8da0a

feat: add refresh cache context api

d39ec25

feat: add refresh cache context api

5ac6f89

feat: add refresh cache context api

cd64575

feat: add refresh cache context api

6f76152

feat: add refresh cache context api

96fd2de

DefTruth self-assigned this Dec 8, 2025

DefTruth added 9 commits December 9, 2025 01:53

feat: add refresh cache context api

7882a78

feat: add refresh cache context api

0b52922

feat: add refresh cache context api

3eece98

feat: add refresh cache context api

a1ddb4b

feat: add refresh cache context api

622a8c2

feat: add refresh cache context api

eba1327

feat: add refresh cache context api

75a2045

feat: add refresh cache context api

7b96b9f

feat: add refresh cache context api

c7e36a2

DefTruth merged commit b583763 into main Dec 9, 2025

DefTruth deleted the dev branch December 9, 2025 03:03

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

feat: add refresh cache context api#542

feat: add refresh cache context api#542
DefTruth merged 18 commits intomainfrom
dev

DefTruth commented Dec 8, 2025 •

edited

Loading

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

1 participant

Conversation

DefTruth commented Dec 8, 2025 • edited Loading Uh oh! There was an error while loading. Please reload this page.

Uh oh!

Qwen-Image

Wan 2.2 T2V

Uh oh!

Reviewers

Assignees

Labels

Projects

Milestone

Development

Uh oh!

1 participant

DefTruth commented Dec 8, 2025 •

edited

Loading