Skip to content

Commit 5d0ee1e

Browse files
committed
feat(diffusers/pipelines): add pipelines of skyreels_v2 in diffusers master
1 parent 46ff896 commit 5d0ee1e

22 files changed

+6292
-1
lines changed

mindone/diffusers/__init__.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,7 @@
7070
"SD3ControlNetModel",
7171
"SD3MultiControlNetModel",
7272
"SD3Transformer2DModel",
73+
"SkyReelsV2Transformer3DModel",
7374
"SparseControlNetModel",
7475
"StableAudioDiTModel",
7576
"StableCascadeUNet",
@@ -219,6 +220,11 @@
219220
"SemanticStableDiffusionPipeline",
220221
"ShapEImg2ImgPipeline",
221222
"ShapEPipeline",
223+
"SkyReelsV2DiffusionForcingImageToVideoPipeline",
224+
"SkyReelsV2DiffusionForcingPipeline",
225+
"SkyReelsV2DiffusionForcingVideoToVideoPipeline",
226+
"SkyReelsV2ImageToVideoPipeline",
227+
"SkyReelsV2Pipeline",
222228
"StableAudioPipeline",
223229
"StableAudioProjectionModel",
224230
"StableCascadeCombinedPipeline",
@@ -399,6 +405,7 @@
399405
SD3ControlNetModel,
400406
SD3MultiControlNetModel,
401407
SD3Transformer2DModel,
408+
SkyReelsV2Transformer3DModel,
402409
SparseControlNetModel,
403410
StableAudioDiTModel,
404411
StableCascadeUNet,
@@ -547,6 +554,11 @@
547554
SemanticStableDiffusionPipeline,
548555
ShapEImg2ImgPipeline,
549556
ShapEPipeline,
557+
SkyReelsV2DiffusionForcingImageToVideoPipeline,
558+
SkyReelsV2DiffusionForcingPipeline,
559+
SkyReelsV2DiffusionForcingVideoToVideoPipeline,
560+
SkyReelsV2ImageToVideoPipeline,
561+
SkyReelsV2Pipeline,
550562
StableAudioPipeline,
551563
StableAudioProjectionModel,
552564
StableCascadeCombinedPipeline,

mindone/diffusers/loaders/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -76,6 +76,7 @@ def text_encoder_attn_modules(text_encoder):
7676
"Lumina2LoraLoaderMixin",
7777
"WanLoraLoaderMixin",
7878
"HiDreamImageLoraLoaderMixin",
79+
"SkyReelsV2LoraLoaderMixin",
7980
],
8081
"peft": ["PeftAdapterMixin"],
8182
"single_file": ["FromSingleFileMixin"],
@@ -100,6 +101,7 @@ def text_encoder_attn_modules(text_encoder):
100101
Mochi1LoraLoaderMixin,
101102
SanaLoraLoaderMixin,
102103
SD3LoraLoaderMixin,
104+
SkyReelsV2LoraLoaderMixin,
103105
StableDiffusionLoraLoaderMixin,
104106
StableDiffusionXLLoraLoaderMixin,
105107
WanLoraLoaderMixin,

mindone/diffusers/loaders/lora_pipeline.py

Lines changed: 371 additions & 0 deletions
Large diffs are not rendered by default.

mindone/diffusers/models/__init__.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -78,6 +78,7 @@
7878
"transformers.transformer_mochi": ["MochiTransformer3DModel"],
7979
"transformers.transformer_omnigen": ["OmniGenTransformer2DModel"],
8080
"transformers.transformer_sd3": ["SD3Transformer2DModel"],
81+
"transformers.transformer_skyreels_v2": ["SkyReelsV2Transformer3DModel"],
8182
"transformers.transformer_temporal": ["TransformerTemporalModel"],
8283
"transformers.transformer_wan": ["WanTransformer3DModel"],
8384
"unets.unet_1d": ["UNet1DModel"],
@@ -154,6 +155,7 @@
154155
PriorTransformer,
155156
SanaTransformer2DModel,
156157
SD3Transformer2DModel,
158+
SkyReelsV2Transformer3DModel,
157159
StableAudioDiTModel,
158160
T5FilmDecoder,
159161
Transformer2DModel,

mindone/diffusers/models/embeddings.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -327,7 +327,7 @@ def get_2d_sincos_pos_embed_from_grid(embed_dim, grid, output_type="np"):
327327
return emb
328328

329329

330-
def get_1d_sincos_pos_embed_from_grid(embed_dim, pos, output_type="np"):
330+
def get_1d_sincos_pos_embed_from_grid(embed_dim, pos, output_type="np", flip_sin_to_cos=False):
331331
"""
332332
This function generates 1D positional embeddings from a grid.
333333
@@ -360,6 +360,11 @@ def get_1d_sincos_pos_embed_from_grid(embed_dim, pos, output_type="np"):
360360
emb_cos = mint.cos(out) # (M, D/2)
361361

362362
emb = mint.concat([emb_sin, emb_cos], dim=1) # (M, D)
363+
364+
# flip sine and cosine embeddings
365+
if flip_sin_to_cos:
366+
emb = mint.cat([emb[:, embed_dim // 2 :], emb[:, : embed_dim // 2]], dim=1)
367+
363368
return emb
364369

365370

mindone/diffusers/models/transformers/__init__.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -26,5 +26,6 @@
2626
from .transformer_mochi import MochiTransformer3DModel
2727
from .transformer_omnigen import OmniGenTransformer2DModel
2828
from .transformer_sd3 import SD3Transformer2DModel
29+
from .transformer_skyreels_v2 import SkyReelsV2Transformer3DModel
2930
from .transformer_temporal import TransformerTemporalModel
3031
from .transformer_wan import WanTransformer3DModel

0 commit comments

Comments
 (0)