Skip to content
Draft
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions QEfficient/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@
from QEfficient.compile.compile_helper import compile
from QEfficient.diffusers.pipelines.flux.pipeline_flux import QEffFluxPipeline
from QEfficient.diffusers.pipelines.wan.pipeline_wan import QEffWanPipeline
from QEfficient.diffusers.pipelines.qwen_image.pipeline_qwenimage import QEFFQwenImagePipeline
from QEfficient.exporter.export_hf_to_cloud_ai_100 import qualcomm_efficient_converter
from QEfficient.generation.text_generation_inference import cloud_ai_100_exec_kv
from QEfficient.peft import QEffAutoPeftModelForCausalLM
Expand Down Expand Up @@ -57,6 +58,7 @@
"QEFFCommonLoader",
"QEffFluxPipeline",
"QEffWanPipeline",
"QEFFQwenImagePipeline",
]


Expand Down
13 changes: 13 additions & 0 deletions QEfficient/diffusers/models/pytorch_transforms.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@
#
# -----------------------------------------------------------------------------

from diffusers.models.attention_processor import Attention
from diffusers.models.normalization import AdaLayerNormContinuous, AdaLayerNormZero, AdaLayerNormZeroSingle, RMSNorm
from diffusers.models.transformers.transformer_flux import (
FluxAttention,
Expand All @@ -13,6 +14,10 @@
FluxTransformer2DModel,
FluxTransformerBlock,
)
from diffusers.models.transformers.transformer_qwenimage import (
QwenDoubleStreamAttnProcessor2_0,
QwenImageTransformer2DModel,
)
from diffusers.models.transformers.transformer_wan import WanAttention, WanAttnProcessor, WanTransformer3DModel
from torch import nn

Expand All @@ -30,6 +35,11 @@
QEffFluxTransformer2DModel,
QEffFluxTransformerBlock,
)
from QEfficient.diffusers.models.transformers.transformer_qwenimage import (
QEffQwenDoubleStreamAttnProcessor2_0,
QEffQwenImageAttention,
QEffQwenImageTransformer2DModel,
)
from QEfficient.diffusers.models.transformers.transformer_wan import (
QEffWanAttention,
QEffWanAttnProcessor,
Expand All @@ -54,6 +64,9 @@ class AttentionTransform(ModuleMappingTransform):
WanAttnProcessor: QEffWanAttnProcessor,
WanAttention: QEffWanAttention,
WanTransformer3DModel: QEffWanTransformer3DModel,
QwenImageTransformer2DModel: QEffQwenImageTransformer2DModel,
QwenDoubleStreamAttnProcessor2_0: QEffQwenDoubleStreamAttnProcessor2_0,
Attention: QEffQwenImageAttention,
}


Expand Down
Loading
Loading