| 
136 | 136 |     Qwen2Model,  | 
137 | 137 |     Qwen2RMSNorm,  | 
138 | 138 | )  | 
 | 139 | +from transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import (  | 
 | 140 | +    Qwen2_5_VLAttention,  | 
 | 141 | +    Qwen2_5_VLDecoderLayer,  | 
 | 142 | +    Qwen2_5_VLForConditionalGeneration,  | 
 | 143 | +    Qwen2_5_VLModel,  | 
 | 144 | +)  | 
 | 145 | +from transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import (  | 
 | 146 | +    Qwen2RMSNorm as Qwen2_5RMSNorm,  | 
 | 147 | +)  | 
139 | 148 | from transformers.models.starcoder2.modeling_starcoder2 import (  | 
140 | 149 |     Starcoder2Attention,  | 
141 | 150 |     Starcoder2DecoderLayer,  | 
 | 
303 | 312 |     QEffQwen2ForCausalLM,  | 
304 | 313 |     QEffQwen2Model,  | 
305 | 314 | )  | 
 | 315 | +from QEfficient.transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import (  | 
 | 316 | +    QEffQwen2_5_VLAttention,  | 
 | 317 | +    QEffQwen2_5_VLDecoderLayer,  | 
 | 318 | +    QEffQwen2_5_VLModel,  | 
 | 319 | +    QEffQwen_2_5_vl_ForConditionalGeneration,  | 
 | 320 | +)  | 
306 | 321 | from QEfficient.transformers.models.starcoder2.modeling_starcoder2 import (  | 
307 | 322 |     QEffStarcoder2Attention,  | 
308 | 323 |     QEFFStarcoder2DecoderLayer,  | 
@@ -335,6 +350,7 @@ class CustomOpsTransform(ModuleMappingTransform):  | 
335 | 350 |         MixtralRMSNorm: CustomRMSNormAIC,  | 
336 | 351 |         Phi3RMSNorm: CustomRMSNormAIC,  | 
337 | 352 |         Qwen2RMSNorm: CustomRMSNormAIC,  | 
 | 353 | +        Qwen2_5RMSNorm: CustomRMSNormAIC,  | 
338 | 354 |         MllamaTextRMSNorm: CustomRMSNormAIC,  | 
339 | 355 |         GraniteRMSNorm: CustomRMSNormAIC,  | 
340 | 356 |         GraniteMoeRMSNorm: CustomRMSNormAIC,  | 
@@ -452,6 +468,11 @@ class KVCacheTransform(ModuleMappingTransform):  | 
452 | 468 |         Qwen2DecoderLayer: QEffQwen2DecoderLayer,  | 
453 | 469 |         Qwen2Model: QEffQwen2Model,  | 
454 | 470 |         Qwen2ForCausalLM: QEffQwen2ForCausalLM,  | 
 | 471 | +        # Qwen2.5 VL  | 
 | 472 | +        Qwen2_5_VLForConditionalGeneration: QEffQwen_2_5_vl_ForConditionalGeneration,  | 
 | 473 | +        Qwen2_5_VLModel: QEffQwen2_5_VLModel,  | 
 | 474 | +        Qwen2_5_VLAttention: QEffQwen2_5_VLAttention,  | 
 | 475 | +        Qwen2_5_VLDecoderLayer: QEffQwen2_5_VLDecoderLayer,  | 
455 | 476 |         # Starcoder2  | 
456 | 477 |         Starcoder2Attention: QEffStarcoder2Attention,  | 
457 | 478 |         Starcoder2DecoderLayer: QEFFStarcoder2DecoderLayer,  | 
 | 
0 commit comments