|
136 | 136 | Qwen2Model,
|
137 | 137 | Qwen2RMSNorm,
|
138 | 138 | )
|
| 139 | +from transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import ( |
| 140 | + Qwen2_5_VLAttention, |
| 141 | + Qwen2_5_VLDecoderLayer, |
| 142 | + Qwen2_5_VLForConditionalGeneration, |
| 143 | + Qwen2_5_VLModel, |
| 144 | +) |
| 145 | +from transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import ( |
| 146 | + Qwen2RMSNorm as Qwen2_5RMSNorm, |
| 147 | +) |
139 | 148 | from transformers.models.starcoder2.modeling_starcoder2 import (
|
140 | 149 | Starcoder2Attention,
|
141 | 150 | Starcoder2DecoderLayer,
|
|
303 | 312 | QEffQwen2ForCausalLM,
|
304 | 313 | QEffQwen2Model,
|
305 | 314 | )
|
| 315 | +from QEfficient.transformers.models.qwen2_5_vl.modeling_qwen2_5_vl import ( |
| 316 | + QEffQwen2_5_VLAttention, |
| 317 | + QEffQwen2_5_VLDecoderLayer, |
| 318 | + QEffQwen2_5_VLModel, |
| 319 | + QEffQwen_2_5_vl_ForConditionalGeneration, |
| 320 | +) |
306 | 321 | from QEfficient.transformers.models.starcoder2.modeling_starcoder2 import (
|
307 | 322 | QEffStarcoder2Attention,
|
308 | 323 | QEFFStarcoder2DecoderLayer,
|
@@ -335,6 +350,7 @@ class CustomOpsTransform(ModuleMappingTransform):
|
335 | 350 | MixtralRMSNorm: CustomRMSNormAIC,
|
336 | 351 | Phi3RMSNorm: CustomRMSNormAIC,
|
337 | 352 | Qwen2RMSNorm: CustomRMSNormAIC,
|
| 353 | + Qwen2_5RMSNorm: CustomRMSNormAIC, |
338 | 354 | MllamaTextRMSNorm: CustomRMSNormAIC,
|
339 | 355 | GraniteRMSNorm: CustomRMSNormAIC,
|
340 | 356 | GraniteMoeRMSNorm: CustomRMSNormAIC,
|
@@ -452,6 +468,11 @@ class KVCacheTransform(ModuleMappingTransform):
|
452 | 468 | Qwen2DecoderLayer: QEffQwen2DecoderLayer,
|
453 | 469 | Qwen2Model: QEffQwen2Model,
|
454 | 470 | Qwen2ForCausalLM: QEffQwen2ForCausalLM,
|
| 471 | + # Qwen2.5 VL |
| 472 | + Qwen2_5_VLForConditionalGeneration: QEffQwen_2_5_vl_ForConditionalGeneration, |
| 473 | + Qwen2_5_VLModel: QEffQwen2_5_VLModel, |
| 474 | + Qwen2_5_VLAttention: QEffQwen2_5_VLAttention, |
| 475 | + Qwen2_5_VLDecoderLayer: QEffQwen2_5_VLDecoderLayer, |
455 | 476 | # Starcoder2
|
456 | 477 | Starcoder2Attention: QEffStarcoder2Attention,
|
457 | 478 | Starcoder2DecoderLayer: QEFFStarcoder2DecoderLayer,
|
|
0 commit comments