|
401 | 401 | # Text generation models |
402 | 402 | "SmolLM3ForCausalLM": ("transformers", "TransformersForCausalLM"), |
403 | 403 | # Multimodal models |
404 | | - "Emu3ForConditionalGeneration": ("transformers", "TransformersForMultimodalLM"), # noqa: E501 |
| 404 | + "Emu3ForConditionalGeneration": ( |
| 405 | + "transformers", |
| 406 | + "TransformersMultiModalForCausalLM", |
| 407 | + ), |
405 | 408 | } |
406 | 409 |
|
407 | 410 | _TRANSFORMERS_BACKEND_MODELS = { |
| 411 | + # Text generation models |
408 | 412 | "TransformersForCausalLM": ("transformers", "TransformersForCausalLM"), |
409 | | - "TransformersForMultimodalLM": ("transformers", "TransformersForMultimodalLM"), # noqa: E501 |
410 | | - "TransformersMoEForCausalLM": ("transformers_moe", "TransformersMoEForCausalLM"), # noqa: E501 |
411 | | - "TransformersMoEForMultimodalLM": ( |
412 | | - "transformers_moe", |
413 | | - "TransformersMoEForMultimodalLM", |
| 413 | + "TransformersMoEForCausalLM": ("transformers", "TransformersMoEForCausalLM"), |
| 414 | + # Multimodal models |
| 415 | + "TransformersMultiModalForCausalLM": ( |
| 416 | + "transformers", |
| 417 | + "TransformersMultiModalForCausalLM", |
| 418 | + ), |
| 419 | + "TransformersMultiModalMoEForCausalLM": ( |
| 420 | + "transformers", |
| 421 | + "TransformersMultiModalMoEForCausalLM", |
414 | 422 | ), |
415 | | - "TransformersEmbeddingModel": ( |
416 | | - "transformers_pooling", |
417 | | - "TransformersEmbeddingModel", |
| 423 | + # Embedding models |
| 424 | + "TransformersEmbeddingModel": ("transformers", "TransformersEmbeddingModel"), |
| 425 | + "TransformersMoEEmbeddingModel": ("transformers", "TransformersMoEEmbeddingModel"), |
| 426 | + "TransformersMultiModalEmbeddingModel": ( |
| 427 | + "transformers", |
| 428 | + "TransformersMultiModalEmbeddingModel", |
418 | 429 | ), |
| 430 | + # Sequence classification models |
419 | 431 | "TransformersForSequenceClassification": ( |
420 | | - "transformers_pooling", |
| 432 | + "transformers", |
421 | 433 | "TransformersForSequenceClassification", |
422 | 434 | ), |
423 | 435 | "TransformersMoEForSequenceClassification": ( |
424 | | - "transformers_pooling", |
| 436 | + "transformers", |
425 | 437 | "TransformersMoEForSequenceClassification", |
426 | 438 | ), |
427 | | - "TransformersMoEEmbeddingModel": ( |
428 | | - "transformers_pooling", |
429 | | - "TransformersMoEEmbeddingModel", |
| 439 | + "TransformersMultiModalForSequenceClassification": ( |
| 440 | + "transformers", |
| 441 | + "TransformersMultiModalForSequenceClassification", |
430 | 442 | ), |
431 | 443 | } |
432 | 444 |
|
|
0 commit comments