Make text generation work with ministral model. (#13395)

Needs template before it works properly.
2026-04-13 17:43:57 -07:00
parent 402ff1cdb7
commit 722bc73319
1 changed files with 2 additions and 1 deletions
@@ -82,6 +82,7 @@ class Ministral3_3BConfig:
    rope_scale = None
    final_norm: bool = True
    lm_head: bool = False
+    stop_tokens = [2]

@dataclass
 class Qwen25_3BConfig:
@@ -969,7 +970,7 @@ class Mistral3Small24B(BaseLlama, torch.nn.Module):
        self.model = Llama2_(config, device=device, dtype=dtype, ops=operations)
        self.dtype = dtype

-class Ministral3_3B(BaseLlama, torch.nn.Module):
+class Ministral3_3B(BaseLlama, BaseQwen3, BaseGenerate, torch.nn.Module):
    def __init__(self, config_dict, dtype, device, operations):
        super().__init__()
        config = Ministral3_3BConfig(**config_dict)