Skip to content

Commit 7607d80

Browse files
Add AutoTokenizer mapping for mistral3 and ministral (#42198)
* WIP * WIP
1 parent 32a58e3 commit 7607d80

File tree

1 file changed

+18
-0
lines changed

1 file changed

+18
-0
lines changed

src/transformers/models/auto/tokenization_auto.py

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -442,6 +442,15 @@
442442
"GPT2TokenizerFast" if is_tokenizers_available() else None,
443443
),
444444
),
445+
(
446+
"ministral",
447+
(
448+
"MistralCommonTokenizer"
449+
if is_mistral_common_available()
450+
else ("LlamaTokenizer" if is_sentencepiece_available() else None),
451+
"LlamaTokenizerFast" if is_tokenizers_available() and not is_mistral_common_available() else None,
452+
),
453+
),
445454
(
446455
"mistral",
447456
(
@@ -451,6 +460,15 @@
451460
"LlamaTokenizerFast" if is_tokenizers_available() and not is_mistral_common_available() else None,
452461
),
453462
),
463+
(
464+
"mistral3",
465+
(
466+
"MistralCommonTokenizer"
467+
if is_mistral_common_available()
468+
else ("LlamaTokenizer" if is_sentencepiece_available() else None),
469+
"LlamaTokenizerFast" if is_tokenizers_available() and not is_mistral_common_available() else None,
470+
),
471+
),
454472
(
455473
"mixtral",
456474
(

0 commit comments

Comments
 (0)