-
-
Notifications
You must be signed in to change notification settings - Fork 14.6k
Add Mistral Large 3 and Ministral 3 #29757
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
a4d3772
2ce6f4e
ad31919
ff4fd5c
cd27b30
51a5b0f
1a30121
c0d78d2
943e82f
397788d
e65b9af
4750d9f
1e7fdcc
e4ea260
0553462
ffaf85b
e74fdf8
a330734
52ef28a
efa0e6d
97a24fc
ce02e1f
09a8941
32f0bbc
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -358,6 +358,9 @@ def check_available_online( | |
| trust_remote_code=True, | ||
| ), | ||
| "MistralForCausalLM": _HfExamplesInfo("mistralai/Mistral-7B-Instruct-v0.1"), | ||
| "MistralLarge3ForCausalLM": _HfExamplesInfo( | ||
| "mistralai/Mistral-Large-3-675B-Instruct-2512-NVFP4", is_available_online=False | ||
| ), | ||
| "MixtralForCausalLM": _HfExamplesInfo( | ||
| "mistralai/Mixtral-8x7B-Instruct-v0.1", | ||
| {"tiny": "TitanML/tiny-mixtral"}, | ||
|
|
@@ -770,7 +773,13 @@ def check_available_online( | |
| ), | ||
| "PixtralForConditionalGeneration": _HfExamplesInfo( | ||
| "mistralai/Pixtral-12B-2409", | ||
| extras={ | ||
| "mistral-large-3": "mistralai/Mistral-Large-3-675B-Instruct-2512-NVFP4", | ||
| "ministral-3": "mistralai/Ministral-3-3B-Instruct-2512", | ||
| }, | ||
| tokenizer_mode="mistral", | ||
| # TODO: revert once Mistral-Large-3 and Ministral-3 are publicly available. | ||
| is_available_online=False, | ||
|
Comment on lines
+781
to
+782
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We should flip this before 0.12 goes out @khluu
Member
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I think it's okay to leave this as is since we're cutting a branch today |
||
| ), | ||
| "QwenVLForConditionalGeneration": _HfExamplesInfo( | ||
| "Qwen/Qwen-VL", | ||
|
|
@@ -870,6 +879,11 @@ def check_available_online( | |
| use_original_num_layers=True, | ||
| max_model_len=10240, | ||
| ), | ||
| "EagleMistralLarge3ForCausalLM": _HfExamplesInfo( | ||
| "mistralai/Mistral-Large-3-675B-Instruct-2512", | ||
| speculative_model="mistralai/Mistral-Large-3-675B-Instruct-2512-Eagle", | ||
| is_available_online=False, | ||
| ), | ||
| "LlamaForCausalLMEagle3": _HfExamplesInfo( | ||
| "Qwen/Qwen3-8B", | ||
| trust_remote_code=True, | ||
|
|
||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -80,7 +80,7 @@ def __init__(self, tokenizer: TokenizerLike): | |
| self.tool_call_regex = re.compile(r"\[{.*}\]", re.DOTALL) | ||
| if _is_fn_name_regex_support(self.model_tokenizer): | ||
| self.fn_name_regex = re.compile( | ||
| r"([a-zA-Z0-9_-]+)(\{[\s\S]*?\})(?=\s*$|,|\s)", re.DOTALL | ||
| r"([a-zA-Z0-9_-]+)(\{[\s\S]*?\})(?=\s*$|,|\s)?", re.DOTALL | ||
|
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Had to add this to make sure tool calls worked as expected for some examples, will rerun some xp to see if i didn't break anything there as we didn't author this.
Contributor
Author
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Looks good on the examples I launched so this looks benign |
||
| ) | ||
| else: | ||
| self.fn_name_regex = None | ||
|
|
||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
lmk @mgoin is this is what you had in mind here.