Skip to content

Commit

Permalink
Add Mistral-Large-Instruct-2411 (#1876)
Browse files Browse the repository at this point in the history
  • Loading branch information
ysjprojects authored Dec 21, 2024
1 parent 7b26d35 commit 7e12d64
Show file tree
Hide file tree
Showing 2 changed files with 21 additions and 0 deletions.
20 changes: 20 additions & 0 deletions litgpt/config.py
Original file line number Diff line number Diff line change
Expand Up @@ -1663,6 +1663,26 @@ def norm_class(self) -> Type:
intermediate_size=28672,
)
)
configs.append(
# https://huggingface.co/mistralai/Mistral-Large-Instruct-2411/blob/main/config.json
dict(
name="Mistral-Large-Instruct-2411",
hf_config=dict(org="mistralai", name="Mistral-Large-Instruct-2411"),
padded_vocab_size=32768,
block_size=32768,
n_layer=88,
n_head=96,
n_embd=12288,
n_query_groups=8,
rotary_percentage=1.0,
parallel_residual=False,
bias=False,
norm_class_name="RMSNorm",
norm_eps=1e-05,
mlp_class_name="LLaMAMLP",
intermediate_size=28672,
)
)


############
Expand Down
1 change: 1 addition & 0 deletions tutorials/download_model_weights.md
Original file line number Diff line number Diff line change
Expand Up @@ -171,6 +171,7 @@ mistralai/Mistral-7B-Instruct-v0.3
mistralai/Mistral-7B-v0.1
mistralai/Mistral-7B-v0.3
mistralai/Mistral-Large-Instruct-2407
mistralai/Mistral-Large-Instruct-2411
mistralai/Mixtral-8x7B-Instruct-v0.1
mistralai/Mixtral-8x7B-v0.1
mistralai/Mixtral-8x22B-Instruct-v0.1
Expand Down

0 comments on commit 7e12d64

Please sign in to comment.