diff --git a/src/build_model.py b/src/build_model.py index 12bfa0c..bebd73c 100644 --- a/src/build_model.py +++ b/src/build_model.py @@ -168,9 +168,9 @@ def build_model( quant_config: QuantConfig, offload_config: OffloadConfig, state_path: str, + model_name: "mistralai/Mixtral-8x7B-Instruct-v0.1", ): - model_name = "mistralai/Mixtral-8x7B-Instruct-v0.1" - + state_dict_00 = load_00_expert_state_dict(state_path, device) def _make_module():