From c515282f5c844670e712cc3d793d513271f797d4 Mon Sep 17 00:00:00 2001 From: 81300 <105078168+81300@users.noreply.github.com> Date: Wed, 1 Feb 2023 19:47:26 +0200 Subject: [PATCH] no_split_module_classes not needed --- server.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/server.py b/server.py index 844d5e66..692c84b9 100644 --- a/server.py +++ b/server.py @@ -178,7 +178,7 @@ def load_model(model_name): # DeepSpeed ZeRO-3 elif args.deepspeed: - model = AutoModelForCausalLM.from_pretrained(Path(f"models/{model_name}", no_split_module_classes=["GPTJBlock"])) + model = AutoModelForCausalLM.from_pretrained(Path(f"models/{model_name}")) model = deepspeed.initialize(model=model, config_params=ds_config, model_parameters=None,