Pārlūkot izejas kodu

no_split_module_classes not needed

81300 3 gadi atpakaļ
vecāks
revīzija
c515282f5c
1 mainītis faili ar 1 papildinājumiem un 1 dzēšanām
  1. 1 1
      server.py

+ 1 - 1
server.py

@@ -178,7 +178,7 @@ def load_model(model_name):
 
 
     # DeepSpeed ZeRO-3
     # DeepSpeed ZeRO-3
     elif args.deepspeed:
     elif args.deepspeed:
-        model = AutoModelForCausalLM.from_pretrained(Path(f"models/{model_name}", no_split_module_classes=["GPTJBlock"]))
+        model = AutoModelForCausalLM.from_pretrained(Path(f"models/{model_name}"))
         model = deepspeed.initialize(model=model,
         model = deepspeed.initialize(model=model,
                                      config_params=ds_config,
                                      config_params=ds_config,
                                      model_parameters=None,
                                      model_parameters=None,