oobabooga 2 лет назад
Родитель
Сommit
706a03b2cb
2 измененных файлов с 3 добавлено и 17 удалено
  1. 3 5
      modules/models.py
  2. 0 12
      presets/LLaMA-Default.txt

+ 3 - 5
modules/models.py

@@ -104,13 +104,11 @@ def load_model(model_name):
         elif path_to_model.name.lower().startswith('llama-65b'):
             pt_model = 'llama-65b-4bit.pt'
         else:
-            print(f"Could not find the .pt model for {model_name}, exiting...")
-            exit()
+            pt_model = f'{model_name}-4bit.pt'
 
-        # check root of models folder, and model path root
-        paths = [  f"{path_to_model}/{pt_model}", f"models/{pt_model}" ]
+        # Try to find the .pt both in models/ and in the subfolder
         pt_path = None
-        for path in [ Path(p) for p in paths ]:
+        for path in [Path(p) for p in [f"models/{pt_model}", f"{path_to_model}/{pt_model}"]]:
             if path.exists():
                 pt_path = path
 

+ 0 - 12
presets/LLaMA-Default.txt

@@ -1,12 +0,0 @@
-do_sample=False
-temperature=0.7
-top_p=0
-typical_p=1
-repetition_penalty=1.15
-top_k=40
-num_beams=1
-penalty_alpha=0
-min_length=0
-length_penalty=1
-no_repeat_ngram_size=0
-early_stopping=True