Compare commits
1 Commits
state_as_f
...
new-qwop
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
8781c84287 |
@@ -15,7 +15,7 @@ from modelutils import find_layers
|
||||
from quant import make_quant
|
||||
|
||||
|
||||
def _load_quant(model, checkpoint, wbits, groupsize=-1, faster_kernel=False, exclude_layers=['lm_head'], kernel_switch_threshold=128):
|
||||
def _load_quant(model, checkpoint, wbits, groupsize=-1, exclude_layers=['lm_head']):
|
||||
config = AutoConfig.from_pretrained(model)
|
||||
def noop(*args, **kwargs):
|
||||
pass
|
||||
@@ -33,16 +33,16 @@ def _load_quant(model, checkpoint, wbits, groupsize=-1, faster_kernel=False, exc
|
||||
for name in exclude_layers:
|
||||
if name in layers:
|
||||
del layers[name]
|
||||
make_quant(model, layers, wbits, groupsize, faster=faster_kernel, kernel_switch_threshold=kernel_switch_threshold)
|
||||
make_quant(model, layers, wbits, groupsize)
|
||||
|
||||
del layers
|
||||
|
||||
print('Loading model ...')
|
||||
if checkpoint.endswith('.safetensors'):
|
||||
from safetensors.torch import load_file as safe_load
|
||||
model.load_state_dict(safe_load(checkpoint))
|
||||
model.load_state_dict(safe_load(checkpoint), strict = False)
|
||||
else:
|
||||
model.load_state_dict(torch.load(checkpoint))
|
||||
model.load_state_dict(torch.load(checkpoint), strict = False)
|
||||
model.seqlen = 2048
|
||||
print('Done.')
|
||||
|
||||
@@ -110,8 +110,7 @@ def load_quantized(model_name):
|
||||
if shared.args.pre_layer:
|
||||
model = load_quant(str(path_to_model), str(pt_path), shared.args.wbits, shared.args.groupsize, shared.args.pre_layer)
|
||||
else:
|
||||
threshold = False if model_type == 'gptj' else 128
|
||||
model = load_quant(str(path_to_model), str(pt_path), shared.args.wbits, shared.args.groupsize, kernel_switch_threshold=threshold)
|
||||
model = load_quant(str(path_to_model), str(pt_path), shared.args.wbits, shared.args.groupsize)
|
||||
|
||||
# accelerate offload (doesn't work properly)
|
||||
if shared.args.gpu_memory:
|
||||
|
||||
Reference in New Issue
Block a user