Fix safetensors kwarg usage in AutoAWQ

2024-10-01 01:26:03 -04:00 · 2023-10-10 19:03:09 -07:00 · 2023-10-10 19:03:09 -07:00 · f63361568c
commit f63361568c
parent 39f16ff83d
1 changed files with 13 additions and 13 deletions
--- a/modules/models.py
+++ b/modules/models.py
@ -277,24 +277,24 @@ def ctransformers_loader(model_name):
    model, tokenizer = ctrans.from_pretrained(model_file)
    return model, tokenizer
 def AutoAWQ_loader(model_name):
-   from awq import AutoAWQForCausalLM
+    from awq import AutoAWQForCausalLM
-   model_dir = Path(f'{shared.args.model_dir}/{model_name}')
+    model_dir = Path(f'{shared.args.model_dir}/{model_name}')
-   if shared.args.deepspeed:
+    model = AutoAWQForCausalLM.from_quantized(
-       logger.warn("AutoAWQ is incompatible with deepspeed")
+                quant_path=model_dir,
                max_new_tokens=shared.args.max_seq_len,
                trust_remote_code=shared.args.trust_remote_code,
                fuse_layers=not shared.args.no_inject_fused_attention,
                max_memory=get_max_memory_dict(),
                batch_size=shared.args.n_batch,
                safetensors=any(model_dir.glob('*.safetensors')),
            )
-   model = AutoAWQForCausalLM.from_quantized(
+    return model
       quant_path=model_dir,
       max_new_tokens=shared.args.max_seq_len,
       trust_remote_code=shared.args.trust_remote_code,
       fuse_layers=not shared.args.no_inject_fused_attention,
       max_memory=get_max_memory_dict(),
       batch_size=shared.args.n_batch,
       safetensors=not shared.args.trust_remote_code)
   return model
 def GPTQ_loader(model_name):