From 47d7e6ea37bfd7f8d519e8632dabe2dc87fee72a Mon Sep 17 00:00:00 2001 From: Main Date: Sat, 19 Oct 2024 18:12:35 +0000 Subject: [PATCH] v13 --- app/models/qwen.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/app/models/qwen.py b/app/models/qwen.py index 219af6f..4b3de92 100644 --- a/app/models/qwen.py +++ b/app/models/qwen.py @@ -25,7 +25,7 @@ class Qwen(BaseModel): self.model = AutoModelForCausalLM.from_pretrained( model_path, torch_dtype=torch.float16, - # quantization_config=quantization_config, + quantization_config=quantization_config, device_map="auto", # low_cpu_mem_usage=True )