robinhad commited on
Commit
d6b4766
·
verified ·
1 Parent(s): 156f98f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -23,10 +23,10 @@ quant_config = BitsAndBytesConfig(
23
  tokenizer = LlamaTokenizer.from_pretrained(model_name)
24
  model = LlamaForCausalLM.from_pretrained(
25
  model_name,
26
- #quantization_config=quant_config
27
  )
28
 
29
- model = PeftModel.from_pretrained(model, lora_name, torch_device="cpu")
30
 
31
  model = model.to("cuda")
32
 
 
23
  tokenizer = LlamaTokenizer.from_pretrained(model_name)
24
  model = LlamaForCausalLM.from_pretrained(
25
  model_name,
26
+ quantization_config=quant_config
27
  )
28
 
29
+ model = PeftModel.from_pretrained(model, lora_name)
30
 
31
  model = model.to("cuda")
32