binqiangliu commited on
Commit
dbb6c49
1 Parent(s): ab440a4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -35,7 +35,7 @@ def load_quantized_model(model_name: str):
35
  #bnb_4bit_use_double_quant=True,
36
  bnb_4bit_use_double_quant=False,
37
  bnb_4bit_quant_type="nf4",
38
- bnb_4bit_compute_dtype=torch.bfloat16
39
  )
40
 
41
  model = AutoModelForCausalLM.from_pretrained(
 
35
  #bnb_4bit_use_double_quant=True,
36
  bnb_4bit_use_double_quant=False,
37
  bnb_4bit_quant_type="nf4",
38
+ #bnb_4bit_compute_dtype=torch.bfloat16
39
  )
40
 
41
  model = AutoModelForCausalLM.from_pretrained(