zhaozitian commited on
Commit
23063a1
1 Parent(s): a1fbbe4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -27,7 +27,7 @@ except:
27
  if device == "cuda":
28
  model = LlamaForCausalLM.from_pretrained(
29
  BASE_MODEL,
30
- load_in_8bit=False,
31
  torch_dtype=torch.float16,
32
  device_map="auto",
33
  )
@@ -72,7 +72,8 @@ def generate_prompt(instruction, input=None):
72
  ### Response:"""
73
 
74
  if device != "cpu":
75
- model.half()
 
76
  model.eval()
77
  if torch.__version__ >= "2":
78
  model = torch.compile(model)
 
27
  if device == "cuda":
28
  model = LlamaForCausalLM.from_pretrained(
29
  BASE_MODEL,
30
+ load_in_8bit=True,
31
  torch_dtype=torch.float16,
32
  device_map="auto",
33
  )
 
72
  ### Response:"""
73
 
74
  if device != "cpu":
75
+ pass
76
+ #model.half()
77
  model.eval()
78
  if torch.__version__ >= "2":
79
  model = torch.compile(model)