Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -104,6 +104,7 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
104 |
device_map="auto",
|
105 |
#quantization_config=quantization_config,
|
106 |
attn_implementation="flash_attention_2",
|
|
|
107 |
)
|
108 |
|
109 |
# Create Gradio interface
|
|
|
104 |
device_map="auto",
|
105 |
#quantization_config=quantization_config,
|
106 |
attn_implementation="flash_attention_2",
|
107 |
+
dtype=torch.bfloat16
|
108 |
)
|
109 |
|
110 |
# Create Gradio interface
|