MS-Phi-Phixtral-Chat

Runtime error

mlabonne commited on Jan 10, 2024

Commit

6d73c80

1 Parent(s): 40ad7d4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,6 +4,8 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 from transformers import StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
 from threading import Thread
 # Loading the tokenizer and model from Hugging Face's model hub.
 tokenizer = AutoTokenizer.from_pretrained(
     "mlabonne/phixtral-2x2_8",
@@ -16,11 +18,6 @@ model = AutoModelForCausalLM.from_pretrained(
     trust_remote_code=True
 )
-# using CUDA for an optimal experience
-device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-model = model.to(device)
 # Defining a custom stopping criteria class for the model's text generation.
 class StopOnTokens(StoppingCriteria):
     def __call__(self, input_ids: torch.LongTensor, scores: torch.FloatTensor, **kwargs) -> bool:

 from transformers import StoppingCriteria, StoppingCriteriaList, TextIteratorStreamer
 from threading import Thread
+torch.set_default_device("cuda")
 # Loading the tokenizer and model from Hugging Face's model hub.
 tokenizer = AutoTokenizer.from_pretrained(
     "mlabonne/phixtral-2x2_8",
     trust_remote_code=True
 )
 # Defining a custom stopping criteria class for the model's text generation.
 class StopOnTokens(StoppingCriteria):
     def __call__(self, input_ids: torch.LongTensor, scores: torch.FloatTensor, **kwargs) -> bool: