anslin-raj's picture
Update README.md
f01a66e
|
raw
history blame
369 Bytes
metadata
license: cc-by-nc-4.0
language:
  - en
library_name: transformers
from transformers import AutoTokenizer, AutoModelForCausalLM

HF_MODEL_REPO = "anslin-raj/Llama-2-7b-chat-hf-8-bit"

tokenizer = AutoTokenizer.from_pretrained(HF_MODEL_REPO, device=device)

model = AutoModelForCausalLM.from_pretrained(HF_MODEL_REPO, device_map=device, load_in_8bit=True)