jaymojnidar commited on
Commit
5bfa3aa
1 Parent(s): 1cb615a

trying out the sharded vesion

Browse files
Files changed (1) hide show
  1. model.py +2 -1
model.py CHANGED
@@ -7,7 +7,8 @@ from transformers import AutoConfig, AutoModelForCausalLM, AutoTokenizer, TextIt
7
  from huggingface_hub import login
8
 
9
  # model_id = 'meta-llama/Llama-2-13b-chat-hf'
10
- model_id = 'meta-llama/Llama-2-7b-chat-hf'
 
11
 
12
  if torch.cuda.is_available():
13
  tok = os.environ['HF_TOKEN']
 
7
  from huggingface_hub import login
8
 
9
  # model_id = 'meta-llama/Llama-2-13b-chat-hf'
10
+ #model_id = 'meta-llama/Llama-2-7b-chat-hf'
11
+ model_id = 'Trelis/Llama-2-7b-chat-hf-sharded-bf16'
12
 
13
  if torch.cuda.is_available():
14
  tok = os.environ['HF_TOKEN']