Update README.md
Browse files
README.md
CHANGED
@@ -14,27 +14,28 @@ This is a fine-tuned version of LLAMA2 trained (7b) on spider, sql-create-contex
|
|
14 |
|
15 |
To initialize the model:
|
16 |
|
17 |
-
|
|
|
18 |
load_in_4bit=use_4bit,
|
19 |
bnb_4bit_quant_type=bnb_4bit_quant_type,
|
20 |
bnb_4bit_compute_dtype=compute_dtype,
|
21 |
bnb_4bit_use_double_quant=use_nested_quant,
|
22 |
)
|
23 |
|
24 |
-
model = AutoModelForCausalLM.from_pretrained(
|
25 |
model_name,
|
26 |
quantization_config=bnb_config,
|
27 |
device_map=device_map,
|
28 |
trust_remote_code=True
|
29 |
)
|
30 |
-
|
31 |
|
32 |
Use the tokenizer:
|
33 |
|
34 |
|
35 |
-
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
36 |
-
tokenizer.pad_token = tokenizer.eos_token
|
37 |
-
tokenizer.padding_side = "right"
|
38 |
|
39 |
To get the prompt:
|
40 |
dataset = dataset.map(
|
|
|
14 |
|
15 |
To initialize the model:
|
16 |
|
17 |
+
|
18 |
+
bnb_config = BitsAndBytesConfig(
|
19 |
load_in_4bit=use_4bit,
|
20 |
bnb_4bit_quant_type=bnb_4bit_quant_type,
|
21 |
bnb_4bit_compute_dtype=compute_dtype,
|
22 |
bnb_4bit_use_double_quant=use_nested_quant,
|
23 |
)
|
24 |
|
25 |
+
model = AutoModelForCausalLM.from_pretrained(
|
26 |
model_name,
|
27 |
quantization_config=bnb_config,
|
28 |
device_map=device_map,
|
29 |
trust_remote_code=True
|
30 |
)
|
31 |
+
|
32 |
|
33 |
Use the tokenizer:
|
34 |
|
35 |
|
36 |
+
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
37 |
+
tokenizer.pad_token = tokenizer.eos_token
|
38 |
+
tokenizer.padding_side = "right"
|
39 |
|
40 |
To get the prompt:
|
41 |
dataset = dataset.map(
|