nm-autobot commited on
Commit
5289db3
1 Parent(s): 25b8339

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -51,7 +51,7 @@
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
- "global_sparsity": 0.14375328644374685,
55
  "ignore": [],
56
  "registry_requires_subclass": false,
57
  "sparsity_structure": "unstructured",
@@ -63,7 +63,7 @@
63
  "rope_theta": 10000.0,
64
  "tie_word_embeddings": false,
65
  "torch_dtype": "bfloat16",
66
- "transformers_version": "4.46.3",
67
  "use_cache": true,
68
  "vocab_size": 32000
69
  }
 
51
  "quantization_status": "compressed",
52
  "sparsity_config": {
53
  "format": "dense",
54
+ "global_sparsity": 0.14329888201729718,
55
  "ignore": [],
56
  "registry_requires_subclass": false,
57
  "sparsity_structure": "unstructured",
 
63
  "rope_theta": 10000.0,
64
  "tie_word_embeddings": false,
65
  "torch_dtype": "bfloat16",
66
+ "transformers_version": "4.47.0",
67
  "use_cache": true,
68
  "vocab_size": 32000
69
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "eos_token_id": 2,
4
  "max_length": 2048,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.46.3"
7
  }
 
3
  "eos_token_id": 2,
4
  "max_length": 2048,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.47.0"
7
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:892873b79abcf66508b526a74179177e303de9b4b1464a6177096348faa7fd76
3
  size 761968800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c99c37708043eee70aa1961dcda6621a800fe68feaa47f280f1083e5b2a53f
3
  size 761968800
recipe.yaml CHANGED
@@ -1,6 +1,6 @@
1
  DEFAULT_stage:
2
  DEFAULT_modifiers:
3
  GPTQModifier:
 
4
  targets: Linear
5
  ignore: [lm_head]
6
- scheme: W4A16
 
1
  DEFAULT_stage:
2
  DEFAULT_modifiers:
3
  GPTQModifier:
4
+ scheme: W4A16
5
  targets: Linear
6
  ignore: [lm_head]
 
tokenizer_config.json CHANGED
@@ -32,6 +32,7 @@
32
  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
33
  "clean_up_tokenization_spaces": false,
34
  "eos_token": "</s>",
 
35
  "legacy": false,
36
  "model_max_length": 2048,
37
  "pad_token": "</s>",
 
32
  "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
33
  "clean_up_tokenization_spaces": false,
34
  "eos_token": "</s>",
35
+ "extra_special_tokens": {},
36
  "legacy": false,
37
  "model_max_length": 2048,
38
  "pad_token": "</s>",