zeio commited on
Commit
7d05f73
1 Parent(s): b56465e

feat(pytorch): added pytorch model

Browse files
Files changed (4) hide show
  1. config.json +14 -23
  2. pytorch_model.bin +3 -0
  3. tokenizer.model +2 -2
  4. tokenizer_config.json +5 -50
config.json CHANGED
@@ -1,25 +1,16 @@
1
  {
2
- "_name_or_path": "imone/Mistral_7B_with_EOT_token",
3
- "architectures": [
4
- "MistralForCausalLM"
5
- ],
6
- "bos_token_id": 1,
7
- "eos_token_id": 32000,
8
- "hidden_act": "silu",
9
- "hidden_size": 4096,
10
- "initializer_range": 0.02,
11
  "intermediate_size": 14336,
12
- "max_position_embeddings": 8192,
13
- "model_type": "mistral",
14
- "num_attention_heads": 32,
15
- "num_hidden_layers": 32,
16
- "num_key_value_heads": 8,
17
- "rms_norm_eps": 1e-05,
18
- "rope_theta": 10000.0,
19
- "sliding_window": 4096,
20
- "tie_word_embeddings": false,
21
- "torch_dtype": "bfloat16",
22
- "transformers_version": "4.34.1",
23
- "use_cache": true,
24
- "vocab_size": 32002
25
- }
 
1
  {
2
+ "architecture": "llama",
3
+ "block_size": 8192,
4
+ "vocab_size": 32002,
5
+ "n_layer": 32,
6
+ "n_head": 32,
7
+ "dim": 4096,
 
 
 
8
  "intermediate_size": 14336,
9
+ "hidden_act": "silu",
10
+ "rope_type": "norm",
11
+ "mlp_gate": true,
12
+ "layernorm": false,
13
+ "n_local_heads": 8,
14
+ "norm_eps": 9.999999747378752e-06,
15
+ "rope_base": 10000.0
16
+ }
 
 
 
 
 
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f2dc7a51f04dd8e1cdd20cb409a2877f31c914a8c1e6ded3bbefc34b82c791
3
+ size 7695315862
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
3
- size 493443
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f006be56d8a743f6d39f22abe25d3e6556f95334953fe93ce038f54957470f
3
+ size 556731
tokenizer_config.json CHANGED
@@ -1,62 +1,17 @@
1
  {
 
 
 
2
  "add_bos_token": true,
3
  "add_eos_token": false,
4
  "added_tokens_decoder": {
5
- "0": {
6
- "content": "<unk>",
7
- "lstrip": false,
8
- "normalized": false,
9
- "rstrip": false,
10
- "single_word": false,
11
- "special": true
12
- },
13
  "1": {
14
  "content": "<s>",
15
- "lstrip": false,
16
- "normalized": false,
17
- "rstrip": false,
18
- "single_word": false,
19
  "special": true
20
  },
21
  "2": {
22
  "content": "</s>",
23
- "lstrip": false,
24
- "normalized": false,
25
- "rstrip": false,
26
- "single_word": false,
27
- "special": true
28
- },
29
- "32000": {
30
- "content": "<|end_of_turn|>",
31
- "lstrip": false,
32
- "normalized": false,
33
- "rstrip": false,
34
- "single_word": false,
35
- "special": true
36
- },
37
- "32001": {
38
- "content": "<|pad_0|>",
39
- "lstrip": false,
40
- "normalized": false,
41
- "rstrip": false,
42
- "single_word": false,
43
  "special": true
44
  }
45
- },
46
- "additional_special_tokens": [
47
- "<|end_of_turn|>",
48
- "<|pad_0|>"
49
- ],
50
- "bos_token": "<s>",
51
- "chat_template": "{{ bos_token }}{% for message in messages %}{{ 'GPT4 Correct ' + message['role'].title() + ': ' + message['content'] + '<|end_of_turn|>'}}{% endfor %}{% if add_generation_prompt %}{{ 'GPT4 Correct Assistant:' }}{% endif %}",
52
- "clean_up_tokenization_spaces": false,
53
- "eos_token": "<|end_of_turn|>",
54
- "legacy": true,
55
- "model_max_length": 1000000000000000019884624838656,
56
- "pad_token": null,
57
- "sp_model_kwargs": {},
58
- "spaces_between_special_tokens": false,
59
- "tokenizer_class": "LlamaTokenizer",
60
- "unk_token": "<unk>",
61
- "use_default_system_prompt": true
62
- }
 
1
  {
2
+ "bos_token": "<s>",
3
+ "eos_token": "<|end_of_turn|>",
4
+ "unk_token": "<unk>",
5
  "add_bos_token": true,
6
  "add_eos_token": false,
7
  "added_tokens_decoder": {
 
 
 
 
 
 
 
 
8
  "1": {
9
  "content": "<s>",
 
 
 
 
10
  "special": true
11
  },
12
  "2": {
13
  "content": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  "special": true
15
  }
16
+ }
17
+ }