p208p2002 commited on
Commit
706d7c5
1 Parent(s): 8b18fe7
config.json CHANGED
@@ -13,11 +13,15 @@
13
  "model_type": "llama",
14
  "num_attention_heads": 12,
15
  "num_hidden_layers": 12,
 
16
  "pad_token_id": 0,
 
17
  "rms_norm_eps": 1e-06,
 
 
18
  "tie_word_embeddings": false,
19
  "torch_dtype": "float32",
20
- "transformers_version": "4.28.1",
21
  "use_cache": true,
22
  "vocab_size": 32000
23
  }
 
13
  "model_type": "llama",
14
  "num_attention_heads": 12,
15
  "num_hidden_layers": 12,
16
+ "num_key_value_heads": 12,
17
  "pad_token_id": 0,
18
+ "pretraining_tp": 1,
19
  "rms_norm_eps": 1e-06,
20
+ "rope_scaling": null,
21
+ "rope_theta": 10000.0,
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "float32",
24
+ "transformers_version": "4.33.2",
25
  "use_cache": true,
26
  "vocab_size": 32000
27
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.28.1"
7
  }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.33.2"
7
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d9e5b44f147b96f452cffb8a6ae0f0f43dfadcd14a530f2af9db23b08b1337a
3
- size 479841145
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8502db988d77aeaa3b6ac39557e536f6eafe9d1291bdb86e9812f06470cef255
3
+ size 479835785
tokenizer.json CHANGED
@@ -77,10 +77,16 @@
77
  "type_id": 0
78
  }
79
  },
 
 
 
 
 
 
80
  {
81
  "Sequence": {
82
  "id": "B",
83
- "type_id": 0
84
  }
85
  }
86
  ],
 
77
  "type_id": 0
78
  }
79
  },
80
+ {
81
+ "SpecialToken": {
82
+ "id": "<s>",
83
+ "type_id": 1
84
+ }
85
+ },
86
  {
87
  "Sequence": {
88
  "id": "B",
89
+ "type_id": 1
90
  }
91
  }
92
  ],
tokenizer_config.json CHANGED
@@ -1,6 +1,4 @@
1
  {
2
- "add_bos_token": true,
3
- "add_eos_token": false,
4
  "bos_token": {
5
  "__type": "AddedToken",
6
  "content": "<s>",
@@ -29,5 +27,6 @@
29
  "normalized": true,
30
  "rstrip": false,
31
  "single_word": false
32
- }
 
33
  }
 
1
  {
 
 
2
  "bos_token": {
3
  "__type": "AddedToken",
4
  "content": "<s>",
 
27
  "normalized": true,
28
  "rstrip": false,
29
  "single_word": false
30
+ },
31
+ "use_default_system_prompt": true
32
  }