smallsuper commited on
Commit
23a03f3
·
verified ·
1 Parent(s): 8c5349e

Upload 10 files

Browse files
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_name_or_path": "TinyLlama/TinyLlama-1.1B-intermediate-step-955k-token-2T",
3
  "architectures": [
4
- "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
@@ -22,7 +22,7 @@
22
  "rope_theta": 10000.0,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
- "transformers_version": "4.37.2",
26
  "use_cache": true,
27
  "vocab_size": 32000
28
  }
 
1
  {
2
  "_name_or_path": "TinyLlama/TinyLlama-1.1B-intermediate-step-955k-token-2T",
3
  "architectures": [
4
+ "LlamaModel"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
 
22
  "rope_theta": 10000.0,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.39.3",
26
  "use_cache": true,
27
  "vocab_size": 32000
28
  }
loftq_init/README.md CHANGED
@@ -201,4 +201,4 @@ Carbon emissions can be estimated using the [Machine Learning Impact calculator]
201
 
202
  ### Framework versions
203
 
204
- - PEFT 0.8.2
 
201
 
202
  ### Framework versions
203
 
204
+ - PEFT 0.10.0
loftq_init/adapter_config.json CHANGED
@@ -1,18 +1,19 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "./model_zoo/loftq/TinyLlama-1.1B-intermediate-step-955k-token-2T-2bit-32rank",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
9
  "layers_pattern": null,
10
  "layers_to_transform": null,
11
  "loftq_config": {
12
- "loftq_bits": 2,
13
- "loftq_iter": 1
14
  },
15
- "lora_alpha": 32,
16
  "lora_dropout": 0.1,
17
  "megatron_config": null,
18
  "megatron_core": "megatron.core",
@@ -22,14 +23,15 @@
22
  "rank_pattern": {},
23
  "revision": null,
24
  "target_modules": [
25
- "v_proj",
26
- "down_proj",
27
- "k_proj",
28
- "o_proj",
29
  "up_proj",
 
30
  "gate_proj",
31
- "q_proj"
 
 
 
32
  ],
33
- "task_type": "CAUSAL_LM",
 
34
  "use_rslora": false
35
  }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "model/TinyLlama-1.1B-intermediate-step-955k-token-2T-4bit-32rank",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
9
+ "layer_replication": null,
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {
13
+ "loftq_bits": 4,
14
+ "loftq_iter": 5
15
  },
16
+ "lora_alpha": 16,
17
  "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
 
 
 
26
  "up_proj",
27
+ "v_proj",
28
  "gate_proj",
29
+ "o_proj",
30
+ "k_proj",
31
+ "q_proj",
32
+ "down_proj"
33
  ],
34
+ "task_type": "FEATURE_EXTRACTION",
35
+ "use_dora": false,
36
  "use_rslora": false
37
  }
loftq_init/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6998c79c86a7f55e325290220aa34b178ff38d3c609b0539856077dcd0418a75
3
- size 50569626
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca4828527e72c13b096312181fc2540a0746f73c8040c0f6bf80dc56ebf79895
3
+ size 50567834
loftq_init/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21f195928f9255a4060fd7d29ea61e5dd07751f12e81ddcd1e7a22e9352a6a85
3
- size 50503848
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c01262a21ac913f1e6039f23e4ea0d0b26f70a995617bca32641cb9041102249
3
+ size 50502000
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d72c89fa2c153a8e77c34b2e6bafca749e40d5b75832ff046ad061f7fd048ac
3
- size 2200119864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46388a7344044c733d14289b9398c8e5e8f55d0c6d5f62fcc0d1f46eac4fae5d
3
+ size 2069046544
tokenizer_config.json CHANGED
@@ -35,6 +35,7 @@
35
  "pad_token": null,
36
  "padding_side": "right",
37
  "sp_model_kwargs": {},
 
38
  "tokenizer_class": "LlamaTokenizer",
39
  "unk_token": "<unk>",
40
  "use_default_system_prompt": false
 
35
  "pad_token": null,
36
  "padding_side": "right",
37
  "sp_model_kwargs": {},
38
+ "task_type": "feature_extraction",
39
  "tokenizer_class": "LlamaTokenizer",
40
  "unk_token": "<unk>",
41
  "use_default_system_prompt": false