dyang415 commited on
Commit
a69b3aa
1 Parent(s): 195852c

Training in progress, epoch 0

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "mistralai/Mixtral-8x7B-v0.1",
5
  "bias": "none",
6
  "fan_in_fan_out": null,
7
  "inference_mode": true,
@@ -19,10 +19,10 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "k_proj",
23
  "v_proj",
 
24
  "o_proj",
25
- "q_proj"
26
  ],
27
  "task_type": "CAUSAL_LM"
28
  }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "mistralai/Mixtral-8x7B-Instruct-v0.1",
5
  "bias": "none",
6
  "fan_in_fan_out": null,
7
  "inference_mode": true,
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "v_proj",
23
+ "q_proj",
24
  "o_proj",
25
+ "k_proj"
26
  ],
27
  "task_type": "CAUSAL_LM"
28
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2e92d127847669a6d0d26e91056cea2134b7f6b0c2fa5db00d4b8074b8dbe8a
3
  size 27297032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:663a26f1f1a3b4fcfd581184eee642fd42fda734b67a37de0e0427b6782aa593
3
  size 27297032
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "mistralai/Mixtral-8x7B-v0.1",
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "mistralai/Mixtral-8x7B-Instruct-v0.1",
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],
runs/Feb29_16-54-10_azure-jap/events.out.tfevents.1709225652.azure-jap.95906.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6ae3d20bfd54d4a2789ce08479c8e2166a58c811cf9ded6be641706c491bc8
3
+ size 10584
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83ad7b64c51d461b9b4bb1de4956d35ef77a860375b5f95b565353c6148fd684
3
  size 4859
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c59c6a5f88064305dd076a6acaf260003a37a4382f71c6a289edbc23a6aece0
3
  size 4859