bstraehle commited on
Commit
244ab57
1 Parent(s): 9625a05

Training in progress, step 1

Browse files
config.json CHANGED
@@ -1,16 +1,12 @@
1
  {
2
- "_name_or_path": "meta-llama/Meta-Llama-3.1-8B-Instruct",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
- "eos_token_id": [
10
- 128001,
11
- 128008,
12
- 128009
13
- ],
14
  "hidden_act": "silu",
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
 
1
  {
2
+ "_name_or_path": "meta-llama/Meta-Llama-3.1-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
+ "eos_token_id": 128001,
 
 
 
 
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
model-00001-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e0c5179f6a0f6659b11c4ec1e0929c863acee319982d1dadc6fef10a393ac2a
3
  size 4886466168
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16d59efba58dce68f5268681c75754e0bd437c19d4515417f989a795e89c49af
3
  size 4886466168
model-00002-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a26040058026a6c614208bc7bf303236af4b1a19afd84084a5a34473b722a8e3
3
  size 4832007448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f604610bfc91adc42cd602ce63f1246dc0823f396708b8fdc9148f99acc6bffd
3
  size 4832007448
model-00003-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80b8ddbfd1eed67e2f9b220f1df577de69da14a3e665195f734dcedbf6883375
3
  size 4999813112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:364287fdee2fc229fb7ef73249b1c554eec5b49ebaaa5258c8a072344ab7284a
3
  size 4999813112
model-00004-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed15c0a1bdd1cefa7fea24f5501882a89d3566fe599c2624c331c3512bcf6c90
3
  size 4999813128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13a45ab992a1d2cf4dbd79231787d6265b466b113972262946eba4963cceefce
3
  size 4999813128
model-00005-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fc1c88984ffd545e0dc1c40ceec497b8ef57936e9ea1769ed4dca95bffc0f23
3
  size 4832007496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2949b7d26e22ed5720d6902cca5566c6ba8f9358dc77febe8292b1b82b18dcf5
3
  size 4832007496
model-00006-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:817de131f47f1cb5427f6274fb6cd4150d544296a93006deb2910da282eb91a6
3
  size 4999813120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95b9613ae2f1c34680e1fb79755b995ad190a8a6a033a061d0d8ca600c04a7c5
3
  size 4999813120
model-00007-of-00007.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a00db3d8defd4479be4e6c5288db021b0f1aab58467a51f701c424f1f6b229a7
3
  size 2571158184
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af63c7b8068e15b5167439fbe4e8dc56d40d2006e60cf22107d9da86809d4be
3
  size 2571158184
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25024f1eb783a07b3c9ec25e3e2129648f4fde5ef22a43417121c1ca396e8ae9
3
- size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38255cda766a708a3a8d69e60e43ab91758f374ef5a0c4b5c19b09f3c182ca89
3
+ size 5368