leonardlin commited on
Commit
fa53998
1 Parent(s): 8372256

Replace FP32 w/ BF16 weights

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +2 -2
  2. model-00001-of-00062.safetensors → model-00001-of-00030.safetensors +2 -2
  3. model-00002-of-00062.safetensors → model-00002-of-00030.safetensors +2 -2
  4. model-00003-of-00062.safetensors → model-00003-of-00030.safetensors +2 -2
  5. model-00004-of-00062.safetensors → model-00004-of-00030.safetensors +2 -2
  6. model-00005-of-00030.safetensors +3 -0
  7. model-00005-of-00062.safetensors +0 -3
  8. model-00006-of-00030.safetensors +3 -0
  9. model-00006-of-00062.safetensors +0 -3
  10. model-00007-of-00030.safetensors +3 -0
  11. model-00007-of-00062.safetensors +0 -3
  12. model-00008-of-00030.safetensors +3 -0
  13. model-00008-of-00062.safetensors +0 -3
  14. model-00009-of-00030.safetensors +3 -0
  15. model-00009-of-00062.safetensors +0 -3
  16. model-00010-of-00030.safetensors +3 -0
  17. model-00010-of-00062.safetensors +0 -3
  18. model-00011-of-00030.safetensors +3 -0
  19. model-00011-of-00062.safetensors +0 -3
  20. model-00012-of-00030.safetensors +3 -0
  21. model-00012-of-00062.safetensors +0 -3
  22. model-00013-of-00030.safetensors +3 -0
  23. model-00013-of-00062.safetensors +0 -3
  24. model-00014-of-00030.safetensors +3 -0
  25. model-00014-of-00062.safetensors +0 -3
  26. model-00015-of-00030.safetensors +3 -0
  27. model-00015-of-00062.safetensors +0 -3
  28. model-00016-of-00030.safetensors +3 -0
  29. model-00016-of-00062.safetensors +0 -3
  30. model-00017-of-00030.safetensors +3 -0
  31. model-00017-of-00062.safetensors +0 -3
  32. model-00018-of-00030.safetensors +3 -0
  33. model-00018-of-00062.safetensors +0 -3
  34. model-00019-of-00030.safetensors +3 -0
  35. model-00019-of-00062.safetensors +0 -3
  36. model-00020-of-00030.safetensors +3 -0
  37. model-00020-of-00062.safetensors +0 -3
  38. model-00021-of-00030.safetensors +3 -0
  39. model-00021-of-00062.safetensors +0 -3
  40. model-00022-of-00030.safetensors +3 -0
  41. model-00022-of-00062.safetensors +0 -3
  42. model-00023-of-00030.safetensors +3 -0
  43. model-00023-of-00062.safetensors +0 -3
  44. model-00024-of-00030.safetensors +3 -0
  45. model-00024-of-00062.safetensors +0 -3
  46. model-00025-of-00030.safetensors +3 -0
  47. model-00025-of-00062.safetensors +0 -3
  48. model-00026-of-00030.safetensors +3 -0
  49. model-00026-of-00062.safetensors +0 -3
  50. model-00027-of-00030.safetensors +3 -0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "outputs/basemodel-llama3-70b",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -21,7 +21,7 @@
21
  "rope_scaling": null,
22
  "rope_theta": 500000.0,
23
  "tie_word_embeddings": false,
24
- "torch_dtype": "float32",
25
  "transformers_version": "4.40.2",
26
  "use_cache": false,
27
  "vocab_size": 128256
 
1
  {
2
+ "_name_or_path": "shisa-v1-llama3-70b",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
21
  "rope_scaling": null,
22
  "rope_theta": 500000.0,
23
  "tie_word_embeddings": false,
24
+ "torch_dtype": "bfloat16",
25
  "transformers_version": "4.40.2",
26
  "use_cache": false,
27
  "vocab_size": 128256
model-00001-of-00062.safetensors → model-00001-of-00030.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01cf66c97514aba3f46785e5e6062d8819ea97cae1d265bad3ecdee109ae4d2c
3
- size 4806672984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b20106aad8348a6e34bf6b81bfa568c201587c283bad01c2c70b3da5495cd098
3
+ size 4584408808
model-00002-of-00062.safetensors → model-00002-of-00030.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b62ee649035e0b7388f1b24854a04f198640294a995f7a744da1caec8ec03b92
3
- size 4362142864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2ee00a0ea5bf261ae719829cab8891d8ed45f42063041017c12d27eb7dd0446
3
+ size 4664167376
model-00003-of-00062.safetensors → model-00003-of-00030.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3d8eefde0ef6cae563c90ef1877800dcdb1bd1968d5b01d61ea659a85b58b70
3
- size 4362142864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6da500c956c587325dc0d266670085e35e8923722b74ec5d490096e8a055bde7
3
+ size 4999711704
model-00004-of-00062.safetensors → model-00004-of-00030.safetensors RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40fc9b683b95472af35e7ebbcf0dd6e224a444c5cf33d3c797f62405b1e2d65d
3
- size 4966188864
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4394fe80f91a5cdad14ac0e15adf42f3a568daba122a6b46acd0dbc6e9d2abd
3
+ size 4966157032
model-00005-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c574c88b7fcffea1b1a725fba0db3e39bac088aa9577e21173473af9d25a4e9
3
+ size 4664134408
model-00005-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a408ab6709d975b33e0453beccde172b5b8460e9a2bd722fc514eea002254385
3
- size 4362142864
 
 
 
 
model-00006-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acb926e3171e2a8ebfacf8b78489f41c49540cee9299db7de7c923d1547af7b1
3
+ size 4664167408
model-00006-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:91124ca99209c2b0a77923c84dfa2e9a6cfdfdf14bd1eaec121da55fbe961839
3
- size 4362142864
 
 
 
 
model-00007-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5411e7649dd183fe34ad341e6e5bce66ab5454088d232be20843d3a11663d2
3
+ size 4664167408
model-00007-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9513b736b54849e9fbe34c0857ea54d50492761b393e8ba1a289a396353f686
3
- size 4966188864
 
 
 
 
model-00008-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eacbc9fc56b14be49968dca772bde2b1098a614cb2493ba71fd6e318d01be008
3
+ size 4999711728
model-00008-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a1b5ee69fdb0aaa5326486137b9bea583fe587e2c9025e5e06b9ed10d7e282b
3
- size 4362142864
 
 
 
 
model-00009-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09e3bb0b7a891696be2c00b54aa6dc34b2db0482e35008943b4e6f415b17b10f
3
+ size 4966157056
model-00009-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3244ecd67bab8a038f100e8c0206f3fd5bb80a6375bda516bc16707be14d4545
3
- size 4362142880
 
 
 
 
model-00010-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b402445b5f8aad2398613cd48e94f229617b7d43eac1457d059196c2d2fec1
3
+ size 4664134408
model-00010-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a91efcfacee117004b9c2d8bdc272748eb2afe3d2719601303e329cd89fbd8e0
3
- size 4966188880
 
 
 
 
model-00011-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2aaa1ef82343d1663cf63648f85e285b59011a4ff6673818d854916c753adc3
3
+ size 4664167408
model-00011-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5ea4accf1e8731c88b4abcba638242a30dce0b883c27c7a925bafd05f482522
3
- size 4362142872
 
 
 
 
model-00012-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c255711407f5117eeaac7be56472458136f4d7c45997fa8b8fa92bdfd4ebd0a0
3
+ size 4664167408
model-00012-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:50b9fda66dc46f4717abd0ab30dd5b64b2cca3b3528ec0f199a144ecd1408de2
3
- size 4362142872
 
 
 
 
model-00013-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd4c0a174c1aaa800046c71720e808004a8156e0891093a6bf098939db405fe0
3
+ size 4999711728
model-00013-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:90cb95544841ed18f9d05df1115bb2c7fd12508a948dceadf8b71bfa0d5041d4
3
- size 4966188880
 
 
 
 
model-00014-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8370523d7031a6778c7e7fcdf6986ebcdb96f230a0a8779a7468dd7c0aa0ae97
3
+ size 4966157056
model-00014-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7bce48749a63bb03fbdbefb45fc4eb2628293bb9b45de5a624250b17df346df2
3
- size 4362142872
 
 
 
 
model-00015-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3334f9991f3ff8e684bfab002e0f8febdcb9a65d831c05757227b66120af026d
3
+ size 4664134408
model-00015-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:85f336aae14b3b6c8f07c04bd82d2ddae050fef4c36f7d42e5f52acbc28e0940
3
- size 4362142872
 
 
 
 
model-00016-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce8392fdca7090e4d83a71d7698ee649c0fee511fa987aff9521807a6c724ddd
3
+ size 4664167408
model-00016-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f31e7623f9dfe1c79555c5d9ff1fbcda784e489a657ac4d83bd89ec28e5d49a5
3
- size 4966188880
 
 
 
 
model-00017-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1e15347c57fde67269dc066bcfb2bb4d432b4b80303a1b8420872e20f60bf38
3
+ size 4664167408
model-00017-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b1fbcf948bf401eb37b6091d3c67bc9973a4dc6d81bc70005f45061d1e6ddf0
3
- size 4362142872
 
 
 
 
model-00018-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce6fe2a8304e7d42b138c0f26d3538c8a120dc676a6cdef13fcf53038669958c
3
+ size 4999711728
model-00018-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0afb4882107bf0e422a4e7f79b1f254d12a1fb3e3eb80fda0641d9ce005ed8a1
3
- size 4362142872
 
 
 
 
model-00019-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:257460fc0e900e6a7d947971dc8c2b963c7c12529272715fcf615e0c97c8d4f6
3
+ size 4966157056
model-00019-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:271feaf7fe5b8aaf772c5e376db460c0fdd6578aad57e36b1f6180481ba927b6
3
- size 4966188880
 
 
 
 
model-00020-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db2b65b4f95c6948563acc67f8c42776d2a580c3ecfbf385fecf8d6de1c4b2da
3
+ size 4664134408
model-00020-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:471818ad2685bef5b119973c47aef9e28460a5200185e0a00b18b3b7dbf10c14
3
- size 4362142872
 
 
 
 
model-00021-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787b8b9b6f645685142bed96b203d011e50c99de3bfbbedf9ae01690e2baa4be
3
+ size 4664167408
model-00021-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:01aea7d2aa17ec78ade5c4f0c4471bb6b94c5ee42aa394f706651abbb2e9d61e
3
- size 4362142872
 
 
 
 
model-00022-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6ba9c4aaf3e426bafc083fae07777f7c4a714a135b3afa2210381d5341f33d7
3
+ size 4664167408
model-00022-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:bea04cc81dc12032c266d18fa3082d1d763b2f1aa7d7c24e7d7e0611fb7f8f70
3
- size 4966188880
 
 
 
 
model-00023-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d91824a919c7a25f6964716ed2356802becf599215410e2ede8ca319e89cbfe7
3
+ size 4999711728
model-00023-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:669d8fa715990f7b876529f88976fad057511fd064ad8d71245854879258502c
3
- size 4362142872
 
 
 
 
model-00024-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f3a28d6e89ec98a58e66cce87084ccb2ba0854dba976d62cdf144f0cf8962c0
3
+ size 4966157056
model-00024-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d7d4748d212bfc63c86b7e0b0570f36e80d74a8edf68adfb277c3039b806087
3
- size 4362142872
 
 
 
 
model-00025-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7957e5684b4368df1179374dbb78d034e44e5d47dc9ddb07b90274a4d70e219f
3
+ size 4664134408
model-00025-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbe649e36c4a6d9e6e08d8635ecc95fd4db3709b1f3081c47c05fb6ec9dceb1e
3
- size 4966188880
 
 
 
 
model-00026-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:936520d664a3446d3419a6d872d2d986f06ffce6e0be29b713a67a9a2fd5c5ea
3
+ size 4664167408
model-00026-of-00062.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:32b85f3ef121521ab28114aeac0a80cfe51cb97e2109c747425de1490e6e7a9f
3
- size 4362142872
 
 
 
 
model-00027-of-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ed83c9ee4afcefb547b0dc16df5167aba3e9cd869777796e2124849f95b3938
3
+ size 4664167408