OpenSourceRonin commited on
Commit
e320be1
1 Parent(s): d9cec79

Upload model Meta-Llama-3.1-405B-Instruct-v8-k65536-65536-woft

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. README.md +38 -0
  3. config.json +0 -0
  4. generation_config.json +13 -0
  5. model-00001-of-00044.safetensors +3 -0
  6. model-00002-of-00044.safetensors +3 -0
  7. model-00003-of-00044.safetensors +3 -0
  8. model-00004-of-00044.safetensors +3 -0
  9. model-00005-of-00044.safetensors +3 -0
  10. model-00006-of-00044.safetensors +3 -0
  11. model-00007-of-00044.safetensors +3 -0
  12. model-00008-of-00044.safetensors +3 -0
  13. model-00009-of-00044.safetensors +3 -0
  14. model-00010-of-00044.safetensors +3 -0
  15. model-00011-of-00044.safetensors +3 -0
  16. model-00012-of-00044.safetensors +3 -0
  17. model-00013-of-00044.safetensors +3 -0
  18. model-00014-of-00044.safetensors +3 -0
  19. model-00015-of-00044.safetensors +3 -0
  20. model-00016-of-00044.safetensors +3 -0
  21. model-00017-of-00044.safetensors +3 -0
  22. model-00018-of-00044.safetensors +3 -0
  23. model-00019-of-00044.safetensors +3 -0
  24. model-00020-of-00044.safetensors +3 -0
  25. model-00021-of-00044.safetensors +3 -0
  26. model-00022-of-00044.safetensors +3 -0
  27. model-00023-of-00044.safetensors +3 -0
  28. model-00024-of-00044.safetensors +3 -0
  29. model-00025-of-00044.safetensors +3 -0
  30. model-00026-of-00044.safetensors +3 -0
  31. model-00027-of-00044.safetensors +3 -0
  32. model-00028-of-00044.safetensors +3 -0
  33. model-00029-of-00044.safetensors +3 -0
  34. model-00030-of-00044.safetensors +3 -0
  35. model-00031-of-00044.safetensors +3 -0
  36. model-00032-of-00044.safetensors +3 -0
  37. model-00033-of-00044.safetensors +3 -0
  38. model-00034-of-00044.safetensors +3 -0
  39. model-00035-of-00044.safetensors +3 -0
  40. model-00036-of-00044.safetensors +3 -0
  41. model-00037-of-00044.safetensors +3 -0
  42. model-00038-of-00044.safetensors +3 -0
  43. model-00039-of-00044.safetensors +3 -0
  44. model-00040-of-00044.safetensors +3 -0
  45. model-00041-of-00044.safetensors +3 -0
  46. model-00042-of-00044.safetensors +3 -0
  47. model-00043-of-00044.safetensors +3 -0
  48. model-00044-of-00044.safetensors +3 -0
  49. model.safetensors.index.json +0 -0
  50. special_tokens_map.json +16 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ license: llama3.1
4
+ base_model:
5
+ - meta-llama/Llama-3.1-405B-Instruct
6
+ base_model_relation: quantized
7
+ tags:
8
+ - VPTQ
9
+ - Quantized
10
+ - Quantization
11
+ ---
12
+ **Disclaimer**:
13
+
14
+ The model is reproduced based on the paper *VPTQ: Extreme Low-bit Vector Post-Training Quantization for Large Language Models* [github](https://github.com/microsoft/vptq) and [arXiv](https://arxiv.org/abs/2409.17066)
15
+
16
+ The model itself is sourced from a community release.
17
+
18
+ It is intended only for experimental purposes.
19
+
20
+ Users are responsible for any consequences arising from the use of this model.
21
+
22
+ **Note**:
23
+
24
+ The PPL test results are for reference only and were collected using GPTQ testing script.
25
+
26
+ ```json
27
+ {
28
+ "ctx_2048": {
29
+ "wikitext2": 1.9966317415237427
30
+ },
31
+ "ctx_4096": {
32
+ "wikitext2": 1.8661881685256958
33
+ },
34
+ "ctx_8192": {
35
+ "wikitext2": 1.8048142194747925
36
+ }
37
+ }
38
+ ```
config.json ADDED
The diff for this file is too large to render. See raw diff
 
generation_config.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "attn_implementation": "flash_attention_2",
3
+ "bos_token_id": 128000,
4
+ "do_sample": true,
5
+ "eos_token_id": [
6
+ 128001,
7
+ 128008,
8
+ 128009
9
+ ],
10
+ "temperature": 0.6,
11
+ "top_p": 0.9,
12
+ "transformers_version": "4.45.2"
13
+ }
model-00001-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64bb430319d52e8f07a26f51cd1a8aaf2bcb7e4d4e9987d1c48a06a20c340d4
3
+ size 4935192536
model-00002-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1a9a03c637dde5e50226314bb7784cccfbc438e237245857a73fa5e56ce7e1d
3
+ size 4828487008
model-00003-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f48a81667167bc915f613a35426696992088d1f7bfe6ac3d440dc8bdd48f2366
3
+ size 4828487008
model-00004-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eec0e64f4aaf25c9771ff617bbef1d49739e210d214338325e818b783d39231f
3
+ size 4828487008
model-00005-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03e7bf18a4a68ec953316528fdb52b0713fb0c53cc89c71ed6b85b08e0307a00
3
+ size 4828487128
model-00006-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b00e374551d570ff85acf129fdd1ad38590e6ecbb00f4192635bfdf409b04d9
3
+ size 4828487136
model-00007-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fac61068e6b91837c76fbe6c914f1497a13d90703cdf787ccaaa381727a59dfc
3
+ size 4828487136
model-00008-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e8b7974dcfac90190760bc754ba486687236e96bd24a3fa01faf81b8aed07c4
3
+ size 4828487136
model-00009-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095c35d2945e5615e9e453b1b94deca83715ed96c4be0fb5d3a8bb9593a34fc1
3
+ size 4828487136
model-00010-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f460d4b620d0d05ce57a433ee96f8167e13cf2f5e46c4c6569f4ee4f83f44b5
3
+ size 4828487136
model-00011-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e0c4748207dbe7a730b864ed55c6335ecfc52bb835efd0afc369a7f319fe8b5
3
+ size 4828487136
model-00012-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a983fb4f4e4033e011c6c81b442883e1426c49551a43531d3ca098d2eac3ff3
3
+ size 4828487136
model-00013-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f859c418f726af6a757f949e8fb6f4205bbd02560e6ca4fce89afc6f221f91a6
3
+ size 4828487136
model-00014-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec78fd18414df686b86871ff404b305e5418e7de9cc40ca9a3b291df3d8a21d
3
+ size 4828487136
model-00015-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40dd45dceed77b8c0020f663f1492b2f5894c0ebb4886d614c5983aa5d77591a
3
+ size 4828487136
model-00016-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8061b14be84e109333f5b5cbff93cb4934c6b98bea88d9b850e92f2cbfc31a7a
3
+ size 4828487136
model-00017-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b752515de1890a278626e11e078ce3533d894713d26c084d579ed7ce2504fe05
3
+ size 4828487136
model-00018-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ea30a42d78d79fd4770ae1a4e6ebc51e170cfcdc4284c6dd0e642748c45cdbe
3
+ size 4828487136
model-00019-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a8cb39f4176a2142bf70976a484fa3568b05e4c4fbff83ce95774ae5921043
3
+ size 4828487136
model-00020-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a2dc1ec004dfd62693511442564f2ad9e3ff1dbc48aaa4935ff9eb38e92b7f5
3
+ size 4828487136
model-00021-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1545d0e0cced85060e4938fca8757a80edc693fb86b977d3d736dea28b6b3a7c
3
+ size 4828487136
model-00022-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d3b87e26db4fe86522a65c993e97b0d5eb036f54fa0f44f70a00bab84470525
3
+ size 4828487136
model-00023-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:427cc7e7e9c2a23019445b7dce9d98731d0415e6ee47aea1a61c687f1b5ec9a7
3
+ size 4828487136
model-00024-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:070eb3f3256a6361c2909786c65e7ab8fde3a91db9198233a8bf5d1058cde8dc
3
+ size 4828487136
model-00025-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f6525e0d90947a5425d96759b27404e1b4fce59415932922920bcc5daead70e
3
+ size 4828487136
model-00026-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59dac12b3e51f0cb0843337b2b1d5465f62dacdb94b433819b81275965982dec
3
+ size 4828487136
model-00027-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee363eb2cbdda57fff7e0779e7d0a777a816162b8ef0b6fa4b4f7b8d7d020a72
3
+ size 4828487136
model-00028-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3be91c30d7103331e9db26ad98a8c8124acd0dc5714f4283e17a6b7fe1c86693
3
+ size 4828487136
model-00029-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd14cb918c43b2929354c99eac53cb5454b9242db059f1b1b3588c7a86c93a73
3
+ size 4828487136
model-00030-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787b3b36d29dc542497b649588bc1ec6e6c095d8db258e2cfedbd65bb260c321
3
+ size 4828487136
model-00031-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a5c9cf4c31851fd9b257704441f2e05138c72461550819e83e753e0997376a7
3
+ size 4828487136
model-00032-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:174a7b0c25c54381e69c19227ef5bf8ea2c0bc78363df26e2cb6b4b655ab3a10
3
+ size 4828487136
model-00033-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88ff0d10f57c7fb9355dc6737cfc8e3a1f31b5df615a72ab476c05def48afc3
3
+ size 4828487136
model-00034-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84afaf085ed0d184036ca896cda0b8a95f29cb431ec7fedebafa30e4ea320c80
3
+ size 4828487136
model-00035-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13544a252387c38cc6c34c4c4e8e8af7b1fd3692647972cb6523069e921a598b
3
+ size 4828487256
model-00036-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db1ea30a1112fd84f28e3ca474efd0fc32af2febfa39fde18517532244ae3df
3
+ size 4828487272
model-00037-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e2bb141a601553026689ef0536cf50848ecfe75d1a5db4e05a1ae17d639fd05
3
+ size 4828487272
model-00038-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8b9aaaec761b0034a9567cc909e496acc4ea2dc7d5d6d62e4a6ef2b7926731d
3
+ size 4828487272
model-00039-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3364ac3eaf1c1dc5a57b425a6cda09c430b764d6f265770a6eef3c2a0611b98e
3
+ size 4828487272
model-00040-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab1cbf788859a7410c88dfe1ee3d77315b8934602602dd2bf4c779ef86e0db37
3
+ size 4828487272
model-00041-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08ab0a61d0a223a546ef6d11aa2a2f58556a7e325b34a8d9d9aa8039a8384eb9
3
+ size 4828487272
model-00042-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1393292f9e6724c0210fade389941d5687bde1491c938c1e4ad22d9a8b582640
3
+ size 4828487272
model-00043-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f36c183e21e7b057e0473ad995943be82fd52e021eec2085308bd1d5527d1710
3
+ size 4096020264
model-00044-of-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71b079a02069ebe5a5f4f8135815f136afb1d6fc4423620dcb2a14fa399cdf12
3
+ size 4202692736
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<|begin_of_text|>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|eot_id|>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ }
16
+ }