l3utterfly
commited on
Commit
·
0a235fc
1
Parent(s):
73d9cf8
Add PTE files for context sizes 2048, 4096, 8192
Browse files- .gitattributes +1 -0
- llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx2048.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx2048.pte +2 -2
- llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx4096.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx4096.pte +2 -2
- llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx8192.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx8192.pte +2 -2
.gitattributes
CHANGED
@@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
36 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx2048.pte filter=lfs diff=lfs merge=lfs -text
|
37 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx4096.pte filter=lfs diff=lfs merge=lfs -text
|
38 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx8192.pte filter=lfs diff=lfs merge=lfs -text
|
|
|
|
36 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx2048.pte filter=lfs diff=lfs merge=lfs -text
|
37 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx4096.pte filter=lfs diff=lfs merge=lfs -text
|
38 |
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx8192.pte filter=lfs diff=lfs merge=lfs -text
|
39 |
+
*.pte filter=lfs diff=lfs merge=lfs -text
|
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx2048.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx2048.pte
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25d4434362e898e9dee8f3c1d143f08c2ea12556afd81c4dae55809738b08fad
|
3 |
+
size 4169560736
|
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx4096.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx4096.pte
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5213fe235a75bb901a8d6ec06a94753fd79ce887f623617dae0d2979f0b0423f
|
3 |
+
size 4171657888
|
llama3_instruct_kv_sdpa_xnn_qe_4_32_ctx8192.pte → Meta-Llama-3-8B-Instruct_kv2_sdpa_xnn_qe_4_32_ctx8192.pte
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8db901a0de48c943d8dd197a778caae765058dc6e1ae44dab21d397aebb9a16
|
3 |
+
size 4175852192
|