Spaces:
Running
Running
CPU only requirement
Browse files- requirements.txt +5 -39
- requirements_amd.txt +0 -51
- requirements_amd_noavx2.txt +0 -49
- requirements_apple_intel.txt +0 -41
- requirements_apple_silicon.txt +0 -43
- requirements_cpu_only.txt +0 -38
- requirements_cpu_only_noavx2.txt +0 -38
- requirements_noavx2.txt +0 -72
- requirements_nowheels.txt +0 -32
requirements.txt
CHANGED
@@ -1,6 +1,4 @@
|
|
1 |
accelerate==0.27.*
|
2 |
-
aqlm[gpu,cpu]==1.1.3; platform_system == "Linux"
|
3 |
-
bitsandbytes==0.43.*
|
4 |
colorama
|
5 |
datasets
|
6 |
einops
|
@@ -23,7 +21,7 @@ safetensors==0.4.*
|
|
23 |
scipy
|
24 |
sentencepiece
|
25 |
tensorboard
|
26 |
-
transformers==4.
|
27 |
tqdm
|
28 |
wandb
|
29 |
|
@@ -34,39 +32,7 @@ sse-starlette==1.6.5
|
|
34 |
tiktoken
|
35 |
|
36 |
# llama-cpp-python (CPU only, AVX2)
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.
|
39 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.
|
40 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.
|
41 |
-
|
42 |
-
# llama-cpp-python (CUDA, no tensor cores)
|
43 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.61+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
44 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.61+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
45 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.61+cu121-cp311-cp311-manylinux_2_31_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
46 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.61+cu121-cp310-cp310-manylinux_2_31_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
47 |
-
|
48 |
-
# llama-cpp-python (CUDA, tensor cores)
|
49 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.61+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
50 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.61+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
51 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.61+cu121-cp311-cp311-manylinux_2_31_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
52 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.61+cu121-cp310-cp310-manylinux_2_31_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
53 |
-
|
54 |
-
# CUDA wheels
|
55 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
56 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
57 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
58 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
59 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.18/exllamav2-0.0.18+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
60 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.18/exllamav2-0.0.18+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
61 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.18/exllamav2-0.0.18+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
62 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.18/exllamav2-0.0.18+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
63 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.18/exllamav2-0.0.18-py3-none-any.whl; platform_system == "Linux" and platform_machine != "x86_64"
|
64 |
-
https://github.com/oobabooga/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2.0cxx11abiFALSE-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
65 |
-
https://github.com/oobabooga/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2.0cxx11abiFALSE-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
66 |
-
https://github.com/Dao-AILab/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2cxx11abiFALSE-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
67 |
-
https://github.com/Dao-AILab/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2cxx11abiFALSE-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
68 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
69 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
70 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
71 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
72 |
-
autoawq==0.2.3; platform_system == "Linux" or platform_system == "Windows"
|
|
|
1 |
accelerate==0.27.*
|
|
|
|
|
2 |
colorama
|
3 |
datasets
|
4 |
einops
|
|
|
21 |
scipy
|
22 |
sentencepiece
|
23 |
tensorboard
|
24 |
+
transformers==4.40.*
|
25 |
tqdm
|
26 |
wandb
|
27 |
|
|
|
32 |
tiktoken
|
33 |
|
34 |
# llama-cpp-python (CPU only, AVX2)
|
35 |
+
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
36 |
+
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
37 |
+
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
38 |
+
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_amd.txt
DELETED
@@ -1,51 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# llama-cpp-python (CPU only, AVX2)
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
39 |
-
|
40 |
-
# AMD wheels
|
41 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/rocm/llama_cpp_python_cuda-0.2.65+rocm5.6.1-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
42 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/rocm/llama_cpp_python_cuda-0.2.65+rocm5.6.1-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
43 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
44 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
45 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
46 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
47 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19-py3-none-any.whl; platform_system != "Darwin" and platform_machine != "x86_64"
|
48 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
49 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
50 |
-
https://github.com/casper-hansen/AutoAWQ/releases/download/v0.2.3/autoawq-0.2.3+rocm561-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
51 |
-
https://github.com/casper-hansen/AutoAWQ/releases/download/v0.2.3/autoawq-0.2.3+rocm561-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_amd_noavx2.txt
DELETED
@@ -1,49 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# llama-cpp-python (CPU only, no AVX2)
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
39 |
-
|
40 |
-
# AMD wheels
|
41 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
42 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
43 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
44 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
45 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19-py3-none-any.whl; platform_system != "Darwin" and platform_machine != "x86_64"
|
46 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+rocm5.6-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
47 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+rocm5.6-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
48 |
-
https://github.com/casper-hansen/AutoAWQ/releases/download/v0.2.3/autoawq-0.2.3+rocm561-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
49 |
-
https://github.com/casper-hansen/AutoAWQ/releases/download/v0.2.3/autoawq-0.2.3+rocm561-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_apple_intel.txt
DELETED
@@ -1,41 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# Mac wheels
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_11_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "20.0.0" and platform_release < "21.0.0" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_11_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "20.0.0" and platform_release < "21.0.0" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_12_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "21.0.0" and platform_release < "22.0.0" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_12_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "21.0.0" and platform_release < "22.0.0" and python_version == "3.10"
|
39 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_14_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "23.0.0" and platform_release < "24.0.0" and python_version == "3.11"
|
40 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_14_0_x86_64.whl; platform_system == "Darwin" and platform_release >= "23.0.0" and platform_release < "24.0.0" and python_version == "3.10"
|
41 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19-py3-none-any.whl
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_apple_silicon.txt
DELETED
@@ -1,43 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# Mac wheels
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_11_0_arm64.whl; platform_system == "Darwin" and platform_release >= "20.0.0" and platform_release < "21.0.0" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_11_0_arm64.whl; platform_system == "Darwin" and platform_release >= "20.0.0" and platform_release < "21.0.0" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_12_0_arm64.whl; platform_system == "Darwin" and platform_release >= "21.0.0" and platform_release < "22.0.0" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_12_0_arm64.whl; platform_system == "Darwin" and platform_release >= "21.0.0" and platform_release < "22.0.0" and python_version == "3.10"
|
39 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_13_0_arm64.whl; platform_system == "Darwin" and platform_release >= "22.0.0" and platform_release < "23.0.0" and python_version == "3.11"
|
40 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_13_0_arm64.whl; platform_system == "Darwin" and platform_release >= "22.0.0" and platform_release < "23.0.0" and python_version == "3.10"
|
41 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp311-cp311-macosx_14_0_arm64.whl; platform_system == "Darwin" and platform_release >= "23.0.0" and platform_release < "24.0.0" and python_version == "3.11"
|
42 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/metal/llama_cpp_python-0.2.65-cp310-cp310-macosx_14_0_arm64.whl; platform_system == "Darwin" and platform_release >= "23.0.0" and platform_release < "24.0.0" and python_version == "3.10"
|
43 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19-py3-none-any.whl
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_cpu_only.txt
DELETED
@@ -1,38 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# llama-cpp-python (CPU only, AVX2)
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx2-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_cpu_only_noavx2.txt
DELETED
@@ -1,38 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
33 |
-
|
34 |
-
# llama-cpp-python (CPU only, no AVX2)
|
35 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
36 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_noavx2.txt
DELETED
@@ -1,72 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
aqlm[gpu,cpu]==1.1.3; platform_system == "Linux"
|
3 |
-
bitsandbytes==0.43.*
|
4 |
-
colorama
|
5 |
-
datasets
|
6 |
-
einops
|
7 |
-
gradio==4.26.*
|
8 |
-
hqq==0.1.5
|
9 |
-
jinja2==3.1.2
|
10 |
-
lm_eval==0.3.0
|
11 |
-
markdown
|
12 |
-
numba==0.59.*
|
13 |
-
numpy==1.26.*
|
14 |
-
optimum==1.17.*
|
15 |
-
pandas
|
16 |
-
peft==0.8.*
|
17 |
-
Pillow>=9.5.0
|
18 |
-
psutil
|
19 |
-
pyyaml
|
20 |
-
requests
|
21 |
-
rich
|
22 |
-
safetensors==0.4.*
|
23 |
-
scipy
|
24 |
-
sentencepiece
|
25 |
-
tensorboard
|
26 |
-
transformers==4.40.*
|
27 |
-
tqdm
|
28 |
-
wandb
|
29 |
-
|
30 |
-
# API
|
31 |
-
SpeechRecognition==3.10.0
|
32 |
-
flask_cloudflared==0.0.14
|
33 |
-
sse-starlette==1.6.5
|
34 |
-
tiktoken
|
35 |
-
|
36 |
-
# llama-cpp-python (CPU only, no AVX2)
|
37 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
38 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
39 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
40 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.65+cpuavx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
41 |
-
|
42 |
-
# llama-cpp-python (CUDA, no tensor cores)
|
43 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.65+cu121avx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
44 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.65+cu121avx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
45 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.65+cu121avx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
46 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.65+cu121avx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
47 |
-
|
48 |
-
# llama-cpp-python (CUDA, tensor cores)
|
49 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.65+cu121avx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
50 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.65+cu121avx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
51 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.65+cu121avx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
52 |
-
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.65+cu121avx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
53 |
-
|
54 |
-
# CUDA wheels
|
55 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
56 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
57 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
58 |
-
https://github.com/jllllll/AutoGPTQ/releases/download/v0.6.0/auto_gptq-0.6.0+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
59 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
60 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
61 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
62 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
63 |
-
https://github.com/turboderp/exllamav2/releases/download/v0.0.19/exllamav2-0.0.19-py3-none-any.whl; platform_system == "Linux" and platform_machine != "x86_64"
|
64 |
-
https://github.com/oobabooga/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2.0cxx11abiFALSE-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
65 |
-
https://github.com/oobabooga/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2.0cxx11abiFALSE-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
66 |
-
https://github.com/Dao-AILab/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2cxx11abiFALSE-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
67 |
-
https://github.com/Dao-AILab/flash-attention/releases/download/v2.5.6/flash_attn-2.5.6+cu122torch2.2cxx11abiFALSE-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
68 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
69 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
70 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
71 |
-
https://github.com/jllllll/GPTQ-for-LLaMa-CUDA/releases/download/0.1.1/gptq_for_llama-0.1.1+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
72 |
-
autoawq==0.2.3; platform_system == "Linux" or platform_system == "Windows"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
requirements_nowheels.txt
DELETED
@@ -1,32 +0,0 @@
|
|
1 |
-
accelerate==0.27.*
|
2 |
-
colorama
|
3 |
-
datasets
|
4 |
-
einops
|
5 |
-
gradio==4.26.*
|
6 |
-
hqq==0.1.5
|
7 |
-
jinja2==3.1.2
|
8 |
-
lm_eval==0.3.0
|
9 |
-
markdown
|
10 |
-
numba==0.59.*
|
11 |
-
numpy==1.26.*
|
12 |
-
optimum==1.17.*
|
13 |
-
pandas
|
14 |
-
peft==0.8.*
|
15 |
-
Pillow>=9.5.0
|
16 |
-
psutil
|
17 |
-
pyyaml
|
18 |
-
requests
|
19 |
-
rich
|
20 |
-
safetensors==0.4.*
|
21 |
-
scipy
|
22 |
-
sentencepiece
|
23 |
-
tensorboard
|
24 |
-
transformers==4.40.*
|
25 |
-
tqdm
|
26 |
-
wandb
|
27 |
-
|
28 |
-
# API
|
29 |
-
SpeechRecognition==3.10.0
|
30 |
-
flask_cloudflared==0.0.14
|
31 |
-
sse-starlette==1.6.5
|
32 |
-
tiktoken
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|