2024-08-20 04:34:10 +02:00
|
|
|
accelerate==0.33.*
|
2024-06-28 02:13:02 +02:00
|
|
|
aqlm[gpu,cpu]==1.1.6; platform_system == "Linux"
|
2024-09-28 01:59:30 +02:00
|
|
|
bitsandbytes==0.44.*
|
2024-04-30 14:11:31 +02:00
|
|
|
colorama
|
|
|
|
datasets
|
|
|
|
einops
|
2024-09-07 03:47:25 +02:00
|
|
|
fastapi==0.112.4
|
2024-04-30 14:11:31 +02:00
|
|
|
gradio==4.26.*
|
2024-07-23 04:53:56 +02:00
|
|
|
hqq==0.1.7.post3
|
2024-06-28 02:12:39 +02:00
|
|
|
jinja2==3.1.4
|
2024-04-30 14:11:31 +02:00
|
|
|
lm_eval==0.3.0
|
|
|
|
markdown
|
|
|
|
numba==0.59.*
|
|
|
|
numpy==1.26.*
|
|
|
|
optimum==1.17.*
|
|
|
|
pandas
|
2024-08-20 04:33:56 +02:00
|
|
|
peft==0.12.*
|
2024-04-30 14:11:31 +02:00
|
|
|
Pillow>=9.5.0
|
|
|
|
psutil
|
2024-09-07 03:47:25 +02:00
|
|
|
pydantic==2.8.2
|
2024-04-30 14:11:31 +02:00
|
|
|
pyyaml
|
|
|
|
requests
|
|
|
|
rich
|
|
|
|
safetensors==0.4.*
|
|
|
|
scipy
|
|
|
|
sentencepiece
|
|
|
|
tensorboard
|
2024-09-26 20:55:51 +02:00
|
|
|
transformers==4.45.*
|
2024-04-30 14:11:31 +02:00
|
|
|
tqdm
|
|
|
|
wandb
|
|
|
|
|
|
|
|
# API
|
|
|
|
SpeechRecognition==3.10.0
|
|
|
|
flask_cloudflared==0.0.14
|
|
|
|
sse-starlette==1.6.5
|
|
|
|
tiktoken
|
|
|
|
|
|
|
|
# llama-cpp-python (CPU only, no AVX2)
|
2024-09-28 00:06:31 +02:00
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.3.0+cpuavx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.3.0+cpuavx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.3.0+cpuavx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.3.0+cpuavx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
2024-04-30 14:11:31 +02:00
|
|
|
|
|
|
|
# llama-cpp-python (CUDA, no tensor cores)
|
2024-09-28 00:06:31 +02:00
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.3.0+cu121avx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.3.0+cu121avx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.3.0+cu121avx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.3.0+cu121avx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
2024-07-23 03:05:11 +02:00
|
|
|
|
|
|
|
# llama-cpp-python (CUDA, tensor cores)
|
2024-09-28 00:06:31 +02:00
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.3.0+cu121avx-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.3.0+cu121avx-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.3.0+cu121avx-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.3.0+cu121avx-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
2024-04-30 14:11:31 +02:00
|
|
|
|
|
|
|
# CUDA wheels
|
2024-09-28 18:44:08 +02:00
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.2.2/exllamav2-0.2.2+cu121.torch2.4.1-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.2.2/exllamav2-0.2.2+cu121.torch2.4.1-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.2.2/exllamav2-0.2.2+cu121.torch2.4.1-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.2.2/exllamav2-0.2.2+cu121.torch2.4.1-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
2024-09-28 00:04:08 +02:00
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.2.2/exllamav2-0.2.2-py3-none-any.whl; platform_system == "Linux" and platform_machine != "x86_64"
|
2024-09-28 18:44:08 +02:00
|
|
|
https://github.com/oobabooga/flash-attention/releases/download/v2.6.3/flash_attn-2.6.3+cu122torch2.4.1cxx11abiFALSE-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/flash-attention/releases/download/v2.6.3/flash_attn-2.6.3+cu122torch2.4.1cxx11abiFALSE-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/Dao-AILab/flash-attention/releases/download/v2.6.3/flash_attn-2.6.3+cu123torch2.4cxx11abiFALSE-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/Dao-AILab/flash-attention/releases/download/v2.6.3/flash_attn-2.6.3+cu123torch2.4cxx11abiFALSE-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|