2024-07-11 18:56:42 -04:00
|
|
|
accelerate==0.32.*
|
2024-06-27 20:13:02 -04:00
|
|
|
aqlm[gpu,cpu]==1.1.6; platform_system == "Linux"
|
2024-05-21 12:32:02 -04:00
|
|
|
auto-gptq==0.7.1
|
2024-03-10 11:30:53 -04:00
|
|
|
bitsandbytes==0.43.*
|
2023-04-16 22:26:52 -04:00
|
|
|
colorama
|
2023-04-02 19:34:25 -04:00
|
|
|
datasets
|
2023-05-29 09:20:18 -04:00
|
|
|
einops
|
2024-04-11 01:24:53 -04:00
|
|
|
gradio==4.26.*
|
2024-07-22 22:53:56 -04:00
|
|
|
hqq==0.1.7.post3
|
2024-06-27 20:12:39 -04:00
|
|
|
jinja2==3.1.4
|
2023-12-24 12:22:31 -05:00
|
|
|
lm_eval==0.3.0
|
2023-03-15 11:40:03 -04:00
|
|
|
markdown
|
2024-03-10 19:13:29 -04:00
|
|
|
numba==0.59.*
|
2024-02-13 14:26:35 -05:00
|
|
|
numpy==1.26.*
|
2024-02-19 17:15:21 -05:00
|
|
|
optimum==1.17.*
|
2023-04-20 23:20:33 -04:00
|
|
|
pandas
|
2024-03-05 05:56:37 -05:00
|
|
|
peft==0.8.*
|
2023-04-08 17:48:46 -04:00
|
|
|
Pillow>=9.5.0
|
2024-04-06 22:02:20 -04:00
|
|
|
psutil
|
2023-04-20 23:20:33 -04:00
|
|
|
pyyaml
|
2023-03-11 12:47:30 -05:00
|
|
|
requests
|
2023-12-20 00:58:36 -05:00
|
|
|
rich
|
2024-02-04 21:40:25 -05:00
|
|
|
safetensors==0.4.*
|
2023-05-25 22:26:25 -04:00
|
|
|
scipy
|
2023-07-19 22:31:19 -04:00
|
|
|
sentencepiece
|
2023-07-12 10:53:31 -04:00
|
|
|
tensorboard
|
2024-07-23 17:06:34 -04:00
|
|
|
transformers==4.43.*
|
2023-07-19 22:31:19 -04:00
|
|
|
tqdm
|
|
|
|
wandb
|
2023-08-09 11:07:55 -04:00
|
|
|
|
2024-03-04 02:46:39 -05:00
|
|
|
# API
|
|
|
|
SpeechRecognition==3.10.0
|
|
|
|
flask_cloudflared==0.0.14
|
2024-04-18 14:05:00 -04:00
|
|
|
sse-starlette==1.6.5
|
2024-03-04 02:46:39 -05:00
|
|
|
tiktoken
|
|
|
|
|
2024-04-30 08:11:31 -04:00
|
|
|
# llama-cpp-python (CPU only, AVX2)
|
2024-07-22 21:05:11 -04:00
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.83+cpuavx2-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.83+cpuavx2-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.83+cpuavx2-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/cpu/llama_cpp_python-0.2.83+cpuavx2-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
2024-04-30 08:11:31 -04:00
|
|
|
|
|
|
|
# llama-cpp-python (CUDA, no tensor cores)
|
2024-07-22 21:05:11 -04:00
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.83+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.83+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.83+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda-0.2.83+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
|
|
|
|
# llama-cpp-python (CUDA, tensor cores)
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.83+cu121-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.83+cu121-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.83+cu121-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/llama-cpp-python-cuBLAS-wheels/releases/download/textgen-webui/llama_cpp_python_cuda_tensorcores-0.2.83+cu121-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
2024-04-30 08:11:31 -04:00
|
|
|
|
2023-09-24 08:58:29 -04:00
|
|
|
# CUDA wheels
|
2024-07-11 15:33:46 -04:00
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.1.7/exllamav2-0.1.7+cu121.torch2.2.2-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.1.7/exllamav2-0.1.7+cu121.torch2.2.2-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.1.7/exllamav2-0.1.7+cu121.torch2.2.2-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.1.7/exllamav2-0.1.7+cu121.torch2.2.2-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
|
|
|
https://github.com/oobabooga/exllamav2/releases/download/v0.1.7/exllamav2-0.1.7-py3-none-any.whl; platform_system == "Linux" and platform_machine != "x86_64"
|
2024-07-12 23:16:11 -04:00
|
|
|
https://github.com/oobabooga/flash-attention/releases/download/v2.6.1/flash_attn-2.6.1+cu122torch2.2.2cxx11abiFALSE-cp311-cp311-win_amd64.whl; platform_system == "Windows" and python_version == "3.11"
|
|
|
|
https://github.com/oobabooga/flash-attention/releases/download/v2.6.1/flash_attn-2.6.1+cu122torch2.2.2cxx11abiFALSE-cp310-cp310-win_amd64.whl; platform_system == "Windows" and python_version == "3.10"
|
|
|
|
https://github.com/Dao-AILab/flash-attention/releases/download/v2.6.1/flash_attn-2.6.1+cu123torch2.2cxx11abiFALSE-cp311-cp311-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.11"
|
|
|
|
https://github.com/Dao-AILab/flash-attention/releases/download/v2.6.1/flash_attn-2.6.1+cu123torch2.2cxx11abiFALSE-cp310-cp310-linux_x86_64.whl; platform_system == "Linux" and platform_machine == "x86_64" and python_version == "3.10"
|
2024-05-21 12:32:02 -04:00
|
|
|
autoawq==0.2.5; platform_system == "Linux" or platform_system == "Windows"
|