Install exllama (#83)

* Install exllama * Handle updating exllama
2024-12-25 13:58:56 +01:00 · 2023-06-17 17:10:36 -05:00 · 2023-06-17 17:10:36 -05:00 · b1d05cbbf6
commit b1d05cbbf6
parent 657049d7d0
1 changed files with 10 additions and 1 deletions
--- a/webui.py
+++ b/webui.py
@ -167,8 +167,17 @@ def update_dependencies():
    if not os.path.exists("repositories/"):
        os.mkdir("repositories")
    # Install GPTQ-for-LLaMa which enables 4bit CUDA quantization
    os.chdir("repositories")
    # Install or update exllama as needed
    if not os.path.exists("exllama/"):
        run_cmd("git clone https://github.com/turboderp/exllama.git", environment=True)
    else:
        os.chdir("exllama")
        run_cmd("git pull", environment=True)
        os.chdir("..")
    # Install GPTQ-for-LLaMa which enables 4bit CUDA quantization
    if not os.path.exists("GPTQ-for-LLaMa/"):
        run_cmd("git clone https://github.com/oobabooga/GPTQ-for-LLaMa.git -b cuda", assert_success=True, environment=True)