mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2024-11-22 08:07:56 +01:00
parent
b15f510154
commit
f0f6d9bdf9
@ -413,12 +413,8 @@ def ExLlamav2_HF_loader(model_name):
|
|||||||
|
|
||||||
|
|
||||||
def HQQ_loader(model_name):
|
def HQQ_loader(model_name):
|
||||||
try:
|
from hqq.core.quantize import HQQBackend, HQQLinear
|
||||||
from hqq.core.quantize import HQQBackend, HQQLinear
|
from hqq.engine.hf import HQQModelForCausalLM
|
||||||
from hqq.engine.hf import HQQModelForCausalLM
|
|
||||||
except ModuleNotFoundError:
|
|
||||||
logger.error("HQQ is not installed. You can install it with:\n\npip install hqq")
|
|
||||||
return None
|
|
||||||
|
|
||||||
logger.info(f"Loading HQQ model with backend: {shared.args.hqq_backend}")
|
logger.info(f"Loading HQQ model with backend: {shared.args.hqq_backend}")
|
||||||
|
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11; platform_system != "Darwin" and platform_machine != "x86_64"
|
exllamav2==0.0.11; platform_system != "Darwin" and platform_machine != "x86_64"
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11; platform_system == "Windows" or python_version < "3.10" or python_version > "3.11" or platform_machine != "x86_64"
|
exllamav2==0.0.11; platform_system == "Windows" or python_version < "3.10" or python_version > "3.11" or platform_machine != "x86_64"
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11; platform_system == "Windows" or python_version < "3.10" or python_version > "3.11" or platform_machine != "x86_64"
|
exllamav2==0.0.11; platform_system == "Windows" or python_version < "3.10" or python_version > "3.11" or platform_machine != "x86_64"
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11
|
exllamav2==0.0.11
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11
|
exllamav2==0.0.11
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11
|
exllamav2==0.0.11
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11
|
exllamav2==0.0.11
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11; platform_system != "Darwin" and platform_machine != "x86_64"
|
exllamav2==0.0.11; platform_system != "Darwin" and platform_machine != "x86_64"
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
@ -4,6 +4,7 @@ datasets
|
|||||||
einops
|
einops
|
||||||
exllamav2==0.0.11
|
exllamav2==0.0.11
|
||||||
gradio==3.50.*
|
gradio==3.50.*
|
||||||
|
hqq==0.1.1.post1
|
||||||
markdown
|
markdown
|
||||||
numpy==1.24.*
|
numpy==1.24.*
|
||||||
optimum==1.16.*
|
optimum==1.16.*
|
||||||
|
Loading…
Reference in New Issue
Block a user