diff --git a/modules/exllama.py b/modules/exllama.py index 150a6e82..69eccbf2 100644 --- a/modules/exllama.py +++ b/modules/exllama.py @@ -48,7 +48,7 @@ class ExllamaModel: result.model = model result.cache = cache result.tokenizer = tokenizer - self.generator = generator + result.generator = generator return result, result def generate_with_streaming(self, prompt, state):