Fix memory leak in new streaming (second attempt)

2024-11-22 08:07:56 +01:00 · 2023-03-11 23:14:49 -03:00 · 2023-03-11 23:14:49 -03:00 · 37f0166b2d
commit 37f0166b2d
parent 92fe947721
2 changed files with 4 additions and 2 deletions
--- a/modules/callbacks.py
+++ b/modules/callbacks.py
@ -49,7 +49,7 @@ class Iteratorize:
    def __init__(self, func, kwargs={}, callback=None):
        self.mfunc=func
        self.c_callback=callback
-        self.q = Queue(maxsize=1)
+        self.q = Queue()
        self.sentinel = object()
        self.kwargs = kwargs

@ -73,3 +73,6 @@ class Iteratorize:
            raise StopIteration
        else:
            return obj
+
+    def __del__(self):
+        pass
--- a/modules/text_generation.py
+++ b/modules/text_generation.py
@ -187,7 +187,6 @@ def generate_reply(question, max_new_tokens, do_sample, temperature, top_p, typi

        yield formatted_outputs(original_question, shared.model_name)
        for output in eval(f"generate_with_streaming({', '.join(generate_params)})"):
-            print(print('Used vram in gib:', torch.cuda.memory_allocated() / 1024**3))
            if shared.soft_prompt:
                output = torch.cat((input_ids[0], output[filler_input_ids.shape[1]:]))
            reply = decode(output)