Proper way to free the cuda cache

2024-11-22 16:17:57 +01:00 · 2023-02-25 15:50:29 -03:00 · 2023-02-25 15:50:29 -03:00 · fa58fd5559
commit fa58fd5559
parent 03d25c1c61
1 changed files with 4 additions and 1 deletions
--- a/modules/text_generation.py
+++ b/modules/text_generation.py
@ -1,3 +1,4 @@
 import gc
 import re
 import time
@ -73,6 +74,8 @@ def formatted_outputs(reply, model_name):
        return reply
 def generate_reply(question, max_new_tokens, do_sample, temperature, top_p, typical_p, repetition_penalty, top_k, min_length, no_repeat_ngram_size, num_beams, penalty_alpha, length_penalty, early_stopping, eos_token=None, stopping_string=None):
    gc.collect()
    if not shared.args.cpu:
        torch.cuda.empty_cache()
    original_question = question