mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2024-11-25 17:29:22 +01:00
Don't stream at more than 24 fps
This is a performance optimization
This commit is contained in:
parent
a160230893
commit
b6c407f51d
@ -188,7 +188,19 @@ def _generate_reply(question, state, eos_token=None, stopping_strings=None, is_c
|
|||||||
shared.stop_everything = False
|
shared.stop_everything = False
|
||||||
clear_torch_cache()
|
clear_torch_cache()
|
||||||
seed = set_manual_seed(state['seed'])
|
seed = set_manual_seed(state['seed'])
|
||||||
|
is_stream = state['stream']
|
||||||
|
last_update = -1
|
||||||
|
reply = ''
|
||||||
for reply in generate_func(question, original_question, seed, state, eos_token, stopping_strings, is_chat=is_chat):
|
for reply in generate_func(question, original_question, seed, state, eos_token, stopping_strings, is_chat=is_chat):
|
||||||
|
if is_stream:
|
||||||
|
cur_time = time.time()
|
||||||
|
if cur_time - last_update > 0.041666666666666664: # Limit streaming to 24 fps
|
||||||
|
last_update = cur_time
|
||||||
|
yield reply
|
||||||
|
else:
|
||||||
|
yield reply
|
||||||
|
|
||||||
|
if is_stream:
|
||||||
yield reply
|
yield reply
|
||||||
|
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user