text-generation-webui/modules/extensions.py

208 lines
7.0 KiB
Python
Raw Normal View History

2023-03-24 20:51:27 +01:00
import traceback
2023-04-24 01:32:22 +02:00
from functools import partial
from inspect import signature
2023-03-24 20:51:27 +01:00
2023-03-15 19:11:16 +01:00
import gradio as gr
import extensions
2023-02-23 18:41:42 +01:00
import modules.shared as shared
from modules.logging_colors import logger
2023-02-24 14:01:21 +01:00
state = {}
available_extensions = []
setup_called = set()
def apply_settings(extension, name):
if not hasattr(extension, 'params'):
return
for param in extension.params:
_id = f"{name}-{param}"
if _id not in shared.settings:
continue
extension.params[param] = shared.settings[_id]
2023-02-23 18:49:02 +01:00
def load_extensions():
2023-04-07 17:20:57 +02:00
global state, setup_called
2023-02-24 14:01:21 +01:00
for i, name in enumerate(shared.args.extensions):
if name in available_extensions:
if name != 'api':
logger.info(f'Loading the extension "{name}"...')
2023-03-16 03:29:56 +01:00
try:
exec(f"import extensions.{name}.script")
extension = getattr(extensions, name).script
apply_settings(extension, name)
2023-04-07 17:20:57 +02:00
if extension not in setup_called and hasattr(extension, "setup"):
setup_called.add(extension)
extension.setup()
2023-04-25 05:10:21 +02:00
2023-03-16 03:29:56 +01:00
state[name] = [True, i]
except:
logger.error(f'Failed to load the extension "{name}".')
2023-03-24 20:51:27 +01:00
traceback.print_exc()
2023-02-23 18:49:02 +01:00
2023-04-07 17:20:57 +02:00
# This iterator returns the extensions in the order specified in the command-line
2023-02-24 14:01:21 +01:00
def iterator():
for name in sorted(state, key=lambda x: state[x][1]):
2023-04-07 05:52:02 +02:00
if state[name][0]:
yield getattr(extensions, name).script, name
2023-02-24 14:01:21 +01:00
2023-04-07 17:20:57 +02:00
# Extension functions that map string -> string
def _apply_string_extensions(function_name, text, state):
2023-02-24 14:01:21 +01:00
for extension, _ in iterator():
2023-04-24 01:32:22 +02:00
if hasattr(extension, function_name):
func = getattr(extension, function_name)
if len(signature(func).parameters) == 2:
text = func(text, state)
else:
text = func(text)
2023-04-25 05:10:21 +02:00
return text
# Extension functions that map string -> string
def _apply_chat_input_extensions(text, visible_text, state):
2023-04-24 01:32:22 +02:00
for extension, _ in iterator():
if hasattr(extension, 'chat_input_modifier'):
text, visible_text = extension.chat_input_modifier(text, visible_text, state)
2023-04-25 05:10:21 +02:00
2023-04-24 01:32:22 +02:00
return text, visible_text
# custom_generate_chat_prompt handling - currently only the first one will work
2023-04-24 01:32:22 +02:00
def _apply_custom_generate_chat_prompt(text, state, **kwargs):
for extension, _ in iterator():
if hasattr(extension, 'custom_generate_chat_prompt'):
return extension.custom_generate_chat_prompt(text, state, **kwargs)
2023-04-25 05:10:21 +02:00
2023-04-24 01:32:22 +02:00
return None
# Extension that modifies the input parameters before they are used
def _apply_state_modifier_extensions(state):
for extension, _ in iterator():
if hasattr(extension, "state_modifier"):
state = getattr(extension, "state_modifier")(state)
return state
2023-05-10 03:49:39 +02:00
2023-05-21 18:24:54 +02:00
# Extension that modifies the chat history before it is used
def _apply_history_modifier_extensions(history):
for extension, _ in iterator():
if hasattr(extension, "history_modifier"):
history = getattr(extension, "history_modifier")(history)
return history
# Extension functions that override the default tokenizer output - The order of execution is not defined
2023-04-24 01:32:22 +02:00
def _apply_tokenizer_extensions(function_name, state, prompt, input_ids, input_embeds):
for extension, _ in iterator():
if hasattr(extension, function_name):
prompt, input_ids, input_embeds = getattr(extension, function_name)(state, prompt, input_ids, input_embeds)
2023-04-25 05:10:21 +02:00
2023-04-24 01:32:22 +02:00
return prompt, input_ids, input_embeds
# Allow extensions to add their own logits processors to the stack being run.
# Each extension would call `processor_list.append({their LogitsProcessor}())`.
def _apply_logits_processor_extensions(function_name, processor_list, input_ids):
for extension, _ in iterator():
if hasattr(extension, function_name):
result = getattr(extension, function_name)(processor_list, input_ids)
if type(result) is list:
processor_list = result
return processor_list
# Get prompt length in tokens after applying extension functions which override the default tokenizer output
# currently only the first one will work
def _apply_custom_tokenized_length(prompt):
for extension, _ in iterator():
if hasattr(extension, 'custom_tokenized_length'):
return getattr(extension, 'custom_tokenized_length')(prompt)
2023-05-10 03:49:39 +02:00
return None
# Custom generate reply handling - currently only the first one will work
def _apply_custom_generate_reply():
for extension, _ in iterator():
if hasattr(extension, 'custom_generate_reply'):
return getattr(extension, 'custom_generate_reply')
return None
def _apply_custom_css():
all_css = ''
for extension, _ in iterator():
if hasattr(extension, 'custom_css'):
all_css += getattr(extension, 'custom_css')()
return all_css
def _apply_custom_js():
all_js = ''
for extension, _ in iterator():
if hasattr(extension, 'custom_js'):
all_js += getattr(extension, 'custom_js')()
return all_js
2023-05-17 06:25:01 +02:00
def create_extensions_block():
to_display = []
for extension, name in iterator():
if hasattr(extension, "ui") and not (hasattr(extension, 'params') and extension.params.get('is_tab', False)):
to_display.append((extension, name))
# Creating the extension ui elements
if len(to_display) > 0:
with gr.Column(elem_id="extensions"):
for row in to_display:
extension, name = row
display_name = getattr(extension, 'params', {}).get('display_name', name)
gr.Markdown(f"\n### {display_name}")
extension.ui()
def create_extensions_tabs():
for extension, name in iterator():
if hasattr(extension, "ui") and (hasattr(extension, 'params') and extension.params.get('is_tab', False)):
display_name = getattr(extension, 'params', {}).get('display_name', name)
with gr.Tab(display_name, elem_classes="extension-tab"):
extension.ui()
2023-04-24 01:32:22 +02:00
EXTENSION_MAP = {
"input": partial(_apply_string_extensions, "input_modifier"),
"output": partial(_apply_string_extensions, "output_modifier"),
"chat_input": _apply_chat_input_extensions,
"state": _apply_state_modifier_extensions,
2023-05-21 18:24:54 +02:00
"history": _apply_history_modifier_extensions,
2023-04-24 01:32:22 +02:00
"bot_prefix": partial(_apply_string_extensions, "bot_prefix_modifier"),
"tokenizer": partial(_apply_tokenizer_extensions, "tokenizer_modifier"),
'logits_processor': partial(_apply_logits_processor_extensions, 'logits_processor_modifier'),
"custom_generate_chat_prompt": _apply_custom_generate_chat_prompt,
"custom_generate_reply": _apply_custom_generate_reply,
"tokenized_length": _apply_custom_tokenized_length,
"css": _apply_custom_css,
"js": _apply_custom_js
2023-04-24 01:32:22 +02:00
}
def apply_extensions(typ, *args, **kwargs):
if typ not in EXTENSION_MAP:
raise ValueError(f"Invalid extension type {typ}")
2023-04-25 05:10:21 +02:00
2023-04-24 01:32:22 +02:00
return EXTENSION_MAP[typ](*args, **kwargs)