Add context_instruct to API. Load default model instruction template … (#2688)

2024-11-22 08:07:56 +01:00 · 2023-07-12 04:01:03 +01:00 · 2023-07-12 04:01:03 +01:00 · d9fabdde40
commit d9fabdde40
parent 324e45b848
6 changed files with 37 additions and 32 deletions
--- a/api-examples/api-example-chat-stream.py
+++ b/api-examples/api-example-chat-stream.py
@ -23,7 +23,8 @@ async def run(user_input, history):
        'history': history,
        'mode': 'instruct',  # Valid options: 'chat', 'chat-instruct', 'instruct'
        'character': 'Example',
-        'instruction_template': 'Vicuna-v1.1',
+        'instruction_template': 'Vicuna-v1.1',  # Will get autodetected if unset
+        # 'context_instruct': '',  # Optional
        'your_name': 'You',

        'regenerate': False,
--- a/api-examples/api-example-chat.py
+++ b/api-examples/api-example-chat.py
@ -17,7 +17,8 @@ def run(user_input, history):
        'history': history,
        'mode': 'instruct',  # Valid options: 'chat', 'chat-instruct', 'instruct'
        'character': 'Example',
-        'instruction_template': 'Vicuna-v1.1',
+        'instruction_template': 'Vicuna-v1.1',  # Will get autodetected if unset
+        # 'context_instruct': '',  # Optional
        'your_name': 'You',

        'regenerate': False,
--- a/api-examples/api-example-model.py
+++ b/api-examples/api-example-model.py
@ -4,6 +4,7 @@ import requests

 HOST = '0.0.0.0:5000'

+
 def generate(prompt, tokens=200):
    request = {'prompt': prompt, 'max_new_tokens': tokens}
    response = requests.post(f'http://{HOST}/api/v1/generate', json=request)
@ -124,7 +125,6 @@ def complex_model_load(model):
        else:
            req['args']['rwkv_strategy'] = 'cuda f16'  # 24GB

-
    return model_api(req)


--- a/extensions/api/util.py
+++ b/extensions/api/util.py
@ -59,7 +59,10 @@ def build_parameters(body, chat=False):

    if chat:
        character = body.get('character')
-        instruction_template = body.get('instruction_template')
+        instruction_template = body.get('instruction_template', shared.settings['instruction_template'])
+        if str(instruction_template) == "None":
+            instruction_template = "Vicuna-v1.1"
+
        name1, name2, _, greeting, context, _ = load_character_memoized(character, str(body.get('your_name', shared.settings['name1'])), shared.settings['name2'], instruct=False)
        name1_instruct, name2_instruct, _, _, context_instruct, turn_template = load_character_memoized(instruction_template, '', '', instruct=True)
        generate_params.update({
@ -72,7 +75,7 @@ def build_parameters(body, chat=False):
            'greeting': greeting,
            'name1_instruct': name1_instruct,
            'name2_instruct': name2_instruct,
-            'context_instruct': context_instruct,
+            'context_instruct': body.get('context_instruct',  context_instruct),
            'turn_template': turn_template,
            'chat-instruct_command': str(body.get('chat-instruct_command', shared.settings['chat-instruct_command'])),
            'history': body.get('history', {'internal': [], 'visible': []})