Fixes for api server - chat mode and integer temperature

This commit is contained in:
Maya Eary 2023-03-28 20:57:16 +03:00
parent cac577d99f
commit d1377c37af

View File

@ -43,14 +43,14 @@ class Handler(BaseHTTPRequestHandler):
generator = generate_reply( generator = generate_reply(
question = prompt, question = prompt,
max_new_tokens = body.get('max_length', 200), max_new_tokens = int(body.get('max_length', 200)),
do_sample=True, do_sample=True,
temperature=body.get('temperature', 0.5), temperature=float(body.get('temperature', 0.5)),
top_p=body.get('top_p', 1), top_p=float(body.get('top_p', 1)),
typical_p=body.get('typical', 1), typical_p=float(body.get('typical', 1)),
repetition_penalty=body.get('rep_pen', 1.1), repetition_penalty=float(body.get('rep_pen', 1.1)),
encoder_repetition_penalty=1, encoder_repetition_penalty=1,
top_k=body.get('top_k', 0), top_k=int(body.get('top_k', 0)),
min_length=0, min_length=0,
no_repeat_ngram_size=0, no_repeat_ngram_size=0,
num_beams=1, num_beams=1,
@ -62,6 +62,9 @@ class Handler(BaseHTTPRequestHandler):
answer = '' answer = ''
for a in generator: for a in generator:
if isinstance(a, str):
answer = a
else:
answer = a[0] answer = a[0]
response = json.dumps({ response = json.dumps({