mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2024-11-23 08:28:21 +01:00
Added model load logic for chat Completions
This commit is contained in:
parent
cc8c7ed209
commit
768124c4b0
@ -119,6 +119,18 @@ async def openai_completions(request: Request, request_data: CompletionRequest):
|
|||||||
|
|
||||||
@app.post('/v1/chat/completions', response_model=ChatCompletionResponse, dependencies=check_key)
|
@app.post('/v1/chat/completions', response_model=ChatCompletionResponse, dependencies=check_key)
|
||||||
async def openai_chat_completions(request: Request, request_data: ChatCompletionRequest):
|
async def openai_chat_completions(request: Request, request_data: ChatCompletionRequest):
|
||||||
|
requested_model = request_data.model
|
||||||
|
payload = OAImodels.get_current_model_info()
|
||||||
|
current_model = payload["model_name"]
|
||||||
|
if not current_model == requested_model:
|
||||||
|
requested_model_dict = {"model_name": requested_model}
|
||||||
|
try:
|
||||||
|
OAImodels._load_model(requested_model_dict)
|
||||||
|
except:
|
||||||
|
traceback.print_exc()
|
||||||
|
return HTTPException(status_code=400, detail="Failed to load the model.")
|
||||||
|
|
||||||
|
|
||||||
path = request.url.path
|
path = request.url.path
|
||||||
is_legacy = "/generate" in path
|
is_legacy = "/generate" in path
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user