mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-03 17:51:09 +01:00
fa8a809a91
* server: ci: windows build and tests * server: ci: remove tmp push branch * server: ci: EOF EOL * Use builti Co-authored-by: Jared Van Bortel <cebtenzzre@gmail.com> * server: tests: server graceful shutdown, then kill, then hard kill * server: tests: remove python2 unicode string * server: tests: remove wrong comment on server starting, close_fds is always true * server: tests: server kill, if pid exists * server: tests: remove dependency to killall * server: tests: ci windows: pid exists better handling --------- Co-authored-by: Jared Van Bortel <cebtenzzre@gmail.com>
101 lines
3.2 KiB
Python
101 lines
3.2 KiB
Python
import errno
|
|
import os
|
|
import socket
|
|
import subprocess
|
|
import time
|
|
from contextlib import closing
|
|
import signal
|
|
|
|
|
|
def before_scenario(context, scenario):
|
|
context.debug = 'DEBUG' in os.environ and os.environ['DEBUG'] == 'ON'
|
|
if context.debug:
|
|
print("DEBUG=ON\n")
|
|
print(f"\x1b[33;42mStarting new scenario: {scenario.name}!\x1b[0m\n")
|
|
port = 8080
|
|
if 'PORT' in os.environ:
|
|
port = int(os.environ['PORT'])
|
|
if is_server_listening("localhost", port):
|
|
assert False, "Server already started"
|
|
|
|
|
|
def after_scenario(context, scenario):
|
|
if context.server_process is None:
|
|
return
|
|
if scenario.status == "failed":
|
|
if 'GITHUB_ACTIONS' in os.environ:
|
|
print(f"\x1b[33;101mSCENARIO FAILED: {scenario.name} server logs:\x1b[0m\n\n")
|
|
if os.path.isfile('llama.log'):
|
|
with closing(open('llama.log', 'r')) as f:
|
|
for line in f:
|
|
print(line)
|
|
if not is_server_listening(context.server_fqdn, context.server_port):
|
|
print("\x1b[33;101mERROR: Server stopped listening\x1b[0m\n")
|
|
|
|
if not pid_exists(context.server_process.pid):
|
|
assert False, f"Server not running pid={context.server_process.pid} ..."
|
|
|
|
server_graceful_shutdown(context)
|
|
|
|
# Wait few for socket to free up
|
|
time.sleep(0.05)
|
|
|
|
attempts = 0
|
|
while pid_exists(context.server_process.pid) or is_server_listening(context.server_fqdn, context.server_port):
|
|
server_kill(context)
|
|
time.sleep(0.1)
|
|
attempts += 1
|
|
if attempts > 5:
|
|
server_kill_hard(context)
|
|
|
|
|
|
def server_graceful_shutdown(context):
|
|
print(f"shutting down server pid={context.server_process.pid} ...\n")
|
|
if os.name == 'nt':
|
|
os.kill(context.server_process.pid, signal.CTRL_C_EVENT)
|
|
else:
|
|
os.kill(context.server_process.pid, signal.SIGINT)
|
|
|
|
|
|
def server_kill(context):
|
|
print(f"killing server pid={context.server_process.pid} ...\n")
|
|
context.server_process.kill()
|
|
|
|
|
|
def server_kill_hard(context):
|
|
pid = context.server_process.pid
|
|
path = context.server_path
|
|
|
|
print(f"Server dangling exits, hard killing force {pid}={path}...\n")
|
|
if os.name == 'nt':
|
|
process = subprocess.check_output(['taskkill', '/F', '/pid', str(pid)]).decode()
|
|
print(process)
|
|
else:
|
|
os.kill(-pid, signal.SIGKILL)
|
|
|
|
|
|
def is_server_listening(server_fqdn, server_port):
|
|
with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as sock:
|
|
result = sock.connect_ex((server_fqdn, server_port))
|
|
_is_server_listening = result == 0
|
|
if _is_server_listening:
|
|
print(f"server is listening on {server_fqdn}:{server_port}...\n")
|
|
return _is_server_listening
|
|
|
|
|
|
def pid_exists(pid):
|
|
"""Check whether pid exists in the current process table."""
|
|
if pid < 0:
|
|
return False
|
|
if os.name == 'nt':
|
|
output = subprocess.check_output(['TASKLIST', '/FI', f'pid eq {pid}']).decode()
|
|
print(output)
|
|
return "No tasks are running" not in output
|
|
else:
|
|
try:
|
|
os.kill(pid, 0)
|
|
except OSError as e:
|
|
return e.errno == errno.EPERM
|
|
else:
|
|
return True
|