mirror of
				https://github.com/ggml-org/llama.cpp.git
				synced 2025-10-30 08:42:00 +00:00 
			
		
		
		
	 fa8a809a91
			
		
	
	fa8a809a91
	
	
	
		
			
			* server: ci: windows build and tests * server: ci: remove tmp push branch * server: ci: EOF EOL * Use builti Co-authored-by: Jared Van Bortel <cebtenzzre@gmail.com> * server: tests: server graceful shutdown, then kill, then hard kill * server: tests: remove python2 unicode string * server: tests: remove wrong comment on server starting, close_fds is always true * server: tests: server kill, if pid exists * server: tests: remove dependency to killall * server: tests: ci windows: pid exists better handling --------- Co-authored-by: Jared Van Bortel <cebtenzzre@gmail.com>
		
			
				
	
	
		
			101 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			101 lines
		
	
	
		
			3.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import errno
 | |
| import os
 | |
| import socket
 | |
| import subprocess
 | |
| import time
 | |
| from contextlib import closing
 | |
| import signal
 | |
| 
 | |
| 
 | |
| def before_scenario(context, scenario):
 | |
|     context.debug = 'DEBUG' in os.environ and os.environ['DEBUG'] == 'ON'
 | |
|     if context.debug:
 | |
|         print("DEBUG=ON\n")
 | |
|     print(f"\x1b[33;42mStarting new scenario: {scenario.name}!\x1b[0m\n")
 | |
|     port = 8080
 | |
|     if 'PORT' in os.environ:
 | |
|         port = int(os.environ['PORT'])
 | |
|     if is_server_listening("localhost", port):
 | |
|         assert False, "Server already started"
 | |
| 
 | |
| 
 | |
| def after_scenario(context, scenario):
 | |
|     if context.server_process is None:
 | |
|         return
 | |
|     if scenario.status == "failed":
 | |
|         if 'GITHUB_ACTIONS' in os.environ:
 | |
|             print(f"\x1b[33;101mSCENARIO FAILED: {scenario.name} server logs:\x1b[0m\n\n")
 | |
|             if os.path.isfile('llama.log'):
 | |
|                 with closing(open('llama.log', 'r')) as f:
 | |
|                     for line in f:
 | |
|                         print(line)
 | |
|         if not is_server_listening(context.server_fqdn, context.server_port):
 | |
|             print("\x1b[33;101mERROR: Server stopped listening\x1b[0m\n")
 | |
| 
 | |
|     if not pid_exists(context.server_process.pid):
 | |
|         assert False, f"Server not running pid={context.server_process.pid} ..."
 | |
| 
 | |
|     server_graceful_shutdown(context)
 | |
| 
 | |
|     # Wait few for socket to free up
 | |
|     time.sleep(0.05)
 | |
| 
 | |
|     attempts = 0
 | |
|     while pid_exists(context.server_process.pid) or is_server_listening(context.server_fqdn, context.server_port):
 | |
|         server_kill(context)
 | |
|         time.sleep(0.1)
 | |
|         attempts += 1
 | |
|         if attempts > 5:
 | |
|             server_kill_hard(context)
 | |
| 
 | |
| 
 | |
| def server_graceful_shutdown(context):
 | |
|     print(f"shutting down server pid={context.server_process.pid} ...\n")
 | |
|     if os.name == 'nt':
 | |
|         os.kill(context.server_process.pid, signal.CTRL_C_EVENT)
 | |
|     else:
 | |
|         os.kill(context.server_process.pid, signal.SIGINT)
 | |
| 
 | |
| 
 | |
| def server_kill(context):
 | |
|     print(f"killing server pid={context.server_process.pid} ...\n")
 | |
|     context.server_process.kill()
 | |
| 
 | |
| 
 | |
| def server_kill_hard(context):
 | |
|     pid = context.server_process.pid
 | |
|     path = context.server_path
 | |
| 
 | |
|     print(f"Server dangling exits, hard killing force {pid}={path}...\n")
 | |
|     if os.name == 'nt':
 | |
|         process = subprocess.check_output(['taskkill', '/F', '/pid', str(pid)]).decode()
 | |
|         print(process)
 | |
|     else:
 | |
|         os.kill(-pid, signal.SIGKILL)
 | |
| 
 | |
| 
 | |
| def is_server_listening(server_fqdn, server_port):
 | |
|     with closing(socket.socket(socket.AF_INET, socket.SOCK_STREAM)) as sock:
 | |
|         result = sock.connect_ex((server_fqdn, server_port))
 | |
|         _is_server_listening = result == 0
 | |
|         if _is_server_listening:
 | |
|             print(f"server is listening on {server_fqdn}:{server_port}...\n")
 | |
|         return _is_server_listening
 | |
| 
 | |
| 
 | |
| def pid_exists(pid):
 | |
|     """Check whether pid exists in the current process table."""
 | |
|     if pid < 0:
 | |
|         return False
 | |
|     if os.name == 'nt':
 | |
|         output = subprocess.check_output(['TASKLIST', '/FI', f'pid eq {pid}']).decode()
 | |
|         print(output)
 | |
|         return "No tasks are running" not in output
 | |
|     else:
 | |
|         try:
 | |
|             os.kill(pid, 0)
 | |
|         except OSError as e:
 | |
|             return e.errno == errno.EPERM
 | |
|         else:
 | |
|             return True
 |