From 68ec6cfa3750758f470b6635dfa58022939e6f56 Mon Sep 17 00:00:00 2001 From: Nicolas Patry Date: Thu, 16 May 2024 15:58:22 +0000 Subject: [PATCH] Fixing signals. Taking the signal handles later, so during loads, regular signal handling is done, we only need to handle SIGINT and SIGTERM during real loads to get more graceful shutdowns when queries are in flight. --- server/text_generation_server/server.py | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/server/text_generation_server/server.py b/server/text_generation_server/server.py index 92126fe6..7c06822f 100644 --- a/server/text_generation_server/server.py +++ b/server/text_generation_server/server.py @@ -35,9 +35,6 @@ class SignalHandler: self.KEEP_PROCESSING = False -signal_handler = SignalHandler() - - class TextGenerationService(generate_pb2_grpc.TextGenerationServiceServicer): def __init__( self, @@ -251,7 +248,7 @@ def serve( await server.start() logger.info("Server started at {}".format(local_url)) - + signal_handler = SignalHandler() while signal_handler.KEEP_PROCESSING: await asyncio.sleep(0.5)