1111import zmq
1212
1313from vllm .utils .collection_utils import ThreadSafeDict
14- from vllm .v1 .engine .core_client import ClientGuard
14+ from vllm .v1 .engine .core_client import ClientSentinel
1515from vllm .v1 .engine .utils import FaultHandler , FaultInfo
1616
1717FAULT_RECEIVER_ADDR = "tcp://127.0.0.1:8844"
@@ -31,59 +31,59 @@ def create_test_thread_safe_dict(initial_data=None):
3131 return tsd
3232
3333
34- def create_client_guard (
34+ def create_client_sentinel (
3535 engine_exception_q : queue .Queue , engine_status_dict : ThreadSafeDict [int , str ]
3636):
37- return ClientGuard (
37+ return ClientSentinel (
3838 fault_receiver_addr = FAULT_RECEIVER_ADDR ,
3939 cmd_addr = CMD_ADDR ,
40- engine_registry = [ b"engine_identity" ] ,
40+ engine_registry = { 0 : b"engine_identity" } ,
4141 engine_exception_q = engine_exception_q ,
4242 fault_pub_addr = FAULT_PUB_ADDR ,
4343 engine_status_dict = engine_status_dict ,
4444 )
4545
4646
47- def test_client_guard_initialization ():
47+ def test_client_sentinel_initialization ():
4848 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
4949 engine_status_dict = create_test_thread_safe_dict ({1 : "Healthy" })
50- guard = create_client_guard (engine_exception_q , engine_status_dict )
50+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
5151
52- assert guard .engine_registry == [ b"engine_identity" ]
53- assert not guard . client_guard_dead
54- assert isinstance (guard .fault_handler , FaultHandler )
55- assert guard .engine_exception_q is engine_exception_q
52+ assert sentinel .engine_registry [ 0 ] == b"engine_identity"
53+ assert not sentinel . client_sentinel_dead
54+ assert isinstance (sentinel .fault_handler , FaultHandler )
55+ assert sentinel .engine_exception_q is engine_exception_q
5656
57- assert guard .fault_receiver_socket .type == zmq .ROUTER
58- assert guard .cmd_socket .type == zmq .ROUTER
59- assert guard .fault_pub_socket .type == zmq .PUB
57+ assert sentinel .fault_receiver_socket .type == zmq .ROUTER
58+ assert sentinel .cmd_socket .type == zmq .ROUTER
59+ assert sentinel .fault_pub_socket .type == zmq .PUB
6060
61- guard . shutdown_guard ()
61+ sentinel . shutdown_sentinel ()
6262
6363
6464@pytest .mark .asyncio
6565async def test_handle_fault ():
6666 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
6767 engine_status_dict = create_test_thread_safe_dict ({1 : "Healthy" })
68- guard = create_client_guard (engine_exception_q , engine_status_dict )
68+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
6969
7070 engine_exception_q .put_nowait (
7171 FaultInfo (engine_id = "1" , message = "test exception" , type = "test" )
7272 )
7373
74- guard .fault_handler .handle_fault = AsyncMock (return_value = True )
74+ sentinel .fault_handler .handle_fault = AsyncMock (return_value = True )
7575
76- result = await guard .handle_fault ("pause" , 5 )
76+ result = await sentinel .handle_fault ("pause" , 5 )
7777 assert result is True
78- guard .fault_handler .handle_fault .assert_awaited_once_with ("pause" , 5 )
78+ sentinel .fault_handler .handle_fault .assert_awaited_once_with ("pause" , 5 )
7979
80- guard . shutdown_guard ()
80+ sentinel . shutdown_sentinel ()
8181
8282
8383def test_fault_receiver ():
8484 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
8585 engine_status_dict = create_test_thread_safe_dict ({1 : "Healthy" })
86- guard = create_client_guard (engine_exception_q , engine_status_dict )
86+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
8787
8888 def send_test_message ():
8989 ctx = zmq .Context ()
@@ -125,13 +125,13 @@ def check_published_message():
125125
126126 assert engine_status_dict [1 ] == "Dead"
127127
128- guard . shutdown_guard ()
128+ sentinel . shutdown_sentinel ()
129129
130130
131131def test_fault_receiver_unhealthy ():
132132 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
133133 engine_status_dict = create_test_thread_safe_dict ({1 : "Healthy" })
134- guard = create_client_guard (engine_exception_q , engine_status_dict )
134+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
135135
136136 def send_unhealthy_message ():
137137 ctx = zmq .Context ()
@@ -149,22 +149,22 @@ def send_unhealthy_message():
149149
150150 assert engine_status_dict [1 ] == "Unhealthy"
151151
152- guard . shutdown_guard ()
152+ sentinel . shutdown_sentinel ()
153153
154154
155- def test_shutdown_guard ():
155+ def test_shutdown_sentinel ():
156156 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
157157 engine_status_dict = create_test_thread_safe_dict ({1 : "Healthy" })
158- guard = create_client_guard (engine_exception_q , engine_status_dict )
158+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
159159
160- original_fault_sock = guard .fault_receiver_socket
161- original_cmd_sock = guard .cmd_socket
162- original_pub_sock = guard .fault_pub_socket
163- original_ctx = guard .zmq_ctx
160+ original_fault_sock = sentinel .fault_receiver_socket
161+ original_cmd_sock = sentinel .cmd_socket
162+ original_pub_sock = sentinel .fault_pub_socket
163+ original_ctx = sentinel .zmq_ctx
164164
165- guard . shutdown_guard ()
165+ sentinel . shutdown_sentinel ()
166166
167- assert guard . client_guard_dead is True
167+ assert sentinel . client_sentinel_dead is True
168168
169169 with pytest .raises (zmq .ZMQError ):
170170 original_fault_sock .recv ()
@@ -182,7 +182,7 @@ def test_shutdown_guard():
182182async def test_handle_fault_async ():
183183 engine_exception_q : queue .Queue [FaultInfo ] = queue .Queue ()
184184 engine_status_dict = create_test_thread_safe_dict ({0 : "Unhealthy" })
185- guard = create_client_guard (engine_exception_q , engine_status_dict )
185+ sentinel = create_client_sentinel (engine_exception_q , engine_status_dict )
186186
187187 time .sleep (0.1 )
188188 ctx = zmq .Context ().instance ()
@@ -213,11 +213,11 @@ def response_cmd(cmd_socket):
213213 threading .Thread (target = receive_cmd , args = (cmd_socket ,), daemon = True ).start ()
214214 threading .Thread (target = response_cmd , args = (cmd_socket ,), daemon = True ).start ()
215215
216- result = await guard .handle_fault ("retry" , 3 )
216+ result = await sentinel .handle_fault ("retry" , 3 )
217217
218218 assert result is True
219219 assert engine_status_dict [0 ] == "Healthy"
220220
221221 cmd_socket .close ()
222222 ctx .term ()
223- guard . shutdown_guard ()
223+ sentinel . shutdown_sentinel ()
0 commit comments