File tree Expand file tree Collapse file tree 2 files changed +4
-2
lines changed Expand file tree Collapse file tree 2 files changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -298,7 +298,8 @@ async def multi_round_request(self,
298298
299299        if  check_match_count :
300300            assert  ctx_match_count  >  0 
301-             assert  gen_match_count  >=  ctx_match_count 
301+             assert  gen_match_count  >  0 
302+             assert  gen_match_count  >=  ctx_match_count  or  gen_evicted 
302303        return  request ["prompt" ]
303304
304305    async  def  test_multi_round_request (self ,
@@ -310,6 +311,8 @@ async def test_multi_round_request(self,
310311                for  prompt  in  init_prompts 
311312            ]
312313            prompts  =  await  asyncio .gather (* chat_threads )
314+             # send a request to flush events 
315+             await  self .multi_round_request (session , init_prompts [0 ], 1 , False )
313316            await  asyncio .gather (* [
314317                self .multi_round_request (session , prompt , 1 , True )
315318                for  prompt  in  prompts 
Original file line number Diff line number Diff line change @@ -287,7 +287,6 @@ test_e2e.py::test_ptp_quickstart_advanced[Llama3.1-70B-FP8-llama-3.1-model/Llama
287287accuracy/test_llm_api_pytorch.py::TestMistralSmall24B::test_auto_dtype SKIP (https://nvbugs/5454875)
288288examples/test_llm_api_with_mpi.py::test_llm_api_single_gpu_with_mpirun[TinyLlama-1.1B-Chat-v1.0] SKIP (https://nvbugs/5434372)
289289triton_server/test_triton.py::test_gpt_ib[gpt-ib] SKIP (https://nvbugs/5431116)
290- disaggregated/test_workers.py::test_workers_kv_cache_events[TinyLlama-1.1B-Chat-v1.0] SKIP (https://nvbugs/5457504)
291290accuracy/test_llm_api.py::TestMistralNemo12B::test_fp8 SKIP (https://nvbugs/5413197)
292291triton_server/test_triton.py::test_gpt_ib_streaming[gpt-ib-streaming] SKIP (https://nvbugs/5371349)
293292triton_server/test_triton.py::test_gpt_ib_ptuning[gpt-ib-ptuning] SKIP (https://nvbugs/5445624)
 
 
   
 
     
   
   
          
    
    
     
    
      
     
     
    You can’t perform that action at this time.
  
 
    
  
    
      
        
     
       
      
     
   
 
    
    
  
 
  
 
     
    
0 commit comments