@@ -127,7 +127,7 @@ def test_jetstream_llama2_seed(self):
127127 decode_state = engine .init_decode_state ()
128128 slot = 0
129129 # pylint: disable-next=all
130- prefill_result = engine .prefill (
130+ prefill_result , _ = engine .prefill (
131131 params = params , padded_tokens = padded_tokens , true_length = true_length
132132 )
133133
@@ -193,7 +193,7 @@ def _llama_e2e(self, env, model_arg):
193193 decode_state = engine .init_decode_state ()
194194 slot = 0
195195 # pylint: disable-next=all
196- prefill_result = engine .prefill (
196+ prefill_result , _ = engine .prefill (
197197 params = params , padded_tokens = padded_tokens , true_length = true_length
198198 )
199199
@@ -278,7 +278,7 @@ def test_llama_e2e_two_addtional_tokens(self):
278278 slot = 0
279279
280280 # pylint: disable-next=all
281- prefill_result = engine .prefill (
281+ prefill_result , _ = engine .prefill (
282282 params = params , padded_tokens = padded_tokens , true_length = true_length
283283 )
284284
@@ -350,7 +350,7 @@ def test_llama_e2e_four_addtional_tokens(self):
350350 slot = 0
351351
352352 # pylint: disable-next=all
353- prefill_result = engine .prefill (
353+ prefill_result , _ = engine .prefill (
354354 params = params , padded_tokens = padded_tokens , true_length = true_length
355355 )
356356
@@ -416,7 +416,7 @@ def test_llama_with_original_prefill_decode_32(self):
416416 # pylint: disable-next=all
417417 decode_state = engine .init_decode_state ()
418418 # pylint: disable-next=all
419- prefill_result = engine .prefill (
419+ prefill_result , _ = engine .prefill (
420420 params = params , padded_tokens = padded_tokens , true_length = true_length
421421 )
422422 out_tokens = prefill_result .token
@@ -491,7 +491,7 @@ def test_llama_with_original_prefill_decode(self):
491491 # pylint: disable-next=all
492492 decode_state = engine .init_decode_state ()
493493 # pylint: disable-next=all
494- prefill_result = engine .prefill (
494+ prefill_result , _ = engine .prefill (
495495 params = params , padded_tokens = padded_tokens , true_length = true_length
496496 )
497497 out_tokens = prefill_result .token
0 commit comments