from serving_cast.request import Request
from serving_cast.utils import summarize
def test_output_throughput_summary_contains_key(cast_model, capfd):
assert cast_model["model_id"]
assert cast_model["op_meta"]
req = Request(num_input_tokens=10, num_output_tokens=10)
req.leaves_client_time = 0.0
req.arrives_server_time = 0.1
req.prefill_done_time = 0.6
req.decode_done_time = 1.6
summarize([req])
out, _ = capfd.readouterr()
assert "output_token_throughput(tok/s)" in out