diff --git a/cpp/serve/engine_state.cc b/cpp/serve/engine_state.cc index 4304ca48af..7847f53fd5 100644 --- a/cpp/serve/engine_state.cc +++ b/cpp/serve/engine_state.cc @@ -12,10 +12,10 @@ namespace serve { String EngineStats::AsJSON() const { picojson::object config; - config["single_token_prefill_latency"] = - picojson::value(total_prefill_length > 0 ? request_total_prefill_time / total_prefill_length : 0.0); - config["single_token_decode_latency"] = - picojson::value(total_decode_length > 0 ? request_total_decode_time / total_decode_length : 0.0); + config["single_token_prefill_latency"] = picojson::value( + total_prefill_length > 0 ? request_total_prefill_time / total_prefill_length : 0.0); + config["single_token_decode_latency"] = picojson::value( + total_decode_length > 0 ? request_total_decode_time / total_decode_length : 0.0); config["engine_total_prefill_time"] = picojson::value(engine_total_prefill_time); config["engine_total_decode_time"] = picojson::value(engine_total_decode_time); config["total_prefill_tokens"] = picojson::value(total_prefill_length); diff --git a/python/mlc_llm/serve/engine_base.py b/python/mlc_llm/serve/engine_base.py index 2b24d8f1c4..7f3f7e1331 100644 --- a/python/mlc_llm/serve/engine_base.py +++ b/python/mlc_llm/serve/engine_base.py @@ -1120,6 +1120,7 @@ def _debug_call_func_on_all_worker(self, func_name: str) -> None: self._ffi["debug_call_func_on_all_worker"](func_name) def stats(self): + """Get the engine stats.""" return self._ffi["stats"]()