feat: Log LLM response token usage (prompt/completion/total, content_len, finish_reason)

2026-03-30 06:15:24 +00:00 · 2026-03-30 06:15:24 +00:00 · 0b0ca598b4
commit 0b0ca598b4
parent 17347da87e
1 changed files with 14 additions and 0 deletions
--- a/backend/pipeline/llm_client.py
+++ b/backend/pipeline/llm_client.py
@ -140,6 +140,13 @@ class LLMClient:
                **kwargs,
            )
            raw = response.choices[0].message.content or ""
+            usage = getattr(response, "usage", None)
+            if usage:
+                logger.info(
+                    "LLM response: prompt_tokens=%s, completion_tokens=%s, total=%s, content_len=%d, finish=%s",
+                    usage.prompt_tokens, usage.completion_tokens, usage.total_tokens,
+                    len(raw), response.choices[0].finish_reason,
+                )
            if modality == "thinking":
                raw = strip_think_tags(raw)
            return raw
@ -161,6 +168,13 @@ class LLMClient:
                **kwargs,
            )
            raw = response.choices[0].message.content or ""
+            usage = getattr(response, "usage", None)
+            if usage:
+                logger.info(
+                    "LLM response (fallback): prompt_tokens=%s, completion_tokens=%s, total=%s, content_len=%d, finish=%s",
+                    usage.prompt_tokens, usage.completion_tokens, usage.total_tokens,
+                    len(raw), response.choices[0].finish_reason,
+                )
            if modality == "thinking":
                raw = strip_think_tags(raw)
            return raw