Server-side usage data from llama-server (via stream_options.include_usage).
| 99 | |
| 100 | /** Server-side usage data from llama-server (via stream_options.include_usage). */ |
| 101 | interface ServerUsage { |
| 102 | prompt_tokens: number; |
| 103 | completion_tokens: number; |
| 104 | total_tokens: number; |
| 105 | // External prompt-cache fields (see _build_usage_chunk in |
| 106 | // external_provider.py); cache_creation is Anthropic-only. |
| 107 | prompt_tokens_details?: { |
| 108 | cached_tokens?: number; |
| 109 | }; |
| 110 | cache_creation_input_tokens?: number; |
| 111 | cache_read_input_tokens?: number; |
| 112 | } |
| 113 | |
| 114 | /** Server-side timing data from llama-server's timings object. */ |
| 115 | interface ServerTimings { |
nothing calls this directly
no outgoing calls
no test coverage detected