@@ -149,14 +149,13 @@ func (h *Handler) handleNonStreamGenerateContent(w http.ResponseWriter, resp *ht
149149 cleanVisibleOutput (result .Thinking , stripReferenceMarkers ),
150150 cleanVisibleOutput (result .Text , stripReferenceMarkers ),
151151 toolNames ,
152- result .OutputTokens ,
153152 ))
154153}
155154
156155//nolint:unused // retained for native Gemini non-stream handling path.
157- func buildGeminiGenerateContentResponse (model , finalPrompt , finalThinking , finalText string , toolNames []string , outputTokens int ) map [string ]any {
156+ func buildGeminiGenerateContentResponse (model , finalPrompt , finalThinking , finalText string , toolNames []string ) map [string ]any {
158157 parts := buildGeminiPartsFromFinal (finalText , finalThinking , toolNames )
159- usage := buildGeminiUsage (finalPrompt , finalThinking , finalText , outputTokens )
158+ usage := buildGeminiUsage (finalPrompt , finalThinking , finalText )
160159 return map [string ]any {
161160 "candidates" : []map [string ]any {
162161 {
@@ -174,14 +173,10 @@ func buildGeminiGenerateContentResponse(model, finalPrompt, finalThinking, final
174173}
175174
176175//nolint:unused // retained for native Gemini non-stream handling path.
177- func buildGeminiUsage (finalPrompt , finalThinking , finalText string , outputTokens int ) map [string ]any {
176+ func buildGeminiUsage (finalPrompt , finalThinking , finalText string ) map [string ]any {
178177 promptTokens := util .EstimateTokens (finalPrompt )
179178 reasoningTokens := util .EstimateTokens (finalThinking )
180179 completionTokens := util .EstimateTokens (finalText )
181- if outputTokens > 0 {
182- completionTokens = outputTokens
183- reasoningTokens = 0
184- }
185180 return map [string ]any {
186181 "promptTokenCount" : promptTokens ,
187182 "candidatesTokenCount" : reasoningTokens + completionTokens ,
0 commit comments