openclaw/src/llm/providers/google-shared.ts

/**
 * Shared utilities for Google Generative AI and Google Vertex providers.
 */

import {
  type Content,
  FinishReason,
  FunctionCallingConfigMode,
  type GenerateContentConfig,
  type GenerateContentParameters,
  type GenerateContentResponse,
  type Part,
  type ThinkingConfig,
} from "@google/genai";
import { calculateCost, clampThinkingLevel } from "../model-utils.js";
import type {
  Api,
  AssistantMessage,
  Context,
  ImageContent,
  Model,
  SimpleStreamOptions,
  StopReason,
  TextContent,
  ThinkingBudgets,
  ThinkingContent,
  ThinkingLevel as AgentThinkingLevel,
  Tool,
  ToolCall,
  StreamOptions,
} from "../types.js";
import type { AssistantMessageEventStream } from "../utils/event-stream.js";
import { sanitizeSurrogates } from "../utils/sanitize-unicode.js";
import { transformMessages } from "./transform-messages.js";

export type GoogleApiType = "google-generative-ai" | "google-vertex";

/**
 * Thinking level for Gemini 3 models.
 * Mirrors Google's ThinkingLevel enum values.
 */
export type GoogleThinkingLevel =
  | "THINKING_LEVEL_UNSPECIFIED"
  | "MINIMAL"
  | "LOW"
  | "MEDIUM"
  | "HIGH";

export type GoogleToolChoice = "auto" | "none" | "any";

export type GoogleThinkingOptions = {
  enabled: boolean;
  budgetTokens?: number;
  level?: GoogleThinkingLevel;
};

export type GoogleProviderOptions = StreamOptions & {
  toolChoice?: GoogleToolChoice;
  thinking?: GoogleThinkingOptions;
};

type GoogleGenerateContentClient = {
  models: {
    generateContentStream(
      params: GenerateContentParameters,
    ): Promise<AsyncIterable<GenerateContentResponse>> | AsyncIterable<GenerateContentResponse>;
  };
};

type ClampedGoogleThinkingLevel = Exclude<AgentThinkingLevel, "xhigh" | "max">;

/**
 * Determines whether a streamed Gemini `Part` should be treated as "thinking".
 *
 * Protocol note (Gemini / Vertex AI thought signatures):
 * - `thought: true` is the definitive marker for thinking content (thought summaries).
 * - `thoughtSignature` is an encrypted representation of the model's internal thought process
 *   used to preserve reasoning context across multi-turn interactions.
 * - `thoughtSignature` can appear on ANY part type (text, functionCall, etc.) - it does NOT
 *   indicate the part itself is thinking content.
 * - For non-functionCall responses, the signature appears on the last part for context replay.
 * - When persisting/replaying model outputs, signature-bearing parts must be preserved as-is;
 *   do not merge/move signatures across parts.
 *
 * See: https://ai.google.dev/gemini-api/docs/thought-signatures
 */
export function isThinkingPart(part: Pick<Part, "thought" | "thoughtSignature">): boolean {
  return part.thought === true;
}

/**
 * Retain thought signatures during streaming.
 *
 * Some backends only send `thoughtSignature` on the first delta for a given part/block; later deltas may omit it.
 * This helper preserves the last non-empty signature for the current block.
 *
 * Note: this does NOT merge or move signatures across distinct response parts. It only prevents
 * a signature from being overwritten with `undefined` within the same streamed block.
 */
export function retainThoughtSignature(
  existing: string | undefined,
  incoming: string | undefined,
): string | undefined {
  if (typeof incoming === "string" && incoming.length > 0) {
    return incoming;
  }
  return existing;
}

// Thought signatures must be base64 for Google APIs (TYPE_BYTES).
const base64SignaturePattern = /^[A-Za-z0-9+/]+={0,2}$/;

function isValidThoughtSignature(signature: string | undefined): boolean {
  if (!signature) {
    return false;
  }
  if (signature.length % 4 !== 0) {
    return false;
  }
  return base64SignaturePattern.test(signature);
}

/**
 * Only keep signatures from the same provider/model and with valid base64.
 */
function resolveThoughtSignature(
  isSameProviderAndModel: boolean,
  signature: string | undefined,
): string | undefined {
  return isSameProviderAndModel && isValidThoughtSignature(signature) ? signature : undefined;
}

/**
 * Models via Google APIs that require explicit tool call IDs in function calls/responses.
 */
export function requiresToolCallId(modelId: string): boolean {
  return modelId.startsWith("claude-") || modelId.startsWith("gpt-oss-");
}

function getGeminiMajorVersion(modelId: string): number | undefined {
  const match = modelId.toLowerCase().match(/^gemini(?:-live)?-(\d+)/);
  if (!match) {
    return undefined;
  }
  return Number.parseInt(match[1], 10);
}

function supportsMultimodalFunctionResponse(modelId: string): boolean {
  const geminiMajorVersion = getGeminiMajorVersion(modelId);
  if (geminiMajorVersion !== undefined) {
    return geminiMajorVersion >= 3;
  }
  return true;
}

/**
 * Convert internal messages to Gemini Content[] format.
 */
export function convertMessages<T extends GoogleApiType>(
  model: Model<T>,
  context: Context,
): Content[] {
  const contents: Content[] = [];
  const normalizeToolCallId = (id: string): string => {
    if (!requiresToolCallId(model.id)) {
      return id;
    }
    return id.replace(/[^a-zA-Z0-9_-]/g, "_").slice(0, 64);
  };

  const transformedMessages = transformMessages(context.messages, model, normalizeToolCallId);

  for (const msg of transformedMessages) {
    if (msg.role === "user") {
      if (typeof msg.content === "string") {
        contents.push({
          role: "user",
          parts: [{ text: sanitizeSurrogates(msg.content) }],
        });
      } else {
        const parts: Part[] = msg.content.map((item) => {
          if (item.type === "text") {
            return { text: sanitizeSurrogates(item.text) };
          }
          return {
            inlineData: {
              mimeType: item.mimeType,
              data: item.data,
            },
          };
        });
        if (parts.length === 0) {
          continue;
        }
        contents.push({
          role: "user",
          parts,
        });
      }
    } else if (msg.role === "assistant") {
      const parts: Part[] = [];
      // Check if message is from same provider and model - only then keep thinking blocks
      const isSameProviderAndModel = msg.provider === model.provider && msg.model === model.id;

      for (const block of msg.content) {
        if (block.type === "text") {
          // Skip empty text blocks
          if (!block.text || block.text.trim() === "") {
            continue;
          }
          const thoughtSignature = resolveThoughtSignature(
            isSameProviderAndModel,
            block.textSignature,
          );
          parts.push({
            text: sanitizeSurrogates(block.text),
            ...(thoughtSignature && { thoughtSignature }),
          });
        } else if (block.type === "thinking") {
          // Skip empty thinking blocks
          if (!block.thinking || block.thinking.trim() === "") {
            continue;
          }
          // Only keep as thinking block if same provider AND same model
          // Otherwise convert to plain text (no tags to avoid model mimicking them)
          if (isSameProviderAndModel) {
            const thoughtSignature = resolveThoughtSignature(
              isSameProviderAndModel,
              block.thinkingSignature,
            );
            parts.push({
              thought: true,
              text: sanitizeSurrogates(block.thinking),
              ...(thoughtSignature && { thoughtSignature }),
            });
          } else {
            parts.push({
              text: sanitizeSurrogates(block.thinking),
            });
          }
        } else if (block.type === "toolCall") {
          const thoughtSignature = resolveThoughtSignature(
            isSameProviderAndModel,
            block.thoughtSignature,
          );
          const part: Part = {
            functionCall: {
              name: block.name,
              args: block.arguments ?? {},
              ...(requiresToolCallId(model.id) ? { id: block.id } : {}),
            },
            ...(thoughtSignature && { thoughtSignature }),
          };
          parts.push(part);
        }
      }

      if (parts.length === 0) {
        continue;
      }
      contents.push({
        role: "model",
        parts,
      });
    } else if (msg.role === "toolResult") {
      // Extract text and image content
      const textContent = msg.content.filter((c): c is TextContent => c.type === "text");
      const textResult = textContent.map((c) => c.text).join("\n");
      const imageContent = model.input.includes("image")
        ? msg.content.filter((c): c is ImageContent => c.type === "image")
        : [];

      const hasText = textResult.length > 0;
      const hasImages = imageContent.length > 0;

      // Gemini 3+ models support multimodal function responses with images nested inside
      // functionResponse.parts. Claude and other non-Gemini models behind Cloud Code Assist /
      // Gemini < 3 still needs a separate user image turn.
      const modelSupportsMultimodalFunctionResponse = supportsMultimodalFunctionResponse(model.id);

      // Use "output" key for success, "error" key for errors as per SDK documentation
      const responseValue = hasText
        ? sanitizeSurrogates(textResult)
        : hasImages
          ? "(see attached image)"
          : "";

      const imageParts: Part[] = imageContent.map((imageBlock) => ({
        inlineData: {
          mimeType: imageBlock.mimeType,
          data: imageBlock.data,
        },
      }));

      const includeId = requiresToolCallId(model.id);
      const functionResponsePart: Part = {
        functionResponse: {
          name: msg.toolName,
          response: msg.isError ? { error: responseValue } : { output: responseValue },
          ...(hasImages && modelSupportsMultimodalFunctionResponse && { parts: imageParts }),
          ...(includeId ? { id: msg.toolCallId } : {}),
        },
      };

      // Cloud Code Assist API requires all function responses to be in a single user turn.
      // Check if the last content is already a user turn with function responses and merge.
      const lastContent = contents[contents.length - 1];
      if (lastContent?.role === "user" && lastContent.parts?.some((p) => p.functionResponse)) {
        lastContent.parts.push(functionResponsePart);
      } else {
        contents.push({
          role: "user",
          parts: [functionResponsePart],
        });
      }

      // For Gemini < 3, add images in a separate user message
      if (hasImages && !modelSupportsMultimodalFunctionResponse) {
        contents.push({
          role: "user",
          parts: [{ text: "Tool result image:" }, ...imageParts],
        });
      }
    }
  }

  return contents;
}

const JSON_SCHEMA_META_DECLARATIONS = new Set([
  "$schema",
  "$id",
  "$anchor",
  "$dynamicAnchor",
  "$vocabulary",
  "$comment",
  "$defs",
  "definitions", // pre-draft-2019-09 equivalent of $defs
]);
const MAX_GOOGLE_TOOL_SCHEMA_DEPTH = 64;
const MAX_GOOGLE_TOOL_SCHEMA_NODES = 10_000;

/**
 * Strip meta-declarations from a schema obj
 */
function sanitizeForOpenApi(schema: unknown): unknown {
  return materializeGoogleToolSchema(schema, { stripMetaDeclarations: true });
}

function materializeGoogleToolSchema(
  schema: unknown,
  options: { stripMetaDeclarations: boolean },
): unknown {
  const state = { nodes: 0 };
  return materializeGoogleToolSchemaValue(schema, options, state, 0, new Set<object>());
}

function materializeGoogleToolSchemaValue(
  schema: unknown,
  options: { stripMetaDeclarations: boolean },
  state: { nodes: number },
  depth: number,
  stack: Set<object>,
): unknown {
  if (depth > MAX_GOOGLE_TOOL_SCHEMA_DEPTH) {
    throw new Error("Google tool schema exceeds maximum supported depth");
  }
  if (++state.nodes > MAX_GOOGLE_TOOL_SCHEMA_NODES) {
    throw new Error("Google tool schema exceeds maximum supported size");
  }
  if (typeof schema !== "object" || schema === null) {
    return schema;
  }
  if (stack.has(schema)) {
    throw new Error("Google tool schema contains a cycle");
  }

  stack.add(schema);
  try {
    if (Array.isArray(schema)) {
      return schema.map((item) =>
        materializeGoogleToolSchemaValue(item, options, state, depth + 1, stack),
      );
    }

    const result: Record<string, unknown> = {};
    for (const [key, value] of Object.entries(schema)) {
      if (options.stripMetaDeclarations && JSON_SCHEMA_META_DECLARATIONS.has(key)) {
        continue;
      }
      Object.defineProperty(result, key, {
        value: materializeGoogleToolSchemaValue(value, options, state, depth + 1, stack),
        enumerable: true,
        configurable: true,
        writable: true,
      });
    }
    return result;
  } finally {
    stack.delete(schema);
  }
}

function buildGoogleFunctionDeclaration(
  tool: Tool,
  useParameters: boolean,
): Record<string, unknown> | undefined {
  try {
    const name = tool.name;
    const description = tool.description;
    const parameters = useParameters
      ? sanitizeForOpenApi(tool.parameters)
      : materializeGoogleToolSchema(tool.parameters, { stripMetaDeclarations: false });
    return {
      name,
      description,
      ...(useParameters ? { parameters } : { parametersJsonSchema: parameters }),
    };
  } catch {
    return undefined;
  }
}

/**
 * Convert tools to Gemini function declarations format.
 *
 * By default uses `parametersJsonSchema` which supports full JSON Schema (including
 * anyOf, oneOf, const, etc.). Set `useParameters` to true to use the legacy `parameters`
 * field instead (OpenAPI 3.03 Schema). This is needed for Cloud Code Assist with Claude
 * models, where the API translates `parameters` into Anthropic's `input_schema`.
 */
export function convertTools(
  tools: Tool[],
  useParameters = false,
): { functionDeclarations: Record<string, unknown>[] }[] | undefined {
  if (tools.length === 0) {
    return undefined;
  }
  const functionDeclarations = tools.flatMap((tool) => {
    const declaration = buildGoogleFunctionDeclaration(tool, useParameters);
    return declaration ? [declaration] : [];
  });
  if (functionDeclarations.length === 0) {
    return undefined;
  }
  return [
    {
      functionDeclarations,
    },
  ];
}

/**
 * Map tool choice string to Gemini FunctionCallingConfigMode.
 */
export function mapToolChoice(choice: string): FunctionCallingConfigMode {
  switch (choice) {
    case "auto":
      return FunctionCallingConfigMode.AUTO;
    case "none":
      return FunctionCallingConfigMode.NONE;
    case "any":
      return FunctionCallingConfigMode.ANY;
    default:
      return FunctionCallingConfigMode.AUTO;
  }
}

function requiresGoogleToolChoice(choice: GoogleProviderOptions["toolChoice"]): boolean {
  return choice === "any";
}

export function createGoogleAssistantOutput<T extends GoogleApiType>(
  model: Model<T>,
  api: Api = model.api,
): AssistantMessage {
  return {
    role: "assistant",
    content: [],
    api,
    provider: model.provider,
    model: model.id,
    usage: {
      input: 0,
      output: 0,
      cacheRead: 0,
      cacheWrite: 0,
      totalTokens: 0,
      cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0, total: 0 },
    },
    stopReason: "stop",
    timestamp: Date.now(),
  };
}

export async function runGoogleGenerateContentLifecycle<T extends GoogleApiType>(params: {
  stream: AssistantMessageEventStream;
  model: Model<T>;
  output: AssistantMessage;
  options?: Pick<StreamOptions, "signal" | "onPayload">;
  createClient: () => GoogleGenerateContentClient;
  buildParams: () => GenerateContentParameters;
  nextToolCallId: (name: string | undefined) => string;
}): Promise<void> {
  const { stream, model, output, options } = params;

  try {
    const client = params.createClient();
    let requestParams = params.buildParams();
    const nextParams = await options?.onPayload?.(requestParams, model);
    if (nextParams !== undefined) {
      requestParams = nextParams as GenerateContentParameters;
    }
    const googleStream = await client.models.generateContentStream(requestParams);
    await consumeGoogleGenerateContentStream({
      chunks: googleStream,
      model,
      output,
      stream,
      signal: options?.signal,
      nextToolCallId: params.nextToolCallId,
    });
  } catch (error) {
    for (const block of output.content) {
      if ("index" in block) {
        delete (block as { index?: number }).index;
      }
    }
    output.stopReason = options?.signal?.aborted ? "aborted" : "error";
    output.errorMessage = error instanceof Error ? error.message : JSON.stringify(error);
    stream.push({ type: "error", reason: output.stopReason, error: output });
    stream.end();
  }
}

export function buildGoogleGenerateContentParams<T extends GoogleApiType>(
  model: Model<T>,
  context: Context,
  options: GoogleProviderOptions = {},
  configHooks?: {
    mapThinkingLevel?: (level: GoogleThinkingLevel) => ThinkingConfig["thinkingLevel"];
    getDisabledThinkingConfig?: (model: Model<T>) => ThinkingConfig;
  },
): GenerateContentParameters {
  const contents = convertMessages(model, context);

  const generationConfig: GenerateContentConfig = {};
  if (options.temperature !== undefined) {
    generationConfig.temperature = options.temperature;
  }
  if (options.maxTokens !== undefined) {
    generationConfig.maxOutputTokens = options.maxTokens;
  }
  if (options.stop !== undefined && options.stop.length > 0) {
    generationConfig.stopSequences = options.stop;
  }

  const tools = context.tools && context.tools.length > 0 ? convertTools(context.tools) : undefined;
  if (!tools && context.tools?.length && requiresGoogleToolChoice(options.toolChoice)) {
    throw new Error("Google tool choice requires at least one valid tool declaration");
  }
  const config: GenerateContentConfig = {
    ...(Object.keys(generationConfig).length > 0 && generationConfig),
    ...(context.systemPrompt && { systemInstruction: sanitizeSurrogates(context.systemPrompt) }),
    ...(tools && { tools }),
  };

  if (tools && options.toolChoice) {
    config.toolConfig = {
      functionCallingConfig: {
        mode: mapToolChoice(options.toolChoice),
      },
    };
  } else {
    config.toolConfig = undefined;
  }

  if (options.thinking?.enabled && model.reasoning) {
    const thinkingConfig: ThinkingConfig = { includeThoughts: true };
    if (options.thinking.level !== undefined) {
      thinkingConfig.thinkingLevel = configHooks?.mapThinkingLevel
        ? configHooks.mapThinkingLevel(options.thinking.level)
        : (options.thinking.level as ThinkingConfig["thinkingLevel"]);
    } else if (options.thinking.budgetTokens !== undefined) {
      thinkingConfig.thinkingBudget = options.thinking.budgetTokens;
    }
    config.thinkingConfig = thinkingConfig;
  } else if (model.reasoning && options.thinking && !options.thinking.enabled) {
    config.thinkingConfig = configHooks?.getDisabledThinkingConfig
      ? configHooks.getDisabledThinkingConfig(model)
      : getDisabledGoogleThinkingConfig(model);
  }

  if (options.signal) {
    if (options.signal.aborted) {
      throw new Error("Request aborted");
    }
    config.abortSignal = options.signal;
  }

  return {
    model: model.id,
    contents,
    config,
  };
}

export function buildGoogleSimpleThinking<T extends GoogleApiType>(
  model: Model<T>,
  options: SimpleStreamOptions | undefined,
  config?: {
    includeGemma4ThinkingLevel?: boolean;
    useFlashLiteBudgets?: boolean;
  },
): GoogleThinkingOptions {
  if (!options?.reasoning) {
    return { enabled: false };
  }

  const clampedReasoning = clampThinkingLevel(model, options.reasoning);
  const effort = (
    clampedReasoning === "off" || clampedReasoning === "max" ? "high" : clampedReasoning
  ) as ClampedGoogleThinkingLevel;

  if (
    isGemini3ProModel(model) ||
    isGemini3FlashModel(model) ||
    (config?.includeGemma4ThinkingLevel && isGemma4Model(model))
  ) {
    return {
      enabled: true,
      level: getGoogleThinkingLevel(effort, model, {
        includeGemma4: config?.includeGemma4ThinkingLevel,
      }),
    };
  }

  return {
    enabled: true,
    budgetTokens: getGoogleBudget(model, effort, options.thinkingBudgets, {
      useFlashLiteBudgets: config?.useFlashLiteBudgets,
    }),
  };
}

export function getDisabledGoogleThinkingConfig<T extends GoogleApiType>(
  model: Model<T>,
  config?: {
    includeGemma4?: boolean;
    mapThinkingLevel?: (level: GoogleThinkingLevel) => ThinkingConfig["thinkingLevel"];
  },
): ThinkingConfig {
  const mapThinkingLevel = (level: GoogleThinkingLevel): ThinkingConfig["thinkingLevel"] =>
    config?.mapThinkingLevel
      ? config.mapThinkingLevel(level)
      : (level as ThinkingConfig["thinkingLevel"]);

  // Google docs: Gemini 3.1 Pro cannot disable thinking, and Gemini 3 Flash / Flash-Lite
  // do not support full thinking-off either. For Gemini 3 models, use the lowest supported
  // thinkingLevel without includeThoughts so hidden thinking remains invisible to OpenClaw.
  if (isGemini3ProModel(model)) {
    return { thinkingLevel: mapThinkingLevel("LOW") };
  }
  if (isGemini3FlashModel(model)) {
    return { thinkingLevel: mapThinkingLevel("MINIMAL") };
  }
  if (config?.includeGemma4 && isGemma4Model(model)) {
    return { thinkingLevel: mapThinkingLevel("MINIMAL") };
  }

  // Gemini 2.x supports disabling via thinkingBudget = 0.
  return { thinkingBudget: 0 };
}

export function isGemma4Model<T extends GoogleApiType>(model: Model<T>): boolean {
  return /gemma-?4/.test(model.id.toLowerCase());
}

export function isGemini3ProModel<T extends GoogleApiType>(model: Model<T>): boolean {
  return /gemini-3(?:\.\d+)?-pro/.test(model.id.toLowerCase());
}

export function isGemini3FlashModel<T extends GoogleApiType>(model: Model<T>): boolean {
  return /gemini-3(?:\.\d+)?-flash/.test(model.id.toLowerCase());
}

function getGoogleThinkingLevel<T extends GoogleApiType>(
  effort: ClampedGoogleThinkingLevel,
  model: Model<T>,
  config?: { includeGemma4?: boolean },
): GoogleThinkingLevel {
  if (isGemini3ProModel(model)) {
    switch (effort) {
      case "minimal":
      case "low":
        return "LOW";
      case "medium":
      case "high":
        return "HIGH";
    }
  }
  if (config?.includeGemma4 && isGemma4Model(model)) {
    switch (effort) {
      case "minimal":
      case "low":
        return "MINIMAL";
      case "medium":
      case "high":
        return "HIGH";
    }
  }
  switch (effort) {
    case "minimal":
      return "MINIMAL";
    case "low":
      return "LOW";
    case "medium":
      return "MEDIUM";
    case "high":
      return "HIGH";
  }
  return "HIGH";
}

function getGoogleBudget<T extends GoogleApiType>(
  model: Model<T>,
  effort: ClampedGoogleThinkingLevel,
  customBudgets?: ThinkingBudgets,
  config?: { useFlashLiteBudgets?: boolean },
): number {
  if (customBudgets?.[effort] !== undefined) {
    return customBudgets[effort];
  }

  if (model.id.includes("2.5-pro")) {
    const budgets: Record<ClampedGoogleThinkingLevel, number> = {
      minimal: 128,
      low: 2048,
      medium: 8192,
      high: 32768,
    };
    return budgets[effort];
  }

  if (config?.useFlashLiteBudgets && model.id.includes("2.5-flash-lite")) {
    const budgets: Record<ClampedGoogleThinkingLevel, number> = {
      minimal: 512,
      low: 2048,
      medium: 8192,
      high: 24576,
    };
    return budgets[effort];
  }

  if (model.id.includes("2.5-flash")) {
    const budgets: Record<ClampedGoogleThinkingLevel, number> = {
      minimal: 128,
      low: 2048,
      medium: 8192,
      high: 24576,
    };
    return budgets[effort];
  }

  return -1;
}

/**
 * Map Gemini FinishReason to our StopReason.
 */
export function mapStopReason(reason: FinishReason): StopReason {
  switch (reason) {
    case FinishReason.STOP:
      return "stop";
    case FinishReason.MAX_TOKENS:
      return "length";
    case FinishReason.BLOCKLIST:
    case FinishReason.PROHIBITED_CONTENT:
    case FinishReason.SPII:
    case FinishReason.SAFETY:
    case FinishReason.IMAGE_SAFETY:
    case FinishReason.IMAGE_PROHIBITED_CONTENT:
    case FinishReason.IMAGE_RECITATION:
    case FinishReason.IMAGE_OTHER:
    case FinishReason.RECITATION:
    case FinishReason.FINISH_REASON_UNSPECIFIED:
    case FinishReason.OTHER:
    case FinishReason.LANGUAGE:
    case FinishReason.MALFORMED_FUNCTION_CALL:
    case FinishReason.UNEXPECTED_TOOL_CALL:
    case FinishReason.NO_IMAGE:
      return "error";
    default: {
      const exhaustive: never = reason;
      throw new Error(`Unhandled stop reason: ${String(exhaustive)}`);
    }
  }
}

export async function consumeGoogleGenerateContentStream<T extends GoogleApiType>(params: {
  chunks: AsyncIterable<GenerateContentResponse>;
  model: Model<T>;
  output: AssistantMessage;
  stream: AssistantMessageEventStream;
  signal?: AbortSignal;
  nextToolCallId: (name: string | undefined) => string;
}): Promise<void> {
  params.stream.push({ type: "start", partial: params.output });
  let currentBlock: TextContent | ThinkingContent | null = null;
  const blocks = params.output.content;
  const blockIndex = () => blocks.length - 1;

  const endCurrentBlock = () => {
    if (!currentBlock) {
      return;
    }
    if (currentBlock.type === "text") {
      params.stream.push({
        type: "text_end",
        contentIndex: blockIndex(),
        content: currentBlock.text,
        partial: params.output,
      });
    } else {
      params.stream.push({
        type: "thinking_end",
        contentIndex: blockIndex(),
        content: currentBlock.thinking,
        partial: params.output,
      });
    }
    currentBlock = null;
  };

  for await (const chunk of params.chunks) {
    params.output.responseId ||= chunk.responseId;
    const candidate = chunk.candidates?.[0];
    if (candidate?.content?.parts) {
      for (const part of candidate.content.parts) {
        if (part.text !== undefined) {
          const isThinking = isThinkingPart(part);
          if (
            !currentBlock ||
            (isThinking && currentBlock.type !== "thinking") ||
            (!isThinking && currentBlock.type !== "text")
          ) {
            endCurrentBlock();
            if (isThinking) {
              currentBlock = { type: "thinking", thinking: "", thinkingSignature: undefined };
              params.output.content.push(currentBlock);
              params.stream.push({
                type: "thinking_start",
                contentIndex: blockIndex(),
                partial: params.output,
              });
            } else {
              currentBlock = { type: "text", text: "" };
              params.output.content.push(currentBlock);
              params.stream.push({
                type: "text_start",
                contentIndex: blockIndex(),
                partial: params.output,
              });
            }
          }
          if (currentBlock.type === "thinking") {
            currentBlock.thinking += part.text;
            currentBlock.thinkingSignature = retainThoughtSignature(
              currentBlock.thinkingSignature,
              part.thoughtSignature,
            );
            params.stream.push({
              type: "thinking_delta",
              contentIndex: blockIndex(),
              delta: part.text,
              partial: params.output,
            });
          } else {
            currentBlock.text += part.text;
            currentBlock.textSignature = retainThoughtSignature(
              currentBlock.textSignature,
              part.thoughtSignature,
            );
            params.stream.push({
              type: "text_delta",
              contentIndex: blockIndex(),
              delta: part.text,
              partial: params.output,
            });
          }
        }

        if (part.functionCall) {
          endCurrentBlock();
          const providedId = part.functionCall.id;
          const needsNewId =
            !providedId ||
            params.output.content.some(
              (block) => block.type === "toolCall" && block.id === providedId,
            );
          const toolCall: ToolCall = {
            type: "toolCall",
            id: needsNewId ? params.nextToolCallId(part.functionCall.name) : providedId,
            name: part.functionCall.name || "",
            arguments: (part.functionCall.args as Record<string, unknown>) ?? {},
            ...(part.thoughtSignature && { thoughtSignature: part.thoughtSignature }),
          };

          params.output.content.push(toolCall);
          params.stream.push({
            type: "toolcall_start",
            contentIndex: blockIndex(),
            partial: params.output,
          });
          params.stream.push({
            type: "toolcall_delta",
            contentIndex: blockIndex(),
            delta: JSON.stringify(toolCall.arguments),
            partial: params.output,
          });
          params.stream.push({
            type: "toolcall_end",
            contentIndex: blockIndex(),
            toolCall,
            partial: params.output,
          });
        }
      }
    }

    if (candidate?.finishReason) {
      params.output.stopReason = mapStopReason(candidate.finishReason);
      if (params.output.content.some((block) => block.type === "toolCall")) {
        params.output.stopReason = "toolUse";
      }
    }

    if (chunk.usageMetadata) {
      params.output.usage = {
        input:
          (chunk.usageMetadata.promptTokenCount || 0) -
          (chunk.usageMetadata.cachedContentTokenCount || 0),
        output:
          (chunk.usageMetadata.candidatesTokenCount || 0) +
          (chunk.usageMetadata.thoughtsTokenCount || 0),
        cacheRead: chunk.usageMetadata.cachedContentTokenCount || 0,
        cacheWrite: 0,
        totalTokens: chunk.usageMetadata.totalTokenCount || 0,
        cost: {
          input: 0,
          output: 0,
          cacheRead: 0,
          cacheWrite: 0,
          total: 0,
        },
      };
      calculateCost(params.model, params.output.usage);
    }
  }

  endCurrentBlock();

  if (params.signal?.aborted) {
    throw new Error("Request was aborted");
  }

  if (params.output.stopReason === "aborted" || params.output.stopReason === "error") {
    throw new Error("An unknown error occurred");
  }

  params.stream.push({
    type: "done",
    reason: params.output.stopReason,
    message: params.output,
  });
  params.stream.end();
}

/**
 * Map string finish reason to our StopReason (for raw API responses).
 */
export function mapStopReasonString(reason: string): StopReason {
  switch (reason) {
    case "STOP":
      return "stop";
    case "MAX_TOKENS":
      return "length";
    default:
      return "error";
  }
}