修改： app/client/platforms/bedrock.ts

2024-11-05 10:34:33 +08:00 · 2024-11-05 10:34:33 +08:00 · 0f276f59bb
parent fc391168e9
commit 0f276f59bb
1 changed files with 237 additions and 348 deletions
--- a/app/client/platforms/bedrock.ts
+++ b/app/client/platforms/bedrock.ts
@ -3,22 +3,49 @@ import {
  ChatOptions,
  getHeaders,
  LLMApi,
  LLMModel,
  LLMUsage,
  MultimodalContent,
  SpeechOptions,
 } from "../api";
 import { useAccessStore, useAppConfig } from "../../store";
 import Locale from "../../locales";
 import {
-  getMessageImages,
+  useAccessStore,
-  getMessageTextContent,
+  useAppConfig,
-  isVisionModel,
+  usePluginStore,
-} from "../../utils";
+  useChatStore,
  ChatMessageTool,
 } from "../../store";
 import { getMessageTextContent, isVisionModel } from "../../utils";
 import { fetch } from "../../utils/stream";
 import { preProcessImageContent, stream } from "../../utils/chat";
-const MAX_IMAGE_SIZE = 1024 * 1024 * 4; // 4MB limit
+export type MultiBlockContent = {
  type: "image" | "text";
  source?: {
    type: string;
    media_type: string;
    data: string;
  };
  text?: string;
 };
 export type AnthropicMessage = {
  role: (typeof ClaudeMapper)[keyof typeof ClaudeMapper];
  content: string | MultiBlockContent[];
 };
 const ClaudeMapper = {
  assistant: "assistant",
  user: "user",
  system: "user",
 } as const;
 export class BedrockApi implements LLMApi {
  usage(): Promise<LLMUsage> {
    throw new Error("Method not implemented.");
  }
  models(): Promise<LLMModel[]> {
    throw new Error("Method not implemented.");
  }
  speech(options: SpeechOptions): Promise<ArrayBuffer> {
    throw new Error("Speech not implemented for Bedrock.");
  }
@ -31,154 +58,17 @@ export class BedrockApi implements LLMApi {
    return res;
  }
  async processDocument(
    file: File,
  ): Promise<{ display: string; content: MultimodalContent }> {
    return new Promise((resolve, reject) => {
      const reader = new FileReader();
      reader.onload = async () => {
        try {
          const arrayBuffer = reader.result as ArrayBuffer;
          const format = file.name.split(".").pop()?.toLowerCase();
          if (!format) {
            throw new Error("Could not determine file format");
          }
          // Format file size
          const size = file.size;
          let sizeStr = "";
          if (size < 1024) {
            sizeStr = size + " B";
          } else if (size < 1024 * 1024) {
            sizeStr = (size / 1024).toFixed(2) + " KB";
          } else {
            sizeStr = (size / (1024 * 1024)).toFixed(2) + " MB";
          }
          // Create display text
          const displayText = `Document: ${file.name} (${sizeStr})`;
          // Create actual content
          const content: MultimodalContent = {
            type: "document",
            document: {
              format: format as
                | "pdf"
                | "csv"
                | "doc"
                | "docx"
                | "xls"
                | "xlsx"
                | "html"
                | "txt"
                | "md",
              name: file.name,
              source: {
                bytes: Buffer.from(arrayBuffer).toString("base64"),
              },
            },
          };
          resolve({
            display: displayText,
            content: content,
          });
        } catch (e) {
          reject(e);
        }
      };
      reader.onerror = () => reject(reader.error);
      reader.readAsArrayBuffer(file);
    });
  }
  async processImage(url: string): Promise<MultimodalContent> {
    if (url.startsWith("data:")) {
      const base64Match = url.match(/^data:image\/([a-zA-Z]*);base64,([^"]*)/);
      if (base64Match) {
        const format = base64Match[1].toLowerCase();
        const base64Data = base64Match[2];
        // Check base64 size
        const binarySize = atob(base64Data).length;
        if (binarySize > MAX_IMAGE_SIZE) {
          throw new Error(
            `Image size (${(binarySize / (1024 * 1024)).toFixed(
              2,
            )}MB) exceeds maximum allowed size of 4MB`,
          );
        }
        return {
          type: "image_url",
          image_url: {
            url: url,
          },
        };
      }
      throw new Error("Invalid data URL format");
    }
    // For non-data URLs, fetch and convert to base64
    try {
      const response = await fetch(url);
      if (!response.ok) {
        throw new Error(`Failed to fetch image: ${response.statusText}`);
      }
      const blob = await response.blob();
      if (blob.size > MAX_IMAGE_SIZE) {
        throw new Error(
          `Image size (${(blob.size / (1024 * 1024)).toFixed(
            2,
          )}MB) exceeds maximum allowed size of 4MB`,
        );
      }
      const reader = new FileReader();
      const base64 = await new Promise<string>((resolve, reject) => {
        reader.onloadend = () => resolve(reader.result as string);
        reader.onerror = () => reject(new Error("Failed to read image data"));
        reader.readAsDataURL(blob);
      });
      return {
        type: "image_url",
        image_url: {
          url: base64,
        },
      };
    } catch (error) {
      console.error("[Bedrock] Image processing error:", error);
      throw error;
    }
  }
  async chat(options: ChatOptions): Promise<void> {
    const visionModel = isVisionModel(options.config.model);
    const accessStore = useAccessStore.getState();
    const shouldStream = !!options.config.stream;
    const modelConfig = {
      ...useAppConfig.getState().modelConfig,
-      ...options.config,
+      ...useChatStore.getState().currentSession().mask.modelConfig,
      ...{
        model: options.config.model,
      },
    };
    if (
      !accessStore.awsRegion ||
      !accessStore.awsAccessKeyId ||
      !accessStore.awsSecretAccessKey
    ) {
      console.log("AWS credentials are not set");
      let responseText = "";
      const responseTexts = [responseText];
      responseTexts.push(Locale.Error.Unauthorized);
      responseText = responseTexts.join("\n\n");
      options.onFinish(responseText);
      return;
    }
    const controller = new AbortController();
    options.onController?.(controller);
    const headers: Record<string, string> = {
      ...getHeaders(),
      "X-Region": accessStore.awsRegion,
@ -186,200 +76,212 @@ export class BedrockApi implements LLMApi {
      "X-Secret-Key": accessStore.awsSecretAccessKey,
    };
-    if (accessStore.awsSessionToken) {
+    // try get base64image from local cache image_url
-      headers["X-Session-Token"] = accessStore.awsSessionToken;
+    const messages: ChatOptions["messages"] = [];
    for (const v of options.messages) {
      const content = await preProcessImageContent(v.content);
      messages.push({ role: v.role, content });
    }
-    try {
+    const keys = ["system", "user"];
      // Process messages to handle multimodal content
      const messages = await Promise.all(
        options.messages.map(async (msg) => {
          if (Array.isArray(msg.content)) {
            // For vision models, include both text and images
            if (isVisionModel(options.config.model)) {
              const images = getMessageImages(msg);
              const content: MultimodalContent[] = [];
-              // Process documents first
+    // roles must alternate between "user" and "assistant" in claude, so add a fake assistant message between two user messages
-              for (const item of msg.content) {
+    for (let i = 0; i < messages.length - 1; i++) {
-                // Check for document content
+      const message = messages[i];
-                if (item && typeof item === "object") {
+      const nextMessage = messages[i + 1];
-                  if ("file" in item && item.file instanceof File) {
+
-                    try {
+      if (keys.includes(message.role) && keys.includes(nextMessage.role)) {
-                      console.log(
+        messages[i] = [
-                        "[Bedrock] Processing document:",
+          message,
-                        item.file.name,
+          {
-                      );
+            role: "assistant",
-                      const { content: docContent } =
+            content: ";",
-                        await this.processDocument(item.file);
+          },
-                      content.push(docContent);
+        ] as any;
                    } catch (e) {
                      console.error("[Bedrock] Failed to process document:", e);
                    }
                  } else if ("document" in item && item.document) {
                    // If document content is already processed, include it directly
                    content.push(item as MultimodalContent);
                  }
      }
    }
-              // Add text content if it's not a document display text
+    const prompt = messages
-              const text = getMessageTextContent(msg);
+      .flat()
-              if (text && !text.startsWith("Document: ")) {
+      .filter((v) => {
-                content.push({ type: "text", text });
+        if (!v.content) return false;
-              }
+        if (typeof v.content === "string" && !v.content.trim()) return false;
        return true;
      })
      .map((v) => {
        const { role, content } = v;
        const insideRole = ClaudeMapper[role] ?? "user";
-              // Process images with size check and error handling
+        if (!visionModel || typeof content === "string") {
-              for (const url of images) {
+          return {
-                try {
+            role: insideRole,
-                  const imageContent = await this.processImage(url);
+            content: getMessageTextContent(v),
-                  content.push(imageContent);
+          };
                } catch (e) {
                  console.error("[Bedrock] Failed to process image:", e);
                  // Add error message as text content
                  content.push({
                    type: "text",
                    text: `Error processing image: ${e}`,
                  });
        }
        return {
          role: insideRole,
          content: content
            .filter((v) => v.image_url || v.text)
            .map(({ type, text, image_url }) => {
              if (type === "text") {
                return {
                  type,
                  text: text!,
                };
              }
              const { url = "" } = image_url || {};
              const colonIndex = url.indexOf(":");
              const semicolonIndex = url.indexOf(";");
              const comma = url.indexOf(",");
-              // Only return content if there is any
+              const mimeType = url.slice(colonIndex + 1, semicolonIndex);
-              if (content.length > 0) {
+              const encodeType = url.slice(semicolonIndex + 1, comma);
-                return { ...msg, content };
+              const data = url.slice(comma + 1);
-              }
+
-            }
+              return {
-            // For non-vision models, only include text
+                type: "image" as const,
-            return { ...msg, content: getMessageTextContent(msg) };
+                source: {
-          }
+                  type: encodeType,
-          return msg;
+                  media_type: mimeType,
                  data,
                },
              };
            }),
-      );
+        };
      // Filter out empty messages
      const filteredMessages = messages.filter((msg) => {
        if (Array.isArray(msg.content)) {
          return msg.content.length > 0;
        }
        return msg.content !== "";
      });
    if (prompt[0]?.role === "assistant") {
      prompt.unshift({
        role: "user",
        content: ";",
      });
    }
    const [tools, funcs] = usePluginStore
      .getState()
      .getAsTools(useChatStore.getState().currentSession().mask?.plugin || []);
    const requestBody = {
        messages: filteredMessages,
      modelId: options.config.model,
      messages: messages.filter((msg) => msg.content.length > 0),
      inferenceConfig: {
        maxTokens: modelConfig.max_tokens,
        temperature: modelConfig.temperature,
        topP: modelConfig.top_p,
        stopSequences: [],
      },
      toolConfig:
        Array.isArray(tools) && tools.length > 0
          ? {
              tools: tools.map((tool: any) => ({
                toolSpec: {
                  name: tool?.function?.name,
                  description: tool?.function?.description,
                  inputSchema: {
                    json: tool?.function?.parameters,
                  },
                },
              })),
              toolChoice: { auto: {} },
            }
          : undefined,
    };
      console.log(
        "[Bedrock] Request body:",
        JSON.stringify(
          {
            ...requestBody,
            messages: requestBody.messages.map((msg) => ({
              ...msg,
              content: Array.isArray(msg.content)
                ? msg.content.map((c) => ({
                    type: c.type,
                    ...(c.document
                      ? {
                          document: {
                            format: c.document.format,
                            name: c.document.name,
                          },
                        }
                      : {}),
                    ...(c.image_url ? { image_url: { url: "[BINARY]" } } : {}),
                    ...(c.text ? { text: c.text } : {}),
                  }))
                : msg.content,
            })),
          },
          null,
          2,
        ),
      );
      const shouldStream = !!options.config.stream;
    const conversePath = `${ApiPath.Bedrock}/converse`;
    const controller = new AbortController();
    options.onController?.(controller);
    if (shouldStream) {
-        let response = await fetch(conversePath, {
+      let currentToolUse: ChatMessageTool | null = null;
-          method: "POST",
+      return stream(
-          headers: {
+        conversePath,
-            ...headers,
+        requestBody,
-            "X-Stream": "true",
+        headers,
-          },
+        Array.isArray(tools)
-          body: JSON.stringify(requestBody),
+          ? tools.map((tool: any) => ({
-          signal: controller.signal,
+              name: tool?.function?.name,
-        });
+              description: tool?.function?.description,
-
+              input_schema: tool?.function?.parameters,
-        if (!response.ok) {
+            }))
-          const error = await response.text();
+          : [],
-          throw new Error(`Bedrock API error: ${error}`);
+        funcs,
-        }
+        controller,
-
+        // parseSSE
-        let buffer = "";
+        (text: string, runTools: ChatMessageTool[]) => {
-        const reader = response.body?.getReader();
+          const event = JSON.parse(text);
        if (!reader) {
          throw new Error("No response body reader available");
        }
        let currentContent = "";
        let isFirstMessage = true;
        while (true) {
          const { done, value } = await reader.read();
          if (done) break;
          // Convert the chunk to text and add to buffer
          const chunk = new TextDecoder().decode(value);
          buffer += chunk;
          // Process complete messages from buffer
          let newlineIndex;
          while ((newlineIndex = buffer.indexOf("\n")) !== -1) {
            const line = buffer.slice(0, newlineIndex).trim();
            buffer = buffer.slice(newlineIndex + 1);
            if (line.startsWith("data: ")) {
              try {
                const event = JSON.parse(line.slice(6));
          if (event.type === "messageStart") {
-                  if (isFirstMessage) {
+            return "";
                    isFirstMessage = false;
          }
-                  continue;
+
          if (event.type === "contentBlockStart" && event.start?.toolUse) {
            const { toolUseId, name } = event.start.toolUse;
            currentToolUse = {
              id: toolUseId,
              type: "function",
              function: {
                name,
                arguments: "",
              },
            };
            runTools.push(currentToolUse);
            return "";
          }
          if (event.type === "text" && event.content) {
-                  currentContent += event.content;
+            return event.content;
                  options.onUpdate?.(currentContent, event.content);
          }
-                if (event.type === "messageStop") {
+          if (
-                  options.onFinish(currentContent);
+            event.type === "toolUse" &&
-                  return;
+            event.input &&
            currentToolUse?.function
          ) {
            currentToolUse.function.arguments += event.input;
            return "";
          }
          if (event.type === "error") {
            throw new Error(event.message || "Unknown error");
          }
              } catch (e) {
                console.error("[Bedrock] Failed to parse stream event:", e);
              }
            }
          }
        }
-        // If we reach here without a messageStop event, finish with current content
+          return "";
-        options.onFinish(currentContent);
+        },
        // processToolMessage
        (requestPayload: any, toolCallMessage: any, toolCallResult: any[]) => {
          currentToolUse = null;
          requestPayload?.messages?.splice(
            requestPayload?.messages?.length,
            0,
            {
              role: "assistant",
              content: toolCallMessage.tool_calls.map(
                (tool: ChatMessageTool) => ({
                  type: "tool_use",
                  id: tool.id,
                  name: tool?.function?.name,
                  input: tool?.function?.arguments
                    ? JSON.parse(tool?.function?.arguments)
                    : {},
                }),
              ),
            },
            ...toolCallResult.map((result) => ({
              role: "user",
              content: [
                {
                  type: "tool_result",
                  tool_use_id: result.tool_call_id,
                  content: result.content,
                },
              ],
            })),
          );
        },
        options,
      );
    } else {
      try {
        const response = await fetch(conversePath, {
          method: "POST",
          headers,
@ -395,23 +297,10 @@ export class BedrockApi implements LLMApi {
        const responseBody = await response.json();
        const content = this.extractMessage(responseBody);
        options.onFinish(content);
-      }
+      } catch (e: any) {
    } catch (e) {
        console.error("[Bedrock] Chat error:", e);
-      options.onError?.(e as Error);
+        throw e;
      }
    }
  async usage(): Promise<LLMUsage> {
    // Bedrock usage is tracked through AWS billing
    return {
      used: 0,
      total: 0,
    };
  }
  async models() {
    // Return empty array as models are configured through AWS console
    return [];
  }
 }