feat(server): use faster model in ci test (#13038)

fix AI-329
2026-02-13 12:55:00 +00:00 · 2025-07-09 22:21:30 +08:00
parent 38537bf310
commit c4c11da976
17 changed files with 121 additions and 61 deletions
--- a/packages/backend/server/src/tests/copilot-provider.spec.ts
+++ b/packages/backend/server/src/tests/copilot-provider.spec.ts
@@ -369,7 +369,7 @@ The term **“CRDT”** was first introduced by Marc Shapiro, Nuno Preguiça, Ca
              .map(c => JSON.parse(c.citationJson).type)
              .filter(type => ['attachment', 'doc'].includes(type)).length ===
              0,
-          'should not have citation'
+          `should not have citation: ${JSON.stringify(c, null, 2)}`
        );
      });
    },
--- a/packages/backend/server/src/plugins/copilot/embedding/client.ts
+++ b/packages/backend/server/src/plugins/copilot/embedding/client.ts
@@ -112,11 +112,14 @@ class ProductionEmbeddingClient extends EmbeddingClient {
    );

    try {
-      return ranks.map((score, chunk) => ({
-        chunk,
-        targetId: this.getTargetId(embeddings[chunk]),
-        score,
-      }));
+      return ranks.map((score, i) => {
+        const chunk = embeddings[i];
+        return {
+          chunk: chunk.chunk,
+          targetId: this.getTargetId(chunk),
+          score: Math.max(score, 1 - (chunk.distance || -Infinity)),
+        };
+      });
    } catch (error) {
      this.logger.error('Failed to parse rerank results', error);
      // silent error, will fallback to default sorting in parent method
@@ -148,7 +151,7 @@ class ProductionEmbeddingClient extends EmbeddingClient {

    const chunks = sortedEmbeddings.reduce(
      (acc, e) => {
-        const targetId = 'docId' in e ? e.docId : 'fileId' in e ? e.fileId : '';
+        const targetId = this.getTargetId(e);
        const key = `${targetId}:${e.chunk}`;
        acc[key] = e;
        return acc;
@@ -179,7 +182,10 @@ class ProductionEmbeddingClient extends EmbeddingClient {
        .filter(Boolean);

      this.logger.verbose(
-        `ReRank completed: ${highConfidenceChunks.length} high-confidence results found`
+        `ReRank completed: ${highConfidenceChunks.length} high-confidence results found, total ${sortedEmbeddings.length} embeddings`,
+        highConfidenceChunks.length !== sortedEmbeddings.length
+          ? JSON.stringify(ranks)
+          : undefined
      );
      return highConfidenceChunks.slice(0, topK);
    } catch (error) {
--- a/packages/backend/server/src/plugins/copilot/prompt/prompts.ts
+++ b/packages/backend/server/src/plugins/copilot/prompt/prompts.ts
@@ -338,7 +338,7 @@ Convert a multi-speaker audio recording into a structured JSON format by transcr
  {
    name: 'Rerank results',
    action: 'Rerank results',
-    model: 'gpt-4.1-mini',
+    model: 'gpt-4.1',
    messages: [
      {
        role: 'system',
@@ -1677,7 +1677,7 @@ This sentence contains information from the first source[^1]. This sentence refe
 Before starting Tool calling, you need to follow:
 - DO NOT explain what operation you will perform.
 - DO NOT embed a tool call mid-sentence.
- When searching for unknown information or keyword, prioritize searching the user's workspace.
+- When searching for unknown information, personal information or keyword, prioritize searching the user's workspace rather than the web.
 - Depending on the complexity of the question and the information returned by the search tools, you can call different tools multiple times to search.
 </tool-calling-guidelines>

--- a/packages/backend/server/src/plugins/copilot/prompt/service.ts
+++ b/packages/backend/server/src/plugins/copilot/prompt/service.ts
@@ -53,8 +53,11 @@ export class PromptService implements OnApplicationBootstrap {
   * @returns prompt messages
   */
  async get(name: string): Promise<ChatPrompt | null> {
-    const cached = this.cache.get(name);
-    if (cached) return cached;
+    // skip cache in dev mode to ensure the latest prompt is always fetched
+    if (!env.dev) {
+      const cached = this.cache.get(name);
+      if (cached) return cached;
+    }

    const prompt = await this.db.aiPrompt.findUnique({
      where: {
--- a/packages/backend/server/src/plugins/copilot/providers/anthropic/anthropic.ts
+++ b/packages/backend/server/src/plugins/copilot/providers/anthropic/anthropic.ts
@@ -62,6 +62,7 @@ export abstract class AnthropicProvider<T> extends CopilotProvider<T> {

    try {
      metrics.ai.counter('chat_text_calls').add(1, { model: model.id });
+
      const [system, msgs] = await chatToGPTMessage(messages, true, true);

      const modelInstance = this.instance(model.id);
--- a/packages/backend/server/src/plugins/copilot/providers/gemini/gemini.ts
+++ b/packages/backend/server/src/plugins/copilot/providers/gemini/gemini.ts
@@ -88,6 +88,12 @@ export abstract class GeminiProvider<T> extends CopilotProvider<T> {
        system,
        messages: msgs,
        abortSignal: options.signal,
+        providerOptions: {
+          google: this.getGeminiOptions(options, model.id),
+        },
+        tools: await this.getTools(options, model.id),
+        maxSteps: this.MAX_STEPS,
+        experimental_continueSteps: true,
      });

      if (!text) throw new Error('Failed to generate text');
@@ -254,16 +260,16 @@ export abstract class GeminiProvider<T> extends CopilotProvider<T> {
  ) {
    const [system, msgs] = await chatToGPTMessage(messages);
    const { fullStream } = streamText({
-      model: this.instance(model.id, {
-        useSearchGrounding: this.useSearchGrounding(options),
-      }),
+      model: this.instance(model.id),
      system,
      messages: msgs,
      abortSignal: options.signal,
-      maxSteps: this.MAX_STEPS,
      providerOptions: {
        google: this.getGeminiOptions(options, model.id),
      },
+      tools: await this.getTools(options, model.id),
+      maxSteps: this.MAX_STEPS,
+      experimental_continueSteps: true,
    });
    return fullStream;
  }
@@ -282,8 +288,4 @@ export abstract class GeminiProvider<T> extends CopilotProvider<T> {
  private isReasoningModel(model: string) {
    return model.startsWith('gemini-2.5');
  }
-
-  private useSearchGrounding(options: CopilotChatOptions) {
-    return options?.tools?.includes('webSearch');
-  }
 }
--- a/packages/backend/server/src/plugins/copilot/providers/openai.ts
+++ b/packages/backend/server/src/plugins/copilot/providers/openai.ts
@@ -274,9 +274,11 @@ export class OpenAIProvider extends CopilotProvider<OpenAIConfig> {
  override getProviderSpecificTools(
    toolName: CopilotChatTools,
    model: string
-  ): [string, Tool] | undefined {
+  ): [string, Tool?] | undefined {
    if (toolName === 'webSearch' && !this.isReasoningModel(model)) {
      return ['web_search_preview', openai.tools.webSearchPreview()];
+    } else if (toolName === 'docEdit') {
+      return ['doc_edit', undefined];
    }
    return;
  }
--- a/packages/backend/server/src/plugins/copilot/providers/provider.ts
+++ b/packages/backend/server/src/plugins/copilot/providers/provider.ts
@@ -126,7 +126,7 @@ export abstract class CopilotProvider<C = any> {
  protected getProviderSpecificTools(
    _toolName: CopilotChatTools,
    _model: string
-  ): [string, Tool] | undefined {
+  ): [string, Tool?] | undefined {
    return;
  }

@@ -143,7 +143,10 @@ export abstract class CopilotProvider<C = any> {
      for (const tool of options.tools) {
        const toolDef = this.getProviderSpecificTools(tool, model);
        if (toolDef) {
-          tools[toolDef[0]] = toolDef[1];
+          // allow provider prevent tool creation
+          if (toolDef[1]) {
+            tools[toolDef[0]] = toolDef[1];
+          }
          continue;
        }
        switch (tool) {
--- a/packages/backend/server/src/plugins/copilot/tools/doc-semantic-search.ts
+++ b/packages/backend/server/src/plugins/copilot/tools/doc-semantic-search.ts
@@ -58,7 +58,7 @@ export const createDocSemanticSearchTool = (
 ) => {
  return tool({
    description:
-      'Retrieve conceptually related passages by performing vector-based semantic similarity search across embedded documents; use this tool only when exact keyword search fails or the user explicitly needs meaning-level matches (e.g., paraphrases, synonyms, broader concepts).',
+      'Retrieve conceptually related passages by performing vector-based semantic similarity search across embedded documents; use this tool only when exact keyword search fails or the user explicitly needs meaning-level matches (e.g., paraphrases, synonyms, broader concepts, recent documents).',
    parameters: z.object({
      query: z
        .string()