perf: quote response

2023-07-17 16:12:51 +08:00
parent 60a9dfb55f
commit 53a4d9db05
20 changed files with 215 additions and 173 deletions
--- a/client/src/pages/api/openapi/modules/chat/gpt.ts
+++ b/client/src/pages/api/openapi/modules/chat/gpt.ts
@@ -128,7 +128,6 @@ export async function chatCompletion({

  const adaptMessages = adaptChatItem_openAI({ messages: filterMessages, reserveId: false });
  const chatAPI = getOpenAIApi();
-  console.log(adaptMessages);

  /* count response max token */
  const promptsToken = modelToolMap.countTokens({
--- a/client/src/pages/api/openapi/modules/kb/search.ts
+++ b/client/src/pages/api/openapi/modules/kb/search.ts
@@ -3,13 +3,14 @@ import { jsonRes } from '@/service/response';
 import { PgClient } from '@/service/pg';
 import { withNextCors } from '@/service/utils/tools';
 import type { ChatItemType } from '@/types/chat';
-import { ChatRoleEnum } from '@/constants/chat';
+import { ChatRoleEnum, rawSearchKey } from '@/constants/chat';
 import { modelToolMap } from '@/utils/plugin';
 import { getVector } from '../../plugin/vector';
 import { countModelPrice, pushTaskBillListItem } from '@/service/events/pushBill';
 import { getModel } from '@/service/utils/data';

 export type QuoteItemType = {
+  kb_id: string;
  id: string;
  q: string;
  a: string;
@@ -26,7 +27,7 @@ type Props = {
  billId?: string;
 };
 type Response = {
-  rawSearch: QuoteItemType[];
+  [rawSearchKey]: QuoteItemType[];
  isEmpty?: boolean;
  quotePrompt?: string;
 };
@@ -85,7 +86,7 @@ export async function kbSearch({
    PgClient.query(
      `BEGIN;
    SET LOCAL ivfflat.probes = ${global.systemEnv.pgIvfflatProbe || 10};
-    select id,q,a,source from modelData where kb_id IN (${kb_ids
+    select kb_id,id,q,a,source from modelData where kb_id IN (${kb_ids
      .map((item) => `'${item}'`)
      .join(',')}) AND vector <#> '[${vectors[0]}]' < -${similarity} order by vector <#> '[${
        vectors[0]
--- a/client/src/pages/api/openapi/text/gptMessagesSlice.ts
+++ b/client/src/pages/api/openapi/text/gptMessagesSlice.ts
@@ -42,11 +42,11 @@ export default async function handler(req: NextApiRequest, res: NextApiResponse)

 export function gpt_chatItemTokenSlice({
  messages,
-  model,
+  model = 'gpt-3.5-turbo',
  maxToken
 }: {
  messages: ChatItemType[];
-  model: ModelType;
+  model?: ModelType;
  maxToken: number;
 }) {
  let result: ChatItemType[] = [];
--- a/client/src/pages/api/openapi/v1/chat/completions.ts
+++ b/client/src/pages/api/openapi/v1/chat/completions.ts
@@ -94,6 +94,8 @@ export default withNextCors(async function handler(req: NextApiRequest, res: Nex
      getChatHistory({ historyId, userId })
    ]);

+    const isOwner = !shareId && userId === String(app.userId);
+
    const prompts = history.concat(gptMessage2ChatType(messages));
    if (prompts[prompts.length - 1].obj === 'AI') {
      prompts.pop();
@@ -143,24 +145,30 @@ export default withNextCors(async function handler(req: NextApiRequest, res: Nex
            _id: messages[messages.length - 1]._id,
            obj: ChatRoleEnum.AI,
            value: answerText,
-            responseData
+            ...responseData
          }
        ],
        userId
      });
    }

+    console.log(`finish time: ${(Date.now() - startTime) / 100}s`);
+
    if (stream) {
      sseResponse({
        res,
        event: sseResponseEventEnum.answer,
        data: '[DONE]'
      });
-      sseResponse({
-        res,
-        event: sseResponseEventEnum.appStreamResponse,
-        data: JSON.stringify(responseData)
-      });
+
+      if (isOwner) {
+        sseResponse({
+          res,
+          event: sseResponseEventEnum.appStreamResponse,
+          data: JSON.stringify(responseData)
+        });
+      }
+
      res.end();
    } else {
      res.json({
@@ -189,7 +197,6 @@ export default withNextCors(async function handler(req: NextApiRequest, res: Nex
    delTaskBill(billId);

    if (stream) {
-      res.status(500);
      sseErrRes(res, err);
      res.end();
    } else {