Optimize the structure and naming of projects (#335)

2025-08-02 12:48:30 +00:00 · 2023-09-21 14:49:56 +08:00
parent a3c77480f7
commit 823f4b7ad1
97 changed files with 882 additions and 821 deletions
--- a/client/src/utils/app.ts
+++ b/client/src/utils/app.ts
@@ -7,14 +7,14 @@ import {
  SpecialInputKeyEnum
 } from '@/constants/flow';
 import { SystemInputEnum } from '@/constants/app';
-import type { SelectedKbType } from '@/types/plugin';
+import type { SelectedDatasetType } from '@/types/core/dataset';
 import { FlowInputItemType } from '@/types/flow';
 import type { AIChatProps } from '@/types/core/aiChat';

 export type EditFormType = {
  chatModel: AIChatProps;
  kb: {
-    list: SelectedKbType;
+    list: SelectedDatasetType;
    searchSimilarity: number;
    searchLimit: number;
    searchEmptyText: string;
--- a/client/src/utils/common/file/index.tsx
+++ b/client/src/utils/common/file/index.tsx
@@ -1,7 +0,0 @@
-import { getFileViewUrl } from '@/api/support/file';
-
-export async function getFileAndOpen(fileId: string) {
-  const url = await getFileViewUrl(fileId);
-  const asPath = `${location.origin}${url}`;
-  window.open(asPath, '_blank');
-}
--- a/client/src/utils/file.ts
+++ b/client/src/utils/file.ts
@@ -1,179 +1,6 @@
-import mammoth from 'mammoth';
-import Papa from 'papaparse';
 import { getErrText } from './tools';
-import { uploadImg, postUploadFiles } from '@/api/support/file';
 import { countPromptTokens } from './common/tiktoken';

-/**
- * upload file to mongo gridfs
- */
-export const uploadFiles = (
-  files: File[],
-  metadata: Record<string, any> = {},
-  percentListen?: (percent: number) => void
-) => {
-  const form = new FormData();
-  form.append('metadata', JSON.stringify(metadata));
-  files.forEach((file) => {
-    form.append('file', file, encodeURIComponent(file.name));
-  });
-  return postUploadFiles(form, (e) => {
-    if (!e.total) return;
-
-    const percent = Math.round((e.loaded / e.total) * 100);
-    percentListen && percentListen(percent);
-  });
-};
-
-/**
- * 读取 txt 文件内容
- */
-export const readTxtContent = (file: File) => {
-  return new Promise((resolve: (_: string) => void, reject) => {
-    try {
-      const reader = new FileReader();
-      reader.onload = () => {
-        resolve(reader.result as string);
-      };
-      reader.onerror = (err) => {
-        console.log('error txt read:', err);
-        reject('读取 txt 文件失败');
-      };
-      reader.readAsText(file);
-    } catch (error) {
-      reject('浏览器不支持文件内容读取');
-    }
-  });
-};
-
-/**
- * 读取 pdf 内容
- */
-export const readPdfContent = (file: File) =>
-  new Promise<string>((resolve, reject) => {
-    try {
-      const pdfjsLib = window['pdfjs-dist/build/pdf'];
-      pdfjsLib.workerSrc = '/js/pdf.worker.js';
-
-      const readPDFPage = async (doc: any, pageNo: number) => {
-        const page = await doc.getPage(pageNo);
-        const tokenizedText = await page.getTextContent();
-
-        const pageText = tokenizedText.items
-          .map((token: any) => token.str)
-          .filter((item: string) => item)
-          .join('');
-        return pageText;
-      };
-
-      let reader = new FileReader();
-      reader.readAsArrayBuffer(file);
-      reader.onload = async (event) => {
-        if (!event?.target?.result) return reject('解析 PDF 失败');
-        try {
-          const doc = await pdfjsLib.getDocument(event.target.result).promise;
-          const pageTextPromises = [];
-          for (let pageNo = 1; pageNo <= doc.numPages; pageNo++) {
-            pageTextPromises.push(readPDFPage(doc, pageNo));
-          }
-          const pageTexts = await Promise.all(pageTextPromises);
-          resolve(pageTexts.join('\n'));
-        } catch (err) {
-          console.log(err, 'pdf load error');
-          reject('解析 PDF 失败');
-        }
-      };
-      reader.onerror = (err) => {
-        console.log(err, 'pdf load error');
-        reject('解析 PDF 失败');
-      };
-    } catch (error) {
-      reject('浏览器不支持文件内容读取');
-    }
-  });
-
-/**
- * 读取doc
- */
-export const readDocContent = (file: File) =>
-  new Promise<string>((resolve, reject) => {
-    try {
-      const reader = new FileReader();
-      reader.readAsArrayBuffer(file);
-      reader.onload = async ({ target }) => {
-        if (!target?.result) return reject('读取 doc 文件失败');
-        try {
-          const res = await mammoth.extractRawText({
-            arrayBuffer: target.result as ArrayBuffer
-          });
-          resolve(res?.value);
-        } catch (error) {
-          window.umami?.track('wordReadError', {
-            err: error?.toString()
-          });
-          console.log('error doc read:', error);
-
-          reject('读取 doc 文件失败, 请转换成 PDF');
-        }
-      };
-      reader.onerror = (err) => {
-        window.umami?.track('wordReadError', {
-          err: err?.toString()
-        });
-        console.log('error doc read:', err);
-
-        reject('读取 doc 文件失败');
-      };
-    } catch (error) {
-      reject('浏览器不支持文件内容读取');
-    }
-  });
-
-/**
- * 读取csv
- */
-export const readCsvContent = async (file: File) => {
-  try {
-    const textArr = await readTxtContent(file);
-    const csvArr = Papa.parse(textArr).data as string[][];
-    if (csvArr.length === 0) {
-      throw new Error('csv 解析失败');
-    }
-    return {
-      header: csvArr.shift() as string[],
-      data: csvArr.map((item) => item)
-    };
-  } catch (error) {
-    return Promise.reject('解析 csv 文件失败');
-  }
-};
-
-/**
- * file download
- */
-export const fileDownload = ({
-  text,
-  type,
-  filename
-}: {
-  text: string;
-  type: string;
-  filename: string;
-}) => {
-  // 导出为文件
-  const blob = new Blob([`\uFEFF${text}`], { type: `${type};charset=utf-8;` });
-
-  // 创建下载链接
-  const downloadLink = document.createElement('a');
-  downloadLink.href = window.URL.createObjectURL(blob);
-  downloadLink.download = filename;
-
-  // 添加链接到页面并触发下载
-  document.body.appendChild(downloadLink);
-  downloadLink.click();
-  document.body.removeChild(downloadLink);
-};
-
 /**
 * text split into chunks
 * maxLen - one chunk len. max: 3500
@@ -217,89 +44,6 @@ export const splitText2Chunks = ({ text, maxLen }: { text: string; maxLen: numbe
  }
 };

-export const fileToBase64 = (file: File) => {
-  return new Promise((resolve, reject) => {
-    const reader = new FileReader();
-    reader.readAsDataURL(file);
-    reader.onload = () => resolve(reader.result);
-    reader.onerror = (error) => reject(error);
-  });
-};
-
-/**
- * compress image. response base64
- * @param maxSize The max size of the compressed image
- */
-export const compressImg = ({
-  file,
-  maxW = 200,
-  maxH = 200,
-  maxSize = 1024 * 100
-}: {
-  file: File;
-  maxW?: number;
-  maxH?: number;
-  maxSize?: number;
-}) =>
-  new Promise<string>((resolve, reject) => {
-    const reader = new FileReader();
-    reader.readAsDataURL(file);
-    reader.onload = async () => {
-      const img = new Image();
-      // @ts-ignore
-      img.src = reader.result;
-      img.onload = async () => {
-        let width = img.width;
-        let height = img.height;
-
-        if (width > height) {
-          if (width > maxW) {
-            height *= maxW / width;
-            width = maxW;
-          }
-        } else {
-          if (height > maxH) {
-            width *= maxH / height;
-            height = maxH;
-          }
-        }
-
-        const canvas = document.createElement('canvas');
-        canvas.width = width;
-        canvas.height = height;
-        const ctx = canvas.getContext('2d');
-
-        if (!ctx) {
-          return reject('压缩图片异常');
-        }
-
-        ctx.drawImage(img, 0, 0, width, height);
-        const compressedDataUrl = canvas.toDataURL(file.type, 0.8);
-        // 移除 canvas 元素
-        canvas.remove();
-
-        if (compressedDataUrl.length > maxSize) {
-          return reject('图片太大了');
-        }
-
-        const src = await (async () => {
-          try {
-            const src = await uploadImg(compressedDataUrl);
-            return src;
-          } catch (error) {
-            return compressedDataUrl;
-          }
-        })();
-
-        resolve(src);
-      };
-    };
-    reader.onerror = (err) => {
-      console.log(err);
-      reject('压缩图片异常');
-    };
-  });
-
 /* simple text, remove chinese space and extra \n */
 export const simpleText = (text: string) => {
  text = text.replace(/([\u4e00-\u9fa5])\s+([\u4e00-\u9fa5])/g, '$1$2');
--- a/client/src/utils/tools.ts
+++ b/client/src/utils/tools.ts
@@ -1,44 +1,5 @@
 import crypto from 'crypto';
-import { useToast } from '@/hooks/useToast';
 import dayjs from 'dayjs';
-import { useTranslation } from 'react-i18next';
-
-/**
- * copy text data
- */
-export const useCopyData = () => {
-  const { t } = useTranslation();
-  const { toast } = useToast();
-
-  return {
-    copyData: async (
-      data: string,
-      title: string | null = t('common.Copy Successful'),
-      duration = 1000
-    ) => {
-      try {
-        if (navigator.clipboard) {
-          await navigator.clipboard.writeText(data);
-        } else {
-          throw new Error('');
-        }
-      } catch (error) {
-        const textarea = document.createElement('textarea');
-        textarea.value = data;
-        document.body.appendChild(textarea);
-        textarea.select();
-        document.execCommand('copy');
-        document.body.removeChild(textarea);
-      }
-
-      toast({
-        title,
-        status: 'success',
-        duration
-      });
-    }
-  };
-};

 /**
 * 密码加密
@@ -138,35 +99,6 @@ export const formatFileSize = (bytes: number): string => {
  return parseFloat((bytes / Math.pow(k, i)).toFixed(2)) + ' ' + sizes[i];
 };

-export const hasVoiceApi = typeof window !== 'undefined' && 'speechSynthesis' in window;
-/**
- * voice broadcast
- */
-export const voiceBroadcast = ({ text }: { text: string }) => {
-  window.speechSynthesis?.cancel();
-  const msg = new SpeechSynthesisUtterance(text);
-  const voices = window.speechSynthesis?.getVoices?.(); // 获取语言包
-  const voice = voices.find((item) => {
-    return item.name === 'Microsoft Yaoyao - Chinese (Simplified, PRC)';
-  });
-  if (voice) {
-    msg.voice = voice;
-  }
-
-  window.speechSynthesis?.speak(msg);
-
-  msg.onerror = (e) => {
-    console.log(e);
-  };
-
-  return {
-    cancel: () => window.speechSynthesis?.cancel()
-  };
-};
-export const cancelBroadcast = () => {
-  window.speechSynthesis?.cancel();
-};
-
 export const getErrText = (err: any, def = '') => {
  const msg: string = typeof err === 'string' ? err : err?.message || def || '';
  msg && console.log('error =>', msg);
--- a/client/src/utils/web/core/dataset.ts
+++ b/client/src/utils/web/core/dataset.ts
@@ -0,0 +1,48 @@
+import { postChunks2Dataset } from '@/api/core/dataset/data';
+import { TrainingModeEnum } from '@/constants/plugin';
+import type { DatasetDataItemType } from '@/types/core/dataset/data';
+import { delay } from '@/utils/tools';
+
+export async function chunksUpload({
+  kbId,
+  mode,
+  chunks,
+  prompt,
+  rate = 200,
+  onUploading
+}: {
+  kbId: string;
+  mode: `${TrainingModeEnum}`;
+  chunks: DatasetDataItemType[];
+  prompt?: string;
+  rate?: number;
+  onUploading?: (insertLen: number, total: number) => void;
+}) {
+  async function upload(data: DatasetDataItemType[]) {
+    return postChunks2Dataset({
+      kbId,
+      data,
+      mode,
+      prompt
+    });
+  }
+
+  let successInsert = 0;
+  let retryTimes = 10;
+  for (let i = 0; i < chunks.length; i += rate) {
+    try {
+      const { insertLen } = await upload(chunks.slice(i, i + rate));
+      onUploading && onUploading(i + rate, chunks.length);
+      successInsert += insertLen;
+    } catch (error) {
+      if (retryTimes === 0) {
+        return Promise.reject(error);
+      }
+      await delay(1000);
+      retryTimes--;
+      i -= rate;
+    }
+  }
+
+  return { insertLen: successInsert };
+}
--- a/client/src/utils/web/file.ts
+++ b/client/src/utils/web/file.ts
@@ -0,0 +1,261 @@
+import mammoth from 'mammoth';
+import Papa from 'papaparse';
+import { uploadImg, postUploadFiles, getFileViewUrl } from '@/api/support/file';
+/**
+ * upload file to mongo gridfs
+ */
+export const uploadFiles = (
+  files: File[],
+  metadata: Record<string, any> = {},
+  percentListen?: (percent: number) => void
+) => {
+  const form = new FormData();
+  form.append('metadata', JSON.stringify(metadata));
+  files.forEach((file) => {
+    form.append('file', file, encodeURIComponent(file.name));
+  });
+  return postUploadFiles(form, (e) => {
+    if (!e.total) return;
+
+    const percent = Math.round((e.loaded / e.total) * 100);
+    percentListen && percentListen(percent);
+  });
+};
+
+/**
+ * 读取 txt 文件内容
+ */
+export const readTxtContent = (file: File) => {
+  return new Promise((resolve: (_: string) => void, reject) => {
+    try {
+      const reader = new FileReader();
+      reader.onload = () => {
+        resolve(reader.result as string);
+      };
+      reader.onerror = (err) => {
+        console.log('error txt read:', err);
+        reject('读取 txt 文件失败');
+      };
+      reader.readAsText(file);
+    } catch (error) {
+      reject('浏览器不支持文件内容读取');
+    }
+  });
+};
+
+/**
+ * 读取 pdf 内容
+ */
+export const readPdfContent = (file: File) =>
+  new Promise<string>((resolve, reject) => {
+    try {
+      const pdfjsLib = window['pdfjs-dist/build/pdf'];
+      pdfjsLib.workerSrc = '/js/pdf.worker.js';
+
+      const readPDFPage = async (doc: any, pageNo: number) => {
+        const page = await doc.getPage(pageNo);
+        const tokenizedText = await page.getTextContent();
+
+        const pageText = tokenizedText.items
+          .map((token: any) => token.str)
+          .filter((item: string) => item)
+          .join('');
+        return pageText;
+      };
+
+      let reader = new FileReader();
+      reader.readAsArrayBuffer(file);
+      reader.onload = async (event) => {
+        if (!event?.target?.result) return reject('解析 PDF 失败');
+        try {
+          const doc = await pdfjsLib.getDocument(event.target.result).promise;
+          const pageTextPromises = [];
+          for (let pageNo = 1; pageNo <= doc.numPages; pageNo++) {
+            pageTextPromises.push(readPDFPage(doc, pageNo));
+          }
+          const pageTexts = await Promise.all(pageTextPromises);
+          resolve(pageTexts.join('\n'));
+        } catch (err) {
+          console.log(err, 'pdf load error');
+          reject('解析 PDF 失败');
+        }
+      };
+      reader.onerror = (err) => {
+        console.log(err, 'pdf load error');
+        reject('解析 PDF 失败');
+      };
+    } catch (error) {
+      reject('浏览器不支持文件内容读取');
+    }
+  });
+
+/**
+ * 读取doc
+ */
+export const readDocContent = (file: File) =>
+  new Promise<string>((resolve, reject) => {
+    try {
+      const reader = new FileReader();
+      reader.readAsArrayBuffer(file);
+      reader.onload = async ({ target }) => {
+        if (!target?.result) return reject('读取 doc 文件失败');
+        try {
+          const res = await mammoth.extractRawText({
+            arrayBuffer: target.result as ArrayBuffer
+          });
+          resolve(res?.value);
+        } catch (error) {
+          window.umami?.track('wordReadError', {
+            err: error?.toString()
+          });
+          console.log('error doc read:', error);
+
+          reject('读取 doc 文件失败, 请转换成 PDF');
+        }
+      };
+      reader.onerror = (err) => {
+        window.umami?.track('wordReadError', {
+          err: err?.toString()
+        });
+        console.log('error doc read:', err);
+
+        reject('读取 doc 文件失败');
+      };
+    } catch (error) {
+      reject('浏览器不支持文件内容读取');
+    }
+  });
+
+/**
+ * 读取csv
+ */
+export const readCsvContent = async (file: File) => {
+  try {
+    const textArr = await readTxtContent(file);
+    const csvArr = Papa.parse(textArr).data as string[][];
+    if (csvArr.length === 0) {
+      throw new Error('csv 解析失败');
+    }
+    return {
+      header: csvArr.shift() as string[],
+      data: csvArr.map((item) => item)
+    };
+  } catch (error) {
+    return Promise.reject('解析 csv 文件失败');
+  }
+};
+
+/**
+ * file download
+ */
+export const fileDownload = ({
+  text,
+  type,
+  filename
+}: {
+  text: string;
+  type: string;
+  filename: string;
+}) => {
+  // 导出为文件
+  const blob = new Blob([`\uFEFF${text}`], { type: `${type};charset=utf-8;` });
+
+  // 创建下载链接
+  const downloadLink = document.createElement('a');
+  downloadLink.href = window.URL.createObjectURL(blob);
+  downloadLink.download = filename;
+
+  // 添加链接到页面并触发下载
+  document.body.appendChild(downloadLink);
+  downloadLink.click();
+  document.body.removeChild(downloadLink);
+};
+
+export async function getFileAndOpen(fileId: string) {
+  const url = await getFileViewUrl(fileId);
+  const asPath = `${location.origin}${url}`;
+  window.open(asPath, '_blank');
+}
+
+export const fileToBase64 = (file: File) => {
+  return new Promise((resolve, reject) => {
+    const reader = new FileReader();
+    reader.readAsDataURL(file);
+    reader.onload = () => resolve(reader.result);
+    reader.onerror = (error) => reject(error);
+  });
+};
+
+/**
+ * compress image. response base64
+ * @param maxSize The max size of the compressed image
+ */
+export const compressImg = ({
+  file,
+  maxW = 200,
+  maxH = 200,
+  maxSize = 1024 * 100
+}: {
+  file: File;
+  maxW?: number;
+  maxH?: number;
+  maxSize?: number;
+}) =>
+  new Promise<string>((resolve, reject) => {
+    const reader = new FileReader();
+    reader.readAsDataURL(file);
+    reader.onload = async () => {
+      const img = new Image();
+      // @ts-ignore
+      img.src = reader.result;
+      img.onload = async () => {
+        let width = img.width;
+        let height = img.height;
+
+        if (width > height) {
+          if (width > maxW) {
+            height *= maxW / width;
+            width = maxW;
+          }
+        } else {
+          if (height > maxH) {
+            width *= maxH / height;
+            height = maxH;
+          }
+        }
+
+        const canvas = document.createElement('canvas');
+        canvas.width = width;
+        canvas.height = height;
+        const ctx = canvas.getContext('2d');
+
+        if (!ctx) {
+          return reject('压缩图片异常');
+        }
+
+        ctx.drawImage(img, 0, 0, width, height);
+        const compressedDataUrl = canvas.toDataURL(file.type, 0.8);
+        // 移除 canvas 元素
+        canvas.remove();
+
+        if (compressedDataUrl.length > maxSize) {
+          return reject('图片太大了');
+        }
+
+        const src = await (async () => {
+          try {
+            const src = await uploadImg(compressedDataUrl);
+            return src;
+          } catch (error) {
+            return compressedDataUrl;
+          }
+        })();
+
+        resolve(src);
+      };
+    };
+    reader.onerror = (err) => {
+      console.log(err);
+      reject('压缩图片异常');
+    };
+  });
--- a/client/src/utils/web/i18n.ts
+++ b/client/src/utils/web/i18n.ts
--- a/client/src/utils/web/voice.ts
+++ b/client/src/utils/web/voice.ts
@@ -0,0 +1,28 @@
+export const hasVoiceApi = typeof window !== 'undefined' && 'speechSynthesis' in window;
+/**
+ * voice broadcast
+ */
+export const voiceBroadcast = ({ text }: { text: string }) => {
+  window.speechSynthesis?.cancel();
+  const msg = new SpeechSynthesisUtterance(text);
+  const voices = window.speechSynthesis?.getVoices?.(); // 获取语言包
+  const voice = voices.find((item) => {
+    return item.name === 'Microsoft Yaoyao - Chinese (Simplified, PRC)';
+  });
+  if (voice) {
+    msg.voice = voice;
+  }
+
+  window.speechSynthesis?.speak(msg);
+
+  msg.onerror = (e) => {
+    console.log(e);
+  };
+
+  return {
+    cancel: () => window.speechSynthesis?.cancel()
+  };
+};
+export const cancelBroadcast = () => {
+  window.speechSynthesis?.cancel();
+};