mirror of
https://github.com/labring/FastGPT.git
synced 2025-07-22 12:20:34 +00:00

* Training status (#4424) * dataset data training state (#4311) * dataset data training state * fix * fix ts * fix * fix api format * fix * fix * perf: count training * format * fix: dataset training state (#4417) * fix * add test * fix * fix * fix test * fix test * perf: training count * count * loading status --------- Co-authored-by: heheer <heheer@sealos.io> * doc * website sync feature (#4429) * perf: introduce BullMQ for website sync (#4403) * perf: introduce BullMQ for website sync * feat: new redis module * fix: remove graceful shutdown * perf: improve UI in dataset detail - Updated the "change" icon SVG file. - Modified i18n strings. - Added new i18n string "immediate_sync". - Improved UI in dataset detail page, including button icons and background colors. * refactor: Add chunkSettings to DatasetSchema * perf: website sync ux * env template * fix: clean up website dataset when updating chunk settings (#4420) * perf: check setting updated * perf: worker currency * feat: init script for website sync refactor (#4425) * website feature doc --------- Co-authored-by: a.e. <49438478+I-Info@users.noreply.github.com> * pro migration (#4388) (#4433) * pro migration * reuse customPdfParseType Co-authored-by: gggaaallleee <91131304+gggaaallleee@users.noreply.github.com> * perf: remove loading ui * feat: config chat file expired time * Redis cache (#4436) * perf: add Redis cache for vector counting (#4432) * feat: cache * perf: get cache key --------- Co-authored-by: a.e. <49438478+I-Info@users.noreply.github.com> * perf: mobile voice input (#4437) * update:Mobile voice interaction (#4362) * Add files via upload * Add files via upload * Update ollama.md * Update ollama.md * Add files via upload * Update useSpeech.ts * Update ChatInput.tsx * Update useSpeech.ts * Update ChatInput.tsx * Update useSpeech.ts * Update constants.ts * Add files via upload * Update ChatInput.tsx * Update useSpeech.ts * Update useSpeech.ts * Update useSpeech.ts * Update ChatInput.tsx * Add files via upload * Update common.json * Update VoiceInput.tsx * Update ChatInput.tsx * Update VoiceInput.tsx * Update useSpeech.ts * Update useSpeech.ts * Update common.json * Update common.json * Update common.json * Update VoiceInput.tsx * Update VoiceInput.tsx * Update ChatInput.tsx * Update VoiceInput.tsx * Update ChatInput.tsx * Update VoiceInput.tsx * Update ChatInput.tsx * Update useSpeech.ts * Update common.json * Update chat.json * Update common.json * Update chat.json * Update common.json * Update chat.json * Update VoiceInput.tsx * Update ChatInput.tsx * Update useSpeech.ts * Update VoiceInput.tsx * speech ui * 优化语音输入组件,调整输入框显示逻辑,修复语音输入遮罩层样式,更新画布背景透明度,增强用户交互体验。 (#4435) * perf: mobil voice input --------- Co-authored-by: dreamer6680 <1468683855@qq.com> * Test completion v2 (#4438) * add v2 completions (#4364) * add v2 completions * completion config * config version * fix * frontend * doc * fix * fix: completions v2 api --------- Co-authored-by: heheer <heheer@sealos.io> * package * Test mongo log (#4443) * feat: mongodb-log (#4426) * perf: mongo log * feat: completions stop reasoner * mongo db log --------- Co-authored-by: Finley Ge <32237950+FinleyGe@users.noreply.github.com> * update doc * Update doc * fix external var ui (#4444) * action * fix: ts (#4458) * preview doc action add docs preview permission update preview action udpate action * update doc (#4460) * update preview action * update doc * remove * update * schema * update mq export;perf: redis cache (#4465) * perf: redis cache * update mq export * perf: website sync error tip * add error worker * website sync ui (#4466) * Updated the dynamic display of the voice input pop-up (#4469) * Update VoiceInput.tsx * Update VoiceInput.tsx * Update VoiceInput.tsx * fix: voice input --------- Co-authored-by: heheer <heheer@sealos.io> Co-authored-by: a.e. <49438478+I-Info@users.noreply.github.com> Co-authored-by: gggaaallleee <91131304+gggaaallleee@users.noreply.github.com> Co-authored-by: dreamer6680 <1468683855@qq.com> Co-authored-by: Finley Ge <32237950+FinleyGe@users.noreply.github.com>
143 lines
3.0 KiB
TypeScript
143 lines
3.0 KiB
TypeScript
import { connectionMongo, getMongoModel } from '../../../common/mongo';
|
|
const { Schema } = connectionMongo;
|
|
import { DatasetCollectionSchemaType } from '@fastgpt/global/core/dataset/type.d';
|
|
import { DatasetCollectionTypeMap } from '@fastgpt/global/core/dataset/constants';
|
|
import { ChunkSettings, DatasetCollectionName } from '../schema';
|
|
import {
|
|
TeamCollectionName,
|
|
TeamMemberCollectionName
|
|
} from '@fastgpt/global/support/user/team/constant';
|
|
|
|
export const DatasetColCollectionName = 'dataset_collections';
|
|
|
|
const DatasetCollectionSchema = new Schema({
|
|
parentId: {
|
|
type: Schema.Types.ObjectId,
|
|
ref: DatasetColCollectionName,
|
|
default: null
|
|
},
|
|
teamId: {
|
|
type: Schema.Types.ObjectId,
|
|
ref: TeamCollectionName,
|
|
required: true
|
|
},
|
|
tmbId: {
|
|
type: Schema.Types.ObjectId,
|
|
ref: TeamMemberCollectionName,
|
|
required: true
|
|
},
|
|
datasetId: {
|
|
type: Schema.Types.ObjectId,
|
|
ref: DatasetCollectionName,
|
|
required: true
|
|
},
|
|
|
|
// Basic info
|
|
type: {
|
|
type: String,
|
|
enum: Object.keys(DatasetCollectionTypeMap),
|
|
required: true
|
|
},
|
|
name: {
|
|
type: String,
|
|
required: true
|
|
},
|
|
tags: {
|
|
type: [String],
|
|
default: []
|
|
},
|
|
|
|
createTime: {
|
|
type: Date,
|
|
default: () => new Date()
|
|
},
|
|
updateTime: {
|
|
type: Date,
|
|
default: () => new Date()
|
|
},
|
|
|
|
// Metadata
|
|
// local file collection
|
|
fileId: {
|
|
type: Schema.Types.ObjectId,
|
|
ref: 'dataset.files'
|
|
},
|
|
// web link collection
|
|
rawLink: String,
|
|
// Api collection
|
|
apiFileId: String,
|
|
// external collection(Abandoned)
|
|
externalFileId: String,
|
|
externalFileUrl: String, // external import url
|
|
|
|
rawTextLength: Number,
|
|
hashRawText: String,
|
|
metadata: {
|
|
type: Object,
|
|
default: {}
|
|
},
|
|
|
|
forbid: Boolean,
|
|
// next sync time
|
|
nextSyncTime: Date,
|
|
|
|
// Parse settings
|
|
customPdfParse: Boolean,
|
|
|
|
// Chunk settings
|
|
...ChunkSettings
|
|
});
|
|
|
|
DatasetCollectionSchema.virtual('dataset', {
|
|
ref: DatasetCollectionName,
|
|
localField: 'datasetId',
|
|
foreignField: '_id',
|
|
justOne: true
|
|
});
|
|
|
|
try {
|
|
// auth file
|
|
DatasetCollectionSchema.index({ teamId: 1, fileId: 1 });
|
|
|
|
// list collection; deep find collections
|
|
DatasetCollectionSchema.index({
|
|
teamId: 1,
|
|
datasetId: 1,
|
|
parentId: 1,
|
|
updateTime: -1
|
|
});
|
|
|
|
// Tag filter
|
|
DatasetCollectionSchema.index({ teamId: 1, datasetId: 1, tags: 1 });
|
|
// create time filter
|
|
DatasetCollectionSchema.index({ teamId: 1, datasetId: 1, createTime: 1 });
|
|
|
|
// next sync time filter
|
|
DatasetCollectionSchema.index(
|
|
{ type: 1, nextSyncTime: -1 },
|
|
{
|
|
partialFilterExpression: {
|
|
nextSyncTime: { $exists: true }
|
|
}
|
|
}
|
|
);
|
|
|
|
// Get collection by external file id
|
|
DatasetCollectionSchema.index(
|
|
{ datasetId: 1, externalFileId: 1 },
|
|
{
|
|
unique: true,
|
|
partialFilterExpression: {
|
|
externalFileId: { $exists: true }
|
|
}
|
|
}
|
|
);
|
|
} catch (error) {
|
|
console.log(error);
|
|
}
|
|
|
|
export const MongoDatasetCollection = getMongoModel<DatasetCollectionSchemaType>(
|
|
DatasetColCollectionName,
|
|
DatasetCollectionSchema
|
|
);
|