perf: 知识库范围

This commit is contained in:
archer
2023-04-06 23:43:34 +08:00
parent fc7edcb54f
commit 1409916bd0
2 changed files with 16 additions and 34 deletions

View File

@@ -1,7 +1,6 @@
import type { NextApiRequest, NextApiResponse } from 'next'; import type { NextApiRequest, NextApiResponse } from 'next';
import { createParser, ParsedEvent, ReconnectInterval } from 'eventsource-parser';
import { connectToDatabase } from '@/service/mongo'; import { connectToDatabase } from '@/service/mongo';
import { getOpenAIApi, authChat } from '@/service/utils/chat'; import { authChat } from '@/service/utils/chat';
import { httpsAgent, openaiChatFilter, systemPromptFilter } from '@/service/utils/tools'; import { httpsAgent, openaiChatFilter, systemPromptFilter } from '@/service/utils/tools';
import { ChatCompletionRequestMessage, ChatCompletionRequestMessageRoleEnum } from 'openai'; import { ChatCompletionRequestMessage, ChatCompletionRequestMessageRoleEnum } from 'openai';
import { ChatItemType } from '@/types/chat'; import { ChatItemType } from '@/types/chat';
@@ -13,8 +12,7 @@ import { pushChatBill } from '@/service/events/pushBill';
import { connectRedis } from '@/service/redis'; import { connectRedis } from '@/service/redis';
import { VecModelDataPrefix } from '@/constants/redis'; import { VecModelDataPrefix } from '@/constants/redis';
import { vectorToBuffer } from '@/utils/tools'; import { vectorToBuffer } from '@/utils/tools';
import { openaiCreateEmbedding } from '@/service/utils/openai'; import { openaiCreateEmbedding, gpt35StreamResponse } from '@/service/utils/openai';
import { gpt35StreamResponse } from '@/service/utils/openai';
/* 发送提示词 */ /* 发送提示词 */
export default async function handler(req: NextApiRequest, res: NextApiResponse) { export default async function handler(req: NextApiRequest, res: NextApiResponse) {
@@ -73,7 +71,6 @@ export default async function handler(req: NextApiRequest, res: NextApiResponse)
`@modelId:{${String( `@modelId:{${String(
chat.modelId._id chat.modelId._id
)}} @vector:[VECTOR_RANGE 0.24 $blob]=>{$YIELD_DISTANCE_AS: score}`, )}} @vector:[VECTOR_RANGE 0.24 $blob]=>{$YIELD_DISTANCE_AS: score}`,
// `@modelId:{${String(chat.modelId._id)}}=>[KNN 10 @vector $blob AS score]`,
'RETURN', 'RETURN',
'1', '1',
'text', 'text',
@@ -90,17 +87,14 @@ export default async function handler(req: NextApiRequest, res: NextApiResponse)
'2' '2'
]); ]);
const formatRedisPrompt: string[] = [];
// 格式化响应值,获取 qa // 格式化响应值,获取 qa
const formatRedisPrompt = [2, 4, 6, 8, 10, 12, 14, 16, 18, 20] for (let i = 2; i < 42; i += 2) {
.map((i) => { const text = redisData[i]?.[1];
if (!redisData[i]) return ''; if (text) {
const text = (redisData[i][1] as string) || ''; formatRedisPrompt.push(text);
}
if (!text) return ''; }
return text;
})
.filter((item) => item);
if (formatRedisPrompt.length === 0) { if (formatRedisPrompt.length === 0) {
throw new Error('对不起,我没有找到你的问题'); throw new Error('对不起,我没有找到你的问题');

View File

@@ -132,9 +132,7 @@ export default async function handler(req: NextApiRequest, res: NextApiResponse)
const redisData: any[] = await redis.sendCommand([ const redisData: any[] = await redis.sendCommand([
'FT.SEARCH', 'FT.SEARCH',
`idx:${VecModelDataPrefix}:hash`, `idx:${VecModelDataPrefix}:hash`,
`@modelId:{${String( `@modelId:{${String(model._id)}}=>[KNN 20 @vector $blob AS score]`,
model._id
)}} @vector:[VECTOR_RANGE 0.25 $blob]=>{$YIELD_DISTANCE_AS: score}`,
'RETURN', 'RETURN',
'1', '1',
'text', 'text',
@@ -144,27 +142,17 @@ export default async function handler(req: NextApiRequest, res: NextApiResponse)
'2', '2',
'blob', 'blob',
vectorToBuffer(promptVector), vectorToBuffer(promptVector),
'LIMIT',
'0',
'20',
'DIALECT', 'DIALECT',
'2' '2'
]); ]);
// 格式化响应值,获取 qa // 格式化响应值,获取 qa
const formatRedisPrompt = [2, 4, 6, 8, 10, 12, 14, 16, 18, 20] const formatRedisPrompt: string[] = [];
.map((i) => { for (let i = 2; i < 42; i += 2) {
if (!redisData[i]) return ''; const text = redisData[i]?.[1];
const text = (redisData[i][1] as string) || ''; if (text) {
formatRedisPrompt.push(text);
if (!text) return ''; }
return text;
})
.filter((item) => item);
if (formatRedisPrompt.length === 0) {
throw new Error('对不起,我没有找到你的问题');
} }
// textArr 筛选,最多 3200 tokens // textArr 筛选,最多 3200 tokens