import { batchRun } from '../system/utils'; import { getNanoid, simpleText } from './tools'; import type { ImageType } from '../../../service/worker/readFile/type'; /* Delete redundant text in markdown */ export const simpleMarkdownText = (rawText: string) => { rawText = simpleText(rawText); // Remove a line feed from a hyperlink or picture rawText = rawText.replace(/\[([^\]]+)\]\((.+?)\)/g, (match, linkText, url) => { const cleanedLinkText = linkText.replace(/\n/g, ' ').trim(); if (!url) { return ''; } return `[${cleanedLinkText}](${url})`; }); // replace special #\.* …… const reg1 = /\\([#`!*()+-_\[\]{}\\.])/g; if (reg1.test(rawText)) { rawText = rawText.replace(reg1, '$1'); } // replace \\n rawText = rawText.replace(/\\\\n/g, '\\n'); // Remove headings and code blocks front spaces ['####', '###', '##', '#', '```', '~~~'].forEach((item, i) => { const reg = new RegExp(`\\n\\s*${item}`, 'g'); if (reg.test(rawText)) { rawText = rawText.replace(new RegExp(`(\\n)( *)(${item})`, 'g'), '$1$3'); } }); return rawText.trim(); }; export const htmlTable2Md = (content: string): string => { return content.replace(/
]*\/>| | ]*>.*?<\/td>/g) || []; cells.forEach((cell) => { while (tableData[rowIndex][colIndex]) { colIndex++; } const colspan = parseInt(cell.match(/colspan="(\d+)"/)?.[1] || '1'); const rowspan = parseInt(cell.match(/rowspan="(\d+)"/)?.[1] || '1'); let content = ''; if (cell.endsWith('/>')) { content = ''; } else { content = cell.replace(/ | ]*>|<\/td>/g, '').trim();
}
for (let i = 0; i < rowspan; i++) {
for (let j = 0; j < colspan; j++) {
if (!tableData[rowIndex + i]) {
tableData[rowIndex + i] = [];
}
tableData[rowIndex + i][colIndex + j] = i === 0 && j === 0 ? content : '^^';
}
}
colIndex += colspan;
maxColumns = Math.max(maxColumns, colIndex);
});
for (let i = 0; i < maxColumns; i++) {
if (!tableData[rowIndex][i]) {
tableData[rowIndex][i] = ' ';
}
}
});
const chunks: string[] = [];
const headerCells = tableData[0]
.slice(0, maxColumns)
.map((cell) => (cell === '^^' ? ' ' : cell || ' '));
const headerRow = '| ' + headerCells.join(' | ') + ' |';
chunks.push(headerRow);
const separator = '| ' + Array(headerCells.length).fill('---').join(' | ') + ' |';
chunks.push(separator);
tableData.slice(1).forEach((row) => {
const paddedRow = row
.slice(0, maxColumns)
.map((cell) => (cell === '^^' ? ' ' : cell || ' '));
while (paddedRow.length < maxColumns) {
paddedRow.push(' ');
}
chunks.push('| ' + paddedRow.join(' | ') + ' |');
});
return chunks.join('\n');
} catch (error) {
return htmlTable;
}
});
};
/**
* format markdown
* 1. upload base64
* 2. replace \
*/
export const uploadMarkdownBase64 = async ({
rawText,
uploadImgController
}: {
rawText: string;
uploadImgController?: (base64: string) => Promise |