External dataset (#1497)

* perf: read rawText and chunk code

* perf: read raw text

* perf: read rawtext

* perf: token count

* log
This commit is contained in:
Archer
2024-05-16 11:47:53 +08:00
committed by GitHub
parent d5073f98ab
commit c6d9b15897
36 changed files with 531 additions and 267 deletions

View File

@@ -123,7 +123,9 @@ export async function checkInvalidDatasetData(start: Date, end: Date) {
continue;
}
} catch (error) {}
console.log(++index);
if (++index % 100 === 0) {
console.log(index);
}
}
}