V4.6.6-2 (#673)
This commit is contained in:
13
projects/app/src/service/common/string/jieba.ts
Normal file
13
projects/app/src/service/common/string/jieba.ts
Normal file
@@ -0,0 +1,13 @@
|
||||
import { cut } from '@node-rs/jieba';
|
||||
import { stopWords } from '@fastgpt/global/common/string/jieba';
|
||||
|
||||
export function jiebaSplit({ text }: { text: string }) {
|
||||
const tokens = cut(text, true);
|
||||
|
||||
return (
|
||||
tokens
|
||||
.map((item) => item.replace(/[^\u4e00-\u9fa5a-zA-Z0-9\s]/g, '').trim())
|
||||
.filter((item) => item && !stopWords.has(item))
|
||||
.join(' ') || ''
|
||||
);
|
||||
}
|
||||
Reference in New Issue
Block a user