refactor(deps): 将jieba分词库替换为rjieba

This commit is contained in:
雅诺狐
2025-10-05 12:08:18 +08:00
parent 1a68365752
commit 413973979c
13 changed files with 85 additions and 29 deletions

View File

@@ -4,7 +4,7 @@ from datetime import datetime
from difflib import SequenceMatcher
from typing import Any
import jieba
import rjieba
import orjson
from json_repair import repair_json
from sklearn.feature_extraction.text import TfidfVectorizer
@@ -535,9 +535,9 @@ class RelationshipManager:
s1 = str(s1)
s2 = str(s2)
# 1. 使用 jieba 进行分词
s1_words = " ".join(jieba.cut(s1))
s2_words = " ".join(jieba.cut(s2))
# 1. 使用 rjieba 进行分词
s1_words = " ".join(rjieba.cut(s1))
s2_words = " ".join(rjieba.cut(s2))
# 2. 将两句话放入一个列表中
corpus = [s1_words, s2_words]