Signed-off-by: kenwoodjw <blackxin55+@gmail.com>
@ -720,7 +720,17 @@ STOPWORDS = {
"〉",
"〈",
"…",
" ",
"0",
"1",
"2",
"3",
"4",
"5",
"6",
"7",
"8",
"9",
@ -731,16 +741,6 @@ STOPWORDS = {
"0",
"1",
"2",
"3",
"4",
"5",
"6",
"7",
"8",
"9",
"二",
"三",
"四",
@ -261,7 +261,7 @@ class OracleVector(BaseVector):
words = pseg.cut(query)
current_entity = ""
for word, pos in words:
if pos in {"nr", "Ng", "eng", "nz", "n", "ORG", "v"}: # nr: 人名, ns: 地名, nt: 机构名
if pos in {"nr", "Ng", "eng", "nz", "n", "ORG", "v"}: # nr: 人名,ns: 地名,nt: 机构名
current_entity += word
else:
if current_entity: