mirror of
https://git.mirrors.martin98.com/https://github.com/infiniflow/ragflow.git
synced 2025-08-12 09:09:00 +08:00
enable 3 char words to finegrind tokenize (#2210)
### What problem does this PR solve? ### Type of change - [x] Performance Improvement
This commit is contained in:
parent
21179a9be9
commit
6d232f1bdb
@ -83,7 +83,7 @@ class EsQueryer:
|
||||
), tks
|
||||
|
||||
def need_fine_grained_tokenize(tk):
|
||||
if len(tk) < 4:
|
||||
if len(tk) < 3:
|
||||
return False
|
||||
if re.match(r"[0-9a-z\.\+#_\*-]+$", tk):
|
||||
return False
|
||||
|
Loading…
x
Reference in New Issue
Block a user