mirror of
https://git.mirrors.martin98.com/https://github.com/infiniflow/ragflow.git
synced 2025-08-13 20:05:57 +08:00
fix bug in pdf parser (#986)
### What problem does this PR solve? #963 ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue)
This commit is contained in:
parent
f077b57f8b
commit
843720f958
@ -392,7 +392,7 @@ class RAGFlowPdfParser:
|
|||||||
b["text"].strip()[-1] in ",;:'\",、‘“;:-",
|
b["text"].strip()[-1] in ",;:'\",、‘“;:-",
|
||||||
len(b["text"].strip()) > 1 and b["text"].strip(
|
len(b["text"].strip()) > 1 and b["text"].strip(
|
||||||
)[-2] in ",;:'\",‘“、;:",
|
)[-2] in ",;:'\",‘“、;:",
|
||||||
b_["text"].strip()[0] in "。;?!?”)),,、:",
|
b_["text"].strip() and b_["text"].strip()[0] in "。;?!?”)),,、:",
|
||||||
]
|
]
|
||||||
# features for not concating
|
# features for not concating
|
||||||
feats = [
|
feats = [
|
||||||
|
Loading…
x
Reference in New Issue
Block a user