diff --git a/deepdoc/vision/table_structure_recognizer.py b/deepdoc/vision/table_structure_recognizer.py index 64ad8b92..470abc3b 100644 --- a/deepdoc/vision/table_structure_recognizer.py +++ b/deepdoc/vision/table_structure_recognizer.py @@ -133,7 +133,7 @@ class TableStructureRecognizer(Recognizer): return "Ot" @staticmethod - def construct_table(boxes, is_english=False, html=False, **kwargs): + def construct_table(boxes, is_english=False, html=True, **kwargs): cap = "" i = 0 while i < len(boxes): diff --git a/rag/app/manual.py b/rag/app/manual.py index 5de782d6..a05670a0 100644 --- a/rag/app/manual.py +++ b/rag/app/manual.py @@ -162,6 +162,8 @@ class Docx(DocxParser): if c.text == r.cells[j].text: span += 1 i = j + else: + break i += 1 html += f"{c.text}" if span == 1 else f"{c.text}" html += ""