Kevin Hu
commited on
Commit
·
fe5404c
1
Parent(s):
d8f8ecb
fix bug of ragflowdocxpparser (#1642)
Browse files### What problem does this PR solve?
#1627
### Type of change
- [x] Bug Fix (non-breaking change which fixes an issue)
deepdoc/parser/docx_parser.py
CHANGED
@@ -127,7 +127,7 @@ class RAGFlowDocxParser:
|
|
127 |
runs_within_single_paragraph.append(run.text) # append run.text first
|
128 |
|
129 |
# wrap page break checker into a static method
|
130 |
-
if
|
131 |
pn += 1
|
132 |
|
133 |
secs.append(("".join(runs_within_single_paragraph), p.style.name)) # then concat run.text as part of the paragraph
|
|
|
127 |
runs_within_single_paragraph.append(run.text) # append run.text first
|
128 |
|
129 |
# wrap page break checker into a static method
|
130 |
+
if 'lastRenderedPageBreak' in run._element.xml:
|
131 |
pn += 1
|
132 |
|
133 |
secs.append(("".join(runs_within_single_paragraph), p.style.name)) # then concat run.text as part of the paragraph
|