Kevin Hu commited on
Commit
fe5404c
·
1 Parent(s): d8f8ecb

fix bug of ragflowdocxpparser (#1642)

Browse files

### What problem does this PR solve?

#1627

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

Files changed (1) hide show
  1. deepdoc/parser/docx_parser.py +1 -1
deepdoc/parser/docx_parser.py CHANGED
@@ -127,7 +127,7 @@ class RAGFlowDocxParser:
127
  runs_within_single_paragraph.append(run.text) # append run.text first
128
 
129
  # wrap page break checker into a static method
130
- if RAGFlowDocxParser.has_page_break(run._element.xml):
131
  pn += 1
132
 
133
  secs.append(("".join(runs_within_single_paragraph), p.style.name)) # then concat run.text as part of the paragraph
 
127
  runs_within_single_paragraph.append(run.text) # append run.text first
128
 
129
  # wrap page break checker into a static method
130
+ if 'lastRenderedPageBreak' in run._element.xml:
131
  pn += 1
132
 
133
  secs.append(("".join(runs_within_single_paragraph), p.style.name)) # then concat run.text as part of the paragraph