mirror of
https://github.com/langgenius/dify.git
synced 2024-11-16 19:59:50 +08:00
fix: code block segmentation problem of markdown document (#6465)
This commit is contained in:
parent
16b4f560cd
commit
5e4ac11df3
|
@ -54,8 +54,16 @@ class MarkdownExtractor(BaseExtractor):
|
||||||
|
|
||||||
current_header = None
|
current_header = None
|
||||||
current_text = ""
|
current_text = ""
|
||||||
|
code_block_flag = False
|
||||||
|
|
||||||
for line in lines:
|
for line in lines:
|
||||||
|
if line.startswith("```"):
|
||||||
|
code_block_flag = not code_block_flag
|
||||||
|
current_text += line + "\n"
|
||||||
|
continue
|
||||||
|
if code_block_flag:
|
||||||
|
current_text += line + "\n"
|
||||||
|
continue
|
||||||
header_match = re.match(r"^#+\s", line)
|
header_match = re.match(r"^#+\s", line)
|
||||||
if header_match:
|
if header_match:
|
||||||
if current_header is not None:
|
if current_header is not None:
|
||||||
|
|
Loading…
Reference in New Issue
Block a user