From 54eae5f9e932d16aa8139a61675056191a28e18c Mon Sep 17 00:00:00 2001 From: qiancai Date: Fri, 29 May 2026 17:41:16 +0800 Subject: [PATCH 1/2] Update merge_by_toc.py --- scripts/merge_by_toc.py | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/scripts/merge_by_toc.py b/scripts/merge_by_toc.py index fd05d144fcb2..3a94551dcdaa 100755 --- a/scripts/merge_by_toc.py +++ b/scripts/merge_by_toc.py @@ -192,6 +192,26 @@ def replace_heading(match): return replace_heading +# remove / tags for PDF output +sticky_header_table_pattern = re.compile(r'^\s*\s*$') + +def remove_sticky_header_table(text): + lines = text.split('\n') + result = [] + i = 0 + while i < len(lines): + if sticky_header_table_pattern.match(lines[i]): + prev_blank = len(result) > 0 and result[-1].strip() == '' + next_blank = i + 1 < len(lines) and lines[i + 1].strip() == '' + if prev_blank and next_blank: + i += 2 + else: + i += 1 + else: + result.append(lines[i]) + i += 1 + return '\n'.join(result) + # remove copyable snippet code def remove_copyable(match): return '' @@ -213,6 +233,7 @@ def remove_copyable(match): chapter = replace_variables(chapter, variables) chapter = replace_link_wrap(chapter, name) chapter = copyable_snippet_pattern.sub(remove_copyable, chapter) + chapter = remove_sticky_header_table(chapter) chapter = extract_custom_ids_and_clean(chapter) chapter = replace_custom_id_links(chapter) From ade5a977b75f7b150840f83509cfbd34eed5e387 Mon Sep 17 00:00:00 2001 From: qiancai Date: Fri, 29 May 2026 17:51:37 +0800 Subject: [PATCH 2/2] resolve comments --- scripts/merge_by_toc.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/scripts/merge_by_toc.py b/scripts/merge_by_toc.py index 3a94551dcdaa..ff4941445cdd 100755 --- a/scripts/merge_by_toc.py +++ b/scripts/merge_by_toc.py @@ -193,7 +193,7 @@ def replace_heading(match): return replace_heading # remove / tags for PDF output -sticky_header_table_pattern = re.compile(r'^\s*\s*$') +sticky_header_table_pattern = re.compile(r'^\s*\s*$') def remove_sticky_header_table(text): lines = text.split('\n') @@ -212,6 +212,7 @@ def remove_sticky_header_table(text): i += 1 return '\n'.join(result) + # remove copyable snippet code def remove_copyable(match): return ''