From 0fcea1d021748a8fd8d4168f112f9b873b28f071 Mon Sep 17 00:00:00 2001 From: qiancai Date: Fri, 29 May 2026 17:41:48 +0800 Subject: [PATCH 1/2] Update merge_by_toc.py --- scripts/merge_by_toc.py | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/scripts/merge_by_toc.py b/scripts/merge_by_toc.py index 14137f5ca801b..4d01d8ba9a9e1 100755 --- a/scripts/merge_by_toc.py +++ b/scripts/merge_by_toc.py @@ -214,6 +214,26 @@ def replace_heading(match): return replace_heading +# remove / tags for PDF output +sticky_header_table_pattern = re.compile(r'^\s*\s*$') + +def remove_sticky_header_table(text): + lines = text.split('\n') + result = [] + i = 0 + while i < len(lines): + if sticky_header_table_pattern.match(lines[i]): + prev_blank = len(result) > 0 and result[-1].strip() == '' + next_blank = i + 1 < len(lines) and lines[i + 1].strip() == '' + if prev_blank and next_blank: + i += 2 + else: + i += 1 + else: + result.append(lines[i]) + i += 1 + return '\n'.join(result) + # remove copyable snippet code def remove_copyable(match): return "" @@ -233,6 +253,7 @@ def remove_copyable(match): chapter = replace_variables(chapter, variables) chapter = replace_link_wrap(chapter, name) chapter = copyable_snippet_pattern.sub(remove_copyable, chapter) + chapter = remove_sticky_header_table(chapter) chapter = extract_custom_ids_and_clean(chapter) chapter = replace_custom_id_links(chapter) # This block is to filter xxx From 713c130d597b6bcb11214263e35c47609089b002 Mon Sep 17 00:00:00 2001 From: qiancai Date: Fri, 29 May 2026 17:51:48 +0800 Subject: [PATCH 2/2] resolve comments --- scripts/merge_by_toc.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/scripts/merge_by_toc.py b/scripts/merge_by_toc.py index 4d01d8ba9a9e1..adcdbc384af73 100755 --- a/scripts/merge_by_toc.py +++ b/scripts/merge_by_toc.py @@ -215,7 +215,7 @@ def replace_heading(match): # remove / tags for PDF output -sticky_header_table_pattern = re.compile(r'^\s*\s*$') +sticky_header_table_pattern = re.compile(r'^\s*\s*$') def remove_sticky_header_table(text): lines = text.split('\n') @@ -234,6 +234,7 @@ def remove_sticky_header_table(text): i += 1 return '\n'.join(result) + # remove copyable snippet code def remove_copyable(match): return ""