Update

RainPPR · RainPPR · commit 30e9d89121a6 · 2026-03-04T20:31:13.000+08:00
diff --git a/images/example_workflow.yml b/images/example_workflow.yml
@@ -69,23 +69,20 @@ jobs:
           path: site/
       
       - name: Puppeteer - Print Web to PDF
-        run: |
-          node /app/src/index.js "${{ matrix.book }}"
+        run: export-pdf-1-print "${{ matrix.book }}"
         env:
           CONCURRENCY: 4
       
       - name: Python - Prepare TeX & Planning
-        run: |
-          uv run /app/scripts/processor.py "${{ matrix.book }}.json" --plan-only
+        run: export-pdf-2-plan "${{ matrix.book }}"
           
       - name: LaTeX - Compile Decorations
         uses: docker://ghcr.io/rainppr/texlive-full:latest
         with:
           args: latexmk -xelatex build/*.tex
           
       - name: Python - Final Synthesis & Bookmarks
-        run: |
-          uv run /app/scripts/processor.py "${{ matrix.book }}.json" --merge
+        run: export-pdf-3-merge "${{ matrix.book }}"
           
       - name: Upload Book Product
         uses: actions/upload-artifact@v4
@@ -96,7 +93,7 @@ jobs:
 
   export_publish:
     name: "Publish: Collect and Release"
-    needs: export_compile
+    needs: export_process
     runs-on: ubuntu-latest
     steps:
       - name: Download all compiled PDFs
diff --git a/images/exporter-build/Dockerfile b/images/exporter-build/Dockerfile
@@ -95,4 +95,4 @@ COPY templates/ /app/templates/
 COPY --chmod=755 bin/ /usr/local/bin/
 
 ENTRYPOINT ["/usr/bin/tini", "--"]
-CMD ["export-pdf"]
+CMD ["export-pdf-1-print"]
diff --git a/images/exporter-build/bin/export-pdf b/images/exporter-build/bin/export-pdf
diff --git a/images/exporter-build/bin/export-pdf-1-print b/images/exporter-build/bin/export-pdf-1-print
@@ -0,0 +1,7 @@
+#!/bin/bash
+set -e
+if [ -z "$1" ]; then
+    echo "Usage: export-pdf-1-print <book_name>"
+    exit 1
+fi
+node /app/src/index.js "$1"
diff --git a/images/exporter-build/bin/export-pdf-2-plan b/images/exporter-build/bin/export-pdf-2-plan
@@ -0,0 +1,7 @@
+#!/bin/bash
+set -e
+if [ -z "$1" ]; then
+    echo "Usage: export-pdf-2-plan <book_name>"
+    exit 1
+fi
+uv run /app/scripts/processor.py "site/build/$1.json" --plan-only
diff --git a/images/exporter-build/bin/export-pdf-3-merge b/images/exporter-build/bin/export-pdf-3-merge
@@ -0,0 +1,7 @@
+#!/bin/bash
+set -e
+if [ -z "$1" ]; then
+    echo "Usage: export-pdf-3-merge <book_name>"
+    exit 1
+fi
+uv run /app/scripts/processor.py "site/build/$1.json" --merge
diff --git a/images/exporter-build/scripts/processor.py b/images/exporter-build/scripts/processor.py
@@ -37,15 +37,17 @@ def extract_precise_toc(self, doc, offset):
                             # 粗放式匹配：字体大且粗的可能是标题
                             if s["size"] > 12:
                                 text = s["text"].strip()
+                                # 存入映射，对 key 进行标准化处理（去除空格、处理罕见字符等）
                                 if text:
-                                    headings_map[text] = (page_num, s["bbox"][1])
+                                    headings_map[text.lower()] = (page_num, s["bbox"][1])
 
         refined_toc = []
         for entry in raw_toc:
             lvl, title, page, dest = entry
-            # 尝试匹配文本高度
-            if title in headings_map:
-                p_idx, y_coord = headings_map[title]
+            # 尝试匹配文本高度，使用小写标准化匹配
+            match_title = title.strip().lower()
+            if match_title in headings_map:
+                p_idx, y_coord = headings_map[match_title]
                 dest = {"kind": fitz.LINK_GOTO, "to": fitz.Point(0, y_coord)}
                 
             refined_toc.append([lvl, title, page + offset, dest])
@@ -81,7 +83,11 @@ def process(self):
 
             # 插入内容页
             for sub in section["sections"]:
-                content_path = Path("site/build") / sub["path"]
+                # 尝试从 JSON 所在目录查找，或者使用绝对 site/build 路径
+                content_path = self.book_json_path.parent / sub["path"]
+                if not content_path.exists():
+                     content_path = Path("site/build") / sub["path"]
+                     
                 if content_path.exists():
                     doc = fitz.open(content_path)
                     # 提取并偏移章节内的书签