🎨 PDF files longer than 1024 pages are not included in asset file content searching https://github.com/siyuan-note/siyuan/issues/9053

2026-03-07 05:10:16 +01:00 · 2023-08-27 11:09:19 +08:00 · 2023-08-27 11:09:19 +08:00 · b578506ea5
commit b578506ea5
parent fd32668abc
1 changed files with 5 additions and 2 deletions
--- a/kernel/model/asset_content.go
+++ b/kernel/model/asset_content.go
@ -748,7 +748,7 @@ func (parser *PdfAssetParser) getTextPageWorker(id int, instance pdfium.Pdfium,

 // Parse will parse a PDF document using PDFium webassembly module using a worker pool
 func (parser *PdfAssetParser) Parse(absPath string) (ret *AssetParseResult) {
-	st := time.Now()
+	now := time.Now()
 	if !strings.HasSuffix(strings.ToLower(absPath), ".pdf") {
 		return
 	}
@ -850,7 +850,10 @@ func (parser *PdfAssetParser) Parse(absPath string) (ret *AssetParseResult) {
 		}
 	}
 	close(results)
-	logging.LogInfof("convert [%s] PDF with %d pages using %d workers took %s.\n", tmp, pc.PageCount, cores, time.Since(st))
+
+	if 256 < pc.PageCount {
+		logging.LogInfof("convert [%s] PDF with [%d[ pages using [%d] workers took [%s]", absPath, pc.PageCount, cores, time.Since(now))
+	}

 	// loop through ordered PDF text pages and join content for asset parse DB result
 	content := ""