From 36bed84802d2fcb6709f5b29600fc4a030fd891f Mon Sep 17 00:00:00 2001 From: Daniel <845765@qq.com> Date: Sun, 7 Apr 2024 11:32:42 +0800 Subject: [PATCH] :art: Database blocks are included in document word count https://github.com/siyuan-note/siyuan/issues/10918 --- kernel/model/file.go | 96 ++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 96 insertions(+) diff --git a/kernel/model/file.go b/kernel/model/file.go index 71def8279..6f2457da6 100644 --- a/kernel/model/file.go +++ b/kernel/model/file.go @@ -17,6 +17,7 @@ package model import ( + "bytes" "errors" "fmt" "os" @@ -448,6 +449,10 @@ func ListDocTree(boxID, listPath string, sortMode int, flashcard, showHidden boo func ContentStat(content string) (ret *util.BlockStatResult) { luteEngine := util.NewLute() + return contentStat(content, luteEngine) +} + +func contentStat(content string, luteEngine *lute.Lute) (ret *util.BlockStatResult) { tree := luteEngine.BlockDOM2Tree(content) runeCnt, wordCnt, linkCnt, imgCnt, refCnt := tree.Root.Stat() return &util.BlockStatResult{ @@ -479,6 +484,10 @@ func BlocksWordCount(ids []string) (ret *util.BlockStatResult) { } node := treenode.GetNodeInTree(tree, id) + if nil == node { + continue + } + runeCnt, wordCnt, linkCnt, imgCnt, refCnt := node.Stat() ret.RuneCount += runeCnt ret.WordCount += wordCnt @@ -497,7 +506,94 @@ func StatTree(id string) (ret *util.BlockStatResult) { return } + var databaseBlockNodes []*ast.Node + ast.Walk(tree.Root, func(n *ast.Node, entering bool) ast.WalkStatus { + if !entering || ast.NodeAttributeView != n.Type { + return ast.WalkContinue + } + + databaseBlockNodes = append(databaseBlockNodes, n) + return ast.WalkContinue + }) + + luteEngine := util.NewLute() + var dbRuneCnt, dbWordCnt, dbLinkCnt, dbImgCnt, dbRefCnt int + for _, n := range databaseBlockNodes { + if "" == n.AttributeViewID { + continue + } + + attrView, _ := av.ParseAttributeView(n.AttributeViewID) + if nil == attrView { + continue + } + + content := bytes.Buffer{} + for _, kValues := range attrView.KeyValues { + for _, v := range kValues.Values { + switch kValues.Key.Type { + case av.KeyTypeURL: + if v.IsEmpty() { + continue + } + + dbLinkCnt++ + content.WriteString(v.URL.Content) + case av.KeyTypeMAsset: + if v.IsEmpty() { + continue + } + + for _, asset := range v.MAsset { + if av.AssetTypeImage == asset.Type { + dbImgCnt++ + } + } + case av.KeyTypeBlock: + if v.IsEmpty() { + continue + } + + if !v.IsDetached { + dbRefCnt++ + } + content.WriteString(v.Block.Content) + case av.KeyTypeText: + if v.IsEmpty() { + continue + } + content.WriteString(v.Text.Content) + case av.KeyTypeNumber: + if v.IsEmpty() { + continue + } + v.Number.FormatNumber() + content.WriteString(v.Number.FormattedContent) + case av.KeyTypeEmail: + if v.IsEmpty() { + continue + } + content.WriteString(v.Email.Content) + case av.KeyTypePhone: + if v.IsEmpty() { + continue + } + content.WriteString(v.Phone.Content) + } + } + } + + dbStat := contentStat(content.String(), luteEngine) + dbRuneCnt += dbStat.RuneCount + dbWordCnt += dbStat.WordCount + } + runeCnt, wordCnt, linkCnt, imgCnt, refCnt := tree.Root.Stat() + runeCnt += dbRuneCnt + wordCnt += dbWordCnt + linkCnt += dbLinkCnt + imgCnt += dbImgCnt + refCnt += dbRefCnt return &util.BlockStatResult{ RuneCount: runeCnt, WordCount: wordCnt,