DocumentModel.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403
  1. package models
  2. import (
  3. "time"
  4. "github.com/beego/i18n"
  5. "fmt"
  6. "strconv"
  7. "bytes"
  8. "os"
  9. "path/filepath"
  10. "strings"
  11. "github.com/PuerkitoBio/goquery"
  12. "github.com/beego/beego/v2/client/orm"
  13. "github.com/beego/beego/v2/core/logs"
  14. "github.com/beego/beego/v2/server/web"
  15. "github.com/mindoc-org/mindoc/cache"
  16. "github.com/mindoc-org/mindoc/conf"
  17. "github.com/mindoc-org/mindoc/utils"
  18. )
  19. // Document struct.
  20. type Document struct {
  21. DocumentId int `orm:"pk;auto;unique;column(document_id)" json:"doc_id"`
  22. DocumentName string `orm:"column(document_name);size(500);description(文档名称)" json:"doc_name"`
  23. Identify string `orm:"column(identify);size(100);index;null;default(null);description(唯一标识)" json:"identify"` // Identify 文档唯一标识
  24. BookId int `orm:"column(book_id);type(int);index;description(关联bools表主键)" json:"book_id"`
  25. ParentId int `orm:"column(parent_id);type(int);index;default(0);description(父级文档)" json:"parent_id"`
  26. OrderSort int `orm:"column(order_sort);default(0);type(int);index;description(排序从小到大排序)" json:"order_sort"`
  27. Markdown string `orm:"column(markdown);type(text);null;description(markdown内容)" json:"markdown"` // Markdown markdown格式文档.
  28. MarkdownTheme string `orm:"column(markdown_theme);size(50);default(theme__light);description(markdown主题)" json:"markdown_theme"`
  29. Release string `orm:"column(release);type(text);null;description(文章内容)" json:"release"` // Release 发布后的Html格式内容.
  30. Content string `orm:"column(content);type(text);null;description(文章内容)" json:"content"` // Content 未发布的 Html 格式内容.
  31. CreateTime time.Time `orm:"column(create_time);type(datetime);auto_now_add;description(创建时间)" json:"create_time"`
  32. MemberId int `orm:"column(member_id);type(int);description(关系用户id)" json:"member_id"`
  33. ModifyTime time.Time `orm:"column(modify_time);type(datetime);auto_now;description(修改时间)" json:"modify_time"`
  34. ModifyAt int `orm:"column(modify_at);type(int);description(修改人id)" json:"-"`
  35. Version int64 `orm:"column(version);type(bigint);description(版本,关联历史文档里的version)" json:"version"`
  36. IsOpen int `orm:"column(is_open);type(int);default(0);description(是否展开子目录 0:阅读时关闭节点 1:阅读时展开节点 2:空目录 单击时会展开下级节点)" json:"is_open"` //是否展开子目录:0 否/1 是 /2 空间节点,单击时展开下一级
  37. ViewCount int `orm:"column(view_count);type(int);description(浏览量)" json:"view_count"`
  38. AttachList []*Attachment `orm:"-" json:"attach"`
  39. //i18n
  40. Lang string `orm:"-"`
  41. }
  42. // 多字段唯一键
  43. func (item *Document) TableUnique() [][]string {
  44. return [][]string{{"book_id", "identify"}}
  45. }
  46. // TableName 获取对应数据库表名.
  47. func (item *Document) TableName() string {
  48. return "documents"
  49. }
  50. // TableEngine 获取数据使用的引擎.
  51. func (item *Document) TableEngine() string {
  52. return "INNODB"
  53. }
  54. func (item *Document) TableNameWithPrefix() string {
  55. return conf.GetDatabasePrefix() + item.TableName()
  56. }
  57. func NewDocument() *Document {
  58. return &Document{
  59. Version: time.Now().Unix(),
  60. }
  61. }
  62. // 根据文档ID查询指定文档.
  63. func (item *Document) Find(id int) (*Document, error) {
  64. if id <= 0 {
  65. return item, ErrInvalidParameter
  66. }
  67. o := orm.NewOrm()
  68. err := o.QueryTable(item.TableNameWithPrefix()).Filter("document_id", id).One(item)
  69. if err == orm.ErrNoRows {
  70. return item, ErrDataNotExist
  71. }
  72. return item, nil
  73. }
  74. // 插入和更新文档.
  75. func (item *Document) InsertOrUpdate(cols ...string) error {
  76. o := orm.NewOrm()
  77. item.DocumentName = utils.StripTags(item.DocumentName)
  78. var err error
  79. if item.DocumentId > 0 {
  80. _, err = o.Update(item, cols...)
  81. } else {
  82. if item.Identify == "" {
  83. book := NewBook()
  84. identify := "docs"
  85. if err := o.QueryTable(book.TableNameWithPrefix()).Filter("book_id", item.BookId).One(book, "identify"); err == nil {
  86. identify = book.Identify
  87. }
  88. item.Identify = fmt.Sprintf("%s-%s", identify, strconv.FormatInt(time.Now().UnixNano(), 32))
  89. }
  90. if item.OrderSort == 0 {
  91. sort, _ := o.QueryTable(item.TableNameWithPrefix()).Filter("book_id", item.BookId).Filter("parent_id", item.ParentId).Count()
  92. item.OrderSort = int(sort) + 1
  93. }
  94. _, err = o.Insert(item)
  95. NewBook().ResetDocumentNumber(item.BookId)
  96. }
  97. if err != nil {
  98. return err
  99. }
  100. return nil
  101. }
  102. // 根据文档识别编号和项目id获取一篇文档
  103. func (item *Document) FindByIdentityFirst(identify string, bookId int) (*Document, error) {
  104. o := orm.NewOrm()
  105. err := o.QueryTable(item.TableNameWithPrefix()).Filter("book_id", bookId).Filter("identify", identify).One(item)
  106. return item, err
  107. }
  108. // 递归删除一个文档.
  109. func (item *Document) RecursiveDocument(docId int) error {
  110. o := orm.NewOrm()
  111. if doc, err := item.Find(docId); err == nil {
  112. o.Delete(doc)
  113. NewDocumentHistory().Clear(doc.DocumentId)
  114. }
  115. var maps []orm.Params
  116. _, err := o.Raw("SELECT document_id FROM " + item.TableNameWithPrefix() + " WHERE parent_id=" + strconv.Itoa(docId)).Values(&maps)
  117. if err != nil {
  118. logs.Error("RecursiveDocument => ", err)
  119. return err
  120. }
  121. for _, param := range maps {
  122. if docId, ok := param["document_id"].(string); ok {
  123. id, _ := strconv.Atoi(docId)
  124. o.QueryTable(item.TableNameWithPrefix()).Filter("document_id", id).Delete()
  125. item.RecursiveDocument(id)
  126. }
  127. }
  128. return nil
  129. }
  130. // 将文档写入缓存
  131. func (item *Document) PutToCache() {
  132. go func(m Document) {
  133. if m.Identify == "" {
  134. if err := cache.Put("Document.Id."+strconv.Itoa(m.DocumentId), m, time.Second*3600); err != nil {
  135. logs.Info("文档缓存失败:", m.DocumentId)
  136. }
  137. } else {
  138. if err := cache.Put(fmt.Sprintf("Document.BookId.%d.Identify.%s", m.BookId, m.Identify), m, time.Second*3600); err != nil {
  139. logs.Info("文档缓存失败:", m.DocumentId)
  140. }
  141. }
  142. }(*item)
  143. }
  144. // 清除缓存
  145. func (item *Document) RemoveCache() {
  146. go func(m Document) {
  147. cache.Put("Document.Id."+strconv.Itoa(m.DocumentId), m, time.Second*3600)
  148. if m.Identify != "" {
  149. cache.Put(fmt.Sprintf("Document.BookId.%d.Identify.%s", m.BookId, m.Identify), m, time.Second*3600)
  150. }
  151. }(*item)
  152. }
  153. // 从缓存获取
  154. func (item *Document) FromCacheById(id int) (*Document, error) {
  155. if err := cache.Get("Document.Id."+strconv.Itoa(id), &item); err == nil && item.DocumentId > 0 {
  156. logs.Info("从缓存中获取文档信息成功 ->", item.DocumentId)
  157. return item, nil
  158. }
  159. if item.DocumentId > 0 {
  160. item.PutToCache()
  161. }
  162. item, err := item.Find(id)
  163. if err == nil {
  164. item.PutToCache()
  165. }
  166. return item, err
  167. }
  168. // 根据文档标识从缓存中查询文档
  169. func (item *Document) FromCacheByIdentify(identify string, bookId int) (*Document, error) {
  170. key := fmt.Sprintf("Document.BookId.%d.Identify.%s", bookId, identify)
  171. if err := cache.Get(key, item); err == nil && item.DocumentId > 0 {
  172. logs.Info("从缓存中获取文档信息成功 ->", key)
  173. return item, nil
  174. }
  175. defer func() {
  176. if item.DocumentId > 0 {
  177. item.PutToCache()
  178. }
  179. }()
  180. return item.FindByIdentityFirst(identify, bookId)
  181. }
  182. // 根据项目ID查询文档列表.
  183. func (item *Document) FindListByBookId(bookId int) (docs []*Document, err error) {
  184. o := orm.NewOrm()
  185. _, err = o.QueryTable(item.TableNameWithPrefix()).Filter("book_id", bookId).OrderBy("order_sort").All(&docs)
  186. return
  187. }
  188. // 判断文章是否存在
  189. func (item *Document) IsExist(documentId int) bool {
  190. o := orm.NewOrm()
  191. return o.QueryTable(item.TableNameWithPrefix()).Filter("document_id", documentId).Exist()
  192. }
  193. // 发布单篇文档
  194. func (item *Document) ReleaseContent() error {
  195. item.Release = strings.TrimSpace(item.Content)
  196. err := item.Processor().InsertOrUpdate("release")
  197. if err != nil {
  198. logs.Error(fmt.Sprintf("发布失败 -> %+v", item), err)
  199. return err
  200. }
  201. //当文档发布后,需要清除已缓存的转换文档和文档缓存
  202. item.RemoveCache()
  203. if err := os.RemoveAll(filepath.Join(conf.WorkingDirectory, "uploads", "books", strconv.Itoa(item.BookId))); err != nil {
  204. logs.Error("删除已缓存的文档目录失败 -> ", filepath.Join(conf.WorkingDirectory, "uploads", "books", strconv.Itoa(item.BookId)))
  205. return err
  206. }
  207. return nil
  208. }
  209. // Processor 调用位置两处:
  210. // 1. 项目发布和文档发布: 处理文档的外链,附件,底部编辑信息等;
  211. // 2. 文档阅读:可以修复存在问题的文档,使其能正常显示附件下载和文档作者信息等。
  212. func (item *Document) Processor() *Document {
  213. if item.Release != "" {
  214. item.Release = utils.SafetyProcessor(item.Release)
  215. } else {
  216. // Release内容为空,直接赋值文档标签,保证附件下载正常
  217. item.Release = "<div class=\"whole-article-wrap\"></div>"
  218. }
  219. // Next: 生成文档的一些附加信息
  220. if docQuery, err := goquery.NewDocumentFromReader(bytes.NewBufferString(item.Release)); err == nil {
  221. //处理附件
  222. if selector := docQuery.Find("div.attach-list").First(); selector.Size() <= 0 {
  223. //处理附件
  224. attachList, err := NewAttachment().FindListByDocumentId(item.DocumentId)
  225. if err == nil && len(attachList) > 0 {
  226. content := bytes.NewBufferString("<div class=\"attach-list\"><strong>" + i18n.Tr(item.Lang, "doc.attachment") + "</strong><ul>")
  227. for _, attach := range attachList {
  228. if strings.HasPrefix(attach.HttpPath, "/") {
  229. attach.HttpPath = strings.TrimSuffix(conf.BaseUrl, "/") + attach.HttpPath
  230. }
  231. li := fmt.Sprintf("<li><a href=\"%s\" target=\"_blank\" title=\"%s\">%s</a></li>", attach.HttpPath, attach.FileName, attach.FileName)
  232. content.WriteString(li)
  233. }
  234. content.WriteString("</ul></div>")
  235. if docQuery == nil {
  236. docQuery, err = goquery.NewDocumentFromReader(content)
  237. if err != nil {
  238. logs.Error("goquery->NewDocumentFromReader err:%+v", err)
  239. }
  240. } else {
  241. if selector := docQuery.Find("div.wiki-bottom").First(); selector.Size() > 0 {
  242. selector.BeforeHtml(content.String()) //This branch should be a compatible branch.
  243. } else if selector := docQuery.Find("div.markdown-article").First(); selector.Size() > 0 {
  244. selector.AppendHtml(content.String()) //The document produced by the editor of Markdown will have this tag.class.
  245. } else if selector := docQuery.Find("div.whole-article-wrap").First(); selector.Size() > 0 {
  246. selector.AppendHtml(content.String()) //All documents should have this tag.
  247. }
  248. }
  249. }
  250. }
  251. //处理了文档底部信息
  252. if selector := docQuery.Find("div.wiki-bottom").First(); selector.Size() <= 0 && item.MemberId > 0 {
  253. //处理文档结尾信息
  254. docCreator, err := NewMember().Find(item.MemberId, "real_name", "account")
  255. release := "<div class=\"wiki-bottom\">"
  256. release += i18n.Tr(item.Lang, "doc.ft_author")
  257. if err == nil && docCreator != nil {
  258. if docCreator.RealName != "" {
  259. release += docCreator.RealName
  260. } else {
  261. release += docCreator.Account
  262. }
  263. }
  264. release += " &nbsp;" + i18n.Tr(item.Lang, "doc.ft_create_time") + item.CreateTime.Local().Format("2006-01-02 15:04") + "<br>"
  265. if item.ModifyAt > 0 {
  266. docModify, err := NewMember().Find(item.ModifyAt, "real_name", "account")
  267. if err == nil {
  268. if docModify.RealName != "" {
  269. release += i18n.Tr(item.Lang, "doc.ft_last_editor") + docModify.RealName
  270. } else {
  271. release += i18n.Tr(item.Lang, "doc.ft_last_editor") + docModify.Account
  272. }
  273. }
  274. }
  275. release += " &nbsp;" + i18n.Tr(item.Lang, "doc.ft_update_time") + item.ModifyTime.Local().Format("2006-01-02 15:04") + "<br>"
  276. release += "</div>"
  277. if selector := docQuery.Find("div.markdown-article").First(); selector.Size() > 0 {
  278. selector.AppendHtml(release)
  279. } else if selector := docQuery.Find("div.whole-article-wrap").First(); selector.Size() > 0 {
  280. selector.AppendHtml(release)
  281. }
  282. }
  283. cdnimg, _ := web.AppConfig.String("cdnimg")
  284. docQuery.Find("img").Each(func(i int, selection *goquery.Selection) {
  285. if src, ok := selection.Attr("src"); ok {
  286. src = strings.TrimSpace(strings.ToLower(src))
  287. //过滤掉没有链接的图片标签
  288. if src == "" || strings.HasPrefix(src, "data:text/html") {
  289. selection.Remove()
  290. return
  291. }
  292. //设置图片为CDN地址
  293. if cdnimg != "" && strings.HasPrefix(src, "/uploads/") {
  294. selection.SetAttr("src", utils.JoinURI(cdnimg, src))
  295. }
  296. }
  297. selection.RemoveAttr("onerror").RemoveAttr("onload")
  298. })
  299. //过滤A标签的非法连接
  300. docQuery.Find("a").Each(func(i int, selection *goquery.Selection) {
  301. if val, exists := selection.Attr("href"); exists {
  302. if val == "" {
  303. selection.SetAttr("href", "#")
  304. return
  305. }
  306. val = strings.Replace(strings.ToLower(val), " ", "", -1)
  307. //移除危险脚本链接
  308. if strings.HasPrefix(val, "data:text/html") ||
  309. strings.HasPrefix(val, "vbscript:") ||
  310. strings.HasPrefix(val, "&#106;avascript:") ||
  311. strings.HasPrefix(val, "javascript:") {
  312. selection.SetAttr("href", "#")
  313. }
  314. }
  315. //移除所有 onerror 属性
  316. selection.RemoveAttr("onerror").RemoveAttr("onload").RemoveAttr("onclick")
  317. })
  318. docQuery.Find("script").Remove()
  319. docQuery.Find("link").Remove()
  320. docQuery.Find("vbscript").Remove()
  321. if html, err := docQuery.Html(); err == nil {
  322. item.Release = strings.TrimSuffix(strings.TrimPrefix(strings.TrimSpace(html), "<html><head></head><body>"), "</body></html>")
  323. }
  324. }
  325. return item
  326. }
  327. // 增加阅读次数
  328. func (item *Document) IncrViewCount(id int) {
  329. o := orm.NewOrm()
  330. o.QueryTable(item.TableNameWithPrefix()).Filter("document_id", id).Update(orm.Params{
  331. "view_count": orm.ColValue(orm.ColAdd, 1),
  332. })
  333. }