markingsystem.go 4.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118
  1. package mark_system
  2. import (
  3. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_parser/ass"
  4. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_parser/srt"
  5. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  6. "github.com/allanpk716/ChineseSubFinder/internal/pkg/sub_helper"
  7. "github.com/allanpk716/ChineseSubFinder/internal/pkg/sub_parser_hub"
  8. "github.com/allanpk716/ChineseSubFinder/internal/types/subparser"
  9. "github.com/sirupsen/logrus"
  10. )
  11. // MarkingSystem 评价系统,解决字幕排序优先级问题
  12. type MarkingSystem struct {
  13. log *logrus.Logger
  14. subSiteSequence []string // 网站的优先级,从高到低
  15. SubTypePriority int // 字幕格式的优先级
  16. subParserHub *sub_parser_hub.SubParserHub
  17. }
  18. func NewMarkingSystem(subSiteSequence []string, subTypePriority int) *MarkingSystem {
  19. mk := MarkingSystem{subSiteSequence: subSiteSequence,
  20. log: log_helper.GetLogger(),
  21. SubTypePriority: subTypePriority,
  22. subParserHub: sub_parser_hub.NewSubParserHub(ass.NewParser(), srt.NewParser())}
  23. return &mk
  24. }
  25. // SelectOneSubFile 选择最优的一个字幕文件
  26. func (m MarkingSystem) SelectOneSubFile(organizeSubFiles []string) *subparser.FileInfo {
  27. var finalSubFile *subparser.FileInfo
  28. subInfoDict := m.parseSubFileInfo(organizeSubFiles)
  29. // 优先级别暂定 subSiteSequence: zimuku -> subhd -> xunlei -> shooter
  30. // 这里需要循环四轮:
  31. // 第一轮,双语、字幕类型自定义,优先
  32. // 第二轮,单语言(中文)、字幕类型自定义,优先
  33. // 第三轮,双语、字幕类型0,优先
  34. // 第四轮,单语言(中文)、字幕类型0,优先
  35. for i := 0; i < 4; i++ {
  36. for _, subSite := range m.subSiteSequence {
  37. infos, ok := subInfoDict[subSite]
  38. if ok == false {
  39. continue
  40. }
  41. if i == 0 {
  42. finalSubFile = sub_helper.SelectChineseBestBilingualSubtitle(infos, m.SubTypePriority)
  43. } else if i == 1 {
  44. finalSubFile = sub_helper.SelectChineseBestSubtitle(infos, m.SubTypePriority)
  45. } else if i == 2 {
  46. finalSubFile = sub_helper.SelectChineseBestBilingualSubtitle(infos, 0)
  47. } else if i == 3 {
  48. finalSubFile = sub_helper.SelectChineseBestSubtitle(infos, 0)
  49. }
  50. if finalSubFile != nil {
  51. return finalSubFile
  52. }
  53. }
  54. }
  55. return nil
  56. }
  57. // SelectEachSiteTop1SubFile 每个网站最优的文件
  58. func (m MarkingSystem) SelectEachSiteTop1SubFile(organizeSubFiles []string) ([]string, []subparser.FileInfo) {
  59. // 每个文件都带有出处 [subhd]
  60. var finalSubFile *subparser.FileInfo
  61. var outSiteName = make([]string, 0)
  62. var outSubParserFileInfos = make([]subparser.FileInfo, 0)
  63. subInfoDict := m.parseSubFileInfo(organizeSubFiles)
  64. // 这里需要循环四轮:
  65. // 第一轮,双语、字幕类型自定义,优先
  66. // 第二轮,单语言(中文)、字幕类型自定义,优先
  67. // 第三轮,双语、字幕类型0,优先
  68. // 第四轮,单语言(中文)、字幕类型0,优先
  69. for siteName, infos := range subInfoDict {
  70. // 每个网站保存一个
  71. for i := 0; i < 4; i++ {
  72. if i == 0 {
  73. finalSubFile = sub_helper.SelectChineseBestBilingualSubtitle(infos, m.SubTypePriority)
  74. } else if i == 1 {
  75. finalSubFile = sub_helper.SelectChineseBestSubtitle(infos, m.SubTypePriority)
  76. } else if i == 2 {
  77. finalSubFile = sub_helper.SelectChineseBestBilingualSubtitle(infos, 0)
  78. } else if i == 3 {
  79. finalSubFile = sub_helper.SelectChineseBestSubtitle(infos, 0)
  80. }
  81. if finalSubFile != nil {
  82. outSiteName = append(outSiteName, siteName)
  83. outSubParserFileInfos = append(outSubParserFileInfos, *finalSubFile)
  84. break
  85. }
  86. }
  87. }
  88. return outSiteName, outSubParserFileInfos
  89. }
  90. // parseSubFileInfo 从文件解析字幕信息
  91. func (m MarkingSystem) parseSubFileInfo(organizeSubFiles []string) map[string][]subparser.FileInfo {
  92. // 一个网站可能就算取了 Top1 字幕,也可能是返回一个压缩包,然后解压完就是多个字幕,所以
  93. var subInfoDict = make(map[string][]subparser.FileInfo)
  94. // 拿到现有的字幕列表,开始抉择
  95. // 先判断当前字幕是什么语言(如果是简体,还需要考虑,判断这个字幕是简体还是繁体)
  96. for _, oneSubFileFullPath := range organizeSubFiles {
  97. subFileInfo, err := m.subParserHub.DetermineFileTypeFromFile(oneSubFileFullPath)
  98. if err != nil {
  99. m.log.Error("DetermineFileTypeFromFile", oneSubFileFullPath, err)
  100. continue
  101. }
  102. _, ok := subInfoDict[subFileInfo.FromWhereSite]
  103. if ok == false {
  104. // 新建
  105. subInfoDict[subFileInfo.FromWhereSite] = make([]subparser.FileInfo, 0)
  106. }
  107. // 添加
  108. subInfoDict[subFileInfo.FromWhereSite] = append(subInfoDict[subFileInfo.FromWhereSite], *subFileInfo)
  109. }
  110. return subInfoDict
  111. }