downloader.go 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231
  1. package main
  2. import (
  3. "github.com/allanpk716/ChineseSubFinder/common"
  4. "github.com/allanpk716/ChineseSubFinder/mark_system"
  5. "github.com/allanpk716/ChineseSubFinder/model"
  6. "github.com/allanpk716/ChineseSubFinder/sub_supplier"
  7. "github.com/allanpk716/ChineseSubFinder/sub_supplier/shooter"
  8. "github.com/allanpk716/ChineseSubFinder/sub_supplier/subhd"
  9. "github.com/allanpk716/ChineseSubFinder/sub_supplier/xunlei"
  10. "github.com/allanpk716/ChineseSubFinder/sub_supplier/zimuku"
  11. "github.com/go-rod/rod/lib/utils"
  12. "github.com/sirupsen/logrus"
  13. "io/ioutil"
  14. "os"
  15. "path"
  16. "path/filepath"
  17. "strings"
  18. )
  19. type Downloader struct {
  20. reqParam common.ReqParam
  21. log *logrus.Logger
  22. topic int // 最多能够下载 Top 几的字幕,每一个网站
  23. wantedExtList []string // 人工确认的需要监控的视频后缀名
  24. defExtList []string // 内置支持的视频后缀名列表
  25. mk *mark_system.MarkingSystem // MarkingSystem
  26. }
  27. func NewDownloader(_reqParam ...common.ReqParam) *Downloader {
  28. var downloader Downloader
  29. downloader.log = model.GetLogger()
  30. downloader.topic = common.DownloadSubsPerSite
  31. if len(_reqParam) > 0 {
  32. downloader.reqParam = _reqParam[0]
  33. if downloader.reqParam.Topic > 0 && downloader.reqParam.Topic != downloader.topic {
  34. downloader.topic = downloader.reqParam.Topic
  35. }
  36. }
  37. downloader.defExtList = make([]string, 0)
  38. downloader.defExtList = append(downloader.defExtList, common.VideoExtMp4)
  39. downloader.defExtList = append(downloader.defExtList, common.VideoExtMkv)
  40. downloader.defExtList = append(downloader.defExtList, common.VideoExtRmvb)
  41. downloader.defExtList = append(downloader.defExtList, common.VideoExtIso)
  42. var sitesSequence = make([]string, 0)
  43. // TODO 这里写固定了抉择字幕的顺序
  44. sitesSequence = append(sitesSequence, common.SubSiteZiMuKu)
  45. sitesSequence = append(sitesSequence, common.SubSiteSubHd)
  46. sitesSequence = append(sitesSequence, common.SubSiteXunLei)
  47. sitesSequence = append(sitesSequence, common.SubSiteShooter)
  48. downloader.mk = mark_system.NewMarkingSystem(sitesSequence)
  49. if len(_reqParam) > 0 {
  50. // 如果用户设置了关注的视频后缀名列表,则用ta的
  51. if len(downloader.reqParam.UserExtList) > 0 {
  52. downloader.wantedExtList = downloader.reqParam.UserExtList
  53. } else {
  54. // 不然就是内置默认的
  55. downloader.wantedExtList = downloader.defExtList
  56. }
  57. } else {
  58. // 不然就是内置默认的
  59. downloader.wantedExtList = downloader.defExtList
  60. }
  61. return &downloader
  62. }
  63. func (d Downloader) GetNowSupportExtList() []string {
  64. return d.wantedExtList
  65. }
  66. func (d Downloader) GetDefSupportExtList() []string {
  67. return d.defExtList
  68. }
  69. func (d Downloader) DownloadSub(dir string) error {
  70. defer func() {
  71. // 抉择完毕,需要清理缓存目录
  72. err := model.ClearTmpFolder()
  73. if err != nil {
  74. d.log.Error(err)
  75. }
  76. }()
  77. nowVideoList, err := d.searchMatchedVideoFile(dir)
  78. if err != nil {
  79. return err
  80. }
  81. // 构建每个字幕站点下载者的实例
  82. subSupplierHub := sub_supplier.NewSubSupplierHub(shooter.NewSupplier(d.reqParam),
  83. subhd.NewSupplier(d.reqParam),
  84. xunlei.NewSupplier(d.reqParam),
  85. zimuku.NewSupplier(d.reqParam),
  86. )
  87. // TODO 后续再改为每个视频以上的流程都是一个 channel 来做,并且需要控制在一个并发量之下(很可能没必要,毕竟要在弱鸡机器上挂机用的)
  88. // 一个视频文件同时多个站点查询,阻塞完毕后,在进行下一个
  89. for i, oneVideoFullPath := range nowVideoList {
  90. // 字幕都下载缓存好了,需要抉择存哪一个,优先选择中文双语的,然后到中文
  91. organizeSubFiles, err := subSupplierHub.DownloadSub(oneVideoFullPath, i)
  92. if err != nil {
  93. d.log.Errorln("subSupplierHub.DownloadSub", oneVideoFullPath ,err)
  94. continue
  95. }
  96. // 得到目标视频文件的根目录
  97. videoRootPath := filepath.Dir(oneVideoFullPath)
  98. // -------------------------------------------------
  99. // 调试缓存,把下载好的字幕写到对应的视频目录下,方便调试
  100. if d.reqParam.DebugMode == true {
  101. err = d.copySubFile2DesFolder(videoRootPath, organizeSubFiles)
  102. if err != nil {
  103. d.log.Errorln("copySubFile2DesFolder", err)
  104. }
  105. }
  106. // -------------------------------------------------
  107. if d.reqParam.SaveMultiSub == false {
  108. // 选择最优的一个字幕
  109. var finalSubFile *common.SubParserFileInfo
  110. finalSubFile = d.mk.SelectOneSubFile(organizeSubFiles)
  111. if finalSubFile == nil {
  112. d.log.Warnln("Found", len(organizeSubFiles), " subtitles but not one fit:", oneVideoFullPath)
  113. continue
  114. }
  115. // 找到了,写入文件
  116. err = d.writeSubFile2VideoPath(oneVideoFullPath, *finalSubFile, "")
  117. if err != nil {
  118. d.log.Errorln("SaveMultiSub:", d.reqParam.SaveMultiSub ,"writeSubFile2VideoPath:", err)
  119. continue
  120. }
  121. } else {
  122. // 每个网站 Top1 的字幕
  123. siteNames, finalSubFiles := d.mk.SelectEachSiteTop1SubFile(organizeSubFiles)
  124. if len(siteNames) < 0 {
  125. d.log.Warnln("SelectEachSiteTop1SubFile found none sub file")
  126. continue
  127. }
  128. for i, file := range finalSubFiles {
  129. err = d.writeSubFile2VideoPath(oneVideoFullPath, file, siteNames[i])
  130. if err != nil {
  131. d.log.Errorln("SaveMultiSub:", d.reqParam.SaveMultiSub ,"writeSubFile2VideoPath:", err)
  132. continue
  133. }
  134. }
  135. }
  136. // -----------------------------------------------------
  137. }
  138. return nil
  139. }
  140. // 在前面需要进行语言的筛选、排序,这里仅仅是存储
  141. func (d Downloader) writeSubFile2VideoPath(videoFileFullPath string, finalSubFile common.SubParserFileInfo, extraSubPreName string) error {
  142. videoRootPath := filepath.Dir(videoFileFullPath)
  143. embyLanExtName := model.Lang2EmbyName(finalSubFile.Lang)
  144. // 构建视频文件加 emby 的字幕预研要求名称
  145. videoFileNameWithOutExt := strings.ReplaceAll(filepath.Base(videoFileFullPath),
  146. filepath.Ext(videoFileFullPath), "")
  147. if extraSubPreName != "" {
  148. extraSubPreName = "[" + extraSubPreName +"]"
  149. }
  150. subNewName := videoFileNameWithOutExt + embyLanExtName + extraSubPreName + finalSubFile.Ext
  151. desSubFullPath := path.Join(videoRootPath, subNewName)
  152. // 最后写入字幕
  153. err := utils.OutputFile(desSubFullPath, finalSubFile.Data)
  154. if err != nil {
  155. return err
  156. }
  157. d.log.Infoln("OrgSubName:", finalSubFile.Name)
  158. d.log.Infoln("SubDownAt:", desSubFullPath)
  159. return nil
  160. }
  161. // searchMatchedVideoFile 搜索符合后缀名的视频文件
  162. func (d Downloader) searchMatchedVideoFile(dir string) ([]string, error) {
  163. var fileFullPathList = make([]string, 0)
  164. pathSep := string(os.PathSeparator)
  165. files, err := ioutil.ReadDir(dir)
  166. if err != nil {
  167. return nil, err
  168. }
  169. for _, curFile := range files {
  170. fullPath := dir + pathSep + curFile.Name()
  171. if curFile.IsDir() {
  172. // 内层的错误就无视了
  173. oneList, _ := d.searchMatchedVideoFile(fullPath)
  174. if oneList != nil {
  175. fileFullPathList = append(fileFullPathList, oneList...)
  176. }
  177. } else {
  178. // 这里就是文件了
  179. if d.isWantedVideoExtDef(curFile.Name()) == true {
  180. fileFullPathList = append(fileFullPathList, fullPath)
  181. }
  182. }
  183. }
  184. return fileFullPathList, nil
  185. }
  186. // isWantedVideoExtDef 后缀名是否符合规则
  187. func (d Downloader) isWantedVideoExtDef(fileName string) bool {
  188. fileName = strings.ToLower(filepath.Ext(fileName))
  189. for _, s := range d.wantedExtList {
  190. if s == fileName {
  191. return true
  192. }
  193. }
  194. return false
  195. }
  196. func (d Downloader) copySubFile2DesFolder(desFolder string, subFiles []string) error {
  197. // 需要进行字幕文件的缓存
  198. // 把缓存的文件夹新建出来
  199. desFolderFullPath := path.Join(desFolder, common.SubTmpFolderName)
  200. err := os.MkdirAll(desFolderFullPath, os.ModePerm)
  201. if err != nil {
  202. return err
  203. }
  204. // 复制下载在 tmp 文件夹中的字幕文件到视频文件夹下面
  205. for _, subFile := range subFiles {
  206. newFn := path.Join(desFolderFullPath, filepath.Base(subFile))
  207. _, err = model.CopyFile(newFn, subFile)
  208. if err != nil {
  209. return err
  210. }
  211. }
  212. return nil
  213. }