downloader.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489
  1. package internal
  2. import (
  3. "github.com/allanpk716/ChineseSubFinder/internal/common"
  4. embyHelper "github.com/allanpk716/ChineseSubFinder/internal/logic/emby_helper"
  5. markSystem "github.com/allanpk716/ChineseSubFinder/internal/logic/mark_system"
  6. seriesHelper "github.com/allanpk716/ChineseSubFinder/internal/logic/series_helper"
  7. subSupplier "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_supplier"
  8. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_supplier/shooter"
  9. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_supplier/subhd"
  10. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_supplier/xunlei"
  11. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_supplier/zimuku"
  12. "github.com/allanpk716/ChineseSubFinder/internal/pkg"
  13. "github.com/allanpk716/ChineseSubFinder/internal/pkg/decode"
  14. "github.com/allanpk716/ChineseSubFinder/internal/pkg/language"
  15. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  16. "github.com/allanpk716/ChineseSubFinder/internal/pkg/sub_helper"
  17. "github.com/allanpk716/ChineseSubFinder/internal/types"
  18. "github.com/allanpk716/ChineseSubFinder/internal/types/emby"
  19. "github.com/allanpk716/ChineseSubFinder/internal/types/series"
  20. "github.com/allanpk716/ChineseSubFinder/internal/types/subparser"
  21. "github.com/go-rod/rod/lib/utils"
  22. "github.com/panjf2000/ants/v2"
  23. "github.com/sirupsen/logrus"
  24. "golang.org/x/net/context"
  25. "os"
  26. "path"
  27. "path/filepath"
  28. "strings"
  29. "sync"
  30. )
  31. // Downloader 实例化一次用一次,不要反复的使用,很多临时标志位需要清理。
  32. type Downloader struct {
  33. reqParam types.ReqParam
  34. log *logrus.Logger
  35. topic int // 最多能够下载 Top 几的字幕,每一个网站
  36. mk *markSystem.MarkingSystem // MarkingSystem
  37. embyHelper *embyHelper.EmbyHelper
  38. movieFileFullPathList []string // 多个需要搜索字幕的电影文件全路径
  39. seriesSubNeedDlMap map[string][]emby.EmbyMixInfo // 多个需要搜索字幕的连续剧目录
  40. }
  41. func NewDownloader(_reqParam ...types.ReqParam) *Downloader {
  42. var downloader Downloader
  43. downloader.log = log_helper.GetLogger()
  44. downloader.topic = common.DownloadSubsPerSite
  45. if len(_reqParam) > 0 {
  46. downloader.reqParam = _reqParam[0]
  47. if downloader.reqParam.Topic > 0 && downloader.reqParam.Topic != downloader.topic {
  48. downloader.topic = downloader.reqParam.Topic
  49. }
  50. // 并发线程的范围控制
  51. if downloader.reqParam.Threads <= 0 {
  52. downloader.reqParam.Threads = 2
  53. } else if downloader.reqParam.Threads >= 10 {
  54. downloader.reqParam.Threads = 10
  55. }
  56. // 初始化 Emby API 接口
  57. if downloader.reqParam.EmbyConfig.Url != "" && downloader.reqParam.EmbyConfig.ApiKey != "" {
  58. downloader.embyHelper = embyHelper.NewEmbyHelper(downloader.reqParam.EmbyConfig)
  59. }
  60. } else {
  61. downloader.reqParam = *types.NewReqParam()
  62. }
  63. var sitesSequence = make([]string, 0)
  64. // TODO 这里写固定了抉择字幕的顺序
  65. sitesSequence = append(sitesSequence, common.SubSiteZiMuKu)
  66. sitesSequence = append(sitesSequence, common.SubSiteSubHd)
  67. sitesSequence = append(sitesSequence, common.SubSiteXunLei)
  68. sitesSequence = append(sitesSequence, common.SubSiteShooter)
  69. downloader.mk = markSystem.NewMarkingSystem(sitesSequence, downloader.reqParam.SubTypePriority)
  70. downloader.movieFileFullPathList = make([]string, 0)
  71. downloader.seriesSubNeedDlMap = make(map[string][]emby.EmbyMixInfo)
  72. return &downloader
  73. }
  74. // GetUpdateVideoListFromEmby 这里首先会进行近期影片的获取,然后对这些影片进行刷新,然后在获取字幕列表,最终得到需要字幕获取的 video 列表
  75. func (d *Downloader) GetUpdateVideoListFromEmby(movieRootDir, seriesRootDir string) error {
  76. if d.embyHelper == nil {
  77. return nil
  78. }
  79. var err error
  80. var movieList []emby.EmbyMixInfo
  81. movieList, d.seriesSubNeedDlMap, err = d.embyHelper.GetRecentlyAddVideoList(movieRootDir, seriesRootDir)
  82. if err != nil {
  83. return err
  84. }
  85. // 获取全路径
  86. for _, info := range movieList {
  87. d.movieFileFullPathList = append(d.movieFileFullPathList, info.VideoFileFullPath)
  88. }
  89. return nil
  90. }
  91. func (d Downloader) RefreshEmbySubList() error {
  92. if d.embyHelper == nil {
  93. return nil
  94. }
  95. bRefresh := false
  96. defer func() {
  97. if bRefresh == true {
  98. d.log.Infoln("Refresh Emby Sub List")
  99. }
  100. }()
  101. bRefresh, err := d.embyHelper.RefreshEmbySubList()
  102. if err != nil {
  103. return err
  104. }
  105. return nil
  106. }
  107. func (d Downloader) DownloadSub4Movie(dir string) error {
  108. defer func() {
  109. // 所有的电影字幕下载完成,抉择完成,需要清理缓存目录
  110. err := pkg.ClearRootTmpFolder()
  111. if err != nil {
  112. d.log.Error("ClearRootTmpFolder", err)
  113. }
  114. d.log.Infoln("Download Movie Sub End...")
  115. }()
  116. var err error
  117. d.log.Infoln("Download Movie Sub Started...")
  118. // 是否是通过 emby_helper api 获取的列表
  119. if d.embyHelper == nil {
  120. // 没有填写 emby_helper api 的信息,那么就走常规的全文件扫描流程
  121. d.movieFileFullPathList, err = pkg.SearchMatchedVideoFile(dir)
  122. if err != nil {
  123. return err
  124. }
  125. } else {
  126. // 进过 emby_helper api 的信息读取
  127. d.log.Infoln("Movie Sub Dl From Emby API...")
  128. if len(d.movieFileFullPathList) < 1 {
  129. d.log.Infoln("Movie Sub Dl From Emby API no movie need Dl sub")
  130. return nil
  131. }
  132. }
  133. // 并发控制
  134. movieDlFunc := func(i interface{}) error {
  135. inData := i.(InputData)
  136. // -----------------------------------------------------
  137. // 构建每个字幕站点下载者的实例
  138. var subSupplierHub = subSupplier.NewSubSupplierHub(
  139. subhd.NewSupplier(d.reqParam),
  140. zimuku.NewSupplier(d.reqParam),
  141. xunlei.NewSupplier(d.reqParam),
  142. shooter.NewSupplier(d.reqParam),
  143. )
  144. // 字幕都下载缓存好了,需要抉择存哪一个,优先选择中文双语的,然后到中文
  145. organizeSubFiles, err := subSupplierHub.DownloadSub4Movie(inData.OneVideoFullPath, inData.Index)
  146. if err != nil {
  147. d.log.Errorln("subSupplierHub.DownloadSub4Movie", inData.OneVideoFullPath, err)
  148. return err
  149. }
  150. if organizeSubFiles == nil || len(organizeSubFiles) < 1 {
  151. d.log.Infoln("no sub found", filepath.Base(inData.OneVideoFullPath))
  152. return nil
  153. }
  154. d.oneVideoSelectBestSub(inData.OneVideoFullPath, organizeSubFiles)
  155. // -----------------------------------------------------
  156. return nil
  157. }
  158. p, err := ants.NewPoolWithFunc(d.reqParam.Threads, func(inData interface{}) {
  159. data := inData.(InputData)
  160. defer data.Wg.Done()
  161. ctx, cancel := context.WithTimeout(context.Background(), common.OneVideoProcessTimeOut)
  162. defer cancel()
  163. done := make(chan error, 1)
  164. panicChan := make(chan interface{}, 1)
  165. go func() {
  166. defer func() {
  167. if p := recover(); p != nil {
  168. panicChan <- p
  169. }
  170. }()
  171. done <- movieDlFunc(inData)
  172. }()
  173. select {
  174. case _ = <-done:
  175. return
  176. case p := <-panicChan:
  177. d.log.Errorln("DownloadSub4Movie.NewPoolWithFunc got panic", p)
  178. case <-ctx.Done():
  179. d.log.Errorln("DownloadSub4Movie.NewPoolWithFunc got time out", ctx.Err())
  180. return
  181. }
  182. })
  183. if err != nil {
  184. return err
  185. }
  186. defer p.Release()
  187. wg := sync.WaitGroup{}
  188. // 一个视频文件同时多个站点查询,阻塞完毕后,在进行下一个
  189. for i, oneVideoFullPath := range d.movieFileFullPathList {
  190. wg.Add(1)
  191. err = p.Invoke(InputData{OneVideoFullPath: oneVideoFullPath, Index: i, Wg: &wg})
  192. if err != nil {
  193. d.log.Errorln("DownloadSub4Movie ants.Invoke", err)
  194. }
  195. }
  196. wg.Wait()
  197. return nil
  198. }
  199. func (d Downloader) DownloadSub4Series(dir string) error {
  200. var err error
  201. defer func() {
  202. // 所有的连续剧字幕下载完成,抉择完成,需要清理缓存目录
  203. err := pkg.ClearRootTmpFolder()
  204. if err != nil {
  205. d.log.Error("ClearRootTmpFolder", err)
  206. }
  207. d.log.Infoln("Download Series Sub End...")
  208. }()
  209. d.log.Infoln("Download Series Sub Started...")
  210. // 并发控制
  211. seriesDlFunc := func(i interface{}) error {
  212. inData := i.(InputData)
  213. // 构建每个字幕站点下载者的实例
  214. var subSupplierHub *subSupplier.SubSupplierHub
  215. subSupplierHub = subSupplier.NewSubSupplierHub(
  216. zimuku.NewSupplier(d.reqParam),
  217. subhd.NewSupplier(d.reqParam),
  218. xunlei.NewSupplier(d.reqParam),
  219. shooter.NewSupplier(d.reqParam),
  220. )
  221. // 这里拿到了这一部连续剧的所有的剧集信息,以及所有下载到的字幕信息
  222. var seriesInfo *series.SeriesInfo
  223. var organizeSubFiles map[string][]string
  224. // 是否是通过 emby_helper api 获取的列表
  225. if d.embyHelper == nil {
  226. seriesInfo, organizeSubFiles, err = subSupplierHub.DownloadSub4Series(inData.OneVideoFullPath, inData.Index)
  227. if err != nil {
  228. d.log.Errorln("subSupplierHub.DownloadSub4Series", inData.OneVideoFullPath, err)
  229. return err
  230. }
  231. } else {
  232. // 先进性 emby_helper api 的操作,读取需要更新字幕的项目
  233. seriesInfo, organizeSubFiles, err = subSupplierHub.DownloadSub4SeriesFromEmby(
  234. path.Join(dir, inData.OneVideoFullPath),
  235. d.seriesSubNeedDlMap[inData.OneVideoFullPath], inData.Index)
  236. if err != nil {
  237. d.log.Errorln("subSupplierHub.DownloadSub4Series", inData.OneVideoFullPath, err)
  238. return err
  239. }
  240. }
  241. if organizeSubFiles == nil || len(organizeSubFiles) < 1 {
  242. d.log.Infoln("no sub found", filepath.Base(inData.OneVideoFullPath))
  243. return nil
  244. }
  245. // 只针对需要下载字幕的视频进行字幕的选择保存
  246. for epsKey, episodeInfo := range seriesInfo.NeedDlEpsKeyList {
  247. // 匹配对应的 Eps 去处理
  248. d.oneVideoSelectBestSub(episodeInfo.FileFullPath, organizeSubFiles[epsKey])
  249. }
  250. // 这里会拿到一份季度字幕的列表比如,Key 是 S1E0 S2E0 S3E0,value 是新的存储位置
  251. fullSeasonSubDict := d.saveFullSeasonSub(seriesInfo, organizeSubFiles)
  252. // TODO 季度的字幕包,应该优先于零散的字幕吧,暂定就这样了,注意是全部都替换
  253. // 需要与有下载需求的季交叉
  254. for _, episodeInfo := range seriesInfo.EpList {
  255. _, ok := seriesInfo.NeedDlSeasonDict[episodeInfo.Season]
  256. if ok == false {
  257. continue
  258. }
  259. // 匹配对应的 Eps 去处理
  260. seasonEpsKey := pkg.GetEpisodeKeyName(episodeInfo.Season, episodeInfo.Episode)
  261. d.oneVideoSelectBestSub(episodeInfo.FileFullPath, fullSeasonSubDict[seasonEpsKey])
  262. }
  263. // 是否清理全季的缓存字幕文件夹
  264. if d.reqParam.SaveOneSeasonSub == false {
  265. err = sub_helper.DeleteOneSeasonSubCacheFolder(seriesInfo.DirPath)
  266. if err != nil {
  267. return err
  268. }
  269. }
  270. return nil
  271. }
  272. p, err := ants.NewPoolWithFunc(d.reqParam.Threads, func(inData interface{}) {
  273. data := inData.(InputData)
  274. defer data.Wg.Done()
  275. ctx, cancel := context.WithTimeout(context.Background(), common.OneVideoProcessTimeOut)
  276. defer cancel()
  277. done := make(chan error, 1)
  278. panicChan := make(chan interface{}, 1)
  279. go func() {
  280. defer func() {
  281. if p := recover(); p != nil {
  282. panicChan <- p
  283. }
  284. }()
  285. done <- seriesDlFunc(inData)
  286. }()
  287. select {
  288. case _ = <-done:
  289. return
  290. case p := <-panicChan:
  291. d.log.Errorln("DownloadSub4Series.NewPoolWithFunc got panic", p)
  292. case <-ctx.Done():
  293. d.log.Errorln("DownloadSub4Series.NewPoolWithFunc got time out", ctx.Err())
  294. return
  295. }
  296. })
  297. if err != nil {
  298. return err
  299. }
  300. defer p.Release()
  301. // 是否是通过 emby_helper api 获取的列表
  302. var seriesDirList = make([]string, 0)
  303. if d.embyHelper == nil {
  304. // 遍历连续剧总目录下的第一层目录
  305. seriesDirList, err = seriesHelper.GetSeriesList(dir)
  306. if err != nil {
  307. return err
  308. }
  309. } else {
  310. // 这里给出的是连续剧的文件夹名称
  311. for s, _ := range d.seriesSubNeedDlMap {
  312. seriesDirList = append(seriesDirList, s)
  313. }
  314. }
  315. wg := sync.WaitGroup{}
  316. for i, oneSeriesPath := range seriesDirList {
  317. wg.Add(1)
  318. err = p.Invoke(InputData{OneVideoFullPath: oneSeriesPath, Index: i, Wg: &wg})
  319. if err != nil {
  320. d.log.Errorln("DownloadSub4Series ants.Invoke", err)
  321. }
  322. }
  323. wg.Wait()
  324. return nil
  325. }
  326. // oneVideoSelectBestSub 一个视频,选择最佳的一个字幕(也可以保存所有网站第一个最佳字幕)
  327. func (d Downloader) oneVideoSelectBestSub(oneVideoFullPath string, organizeSubFiles []string) {
  328. var err error
  329. // 得到目标视频文件的根目录
  330. videoRootPath := filepath.Dir(oneVideoFullPath)
  331. // -------------------------------------------------
  332. // 调试缓存,把下载好的字幕写到对应的视频目录下,方便调试
  333. if d.reqParam.DebugMode == true {
  334. err = d.copySubFile2DesFolder(videoRootPath, organizeSubFiles)
  335. if err != nil {
  336. d.log.Errorln("copySubFile2DesFolder", err)
  337. }
  338. }
  339. // -------------------------------------------------
  340. if d.reqParam.SaveMultiSub == false {
  341. // 选择最优的一个字幕
  342. var finalSubFile *subparser.FileInfo
  343. finalSubFile = d.mk.SelectOneSubFile(organizeSubFiles)
  344. if finalSubFile == nil {
  345. d.log.Warnln("Found", len(organizeSubFiles), " subtitles but not one fit:", oneVideoFullPath)
  346. return
  347. }
  348. // 找到了,写入文件
  349. err = d.writeSubFile2VideoPath(oneVideoFullPath, *finalSubFile, "")
  350. if err != nil {
  351. d.log.Errorln("SaveMultiSub:", d.reqParam.SaveMultiSub, "writeSubFile2VideoPath:", err)
  352. return
  353. }
  354. } else {
  355. // 每个网站 Top1 的字幕
  356. siteNames, finalSubFiles := d.mk.SelectEachSiteTop1SubFile(organizeSubFiles)
  357. if len(siteNames) < 0 {
  358. d.log.Warnln("SelectEachSiteTop1SubFile found none sub file")
  359. return
  360. }
  361. for i, file := range finalSubFiles {
  362. err = d.writeSubFile2VideoPath(oneVideoFullPath, file, siteNames[i])
  363. if err != nil {
  364. d.log.Errorln("SaveMultiSub:", d.reqParam.SaveMultiSub, "writeSubFile2VideoPath:", err)
  365. return
  366. }
  367. }
  368. }
  369. }
  370. // saveFullSeasonSub 这里就需要单独存储到连续剧每一季的文件夹的特殊文件夹中
  371. func (d Downloader) saveFullSeasonSub(seriesInfo *series.SeriesInfo, organizeSubFiles map[string][]string) map[string][]string {
  372. var fullSeasonSubDict = make(map[string][]string)
  373. for _, season := range seriesInfo.SeasonDict {
  374. seasonKey := pkg.GetEpisodeKeyName(season, 0)
  375. subs, ok := organizeSubFiles[seasonKey]
  376. if ok == false {
  377. continue
  378. }
  379. for _, sub := range subs {
  380. subFileName := filepath.Base(sub)
  381. newSeasonSubRootPath := path.Join(seriesInfo.DirPath, "Sub_"+seasonKey)
  382. _ = os.MkdirAll(newSeasonSubRootPath, os.ModePerm)
  383. newSubFullPath := path.Join(newSeasonSubRootPath, subFileName)
  384. err := pkg.CopyFile(sub, newSubFullPath)
  385. if err != nil {
  386. d.log.Errorln("saveFullSeasonSub", subFileName, err)
  387. continue
  388. }
  389. // 从字幕的文件名推断是 哪一季 的 那一集
  390. _, gusSeason, gusEpisode, err := decode.GetSeasonAndEpisodeFromSubFileName(subFileName)
  391. if err != nil {
  392. return nil
  393. }
  394. // 把整季的字幕缓存位置也提供出去,如果之前没有下载到的,这里返回出来的可以补上
  395. seasonEpsKey := pkg.GetEpisodeKeyName(gusSeason, gusEpisode)
  396. _, ok := fullSeasonSubDict[seasonEpsKey]
  397. if ok == false {
  398. // 初始化
  399. fullSeasonSubDict[seasonEpsKey] = make([]string, 0)
  400. }
  401. fullSeasonSubDict[seasonEpsKey] = append(fullSeasonSubDict[seasonEpsKey], sub)
  402. }
  403. }
  404. return fullSeasonSubDict
  405. }
  406. // 在前面需要进行语言的筛选、排序,这里仅仅是存储
  407. func (d Downloader) writeSubFile2VideoPath(videoFileFullPath string, finalSubFile subparser.FileInfo, extraSubPreName string) error {
  408. videoRootPath := filepath.Dir(videoFileFullPath)
  409. embyLanExtName := language.Lang2EmbyName(finalSubFile.Lang)
  410. // 构建视频文件加 emby_helper 的字幕预研要求名称
  411. videoFileNameWithOutExt := strings.ReplaceAll(filepath.Base(videoFileFullPath),
  412. filepath.Ext(videoFileFullPath), "")
  413. if extraSubPreName != "" {
  414. extraSubPreName = "[" + extraSubPreName + "]"
  415. }
  416. subNewName := videoFileNameWithOutExt + embyLanExtName + extraSubPreName + finalSubFile.Ext
  417. desSubFullPath := path.Join(videoRootPath, subNewName)
  418. // 最后写入字幕
  419. err := utils.OutputFile(desSubFullPath, finalSubFile.Data)
  420. if err != nil {
  421. return err
  422. }
  423. d.log.Infoln("OrgSubName:", finalSubFile.Name)
  424. d.log.Infoln("SubDownAt:", desSubFullPath)
  425. return nil
  426. }
  427. // copySubFile2DesFolder 拷贝字幕文件到目标文件夹
  428. func (d Downloader) copySubFile2DesFolder(desFolder string, subFiles []string) error {
  429. // 需要进行字幕文件的缓存
  430. // 把缓存的文件夹新建出来
  431. desFolderFullPath := path.Join(desFolder, common.SubTmpFolderName)
  432. err := os.MkdirAll(desFolderFullPath, os.ModePerm)
  433. if err != nil {
  434. return err
  435. }
  436. // 复制下载在 tmp 文件夹中的字幕文件到视频文件夹下面
  437. for _, subFile := range subFiles {
  438. newFn := path.Join(desFolderFullPath, filepath.Base(subFile))
  439. err = pkg.CopyFile(subFile, newFn)
  440. if err != nil {
  441. return err
  442. }
  443. }
  444. return nil
  445. }
  446. type InputData struct {
  447. OneVideoFullPath string
  448. Index int
  449. Wg *sync.WaitGroup
  450. }