decode.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391
  1. package decode
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/internal/common"
  5. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  6. "github.com/allanpk716/ChineseSubFinder/internal/types"
  7. "github.com/beevik/etree"
  8. PTN "github.com/middelink/go-parse-torrent-name"
  9. "os"
  10. "path/filepath"
  11. "regexp"
  12. "strconv"
  13. "strings"
  14. "time"
  15. )
  16. func getImdbAndYearMovieXml(movieFilePath string) (types.VideoIMDBInfo, error) {
  17. videoInfo := types.VideoIMDBInfo{}
  18. doc := etree.NewDocument()
  19. doc.ReadSettings.Permissive = true
  20. if err := doc.ReadFromFile(movieFilePath); err != nil {
  21. return videoInfo, err
  22. }
  23. for _, t := range doc.FindElements("//IMDB") {
  24. videoInfo.ImdbId = t.Text()
  25. break
  26. }
  27. for _, t := range doc.FindElements("//ProductionYear") {
  28. videoInfo.Year = t.Text()
  29. break
  30. }
  31. if videoInfo.ImdbId != "" {
  32. return videoInfo, nil
  33. }
  34. return videoInfo, common.CanNotFindIMDBID
  35. }
  36. func getImdbAndYearNfo(nfoFilePath string, rootKey string) (types.VideoIMDBInfo, error) {
  37. imdbInfo := types.VideoIMDBInfo{}
  38. doc := etree.NewDocument()
  39. doc.ReadSettings.Permissive = true
  40. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  41. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  42. // 所以这里很傻的方式解决
  43. err := doc.ReadFromFile(nfoFilePath)
  44. if err != nil {
  45. return imdbInfo, err
  46. }
  47. for _, t := range doc.FindElements("./" + rootKey + "/title") {
  48. imdbInfo.Title = t.Text()
  49. break
  50. }
  51. //---------------------------------------------------------------------
  52. for _, t := range doc.FindElements("./" + rootKey + "/imdbid") {
  53. imdbInfo.ImdbId = t.Text()
  54. break
  55. }
  56. for _, t := range doc.FindElements("./" + rootKey + "/imdb_id") {
  57. imdbInfo.ImdbId = t.Text()
  58. break
  59. }
  60. for _, t := range doc.FindElements("//uniqueid[@type='imdb']") {
  61. imdbInfo.ImdbId = t.Text()
  62. break
  63. }
  64. for _, t := range doc.FindElements("//uniqueid[@type='Imdb']") {
  65. imdbInfo.ImdbId = t.Text()
  66. break
  67. }
  68. for _, t := range doc.FindElements("//uniqueid[@type='IMDB']") {
  69. imdbInfo.ImdbId = t.Text()
  70. break
  71. }
  72. //---------------------------------------------------------------------
  73. for _, t := range doc.FindElements("./" + rootKey + "/year") {
  74. imdbInfo.Year = t.Text()
  75. break
  76. }
  77. //---------------------------------------------------------------------
  78. for _, t := range doc.FindElements("./" + rootKey + "/releasedate") {
  79. imdbInfo.ReleaseDate = t.Text()
  80. break
  81. }
  82. //---------------------------------------------------------------------
  83. for _, t := range doc.FindElements("./" + rootKey + "/premiered") {
  84. imdbInfo.ReleaseDate = t.Text()
  85. break
  86. }
  87. if imdbInfo.ImdbId != "" {
  88. return imdbInfo, nil
  89. }
  90. return imdbInfo, common.CanNotFindIMDBID
  91. }
  92. // GetImdbInfo4Movie 从电影视频文件获取 IMDB info
  93. func GetImdbInfo4Movie(movieFileFullPath string) (types.VideoIMDBInfo, error) {
  94. imdbInfo := types.VideoIMDBInfo{}
  95. // movie 当前的目录
  96. dirPth := filepath.Dir(movieFileFullPath)
  97. // 与 movie 文件名一致的 nfo 文件名称
  98. movieNfoFileName := filepath.Base(movieFileFullPath)
  99. movieNfoFileName = strings.ReplaceAll(movieNfoFileName, filepath.Ext(movieFileFullPath), suffixNameNfo)
  100. // movie.xml
  101. movieXmlFPath := ""
  102. // movieName.nfo 文件
  103. movieNameNfoFPath := ""
  104. // 通用的 *.nfo
  105. nfoFilePath := ""
  106. dir, err := os.ReadDir(dirPth)
  107. if err != nil {
  108. return imdbInfo, err
  109. }
  110. for _, fi := range dir {
  111. if fi.IsDir() == true {
  112. continue
  113. }
  114. upperName := strings.ToLower(fi.Name())
  115. if upperName == MetadataMovieXml {
  116. // 找 movie.xml
  117. movieXmlFPath = filepath.Join(dirPth, fi.Name())
  118. break
  119. } else if upperName == movieNfoFileName {
  120. // movieName.nfo 文件
  121. movieNameNfoFPath = filepath.Join(dirPth, fi.Name())
  122. break
  123. } else {
  124. // 找 *.nfo,很可能是 movie.nfo
  125. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  126. if ok {
  127. nfoFilePath = filepath.Join(dirPth, fi.Name())
  128. }
  129. }
  130. }
  131. // 根据找到的开始解析
  132. if movieNameNfoFPath == "" && movieXmlFPath == "" && nfoFilePath == "" {
  133. return imdbInfo, common.NoMetadataFile
  134. }
  135. // 优先分析 movieName.nfo 文件
  136. if movieNameNfoFPath != "" {
  137. imdbInfo, err = getImdbAndYearNfo(movieNameNfoFPath, "movie")
  138. if err != nil {
  139. return types.VideoIMDBInfo{}, err
  140. }
  141. return imdbInfo, nil
  142. }
  143. if movieXmlFPath != "" {
  144. imdbInfo, err = getImdbAndYearMovieXml(movieXmlFPath)
  145. if err != nil {
  146. log_helper.GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  147. } else {
  148. return imdbInfo, nil
  149. }
  150. }
  151. if nfoFilePath != "" {
  152. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "movie")
  153. if err != nil {
  154. return imdbInfo, err
  155. } else {
  156. return imdbInfo, nil
  157. }
  158. }
  159. return imdbInfo, common.CanNotFindIMDBID
  160. }
  161. // GetImdbInfo4SeriesDir 从一个连续剧的根目录获取 IMDB info
  162. func GetImdbInfo4SeriesDir(seriesDir string) (types.VideoIMDBInfo, error) {
  163. imdbInfo := types.VideoIMDBInfo{}
  164. dir, err := os.ReadDir(seriesDir)
  165. if err != nil {
  166. return imdbInfo, err
  167. }
  168. nfoFilePath := ""
  169. for _, fi := range dir {
  170. if fi.IsDir() == true {
  171. continue
  172. }
  173. upperName := strings.ToUpper(fi.Name())
  174. if upperName == strings.ToUpper(MetadateTVNfo) {
  175. // 连续剧的 nfo 文件
  176. nfoFilePath = filepath.Join(seriesDir, fi.Name())
  177. break
  178. } else {
  179. // 找 *.nfo
  180. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  181. if ok {
  182. nfoFilePath = filepath.Join(seriesDir, fi.Name())
  183. }
  184. }
  185. }
  186. // 根据找到的开始解析
  187. if nfoFilePath == "" {
  188. return imdbInfo, common.NoMetadataFile
  189. }
  190. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "tvshow")
  191. if err != nil {
  192. return types.VideoIMDBInfo{}, err
  193. }
  194. return imdbInfo, nil
  195. }
  196. // GetSeriesImdbInfoFromEpisode 从一集获取这个 Series 的 IMDB info
  197. func GetSeriesImdbInfoFromEpisode(oneEpFPath string) (types.VideoIMDBInfo, error) {
  198. var err error
  199. // 当前季的路径
  200. EPdir := filepath.Dir(oneEpFPath)
  201. // 先判断是否存在 tvshow.nfo
  202. nfoFilePath := ""
  203. dir, err := os.ReadDir(EPdir)
  204. for _, fi := range dir {
  205. if fi.IsDir() == true {
  206. continue
  207. }
  208. upperName := strings.ToUpper(fi.Name())
  209. if upperName == strings.ToUpper(MetadateTVNfo) {
  210. // 连续剧的 nfo 文件
  211. nfoFilePath = filepath.Join(EPdir, fi.Name())
  212. break
  213. }
  214. }
  215. if nfoFilePath == "" {
  216. // 没有找到,那么就向上一级再次找
  217. seasonDir := filepath.Base(EPdir)
  218. seriesDir := EPdir[:len(EPdir)-len(seasonDir)]
  219. return GetImdbInfo4SeriesDir(seriesDir)
  220. } else {
  221. var imdbInfo types.VideoIMDBInfo
  222. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "tvshow")
  223. if err != nil {
  224. return types.VideoIMDBInfo{}, err
  225. }
  226. return imdbInfo, nil
  227. }
  228. }
  229. // GetImdbInfo4OneSeriesEpisode 获取这一集的 IMDB info
  230. func GetImdbInfo4OneSeriesEpisode(oneEpFPath string) (types.VideoIMDBInfo, error) {
  231. // 从这一集的视频文件全路径去推算对应的 nfo 文件是否存在
  232. EPdir := filepath.Dir(oneEpFPath)
  233. // 与 EP 文件名一致的 nfo 文件名称
  234. EpNfoFileName := filepath.Base(oneEpFPath)
  235. EpNfoFileName = strings.ReplaceAll(EpNfoFileName, filepath.Ext(oneEpFPath), suffixNameNfo)
  236. // 全路径
  237. EpNfoFPath := filepath.Join(EPdir, EpNfoFileName)
  238. //
  239. imdbInfo := types.VideoIMDBInfo{}
  240. doc := etree.NewDocument()
  241. doc.ReadSettings.Permissive = true
  242. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  243. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  244. // 所以这里很傻的方式解决
  245. err := doc.ReadFromFile(EpNfoFPath)
  246. if err != nil {
  247. return imdbInfo, err
  248. }
  249. for _, t := range doc.FindElements("./episodedetails/aired") {
  250. imdbInfo.ReleaseDate = t.Text()
  251. break
  252. }
  253. for _, t := range doc.FindElements("./episodedetails/premiered") {
  254. imdbInfo.ReleaseDate = t.Text()
  255. break
  256. }
  257. if imdbInfo.ReleaseDate != "" {
  258. return imdbInfo, nil
  259. }
  260. return imdbInfo, common.CanNotFindEpAiredTime
  261. }
  262. // GetVideoInfoFromFileName 从文件名推断文件信息
  263. func GetVideoInfoFromFileName(fileName string) (*PTN.TorrentInfo, error) {
  264. parse, err := PTN.Parse(fileName)
  265. if err != nil {
  266. return nil, err
  267. }
  268. compile, err := regexp.Compile(regFixTitle2)
  269. if err != nil {
  270. return nil, err
  271. }
  272. match := compile.ReplaceAllString(parse.Title, "")
  273. match = strings.TrimRight(match, "")
  274. parse.Title = match
  275. return parse, nil
  276. }
  277. //GetVideoInfoFromFileFullPath 从全文件路径推断文件信息
  278. func GetVideoInfoFromFileFullPath(videoFileFullPath string) (*PTN.TorrentInfo, time.Time, error) {
  279. parse, err := PTN.Parse(filepath.Base(videoFileFullPath))
  280. if err != nil {
  281. return nil, time.Time{}, err
  282. }
  283. compile, err := regexp.Compile(regFixTitle2)
  284. if err != nil {
  285. return nil, time.Time{}, err
  286. }
  287. match := compile.ReplaceAllString(parse.Title, "")
  288. match = strings.TrimRight(match, "")
  289. parse.Title = match
  290. fInfo, err := os.Stat(videoFileFullPath)
  291. if err != nil {
  292. return nil, time.Time{}, err
  293. }
  294. return parse, fInfo.ModTime(), nil
  295. }
  296. // GetSeasonAndEpisodeFromSubFileName 从文件名推断 季 和 集 的信息 Season Episode
  297. func GetSeasonAndEpisodeFromSubFileName(videoFileName string) (bool, int, int, error) {
  298. upperName := strings.ToUpper(videoFileName)
  299. // 先进行单个 Episode 的匹配
  300. // Killing.Eve.S02E01.Do.You.Know.How
  301. var re = regexp.MustCompile(`(?m)\.S(\d+)E(\d+)\.`)
  302. matched := re.FindAllStringSubmatch(upperName, -1)
  303. if matched == nil || len(matched) < 1 {
  304. // Killing.Eve.S02.Do.You.Know.How
  305. // 看看是不是季度字幕打包
  306. re = regexp.MustCompile(`(?m)\.S(\d+)\.`)
  307. matched = re.FindAllStringSubmatch(upperName, -1)
  308. if matched == nil || len(matched) < 1 {
  309. return false, 0, 0, nil
  310. }
  311. season, err := GetNumber2int(matched[0][1])
  312. if err != nil {
  313. return false, 0, 0, err
  314. }
  315. return true, season, 0, nil
  316. } else {
  317. // 一集的字幕
  318. season, err := GetNumber2int(matched[0][1])
  319. if err != nil {
  320. return false, 0, 0, err
  321. }
  322. episode, err := GetNumber2int(matched[0][2])
  323. if err != nil {
  324. return false, 0, 0, err
  325. }
  326. return false, season, episode, nil
  327. }
  328. }
  329. func GetNumber2Float(input string) (float32, error) {
  330. compile := regexp.MustCompile(regGetNumber)
  331. params := compile.FindStringSubmatch(input)
  332. if params == nil || len(params) == 0 {
  333. return 0, errors.New("get number not match")
  334. }
  335. fNum, err := strconv.ParseFloat(params[0], 32)
  336. if err != nil {
  337. return 0, errors.New("get number ParseFloat error")
  338. }
  339. return float32(fNum), nil
  340. }
  341. func GetNumber2int(input string) (int, error) {
  342. compile := regexp.MustCompile(regGetNumber)
  343. params := compile.FindStringSubmatch(input)
  344. if params == nil || len(params) == 0 {
  345. return 0, errors.New("get number not match")
  346. }
  347. fNum, err := strconv.Atoi(params[0])
  348. if err != nil {
  349. return 0, errors.New("get number ParseFloat error")
  350. }
  351. return fNum, nil
  352. }
  353. const (
  354. MetadataMovieXml = "movie.xml"
  355. suffixNameXml = ".xml"
  356. suffixNameNfo = ".nfo"
  357. MetadateTVNfo = "tvshow.nfo"
  358. // 去除特殊字符,仅仅之有中文
  359. regFixTitle = "[^\u4e00-\u9fa5a-zA-Z0-9\\s]"
  360. // 去除特殊字符,把特殊字符都写进去
  361. regFixTitle2 = "[~!@#$%^&*()\\+\\-=|{}';'\\[\\].<>/?~!@#¥%……&*()——+|{}【】';”“’。、?]"
  362. // 获取数字
  363. regGetNumber = "(?:\\-)?\\d{1,}(?:\\.\\d{1,})?"
  364. )