decode.go 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348
  1. package decode
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/internal/common"
  5. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  6. "github.com/allanpk716/ChineseSubFinder/internal/types"
  7. "github.com/beevik/etree"
  8. PTN "github.com/middelink/go-parse-torrent-name"
  9. "io/ioutil"
  10. "os"
  11. "path/filepath"
  12. "regexp"
  13. "strconv"
  14. "strings"
  15. "time"
  16. )
  17. func getImdbAndYearMovieXml(movieFilePath string) (types.VideoIMDBInfo, error) {
  18. videoInfo := types.VideoIMDBInfo{}
  19. doc := etree.NewDocument()
  20. if err := doc.ReadFromFile(movieFilePath); err != nil {
  21. return videoInfo, err
  22. }
  23. for _, t := range doc.FindElements("//IMDB") {
  24. videoInfo.ImdbId = t.Text()
  25. break
  26. }
  27. for _, t := range doc.FindElements("//ProductionYear") {
  28. videoInfo.Year = t.Text()
  29. break
  30. }
  31. if videoInfo.ImdbId != "" {
  32. return videoInfo, nil
  33. }
  34. return videoInfo, common.CanNotFindIMDBID
  35. }
  36. func getImdbAndYearNfo(nfoFilePath string, rootKey string) (types.VideoIMDBInfo, error) {
  37. imdbInfo := types.VideoIMDBInfo{}
  38. doc := etree.NewDocument()
  39. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  40. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  41. // 所以这里很傻的方式解决
  42. err := doc.ReadFromFile(nfoFilePath)
  43. if err != nil {
  44. return imdbInfo, err
  45. }
  46. for _, t := range doc.FindElements("./" + rootKey + "/title") {
  47. imdbInfo.Title = t.Text()
  48. break
  49. }
  50. //---------------------------------------------------------------------
  51. for _, t := range doc.FindElements("./" + rootKey + "/imdbid") {
  52. imdbInfo.ImdbId = t.Text()
  53. break
  54. }
  55. for _, t := range doc.FindElements("./" + rootKey + "/imdb_id") {
  56. imdbInfo.ImdbId = t.Text()
  57. break
  58. }
  59. for _, t := range doc.FindElements("//uniqueid[@type='imdb']") {
  60. imdbInfo.ImdbId = t.Text()
  61. break
  62. }
  63. for _, t := range doc.FindElements("//uniqueid[@type='Imdb']") {
  64. imdbInfo.ImdbId = t.Text()
  65. break
  66. }
  67. for _, t := range doc.FindElements("//uniqueid[@type='IMDB']") {
  68. imdbInfo.ImdbId = t.Text()
  69. break
  70. }
  71. //---------------------------------------------------------------------
  72. for _, t := range doc.FindElements("./" + rootKey + "/year") {
  73. imdbInfo.Year = t.Text()
  74. break
  75. }
  76. //---------------------------------------------------------------------
  77. for _, t := range doc.FindElements("./" + rootKey + "/releasedate") {
  78. imdbInfo.ReleaseDate = t.Text()
  79. break
  80. }
  81. //---------------------------------------------------------------------
  82. for _, t := range doc.FindElements("./" + rootKey + "/premiered") {
  83. imdbInfo.ReleaseDate = t.Text()
  84. break
  85. }
  86. if imdbInfo.ImdbId != "" {
  87. return imdbInfo, nil
  88. }
  89. return imdbInfo, common.CanNotFindIMDBID
  90. }
  91. func GetImdbInfo4Movie(movieFileFullPath string) (types.VideoIMDBInfo, error) {
  92. imdbInfo := types.VideoIMDBInfo{}
  93. // movie 当前的目录
  94. dirPth := filepath.Dir(movieFileFullPath)
  95. // 与 movie 文件名一致的 nfo 文件名称
  96. movieNfoFileName := filepath.Base(movieFileFullPath)
  97. movieNfoFileName = strings.ReplaceAll(movieNfoFileName, filepath.Ext(movieFileFullPath), suffixNameNfo)
  98. // movie.xml
  99. movieXmlFPath := ""
  100. // movieName.nfo 文件
  101. movieNameNfoFPath := ""
  102. // 通用的 *.nfo
  103. nfoFilePath := ""
  104. dir, err := ioutil.ReadDir(dirPth)
  105. if err != nil {
  106. return imdbInfo, err
  107. }
  108. for _, fi := range dir {
  109. if fi.IsDir() == true {
  110. continue
  111. }
  112. upperName := strings.ToLower(fi.Name())
  113. if upperName == MetadataMovieXml {
  114. // 找 movie.xml
  115. movieXmlFPath = filepath.Join(dirPth, fi.Name())
  116. break
  117. } else if upperName == movieNfoFileName {
  118. // movieName.nfo 文件
  119. movieNameNfoFPath = filepath.Join(dirPth, fi.Name())
  120. break
  121. } else {
  122. // 找 *.nfo,很可能是 movie.nfo
  123. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  124. if ok {
  125. nfoFilePath = filepath.Join(dirPth, fi.Name())
  126. }
  127. }
  128. }
  129. // 根据找到的开始解析
  130. if movieNameNfoFPath == "" && movieXmlFPath == "" && nfoFilePath == "" {
  131. return imdbInfo, common.NoMetadataFile
  132. }
  133. // 优先分析 movieName.nfo 文件
  134. if movieNameNfoFPath != "" {
  135. imdbInfo, err = getImdbAndYearNfo(movieNameNfoFPath, "movie")
  136. if err != nil {
  137. return types.VideoIMDBInfo{}, err
  138. }
  139. return imdbInfo, nil
  140. }
  141. if movieXmlFPath != "" {
  142. imdbInfo, err = getImdbAndYearMovieXml(movieXmlFPath)
  143. if err != nil {
  144. log_helper.GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  145. } else {
  146. return imdbInfo, nil
  147. }
  148. }
  149. if nfoFilePath != "" {
  150. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "movie")
  151. if err != nil {
  152. return imdbInfo, err
  153. } else {
  154. return imdbInfo, nil
  155. }
  156. }
  157. return imdbInfo, common.CanNotFindIMDBID
  158. }
  159. func GetImdbInfo4SeriesDir(seriesDir string) (types.VideoIMDBInfo, error) {
  160. imdbInfo := types.VideoIMDBInfo{}
  161. dir, err := ioutil.ReadDir(seriesDir)
  162. if err != nil {
  163. return imdbInfo, err
  164. }
  165. nfoFilePath := ""
  166. for _, fi := range dir {
  167. if fi.IsDir() == true {
  168. continue
  169. }
  170. upperName := strings.ToUpper(fi.Name())
  171. if upperName == strings.ToUpper(MetadateTVNfo) {
  172. // 连续剧的 nfo 文件
  173. nfoFilePath = filepath.Join(seriesDir, fi.Name())
  174. break
  175. } else {
  176. // 找 *.nfo
  177. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  178. if ok {
  179. nfoFilePath = filepath.Join(seriesDir, fi.Name())
  180. }
  181. }
  182. }
  183. // 根据找到的开始解析
  184. if nfoFilePath == "" {
  185. return imdbInfo, common.NoMetadataFile
  186. }
  187. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "tvshow")
  188. if err != nil {
  189. return types.VideoIMDBInfo{}, err
  190. }
  191. return imdbInfo, nil
  192. }
  193. func GetImdbInfo4OneSeriesEpisode(oneEpFPath string) (types.VideoIMDBInfo, error) {
  194. // 从这一集的视频文件全路径去推算对应的 nfo 文件是否存在
  195. EPdir := filepath.Dir(oneEpFPath)
  196. // 与 EP 文件名一致的 nfo 文件名称
  197. EpNfoFileName := filepath.Base(oneEpFPath)
  198. EpNfoFileName = strings.ReplaceAll(EpNfoFileName, filepath.Ext(oneEpFPath), suffixNameNfo)
  199. // 全路径
  200. EpNfoFPath := filepath.Join(EPdir, EpNfoFileName)
  201. //
  202. imdbInfo := types.VideoIMDBInfo{}
  203. doc := etree.NewDocument()
  204. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  205. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  206. // 所以这里很傻的方式解决
  207. err := doc.ReadFromFile(EpNfoFPath)
  208. if err != nil {
  209. return imdbInfo, err
  210. }
  211. for _, t := range doc.FindElements("./episodedetails/aired") {
  212. imdbInfo.ReleaseDate = t.Text()
  213. break
  214. }
  215. for _, t := range doc.FindElements("./episodedetails/premiered") {
  216. imdbInfo.ReleaseDate = t.Text()
  217. break
  218. }
  219. if imdbInfo.ReleaseDate != "" {
  220. return imdbInfo, nil
  221. }
  222. return imdbInfo, common.CanNotFindEpAiredTime
  223. }
  224. // GetVideoInfoFromFileName 从文件名推断文件信息
  225. func GetVideoInfoFromFileName(fileName string) (*PTN.TorrentInfo, error) {
  226. parse, err := PTN.Parse(fileName)
  227. if err != nil {
  228. return nil, err
  229. }
  230. compile, err := regexp.Compile(regFixTitle2)
  231. if err != nil {
  232. return nil, err
  233. }
  234. match := compile.ReplaceAllString(parse.Title, "")
  235. match = strings.TrimRight(match, "")
  236. parse.Title = match
  237. return parse, nil
  238. }
  239. //GetVideoInfoFromFileFullPath 从全文件路径推断文件信息
  240. func GetVideoInfoFromFileFullPath(videoFileFullPath string) (*PTN.TorrentInfo, time.Time, error) {
  241. parse, err := PTN.Parse(filepath.Base(videoFileFullPath))
  242. if err != nil {
  243. return nil, time.Time{}, err
  244. }
  245. compile, err := regexp.Compile(regFixTitle2)
  246. if err != nil {
  247. return nil, time.Time{}, err
  248. }
  249. match := compile.ReplaceAllString(parse.Title, "")
  250. match = strings.TrimRight(match, "")
  251. parse.Title = match
  252. fInfo, err := os.Stat(videoFileFullPath)
  253. if err != nil {
  254. return nil, time.Time{}, err
  255. }
  256. return parse, fInfo.ModTime(), nil
  257. }
  258. // GetSeasonAndEpisodeFromSubFileName 从文件名推断 季 和 集 的信息 Season Episode
  259. func GetSeasonAndEpisodeFromSubFileName(videoFileName string) (bool, int, int, error) {
  260. upperName := strings.ToUpper(videoFileName)
  261. // 先进行单个 Episode 的匹配
  262. // Killing.Eve.S02E01.Do.You.Know.How
  263. var re = regexp.MustCompile(`(?m)\.S(\d+)E(\d+)\.`)
  264. matched := re.FindAllStringSubmatch(upperName, -1)
  265. if len(matched) < 1 {
  266. // Killing.Eve.S02.Do.You.Know.How
  267. // 看看是不是季度字幕打包
  268. re = regexp.MustCompile(`(?m)\.S(\d+)\.`)
  269. matched = re.FindAllStringSubmatch(upperName, -1)
  270. if len(matched) < 1 {
  271. return false, 0, 0, nil
  272. }
  273. season, err := GetNumber2int(matched[0][1])
  274. if err != nil {
  275. return false, 0, 0, err
  276. }
  277. return true, season, 0, nil
  278. } else {
  279. // 一集的字幕
  280. season, err := GetNumber2int(matched[0][1])
  281. if err != nil {
  282. return false, 0, 0, err
  283. }
  284. episode, err := GetNumber2int(matched[0][2])
  285. if err != nil {
  286. return false, 0, 0, err
  287. }
  288. return false, season, episode, nil
  289. }
  290. }
  291. func GetNumber2Float(input string) (float32, error) {
  292. compile := regexp.MustCompile(regGetNumber)
  293. params := compile.FindStringSubmatch(input)
  294. if len(params) == 0 {
  295. return 0, errors.New("get number not match")
  296. }
  297. fNum, err := strconv.ParseFloat(params[0], 32)
  298. if err != nil {
  299. return 0, errors.New("get number ParseFloat error")
  300. }
  301. return float32(fNum), nil
  302. }
  303. func GetNumber2int(input string) (int, error) {
  304. compile := regexp.MustCompile(regGetNumber)
  305. params := compile.FindStringSubmatch(input)
  306. if len(params) == 0 {
  307. return 0, errors.New("get number not match")
  308. }
  309. fNum, err := strconv.Atoi(params[0])
  310. if err != nil {
  311. return 0, errors.New("get number ParseFloat error")
  312. }
  313. return fNum, nil
  314. }
  315. const (
  316. MetadataMovieXml = "movie.xml"
  317. suffixNameXml = ".xml"
  318. suffixNameNfo = ".nfo"
  319. MetadateTVNfo = "tvshow.nfo"
  320. // 去除特殊字符,仅仅之有中文
  321. regFixTitle = "[^\u4e00-\u9fa5a-zA-Z0-9\\s]"
  322. // 去除特殊字符,把特殊字符都写进去
  323. regFixTitle2 = "[~!@#$%^&*()\\+\\-=|{}';'\\[\\].<>/?~!@#¥%……&*()——+|{}【】';”“’。、?]"
  324. // 获取数字
  325. regGetNumber = "(?:\\-)?\\d{1,}(?:\\.\\d{1,})?"
  326. )