decode.go 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349
  1. package decode
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/internal/common"
  5. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  6. "github.com/allanpk716/ChineseSubFinder/internal/types"
  7. "github.com/beevik/etree"
  8. PTN "github.com/middelink/go-parse-torrent-name"
  9. "io/ioutil"
  10. "os"
  11. "path"
  12. "path/filepath"
  13. "regexp"
  14. "strconv"
  15. "strings"
  16. "time"
  17. )
  18. func getImdbAndYearMovieXml(movieFilePath string) (types.VideoIMDBInfo, error) {
  19. videoInfo := types.VideoIMDBInfo{}
  20. doc := etree.NewDocument()
  21. if err := doc.ReadFromFile(movieFilePath); err != nil {
  22. return videoInfo, err
  23. }
  24. for _, t := range doc.FindElements("//IMDB") {
  25. videoInfo.ImdbId = t.Text()
  26. break
  27. }
  28. for _, t := range doc.FindElements("//ProductionYear") {
  29. videoInfo.Year = t.Text()
  30. break
  31. }
  32. if videoInfo.ImdbId != "" {
  33. return videoInfo, nil
  34. }
  35. return videoInfo, common.CanNotFindIMDBID
  36. }
  37. func getImdbAndYearNfo(nfoFilePath string, rootKey string) (types.VideoIMDBInfo, error) {
  38. imdbInfo := types.VideoIMDBInfo{}
  39. doc := etree.NewDocument()
  40. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  41. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  42. // 所以这里很傻的方式解决
  43. err := doc.ReadFromFile(nfoFilePath)
  44. if err != nil {
  45. return imdbInfo, err
  46. }
  47. for _, t := range doc.FindElements("./" + rootKey + "/title") {
  48. imdbInfo.Title = t.Text()
  49. break
  50. }
  51. //---------------------------------------------------------------------
  52. for _, t := range doc.FindElements("./" + rootKey + "/imdbid") {
  53. imdbInfo.ImdbId = t.Text()
  54. break
  55. }
  56. for _, t := range doc.FindElements("./" + rootKey + "/imdb_id") {
  57. imdbInfo.ImdbId = t.Text()
  58. break
  59. }
  60. for _, t := range doc.FindElements("//uniqueid[@type='imdb']") {
  61. imdbInfo.ImdbId = t.Text()
  62. break
  63. }
  64. for _, t := range doc.FindElements("//uniqueid[@type='Imdb']") {
  65. imdbInfo.ImdbId = t.Text()
  66. break
  67. }
  68. for _, t := range doc.FindElements("//uniqueid[@type='IMDB']") {
  69. imdbInfo.ImdbId = t.Text()
  70. break
  71. }
  72. //---------------------------------------------------------------------
  73. for _, t := range doc.FindElements("./" + rootKey + "/year") {
  74. imdbInfo.Year = t.Text()
  75. break
  76. }
  77. //---------------------------------------------------------------------
  78. for _, t := range doc.FindElements("./" + rootKey + "/releasedate") {
  79. imdbInfo.ReleaseDate = t.Text()
  80. break
  81. }
  82. //---------------------------------------------------------------------
  83. for _, t := range doc.FindElements("./" + rootKey + "/premiered") {
  84. imdbInfo.ReleaseDate = t.Text()
  85. break
  86. }
  87. if imdbInfo.ImdbId != "" {
  88. return imdbInfo, nil
  89. }
  90. return imdbInfo, common.CanNotFindIMDBID
  91. }
  92. func GetImdbInfo4Movie(movieFileFullPath string) (types.VideoIMDBInfo, error) {
  93. imdbInfo := types.VideoIMDBInfo{}
  94. // movie 当前的目录
  95. dirPth := filepath.Dir(movieFileFullPath)
  96. // 与 movie 文件名一致的 nfo 文件名称
  97. movieNfoFileName := filepath.Base(movieFileFullPath)
  98. movieNfoFileName = strings.ReplaceAll(movieNfoFileName, filepath.Ext(movieFileFullPath), suffixNameNfo)
  99. // movie.xml
  100. movieXmlFPath := ""
  101. // movieName.nfo 文件
  102. movieNameNfoFPath := ""
  103. // 通用的 *.nfo
  104. nfoFilePath := ""
  105. dir, err := ioutil.ReadDir(dirPth)
  106. if err != nil {
  107. return imdbInfo, err
  108. }
  109. for _, fi := range dir {
  110. if fi.IsDir() == true {
  111. continue
  112. }
  113. upperName := strings.ToLower(fi.Name())
  114. if upperName == MetadataMovieXml {
  115. // 找 movie.xml
  116. movieXmlFPath = path.Join(dirPth, fi.Name())
  117. break
  118. } else if upperName == movieNfoFileName {
  119. // movieName.nfo 文件
  120. movieNameNfoFPath = path.Join(dirPth, fi.Name())
  121. break
  122. } else {
  123. // 找 *.nfo,很可能是 movie.nfo
  124. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  125. if ok {
  126. nfoFilePath = path.Join(dirPth, fi.Name())
  127. }
  128. }
  129. }
  130. // 根据找到的开始解析
  131. if movieNameNfoFPath == "" && movieXmlFPath == "" && nfoFilePath == "" {
  132. return imdbInfo, common.NoMetadataFile
  133. }
  134. // 优先分析 movieName.nfo 文件
  135. if movieNameNfoFPath != "" {
  136. imdbInfo, err = getImdbAndYearNfo(movieNameNfoFPath, "movie")
  137. if err != nil {
  138. return types.VideoIMDBInfo{}, err
  139. }
  140. return imdbInfo, nil
  141. }
  142. if movieXmlFPath != "" {
  143. imdbInfo, err = getImdbAndYearMovieXml(movieXmlFPath)
  144. if err != nil {
  145. log_helper.GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  146. } else {
  147. return imdbInfo, nil
  148. }
  149. }
  150. if nfoFilePath != "" {
  151. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "movie")
  152. if err != nil {
  153. return imdbInfo, err
  154. } else {
  155. return imdbInfo, nil
  156. }
  157. }
  158. return imdbInfo, common.CanNotFindIMDBID
  159. }
  160. func GetImdbInfo4SeriesDir(seriesDir string) (types.VideoIMDBInfo, error) {
  161. imdbInfo := types.VideoIMDBInfo{}
  162. dir, err := ioutil.ReadDir(seriesDir)
  163. if err != nil {
  164. return imdbInfo, err
  165. }
  166. nfoFilePath := ""
  167. for _, fi := range dir {
  168. if fi.IsDir() == true {
  169. continue
  170. }
  171. upperName := strings.ToUpper(fi.Name())
  172. if upperName == strings.ToUpper(MetadateTVNfo) {
  173. // 连续剧的 nfo 文件
  174. nfoFilePath = path.Join(seriesDir, fi.Name())
  175. break
  176. } else {
  177. // 找 *.nfo
  178. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  179. if ok {
  180. nfoFilePath = path.Join(seriesDir, fi.Name())
  181. }
  182. }
  183. }
  184. // 根据找到的开始解析
  185. if nfoFilePath == "" {
  186. return imdbInfo, common.NoMetadataFile
  187. }
  188. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "tvshow")
  189. if err != nil {
  190. return types.VideoIMDBInfo{}, err
  191. }
  192. return imdbInfo, nil
  193. }
  194. func GetImdbInfo4OneSeriesEpisode(oneEpFPath string) (types.VideoIMDBInfo, error) {
  195. // 从这一集的视频文件全路径去推算对应的 nfo 文件是否存在
  196. EPdir := filepath.Dir(oneEpFPath)
  197. // 与 EP 文件名一致的 nfo 文件名称
  198. EpNfoFileName := filepath.Base(oneEpFPath)
  199. EpNfoFileName = strings.ReplaceAll(EpNfoFileName, filepath.Ext(oneEpFPath), suffixNameNfo)
  200. // 全路径
  201. EpNfoFPath := path.Join(EPdir, EpNfoFileName)
  202. //
  203. imdbInfo := types.VideoIMDBInfo{}
  204. doc := etree.NewDocument()
  205. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  206. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  207. // 所以这里很傻的方式解决
  208. err := doc.ReadFromFile(EpNfoFPath)
  209. if err != nil {
  210. return imdbInfo, err
  211. }
  212. for _, t := range doc.FindElements("./episodedetails/aired") {
  213. imdbInfo.ReleaseDate = t.Text()
  214. break
  215. }
  216. for _, t := range doc.FindElements("./episodedetails/premiered") {
  217. imdbInfo.ReleaseDate = t.Text()
  218. break
  219. }
  220. if imdbInfo.ReleaseDate != "" {
  221. return imdbInfo, nil
  222. }
  223. return imdbInfo, common.CanNotFindEpAiredTime
  224. }
  225. // GetVideoInfoFromFileName 从文件名推断文件信息
  226. func GetVideoInfoFromFileName(fileName string) (*PTN.TorrentInfo, error) {
  227. parse, err := PTN.Parse(fileName)
  228. if err != nil {
  229. return nil, err
  230. }
  231. compile, err := regexp.Compile(regFixTitle2)
  232. if err != nil {
  233. return nil, err
  234. }
  235. match := compile.ReplaceAllString(parse.Title, "")
  236. match = strings.TrimRight(match, "")
  237. parse.Title = match
  238. return parse, nil
  239. }
  240. //GetVideoInfoFromFileFullPath 从全文件路径推断文件信息
  241. func GetVideoInfoFromFileFullPath(videoFileFullPath string) (*PTN.TorrentInfo, time.Time, error) {
  242. parse, err := PTN.Parse(filepath.Base(videoFileFullPath))
  243. if err != nil {
  244. return nil, time.Time{}, err
  245. }
  246. compile, err := regexp.Compile(regFixTitle2)
  247. if err != nil {
  248. return nil, time.Time{}, err
  249. }
  250. match := compile.ReplaceAllString(parse.Title, "")
  251. match = strings.TrimRight(match, "")
  252. parse.Title = match
  253. fInfo, err := os.Stat(videoFileFullPath)
  254. if err != nil {
  255. return nil, time.Time{}, err
  256. }
  257. return parse, fInfo.ModTime(), nil
  258. }
  259. // GetSeasonAndEpisodeFromSubFileName 从文件名推断 季 和 集 的信息 Season Episode
  260. func GetSeasonAndEpisodeFromSubFileName(videoFileName string) (bool, int, int, error) {
  261. upperName := strings.ToUpper(videoFileName)
  262. // 先进行单个 Episode 的匹配
  263. // Killing.Eve.S02E01.Do.You.Know.How
  264. var re = regexp.MustCompile(`(?m)\.S(\d+)E(\d+)\.`)
  265. matched := re.FindAllStringSubmatch(upperName, -1)
  266. if len(matched) < 1 {
  267. // Killing.Eve.S02.Do.You.Know.How
  268. // 看看是不是季度字幕打包
  269. re = regexp.MustCompile(`(?m)\.S(\d+)\.`)
  270. matched = re.FindAllStringSubmatch(upperName, -1)
  271. if len(matched) < 1 {
  272. return false, 0, 0, nil
  273. }
  274. season, err := GetNumber2int(matched[0][1])
  275. if err != nil {
  276. return false, 0, 0, err
  277. }
  278. return true, season, 0, nil
  279. } else {
  280. // 一集的字幕
  281. season, err := GetNumber2int(matched[0][1])
  282. if err != nil {
  283. return false, 0, 0, err
  284. }
  285. episode, err := GetNumber2int(matched[0][2])
  286. if err != nil {
  287. return false, 0, 0, err
  288. }
  289. return false, season, episode, nil
  290. }
  291. }
  292. func GetNumber2Float(input string) (float32, error) {
  293. compile := regexp.MustCompile(regGetNumber)
  294. params := compile.FindStringSubmatch(input)
  295. if len(params) == 0 {
  296. return 0, errors.New("get number not match")
  297. }
  298. fNum, err := strconv.ParseFloat(params[0], 32)
  299. if err != nil {
  300. return 0, errors.New("get number ParseFloat error")
  301. }
  302. return float32(fNum), nil
  303. }
  304. func GetNumber2int(input string) (int, error) {
  305. compile := regexp.MustCompile(regGetNumber)
  306. params := compile.FindStringSubmatch(input)
  307. if len(params) == 0 {
  308. return 0, errors.New("get number not match")
  309. }
  310. fNum, err := strconv.Atoi(params[0])
  311. if err != nil {
  312. return 0, errors.New("get number ParseFloat error")
  313. }
  314. return fNum, nil
  315. }
  316. const (
  317. MetadataMovieXml = "movie.xml"
  318. suffixNameXml = ".xml"
  319. suffixNameNfo = ".nfo"
  320. MetadateTVNfo = "tvshow.nfo"
  321. // 去除特殊字符,仅仅之有中文
  322. regFixTitle = "[^\u4e00-\u9fa5a-zA-Z0-9\\s]"
  323. // 去除特殊字符,把特殊字符都写进去
  324. regFixTitle2 = "[~!@#$%^&*()\\+\\-=|{}';'\\[\\].<>/?~!@#¥%……&*()——+|{}【】';”“’。、?]"
  325. // 获取数字
  326. regGetNumber = "(?:\\-)?\\d{1,}(?:\\.\\d{1,})?"
  327. )