decode.go 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. package model
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/common"
  5. "github.com/beevik/etree"
  6. PTN "github.com/middelink/go-parse-torrent-name"
  7. "io/ioutil"
  8. "os"
  9. "path"
  10. "path/filepath"
  11. "regexp"
  12. "strconv"
  13. "strings"
  14. "time"
  15. )
  16. func getImdbAndYearMovieXml(movieFilePath string) (common.VideoIMDBInfo, error) {
  17. videoInfo := common.VideoIMDBInfo{}
  18. doc := etree.NewDocument()
  19. if err := doc.ReadFromFile(movieFilePath); err != nil {
  20. return videoInfo, err
  21. }
  22. for _, t := range doc.FindElements("//IMDB") {
  23. videoInfo.ImdbId = t.Text()
  24. break
  25. }
  26. for _, t := range doc.FindElements("//ProductionYear") {
  27. videoInfo.Year = t.Text()
  28. break
  29. }
  30. if videoInfo.ImdbId != "" {
  31. return videoInfo, nil
  32. }
  33. return videoInfo, common.CanNotFindIMDBID
  34. }
  35. func getImdbAndYearNfo(nfoFilePath string, rootKey string) (common.VideoIMDBInfo, error) {
  36. imdbInfo := common.VideoIMDBInfo{}
  37. doc := etree.NewDocument()
  38. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  39. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  40. // 所以这里很傻的方式解决
  41. err := doc.ReadFromFile(nfoFilePath)
  42. if err != nil {
  43. return imdbInfo, err
  44. }
  45. for _, t := range doc.FindElements("./" + rootKey +"/title") {
  46. imdbInfo.Title = t.Text()
  47. break
  48. }
  49. //---------------------------------------------------------------------
  50. for _, t := range doc.FindElements("./" + rootKey +"/imdb_id") {
  51. imdbInfo.ImdbId = t.Text()
  52. break
  53. }
  54. for _, t := range doc.FindElements("//uniqueid[@type='imdb']") {
  55. imdbInfo.ImdbId = t.Text()
  56. break
  57. }
  58. for _, t := range doc.FindElements("//uniqueid[@type='Imdb']") {
  59. imdbInfo.ImdbId = t.Text()
  60. break
  61. }
  62. for _, t := range doc.FindElements("//uniqueid[@type='IMDB']") {
  63. imdbInfo.ImdbId = t.Text()
  64. break
  65. }
  66. //---------------------------------------------------------------------
  67. for _, t := range doc.FindElements("./" + rootKey +"/year") {
  68. imdbInfo.Year = t.Text()
  69. break
  70. }
  71. //---------------------------------------------------------------------
  72. for _, t := range doc.FindElements("./" + rootKey + "/releasedate") {
  73. imdbInfo.ReleaseDate = t.Text()
  74. break
  75. }
  76. //---------------------------------------------------------------------
  77. for _, t := range doc.FindElements("./" + rootKey + "/premiered") {
  78. imdbInfo.ReleaseDate = t.Text()
  79. break
  80. }
  81. if imdbInfo.ImdbId != "" {
  82. return imdbInfo, nil
  83. }
  84. return imdbInfo, common.CanNotFindIMDBID
  85. }
  86. func GetImdbInfo4Movie(movieFileFullPath string) (common.VideoIMDBInfo, error) {
  87. imdbInfo := common.VideoIMDBInfo{}
  88. // movie 当前的目录
  89. dirPth := filepath.Dir(movieFileFullPath)
  90. // 与 movie 文件名一致的 nfo 文件名称
  91. movieNfoFileName := filepath.Base(movieFileFullPath)
  92. movieNfoFileName = strings.ReplaceAll(movieNfoFileName, filepath.Ext(movieFileFullPath), suffixNameNfo)
  93. // movie.xml
  94. movieXmlFPath := ""
  95. // movieName.nfo 文件
  96. movieNameNfoFPath := ""
  97. // 通用的 *.nfo
  98. nfoFilePath := ""
  99. dir, err := ioutil.ReadDir(dirPth)
  100. if err != nil {
  101. return imdbInfo, err
  102. }
  103. for _, fi := range dir {
  104. if fi.IsDir() == true {
  105. continue
  106. }
  107. upperName := strings.ToLower(fi.Name())
  108. if upperName == MetadataMovieXml {
  109. // 找 movie.xml
  110. movieXmlFPath = path.Join(dirPth, fi.Name())
  111. break
  112. } else if upperName == movieNfoFileName {
  113. // movieName.nfo 文件
  114. movieNameNfoFPath = path.Join(dirPth, fi.Name())
  115. break
  116. } else {
  117. // 找 *.nfo,很可能是 movie.nfo
  118. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  119. if ok {
  120. nfoFilePath = path.Join(dirPth, fi.Name())
  121. }
  122. }
  123. }
  124. // 根据找到的开始解析
  125. if movieNameNfoFPath == "" && movieXmlFPath == "" && nfoFilePath == "" {
  126. return imdbInfo, common.NoMetadataFile
  127. }
  128. // 优先分析 movieName.nfo 文件
  129. if movieNameNfoFPath != "" {
  130. imdbInfo, err = getImdbAndYearNfo(movieNameNfoFPath, "movie")
  131. if err != nil {
  132. return common.VideoIMDBInfo{}, err
  133. }
  134. return imdbInfo, nil
  135. }
  136. if movieXmlFPath != "" {
  137. imdbInfo, err = getImdbAndYearMovieXml(movieXmlFPath)
  138. if err != nil {
  139. GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  140. } else {
  141. return imdbInfo, nil
  142. }
  143. }
  144. if nfoFilePath != "" {
  145. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "movie")
  146. if err != nil {
  147. return imdbInfo, err
  148. } else {
  149. return imdbInfo, nil
  150. }
  151. }
  152. return imdbInfo, common.CanNotFindIMDBID
  153. }
  154. func GetImdbInfo4SeriesDir(seriesDir string) (common.VideoIMDBInfo, error) {
  155. imdbInfo := common.VideoIMDBInfo{}
  156. dir, err := ioutil.ReadDir(seriesDir)
  157. if err != nil {
  158. return imdbInfo, err
  159. }
  160. nfoFilePath := ""
  161. for _, fi := range dir {
  162. if fi.IsDir() == true {
  163. continue
  164. }
  165. upperName := strings.ToUpper(fi.Name())
  166. if upperName == strings.ToUpper(MetadateTVNfo) {
  167. // 连续剧的 nfo 文件
  168. nfoFilePath = path.Join(seriesDir, fi.Name())
  169. break
  170. } else {
  171. // 找 *.nfo
  172. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  173. if ok {
  174. nfoFilePath = path.Join(seriesDir, fi.Name())
  175. }
  176. }
  177. }
  178. // 根据找到的开始解析
  179. if nfoFilePath == "" {
  180. return imdbInfo, common.NoMetadataFile
  181. }
  182. imdbInfo, err = getImdbAndYearNfo(nfoFilePath, "tvshow")
  183. if err != nil {
  184. return common.VideoIMDBInfo{}, err
  185. }
  186. return imdbInfo, nil
  187. }
  188. func GetImdbInfo4OneSeriesEpisode(oneEpFPath string) (common.VideoIMDBInfo, error) {
  189. // 从这一集的视频文件全路径去推算对应的 nfo 文件是否存在
  190. EPdir := filepath.Dir(oneEpFPath)
  191. // 与 EP 文件名一致的 nfo 文件名称
  192. EpNfoFileName := filepath.Base(oneEpFPath)
  193. EpNfoFileName = strings.ReplaceAll(EpNfoFileName, filepath.Ext(oneEpFPath), suffixNameNfo)
  194. // 全路径
  195. EpNfoFPath := path.Join(EPdir, EpNfoFileName)
  196. //
  197. imdbInfo := common.VideoIMDBInfo{}
  198. doc := etree.NewDocument()
  199. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  200. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  201. // 所以这里很傻的方式解决
  202. err := doc.ReadFromFile(EpNfoFPath)
  203. if err != nil {
  204. return imdbInfo, err
  205. }
  206. for _, t := range doc.FindElements("./episodedetails/aired") {
  207. imdbInfo.ReleaseDate = t.Text()
  208. break
  209. }
  210. for _, t := range doc.FindElements("./episodedetails/premiered") {
  211. imdbInfo.ReleaseDate = t.Text()
  212. break
  213. }
  214. if imdbInfo.ReleaseDate != "" {
  215. return imdbInfo, nil
  216. }
  217. return imdbInfo, common.CanNotFindEpAiredTime
  218. }
  219. // GetVideoInfoFromFileName 从文件名推断文件信息
  220. func GetVideoInfoFromFileName(fileName string) (*PTN.TorrentInfo, error) {
  221. parse, err := PTN.Parse(fileName)
  222. if err != nil {
  223. return nil, err
  224. }
  225. compile, err := regexp.Compile(regFixTitle2)
  226. if err != nil {
  227. return nil, err
  228. }
  229. match := compile.ReplaceAllString(parse.Title, "")
  230. match = strings.TrimRight(match, "")
  231. parse.Title = match
  232. return parse, nil
  233. }
  234. //GetVideoInfoFromFileFullPath 从全文件路径推断文件信息
  235. func GetVideoInfoFromFileFullPath(videoFileFullPath string) (*PTN.TorrentInfo, time.Time, error) {
  236. parse, err := PTN.Parse(filepath.Base(videoFileFullPath))
  237. if err != nil {
  238. return nil, time.Time{}, err
  239. }
  240. compile, err := regexp.Compile(regFixTitle2)
  241. if err != nil {
  242. return nil, time.Time{}, err
  243. }
  244. match := compile.ReplaceAllString(parse.Title, "")
  245. match = strings.TrimRight(match, "")
  246. parse.Title = match
  247. fInfo, err := os.Stat(videoFileFullPath)
  248. if err != nil {
  249. return nil, time.Time{}, err
  250. }
  251. return parse, fInfo.ModTime(), nil
  252. }
  253. // GetSeasonAndEpisodeFromSubFileName 从文件名推断 季 和 集 的信息 Season Episode
  254. func GetSeasonAndEpisodeFromSubFileName(videoFileName string) (bool, int, int, error) {
  255. upperName := strings.ToUpper(videoFileName)
  256. // 先进行单个 Episode 的匹配
  257. // Killing.Eve.S02E01.Do.You.Know.How
  258. var re = regexp.MustCompile(`(?m)\.S(\d+)E(\d+)\.`)
  259. matched := re.FindAllStringSubmatch(upperName, -1)
  260. if len(matched) < 1 {
  261. // Killing.Eve.S02.Do.You.Know.How
  262. // 看看是不是季度字幕打包
  263. re = regexp.MustCompile(`(?m)\.S(\d+)\.`)
  264. matched = re.FindAllStringSubmatch(upperName, -1)
  265. if len(matched) < 1 {
  266. return false, 0, 0, nil
  267. }
  268. season, err := GetNumber2int(matched[0][1])
  269. if err != nil {
  270. return false,0, 0, err
  271. }
  272. return true, season, 0, nil
  273. } else {
  274. // 一集的字幕
  275. season, err := GetNumber2int(matched[0][1])
  276. if err != nil {
  277. return false,0, 0, err
  278. }
  279. episode, err := GetNumber2int(matched[0][2])
  280. if err != nil {
  281. return false, 0, 0, err
  282. }
  283. return false, season, episode, nil
  284. }
  285. }
  286. func GetNumber2Float(input string) (float32, error) {
  287. compile := regexp.MustCompile(regGetNumber)
  288. params := compile.FindStringSubmatch(input)
  289. if len(params) == 0 {
  290. return 0, errors.New("get number not match")
  291. }
  292. fNum, err := strconv.ParseFloat(params[0],32)
  293. if err != nil {
  294. return 0, errors.New("get number ParseFloat error")
  295. }
  296. return float32(fNum), nil
  297. }
  298. func GetNumber2int(input string) (int, error) {
  299. compile := regexp.MustCompile(regGetNumber)
  300. params := compile.FindStringSubmatch(input)
  301. if len(params) == 0 {
  302. return 0, errors.New("get number not match")
  303. }
  304. fNum, err := strconv.Atoi(params[0])
  305. if err != nil {
  306. return 0, errors.New("get number ParseFloat error")
  307. }
  308. return fNum, nil
  309. }
  310. const (
  311. MetadataMovieXml = "movie.xml"
  312. suffixNameXml = ".xml"
  313. suffixNameNfo = ".nfo"
  314. MetadateTVNfo = "tvshow.nfo"
  315. // 去除特殊字符,仅仅之有中文
  316. regFixTitle = "[^\u4e00-\u9fa5a-zA-Z0-9\\s]"
  317. // 去除特殊字符,把特殊字符都写进去
  318. regFixTitle2 = "[`~!@#$%^&*()+-=|{}';'\\[\\].<>/?~!@#¥%……&*()——+|{}【】';”“’。、?]"
  319. // 获取数字
  320. regGetNumber = "(?:\\-)?\\d{1,}(?:\\.\\d{1,})?"
  321. )