decode.go 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342
  1. package model
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/common"
  5. "github.com/beevik/etree"
  6. PTN "github.com/middelink/go-parse-torrent-name"
  7. "io/ioutil"
  8. "os"
  9. "path"
  10. "path/filepath"
  11. "regexp"
  12. "strconv"
  13. "strings"
  14. "time"
  15. )
  16. func getImdbAndYearMovieXml(movieFilePath string) (common.VideoIMDBInfo, error) {
  17. videoInfo := common.VideoIMDBInfo{}
  18. doc := etree.NewDocument()
  19. if err := doc.ReadFromFile(movieFilePath); err != nil {
  20. return videoInfo, err
  21. }
  22. for _, t := range doc.FindElements("//IMDB") {
  23. videoInfo.ImdbId = t.Text()
  24. break
  25. }
  26. for _, t := range doc.FindElements("//ProductionYear") {
  27. videoInfo.Year = t.Text()
  28. break
  29. }
  30. if videoInfo.ImdbId != "" {
  31. return videoInfo, nil
  32. }
  33. return videoInfo, common.CanNotFindIMDBID
  34. }
  35. func getImdbAndYearNfo(nfoFilePath string) (common.VideoIMDBInfo, error) {
  36. imdbInfo := common.VideoIMDBInfo{}
  37. doc := etree.NewDocument()
  38. // 这里会遇到一个梗,下面的关键词,可能是小写、大写、首字母大写
  39. // 读取文件转换为全部的小写,然后在解析 xml ? etree 在转换为小写后,某些类型的文件的内容会崩溃···
  40. // 所以这里很傻的方式解决
  41. err := doc.ReadFromFile(nfoFilePath)
  42. if err != nil {
  43. return imdbInfo, err
  44. }
  45. for _, t := range doc.FindElements("//uniqueid[@type='imdb']") {
  46. imdbInfo.ImdbId = t.Text()
  47. break
  48. }
  49. for _, t := range doc.FindElements("//uniqueid[@type='Imdb']") {
  50. imdbInfo.ImdbId = t.Text()
  51. break
  52. }
  53. for _, t := range doc.FindElements("//uniqueid[@type='IMDB']") {
  54. imdbInfo.ImdbId = t.Text()
  55. break
  56. }
  57. for _, t := range doc.FindElements("./movie/year") {
  58. imdbInfo.Year = t.Text()
  59. break
  60. }
  61. for _, t := range doc.FindElements("./movie/releasedate") {
  62. imdbInfo.ReleaseDate = t.Text()
  63. break
  64. }
  65. for _, t := range doc.FindElements("./movie/premiered") {
  66. imdbInfo.ReleaseDate = t.Text()
  67. break
  68. }
  69. if imdbInfo.ImdbId != "" {
  70. return imdbInfo, nil
  71. }
  72. return imdbInfo, common.CanNotFindIMDBID
  73. }
  74. func GetImdbInfo4Movie(movieFileFullPath string) (common.VideoIMDBInfo, error) {
  75. imdbInfo := common.VideoIMDBInfo{}
  76. // movie 当前的目录
  77. dirPth := filepath.Dir(movieFileFullPath)
  78. // 与 movie 文件名一致的 nfo 文件名称
  79. movieNfoFileName := filepath.Base(movieFileFullPath)
  80. movieNfoFileName = strings.ReplaceAll(movieNfoFileName, filepath.Ext(movieFileFullPath), "")
  81. // movie.xml
  82. movieXmlFPath := ""
  83. // movieName.nfo 文件
  84. movieNameNfoFPath := ""
  85. // 通用的 *.nfo
  86. nfoFilePath := ""
  87. dir, err := ioutil.ReadDir(dirPth)
  88. if err != nil {
  89. return imdbInfo, err
  90. }
  91. for _, fi := range dir {
  92. if fi.IsDir() == true {
  93. continue
  94. }
  95. upperName := strings.ToLower(fi.Name())
  96. if upperName == MetadataMovieXml {
  97. // 找 movie.xml
  98. movieXmlFPath = path.Join(dirPth, fi.Name())
  99. break
  100. } else if upperName == movieNfoFileName {
  101. // movieName.nfo 文件
  102. movieNameNfoFPath = path.Join(dirPth, fi.Name())
  103. break
  104. } else {
  105. // 找 *.nfo,很可能是 movie.nfo
  106. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  107. if ok {
  108. nfoFilePath = path.Join(dirPth, fi.Name())
  109. }
  110. }
  111. }
  112. // 根据找到的开始解析
  113. if movieNameNfoFPath == "" && movieXmlFPath == "" && nfoFilePath == "" {
  114. return imdbInfo, common.NoMetadataFile
  115. }
  116. // 优先分析 movieName.nfo 文件
  117. if movieNameNfoFPath != "" {
  118. imdbInfo, err = getImdbAndYearNfo(movieNameNfoFPath)
  119. if err != nil {
  120. return common.VideoIMDBInfo{}, err
  121. }
  122. return imdbInfo, nil
  123. }
  124. if movieXmlFPath != "" {
  125. imdbInfo, err = getImdbAndYearMovieXml(movieXmlFPath)
  126. if err != nil {
  127. GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  128. } else {
  129. return imdbInfo, nil
  130. }
  131. }
  132. if nfoFilePath != "" {
  133. imdbInfo, err = getImdbAndYearNfo(nfoFilePath)
  134. if err != nil {
  135. return imdbInfo, err
  136. } else {
  137. return imdbInfo, nil
  138. }
  139. }
  140. return imdbInfo, common.CanNotFindIMDBID
  141. }
  142. func GetImdbInfo4SeriesDir(seriesDir string) (common.VideoIMDBInfo, error) {
  143. imdbInfo := common.VideoIMDBInfo{}
  144. dir, err := ioutil.ReadDir(seriesDir)
  145. if err != nil {
  146. return imdbInfo, err
  147. }
  148. nfoFilePath := ""
  149. for _, fi := range dir {
  150. if fi.IsDir() == true {
  151. continue
  152. }
  153. upperName := strings.ToUpper(fi.Name())
  154. if upperName == strings.ToUpper(MetadateTVNfo) {
  155. // 连续剧的 nfo 文件
  156. nfoFilePath = path.Join(seriesDir, fi.Name())
  157. break
  158. } else {
  159. // 找 *.nfo
  160. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  161. if ok {
  162. nfoFilePath = path.Join(seriesDir, fi.Name())
  163. }
  164. }
  165. }
  166. // 根据找到的开始解析
  167. if nfoFilePath == "" {
  168. return imdbInfo, common.NoMetadataFile
  169. }
  170. imdbInfo, err = getImdbAndYearNfo(nfoFilePath)
  171. if err != nil {
  172. return common.VideoIMDBInfo{}, err
  173. }
  174. return imdbInfo, nil
  175. }
  176. // TODO 需要拆分出三个方向,一个是电影,输入电影文件全路径,一个是连续剧,输入的是连续剧的目录,最后一个是连续剧的一集文件的全路径
  177. func GetImdbInfo(dirPth string) (common.VideoIMDBInfo, error) {
  178. imdbInfo := common.VideoIMDBInfo{}
  179. dir, err := ioutil.ReadDir(dirPth)
  180. if err != nil {
  181. return imdbInfo, err
  182. }
  183. pathSep := string(os.PathSeparator)
  184. // 优先找 movie.xml 这个是 raddarr 下载的电影会存下来的,可以在 Metadata 设置 Emby
  185. var movieFilePath = ""
  186. // 这个是使用 tinyMediaManager 削刮器按 Kodi 来存储的
  187. var nfoFilePath = ""
  188. for _, fi := range dir {
  189. if fi.IsDir() == true {
  190. continue
  191. }
  192. upperName := strings.ToUpper(fi.Name())
  193. // 找 movie.xml
  194. if upperName == strings.ToUpper(MetadataMovieXml) {
  195. movieFilePath = dirPth + pathSep + fi.Name()
  196. break
  197. } else if upperName == strings.ToUpper(MetadateTVNfo) {
  198. // 连续剧的 nfo 文件
  199. nfoFilePath = dirPth + pathSep + fi.Name()
  200. break
  201. } else {
  202. // 找 *.nfo
  203. ok := strings.HasSuffix(fi.Name(), suffixNameNfo)
  204. if ok {
  205. nfoFilePath = dirPth + pathSep + fi.Name()
  206. }
  207. }
  208. }
  209. // 根据找到的开始解析
  210. if movieFilePath == "" && nfoFilePath == "" {
  211. return imdbInfo, common.NoMetadataFile
  212. }
  213. if movieFilePath != "" {
  214. imdbInfo, err = getImdbAndYearMovieXml(movieFilePath)
  215. if err != nil {
  216. GetLogger().Errorln("getImdbAndYearMovieXml error, move on:", err)
  217. } else {
  218. return imdbInfo, nil
  219. }
  220. }
  221. if nfoFilePath != "" {
  222. imdbInfo, err = getImdbAndYearNfo(nfoFilePath)
  223. if err != nil {
  224. return imdbInfo, err
  225. } else {
  226. return imdbInfo, nil
  227. }
  228. }
  229. return imdbInfo, common.CanNotFindIMDBID
  230. }
  231. //GetVideoInfoFromFileFullPath 从全文件路径推断文件信息
  232. func GetVideoInfoFromFileFullPath(videoFileFullPath string) (*PTN.TorrentInfo, time.Time, error) {
  233. parse, err := PTN.Parse(filepath.Base(videoFileFullPath))
  234. if err != nil {
  235. return nil, time.Time{}, err
  236. }
  237. compile, err := regexp.Compile(regFixTitle2)
  238. if err != nil {
  239. return nil, time.Time{}, err
  240. }
  241. match := compile.ReplaceAllString(parse.Title, "")
  242. match = strings.TrimRight(match, "")
  243. parse.Title = match
  244. fInfo, err := os.Stat(videoFileFullPath)
  245. if err != nil {
  246. return nil, time.Time{}, err
  247. }
  248. return parse, fInfo.ModTime(), nil
  249. }
  250. // GetSeasonAndEpisodeFromSubFileName 从文件名推断 季 和 集 的信息 Season Episode
  251. func GetSeasonAndEpisodeFromSubFileName(videoFileName string) (bool, int, int, error) {
  252. upperName := strings.ToUpper(videoFileName)
  253. // 先进行单个 Episode 的匹配
  254. // Killing.Eve.S02E01.Do.You.Know.How
  255. var re = regexp.MustCompile(`(?m)\.S(\d+)E(\d+)\.`)
  256. matched := re.FindAllStringSubmatch(upperName, -1)
  257. if len(matched) < 1 {
  258. // Killing.Eve.S02.Do.You.Know.How
  259. // 看看是不是季度字幕打包
  260. re = regexp.MustCompile(`(?m)\.S(\d+)\.`)
  261. matched = re.FindAllStringSubmatch(upperName, -1)
  262. if len(matched) < 1 {
  263. return false, 0, 0, nil
  264. }
  265. season, err := GetNumber2int(matched[0][1])
  266. if err != nil {
  267. return false,0, 0, err
  268. }
  269. return true, season, 0, nil
  270. } else {
  271. // 一集的字幕
  272. season, err := GetNumber2int(matched[0][1])
  273. if err != nil {
  274. return false,0, 0, err
  275. }
  276. episode, err := GetNumber2int(matched[0][2])
  277. if err != nil {
  278. return false, 0, 0, err
  279. }
  280. return false, season, episode, nil
  281. }
  282. }
  283. func GetNumber2Float(input string) (float32, error) {
  284. compile := regexp.MustCompile(regGetNumber)
  285. params := compile.FindStringSubmatch(input)
  286. if len(params) == 0 {
  287. return 0, errors.New("get number not match")
  288. }
  289. fNum, err := strconv.ParseFloat(params[0],32)
  290. if err != nil {
  291. return 0, errors.New("get number ParseFloat error")
  292. }
  293. return float32(fNum), nil
  294. }
  295. func GetNumber2int(input string) (int, error) {
  296. compile := regexp.MustCompile(regGetNumber)
  297. params := compile.FindStringSubmatch(input)
  298. if len(params) == 0 {
  299. return 0, errors.New("get number not match")
  300. }
  301. fNum, err := strconv.Atoi(params[0])
  302. if err != nil {
  303. return 0, errors.New("get number ParseFloat error")
  304. }
  305. return fNum, nil
  306. }
  307. const (
  308. MetadataMovieXml = "movie.xml"
  309. suffixNameXml = ".xml"
  310. suffixNameNfo = ".nfo"
  311. MetadateTVNfo = "tvshow.nfo"
  312. // 去除特殊字符,仅仅之有中文
  313. regFixTitle = "[^\u4e00-\u9fa5a-zA-Z0-9\\s]"
  314. // 去除特殊字符,把特殊字符都写进去
  315. regFixTitle2 = "[`~!@#$%^&*()+-=|{}';'\\[\\].<>/?~!@#¥%……&*()——+|{}【】';”“’。、?]"
  316. // 获取数字
  317. regGetNumber = "(?:\\-)?\\d{1,}(?:\\.\\d{1,})?"
  318. )