sub_helper.go 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603
  1. package sub_helper
  2. import (
  3. "errors"
  4. "github.com/allanpk716/ChineseSubFinder/internal/common"
  5. "github.com/allanpk716/ChineseSubFinder/internal/pkg/archive_helper"
  6. "github.com/allanpk716/ChineseSubFinder/internal/pkg/decode"
  7. "github.com/allanpk716/ChineseSubFinder/internal/pkg/language"
  8. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  9. "github.com/allanpk716/ChineseSubFinder/internal/pkg/my_folder"
  10. "github.com/allanpk716/ChineseSubFinder/internal/pkg/my_util"
  11. "github.com/allanpk716/ChineseSubFinder/internal/pkg/regex_things"
  12. "github.com/allanpk716/ChineseSubFinder/internal/pkg/sub_parser_hub"
  13. "github.com/allanpk716/ChineseSubFinder/internal/pkg/vad"
  14. "github.com/allanpk716/ChineseSubFinder/internal/types/subparser"
  15. "github.com/allanpk716/ChineseSubFinder/internal/types/supplier"
  16. "math"
  17. "os"
  18. "path/filepath"
  19. "strconv"
  20. "strings"
  21. "time"
  22. )
  23. // OrganizeDlSubFiles 需要从汇总来是网站字幕中,解压对应的压缩包中的字幕出来
  24. func OrganizeDlSubFiles(tmpFolderName string, subInfos []supplier.SubInfo) (map[string][]string, error) {
  25. // 缓存列表,整理后的字幕列表
  26. // SxEx - []string 字幕的路径
  27. var siteSubInfoDict = make(map[string][]string)
  28. tmpFolderFullPath, err := my_folder.GetTmpFolderByName(tmpFolderName)
  29. if err != nil {
  30. return nil, err
  31. }
  32. // 把后缀名给改好
  33. ChangeVideoExt2SubExt(subInfos)
  34. // 第三方的解压库,首先不支持 io.Reader 的操作,也就是得缓存到本地硬盘再读取解压
  35. // 且使用 walk 会无法解压 rar,得指定具体的实例,太麻烦了,直接用通用的接口得了,就是得都缓存下来再判断
  36. // 基于以上两点,写了一堆啰嗦的逻辑···
  37. for i := range subInfos {
  38. // 先存下来,保存是时候需要前缀,前缀就是从那个网站下载来的
  39. nowFileSaveFullPath := filepath.Join(tmpFolderFullPath, GetFrontNameAndOrgName(&subInfos[i]))
  40. err = my_util.WriteFile(nowFileSaveFullPath, subInfos[i].Data)
  41. if err != nil {
  42. log_helper.GetLogger().Errorln("getFrontNameAndOrgName - WriteFile", subInfos[i].FromWhere, subInfos[i].Name, subInfos[i].TopN, err)
  43. continue
  44. }
  45. nowExt := strings.ToLower(subInfos[i].Ext)
  46. epsKey := my_util.GetEpisodeKeyName(subInfos[i].Season, subInfos[i].Episode)
  47. _, ok := siteSubInfoDict[epsKey]
  48. if ok == false {
  49. // 不存在则实例化
  50. siteSubInfoDict[epsKey] = make([]string, 0)
  51. }
  52. if nowExt != ".zip" && nowExt != ".tar" && nowExt != ".rar" && nowExt != ".7z" {
  53. // 是否是受支持的字幕类型
  54. if sub_parser_hub.IsSubExtWanted(nowExt) == false {
  55. log_helper.GetLogger().Debugln("OrganizeDlSubFiles -> IsSubExtWanted == false", "Name:", subInfos[i].Name, "FileUrl:", subInfos[i].FileUrl)
  56. continue
  57. }
  58. // 加入缓存列表
  59. siteSubInfoDict[epsKey] = append(siteSubInfoDict[epsKey], nowFileSaveFullPath)
  60. } else {
  61. // 那么就是需要解压的文件了
  62. // 解压,给一个单独的文件夹
  63. unzipTmpFolder := filepath.Join(tmpFolderFullPath, subInfos[i].FromWhere)
  64. err = os.MkdirAll(unzipTmpFolder, os.ModePerm)
  65. if err != nil {
  66. return nil, err
  67. }
  68. err = archive_helper.UnArchiveFile(nowFileSaveFullPath, unzipTmpFolder)
  69. // 解压完成后,遍历受支持的字幕列表,加入缓存列表
  70. if err != nil {
  71. log_helper.GetLogger().Errorln("archiver.UnArchive", subInfos[i].FromWhere, subInfos[i].Name, subInfos[i].TopN, err)
  72. continue
  73. }
  74. // 搜索这个目录下的所有符合字幕格式的文件
  75. subFileFullPaths, err := SearchMatchedSubFileByDir(unzipTmpFolder)
  76. if err != nil {
  77. log_helper.GetLogger().Errorln("searchMatchedSubFile", subInfos[i].FromWhere, subInfos[i].Name, subInfos[i].TopN, err)
  78. continue
  79. }
  80. // 这里需要给这些下载到的文件进行改名,加是从那个网站来的前缀,后续好查找
  81. for _, fileFullPath := range subFileFullPaths {
  82. newSubName := AddFrontName(subInfos[i], filepath.Base(fileFullPath))
  83. newSubNameFullPath := filepath.Join(tmpFolderFullPath, newSubName)
  84. // 改名
  85. err = os.Rename(fileFullPath, newSubNameFullPath)
  86. if err != nil {
  87. log_helper.GetLogger().Errorln("os.Rename", subInfos[i].FromWhere, subInfos[i].Name, subInfos[i].TopN, err)
  88. continue
  89. }
  90. // 加入缓存列表
  91. siteSubInfoDict[epsKey] = append(siteSubInfoDict[epsKey], newSubNameFullPath)
  92. }
  93. }
  94. }
  95. return siteSubInfoDict, nil
  96. }
  97. // ChangeVideoExt2SubExt 检测 Name,如果是视频的后缀名就改为字幕的后缀名
  98. func ChangeVideoExt2SubExt(subInfos []supplier.SubInfo) {
  99. for x, info := range subInfos {
  100. tmpSubFileName := info.Name
  101. // 如果后缀名是下载字幕目标的后缀名 或者 是压缩包格式的,则跳过
  102. if strings.Contains(tmpSubFileName, info.Ext) == true || archive_helper.IsWantedArchiveExtName(tmpSubFileName) == true {
  103. } else {
  104. subInfos[x].Name = tmpSubFileName + info.Ext
  105. }
  106. }
  107. }
  108. // SelectChineseBestBilingualSubtitle 找到合适的双语中文字幕,简体->繁体,以及 字幕类型的优先级选择
  109. func SelectChineseBestBilingualSubtitle(subs []subparser.FileInfo, subTypePriority int) *subparser.FileInfo {
  110. // 先傻一点实现优先双语的,之前的写法有 bug
  111. for _, info := range subs {
  112. // 找到了中文字幕
  113. if language.HasChineseLang(info.Lang) == true {
  114. // 字幕的优先级 0 - 原样, 1 - srt , 2 - ass/ssa
  115. if subTypePriority == 1 {
  116. // 1 - srt
  117. if strings.ToLower(info.Ext) == common.SubExtSRT {
  118. // 优先双语
  119. if language.IsBilingualSubtitle(info.Lang) == true {
  120. return &info
  121. }
  122. }
  123. } else if subTypePriority == 2 {
  124. // 2 - ass/ssa
  125. if strings.ToLower(info.Ext) == common.SubExtASS || strings.ToLower(info.Ext) == common.SubExtSSA {
  126. // 优先双语
  127. if language.IsBilingualSubtitle(info.Lang) == true {
  128. return &info
  129. }
  130. }
  131. } else {
  132. // 优先双语
  133. if language.IsBilingualSubtitle(info.Lang) == true {
  134. return &info
  135. }
  136. }
  137. }
  138. }
  139. return nil
  140. }
  141. // SelectChineseBestSubtitle 找到合适的中文字幕,简体->繁体,以及 字幕类型的优先级选择
  142. func SelectChineseBestSubtitle(subs []subparser.FileInfo, subTypePriority int) *subparser.FileInfo {
  143. // 先傻一点实现优先双语的,之前的写法有 bug
  144. for _, info := range subs {
  145. // 找到了中文字幕
  146. if language.HasChineseLang(info.Lang) == true {
  147. // 字幕的优先级 0 - 原样, 1 - srt , 2 - ass/ssa
  148. if subTypePriority == 1 {
  149. // 1 - srt
  150. if strings.ToLower(info.Ext) == common.SubExtSRT {
  151. return &info
  152. }
  153. } else if subTypePriority == 2 {
  154. // 2 - ass/ssa
  155. if strings.ToLower(info.Ext) == common.SubExtASS || strings.ToLower(info.Ext) == common.SubExtSSA {
  156. return &info
  157. }
  158. } else {
  159. return &info
  160. }
  161. }
  162. }
  163. return nil
  164. }
  165. // GetFrontNameAndOrgName 返回的名称包含,那个网站下载的,这个网站中排名第几,文件名
  166. func GetFrontNameAndOrgName(info *supplier.SubInfo) string {
  167. infoName := ""
  168. fileName, err := decode.GetVideoInfoFromFileName(info.Name)
  169. if err != nil {
  170. log_helper.GetLogger().Warnln("", err)
  171. infoName = info.Name
  172. } else {
  173. infoName = fileName.Title + "_S" + strconv.Itoa(fileName.Season) + "E" + strconv.Itoa(fileName.Episode) + filepath.Ext(info.Name)
  174. }
  175. info.Name = infoName
  176. return "[" + info.FromWhere + "]_" + strconv.FormatInt(info.TopN, 10) + "_" + infoName
  177. }
  178. // AddFrontName 添加文件的前缀
  179. func AddFrontName(info supplier.SubInfo, orgName string) string {
  180. return "[" + info.FromWhere + "]_" + strconv.FormatInt(info.TopN, 10) + "_" + orgName
  181. }
  182. // SearchMatchedSubFileByDir 搜索符合后缀名的视频文件,排除 Sub_SxE0 这样的文件夹中的文件
  183. func SearchMatchedSubFileByDir(dir string) ([]string, error) {
  184. // 这里有个梗,会出现 __MACOSX 这类文件夹,那么里面会有一样的文件,需要用文件大小排除一下,至少大于 1 kb 吧
  185. var fileFullPathList = make([]string, 0)
  186. pathSep := string(os.PathSeparator)
  187. files, err := os.ReadDir(dir)
  188. if err != nil {
  189. return nil, err
  190. }
  191. for _, curFile := range files {
  192. fullPath := dir + pathSep + curFile.Name()
  193. if my_util.IsDir(fullPath) == true {
  194. // 需要排除 Sub_S1E0、Sub_S2E0 这样的整季的字幕文件夹,这里仅仅是缓存,不会被加载的
  195. matched := regex_things.RegOneSeasonSubFolderNameMatch.FindAllStringSubmatch(curFile.Name(), -1)
  196. if matched != nil && len(matched) > 0 {
  197. continue
  198. }
  199. // 内层的错误就无视了
  200. oneList, _ := SearchMatchedSubFileByDir(fullPath)
  201. if oneList != nil {
  202. fileFullPathList = append(fileFullPathList, oneList...)
  203. }
  204. } else {
  205. // 这里就是文件了
  206. info, err := curFile.Info()
  207. if err != nil {
  208. return nil, err
  209. }
  210. if info.Size() < 1000 {
  211. continue
  212. }
  213. if info.Size() == 4096 && strings.HasPrefix(curFile.Name(), "._") == true {
  214. log_helper.GetLogger().Debugln("SearchMatchedSubFileByDir file.Size() == 4096 && Prefix Name == ._*", fullPath)
  215. continue
  216. }
  217. if sub_parser_hub.IsSubExtWanted(filepath.Ext(curFile.Name())) == true {
  218. fileFullPathList = append(fileFullPathList, fullPath)
  219. }
  220. }
  221. }
  222. return fileFullPathList, nil
  223. }
  224. // SearchMatchedSubFileByOneVideo 搜索这个视频当前目录下匹配的字幕
  225. func SearchMatchedSubFileByOneVideo(oneVideoFullPath string) ([]string, error) {
  226. dir := filepath.Dir(oneVideoFullPath)
  227. fileName := filepath.Base(oneVideoFullPath)
  228. fileName = strings.ToLower(fileName)
  229. fileName = strings.ReplaceAll(fileName, filepath.Ext(fileName), "")
  230. pathSep := string(os.PathSeparator)
  231. files, err := os.ReadDir(dir)
  232. if err != nil {
  233. return nil, err
  234. }
  235. var matchedSubs = make([]string, 0)
  236. for _, curFile := range files {
  237. if curFile.IsDir() {
  238. continue
  239. }
  240. // 这里就是文件了
  241. info, err := curFile.Info()
  242. if err != nil {
  243. return nil, err
  244. }
  245. if info.Size() < 1000 {
  246. continue
  247. }
  248. // 判断的时候用小写的,后续重命名的时候用原有的名称
  249. nowFileName := strings.ToLower(curFile.Name())
  250. // 后缀名得对
  251. if sub_parser_hub.IsSubExtWanted(filepath.Ext(nowFileName)) == false {
  252. continue
  253. }
  254. // 字幕文件名应该包含 视频文件名(无后缀)
  255. if strings.Contains(nowFileName, fileName) == false {
  256. continue
  257. }
  258. oldPath := dir + pathSep + curFile.Name()
  259. matchedSubs = append(matchedSubs, oldPath)
  260. }
  261. return matchedSubs, nil
  262. }
  263. // SearchVideoMatchSubFileAndRemoveExtMark 找到找个视频目录下相匹配的字幕,同时去除这些字幕中 .default 或者 .forced 的标记。注意这两个标记不应该同时出现,否则无法正确去除
  264. func SearchVideoMatchSubFileAndRemoveExtMark(oneVideoFullPath string) error {
  265. dir := filepath.Dir(oneVideoFullPath)
  266. fileName := filepath.Base(oneVideoFullPath)
  267. fileName = strings.ToLower(fileName)
  268. fileName = strings.ReplaceAll(fileName, filepath.Ext(fileName), "")
  269. pathSep := string(os.PathSeparator)
  270. files, err := os.ReadDir(dir)
  271. if err != nil {
  272. return err
  273. }
  274. for _, curFile := range files {
  275. if curFile.IsDir() {
  276. continue
  277. } else {
  278. // 这里就是文件了
  279. info, err := curFile.Info()
  280. if err != nil {
  281. return err
  282. }
  283. if info.Size() < 1000 {
  284. continue
  285. }
  286. // 判断的时候用小写的,后续重命名的时候用原有的名称
  287. nowFileName := strings.ToLower(curFile.Name())
  288. // 后缀名得对
  289. if sub_parser_hub.IsSubExtWanted(filepath.Ext(nowFileName)) == false {
  290. continue
  291. }
  292. // 字幕文件名应该包含 视频文件名(无后缀)
  293. if strings.Contains(nowFileName, fileName) == false {
  294. continue
  295. }
  296. // 得包含 .default. 找个关键词
  297. if strings.Contains(nowFileName, subparser.Sub_Ext_Mark_Default+".") == true {
  298. oldPath := dir + pathSep + curFile.Name()
  299. newPath := dir + pathSep + strings.ReplaceAll(curFile.Name(), subparser.Sub_Ext_Mark_Default+".", ".")
  300. err = os.Rename(oldPath, newPath)
  301. if err != nil {
  302. return err
  303. }
  304. } else if strings.Contains(nowFileName, subparser.Sub_Ext_Mark_Forced+".") == true {
  305. // 得包含 .forced. 找个关键词
  306. oldPath := dir + pathSep + curFile.Name()
  307. newPath := dir + pathSep + strings.ReplaceAll(curFile.Name(), subparser.Sub_Ext_Mark_Forced+".", ".")
  308. err = os.Rename(oldPath, newPath)
  309. if err != nil {
  310. return err
  311. }
  312. } else {
  313. continue
  314. }
  315. }
  316. }
  317. return nil
  318. }
  319. // DeleteOneSeasonSubCacheFolder 删除一个连续剧中的所有一季字幕的缓存文件夹
  320. func DeleteOneSeasonSubCacheFolder(seriesDir string) error {
  321. debugFolderByName, err := my_folder.GetDebugFolderByName([]string{filepath.Base(seriesDir)})
  322. if err != nil {
  323. return err
  324. }
  325. files, err := os.ReadDir(debugFolderByName)
  326. if err != nil {
  327. return err
  328. }
  329. pathSep := string(os.PathSeparator)
  330. for _, curFile := range files {
  331. if curFile.IsDir() == true {
  332. matched := regex_things.RegOneSeasonSubFolderNameMatch.FindAllStringSubmatch(curFile.Name(), -1)
  333. if matched == nil || len(matched) < 1 {
  334. continue
  335. }
  336. fullPath := debugFolderByName + pathSep + curFile.Name()
  337. err = os.RemoveAll(fullPath)
  338. if err != nil {
  339. return err
  340. }
  341. }
  342. }
  343. return nil
  344. }
  345. /*
  346. 只针对英文字幕进行合并分散的 DialoguesFilter
  347. 会遇到这样的字幕,如下0
  348. 2line-The Card Counter (2021) WEBDL-1080p.chinese(inside).ass
  349. 它的对白一句话分了两个 dialogue 去做。这样做后续字幕时间轴校正就会遇到问题,因为只有一半,匹配占比会很低
  350. (每一个 Dialogue 的首字母需要分析,大写和小写的占比是多少,统计一下,正常的,和上述特殊的)
  351. 那么,就需要额外的逻辑去对 DialoguesFilterEx 进行额外的推断
  352. 暂时考虑的方案是,英文对白每一句的开头应该是英文大写字幕,如果是小写字幕,就应该与上语句合并,且每一句的字符长度有大于一定才触发
  353. */
  354. func MergeMultiDialogue4EngSubtitle(inSubParser *subparser.FileInfo) {
  355. merger := NewDialogueMerger()
  356. for _, dialogueEx := range inSubParser.DialoguesFilterEx {
  357. merger.Add(dialogueEx)
  358. }
  359. inSubParser.DialoguesFilterEx = merger.Get()
  360. }
  361. // GetVADInfoFeatureFromSub 跟下面的 GetVADInfoFeatureFromSubNeedOffsetTimeWillInsert 函数功能一致
  362. func GetVADInfoFeatureFromSub(fileInfo *subparser.FileInfo, frontAndEndPer float64, subUnitMaxCount int, insert bool) ([]SubUnit, error) {
  363. return GetVADInfoFeatureFromSubNeedOffsetTimeWillInsert(fileInfo, frontAndEndPer, subUnitMaxCount, 0, insert)
  364. }
  365. /*
  366. GetVADInfoFeatureFromSubNeedOffsetTimeWillInsert 只不过这里可以加一个每一句话固定的偏移时间
  367. 这里的字幕要求是完整的一个字幕
  368. 1. 抽取字幕的时间片段的时候,暂定,前 15% 和后 15% 要避开,前奏、主题曲、结尾曲
  369. 2. 将整个字幕,抽取连续 5 句对话为一个单元,提取时间片段信息
  370. 3. 这里抽取的是特征,也就有额外的逻辑去找这个特征(本程序内会描述为“钥匙”)
  371. */
  372. func GetVADInfoFeatureFromSubNeedOffsetTimeWillInsert(fileInfo *subparser.FileInfo, SkipFrontAndEndPer float64, subUnitMaxCount int, offsetTime float64, insert bool) ([]SubUnit, error) {
  373. if subUnitMaxCount < 0 {
  374. subUnitMaxCount = 0
  375. }
  376. nowDialogue := fileInfo.Dialogues
  377. srcSubUnitList := make([]SubUnit, 0)
  378. srcSubDialogueList := make([]subparser.OneDialogue, 0)
  379. srcOneSubUnit := NewSubUnit()
  380. // 最后一个对话的结束时间
  381. lastDialogueExTimeEnd, err := my_util.ParseTime(nowDialogue[len(nowDialogue)-1].EndTime)
  382. if err != nil {
  383. return nil, err
  384. }
  385. // 相当于总时长
  386. fullDuration := my_util.Time2SecondNumber(lastDialogueExTimeEnd)
  387. // 最低的起始时间,因为可能需要裁剪范围
  388. startRangeTimeMin := fullDuration * SkipFrontAndEndPer
  389. endRangeTimeMax := fullDuration * (1.0 - SkipFrontAndEndPer)
  390. println(startRangeTimeMin)
  391. println(endRangeTimeMax)
  392. for i := 0; i < len(nowDialogue); i++ {
  393. oneDialogueExTimeStart, err := my_util.ParseTime(nowDialogue[i].StartTime)
  394. if err != nil {
  395. return nil, err
  396. }
  397. oneDialogueExTimeEnd, err := my_util.ParseTime(nowDialogue[i].EndTime)
  398. if err != nil {
  399. return nil, err
  400. }
  401. oneStart := my_util.Time2SecondNumber(oneDialogueExTimeStart)
  402. if SkipFrontAndEndPer > 0 {
  403. if fullDuration*SkipFrontAndEndPer > oneStart || fullDuration*(1.0-SkipFrontAndEndPer) < oneStart {
  404. continue
  405. }
  406. }
  407. if nowDialogue[i].Lines == nil || len(nowDialogue[i].Lines) == 0 {
  408. continue
  409. }
  410. // 如果当前的这一句话,为空,或者进过正则表达式剔除特殊字符后为空,则跳过
  411. if my_util.ReplaceSpecString(nowDialogue[i].Lines[0], "") == "" {
  412. continue
  413. }
  414. // 如果当前的这一句话,为空,或者进过正则表达式剔除特殊字符后为空,则跳过
  415. if my_util.ReplaceSpecString(fileInfo.GetDialogueExContent(i), "") == "" {
  416. continue
  417. }
  418. // 低于 5句对白,则添加
  419. if srcOneSubUnit.GetDialogueCount() < subUnitMaxCount {
  420. // 算上偏移
  421. offsetTimeDuration := time.Duration(offsetTime * math.Pow10(9))
  422. oneDialogueExTimeStart = oneDialogueExTimeStart.Add(offsetTimeDuration)
  423. oneDialogueExTimeEnd = oneDialogueExTimeEnd.Add(offsetTimeDuration)
  424. // 如果没有偏移就是 0
  425. if insert == true {
  426. srcOneSubUnit.AddAndInsert(oneDialogueExTimeStart, oneDialogueExTimeEnd)
  427. } else {
  428. srcOneSubUnit.Add(oneDialogueExTimeStart, oneDialogueExTimeEnd)
  429. }
  430. // 这一个单元的 Dialogue 需要合并起来,才能判断是否符合“钥匙”的要求
  431. srcSubDialogueList = append(srcSubDialogueList, nowDialogue[i])
  432. } else {
  433. // 用完清空
  434. srcSubDialogueList = make([]subparser.OneDialogue, 0)
  435. // 将拼凑起来的对话组成一个单元进行存储起来
  436. srcSubUnitList = append(srcSubUnitList, *srcOneSubUnit)
  437. // 然后重置
  438. srcOneSubUnit = NewSubUnit()
  439. }
  440. }
  441. if srcOneSubUnit.GetDialogueCount() > 0 {
  442. srcSubUnitList = append(srcSubUnitList, *srcOneSubUnit)
  443. }
  444. return srcSubUnitList, nil
  445. }
  446. /*
  447. GetVADInfoFeatureFromSubNew 将 Sub 文件转换为 VAD List 信息
  448. */
  449. func GetVADInfoFeatureFromSubNew(fileInfo *subparser.FileInfo, SkipFrontAndEndPer float64) (*SubUnit, error) {
  450. outSubUnits := NewSubUnit()
  451. if len(fileInfo.Dialogues) <= 0 {
  452. return nil, errors.New("GetVADInfoFeatureFromSubNew fileInfo Dialogue Length is 0")
  453. }
  454. /*
  455. 先拼凑出完整的一个 VAD List
  456. 因为 VAD 的窗口是 10ms,那么需要多每一句话按 10 ms 的单位进行取整
  457. 每一句话开始、结束的时间,需要向下取整
  458. */
  459. subStartTimeFloor := my_util.MakeFloor10msMultipleFromFloat(my_util.Time2SecondNumber(fileInfo.GetStartTime()))
  460. subEndTimeFloor := my_util.MakeFloor10msMultipleFromFloat(my_util.Time2SecondNumber(fileInfo.GetEndTime()))
  461. // 如果想要从 0 时间点开始算,那么 subStartTimeFloor 这个值就需要重置到0
  462. subStartTimeFloor = 0
  463. subFullSecondTimeFloor := subEndTimeFloor - subStartTimeFloor
  464. // 根据这个时长就能够得到一个完整的 VAD List,然后再通过每一句对白进行 VAD 值的调整即可,这样就能够保证
  465. // 相同的一个字幕因为使用 ffmpeg 导出 srt 和 ass 后的,可能存在总体时间轴不一致的问题
  466. // 123.450 - > 12345
  467. vadLen := int(subFullSecondTimeFloor*100) + 2
  468. subVADs := make([]vad.VADInfo, vadLen)
  469. subStartTimeFloor10ms := subStartTimeFloor * 100
  470. for i := 0; i < vadLen; i++ {
  471. subVADs[i] = *vad.NewVADInfoBase(false, time.Duration((subStartTimeFloor10ms+float64(i))*math.Pow10(7)))
  472. }
  473. // 计算出需要截取的片段,起始和结束
  474. skipLen := int(float64(vadLen) * SkipFrontAndEndPer)
  475. skipStartIndex := skipLen
  476. skipEndIndex := vadLen - skipLen
  477. // 现在需要从 fileInfo 的每一句对白也就对应一段连续的 VAD active = true 来进行改写,记得向下取整
  478. lastDialogueIndex := 0
  479. for _, dialogue := range fileInfo.Dialogues {
  480. if dialogue.Lines == nil || len(dialogue.Lines) == 0 {
  481. continue
  482. }
  483. // 如果当前的这一句话,为空,或者进过正则表达式剔除特殊字符后为空,则跳过
  484. if my_util.ReplaceSpecString(dialogue.Lines[0], "") == "" {
  485. continue
  486. }
  487. // 字幕的开始时间
  488. oneDialogueStartTime, err := my_util.ParseTime(dialogue.StartTime)
  489. if err != nil {
  490. return nil, err
  491. }
  492. // 字幕的结束时间
  493. oneDialogueEndTime, err := my_util.ParseTime(dialogue.EndTime)
  494. if err != nil {
  495. return nil, err
  496. }
  497. // 字幕的时长,对时间进行向下取整
  498. oneDialogueStartTimeFloor := my_util.MakeCeil10msMultipleFromFloat(my_util.Time2SecondNumber(oneDialogueStartTime))
  499. oneDialogueEndTimeFloor := my_util.MakeFloor10msMultipleFromFloat(my_util.Time2SecondNumber(oneDialogueEndTime))
  500. // 得到一句对白的时长
  501. changeVADStartIndex := int(oneDialogueStartTimeFloor * 100)
  502. changeVADEndIndex := int(oneDialogueEndTimeFloor * 100)
  503. // 不能超过 最后一句话的时常
  504. if changeVADStartIndex > int(subEndTimeFloor*100) {
  505. continue
  506. }
  507. // 也不能比起始的第一句话时间轴更低
  508. if changeVADStartIndex < int(subStartTimeFloor10ms) {
  509. continue
  510. }
  511. // 当前这句话的开始和结束信息
  512. changerStartIndex := changeVADStartIndex - int(subStartTimeFloor10ms)
  513. if changerStartIndex < 0 {
  514. continue
  515. }
  516. changerEndIndex := changeVADEndIndex - int(subStartTimeFloor10ms)
  517. if changerEndIndex < 0 {
  518. continue
  519. }
  520. // 如果上一个对白的最后一个 OffsetIndex 连接着当前这一句的索引的 VAD 信息 active 是 true 就设置为 false
  521. if lastDialogueIndex == changerStartIndex {
  522. for i := 1; i <= 2; i++ {
  523. if lastDialogueIndex-i >= 0 && subVADs[lastDialogueIndex-i].Active == true {
  524. subVADs[lastDialogueIndex-i].Active = false
  525. }
  526. }
  527. }
  528. // 开始根据当前这句话进行 VAD 信息的设置
  529. // 调整之前做好的整体 VAD 的信息,符合 VAD active = true
  530. if changerEndIndex >= vadLen {
  531. changerEndIndex = vadLen - 1
  532. }
  533. for i := changerStartIndex; i <= changerEndIndex; i++ {
  534. subVADs[i].Active = true
  535. }
  536. lastDialogueIndex = changerEndIndex
  537. }
  538. // 截取出来当前这一段
  539. tmpVADList := subVADs[skipStartIndex:skipEndIndex]
  540. outSubUnits.VADList = tmpVADList
  541. tmpStartTime := time.Time{}
  542. tmpStartTime = tmpStartTime.Add(tmpVADList[0].Time)
  543. tmpEndTime := time.Time{}
  544. tmpEndTime = tmpEndTime.Add(tmpVADList[len(tmpVADList)-1].Time)
  545. outSubUnits.SetBaseTime(tmpStartTime)
  546. outSubUnits.SetOffsetStartTime(tmpStartTime)
  547. outSubUnits.SetOffsetEndTime(tmpEndTime)
  548. return outSubUnits, nil
  549. }