test_statistics_subs_score.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429
  1. package TestCode
  2. import (
  3. "context"
  4. "fmt"
  5. "os"
  6. "path/filepath"
  7. "sync"
  8. common2 "github.com/ChineseSubFinder/ChineseSubFinder/pkg/types/common"
  9. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/task_control"
  10. "github.com/sirupsen/logrus"
  11. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/ffmpeg_helper"
  12. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/types/subparser"
  13. "github.com/huandu/go-clone"
  14. "github.com/xuri/excelize/v2"
  15. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/log_helper"
  16. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/logic/sub_parser/ass"
  17. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/logic/sub_parser/srt"
  18. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/logic/sub_timeline_fixer"
  19. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/settings"
  20. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/sub_parser_hub"
  21. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/vad"
  22. )
  23. func statistics_subs_score_one(baseAudioFileFPath, baseSubFileFPath, srcSubFileFPath string) {
  24. audioVADInfos, err := vad.GetVADInfoFromAudio(vad.AudioInfo{
  25. FileFullPath: baseAudioFileFPath,
  26. SampleRate: 16000,
  27. BitDepth: 16,
  28. }, true)
  29. if err != nil {
  30. return
  31. }
  32. subParserHub := sub_parser_hub.NewSubParserHub(
  33. log_helper.GetLogger4Tester(),
  34. ass.NewParser(log_helper.GetLogger4Tester()),
  35. srt.NewParser(log_helper.GetLogger4Tester()),
  36. )
  37. bFind, infoBase, err := subParserHub.DetermineFileTypeFromFile(baseSubFileFPath)
  38. if err != nil {
  39. return
  40. }
  41. if bFind == false {
  42. return
  43. }
  44. bFind, srcBase, err := subParserHub.DetermineFileTypeFromFile(srcSubFileFPath)
  45. if err != nil {
  46. return
  47. }
  48. if bFind == false {
  49. return
  50. }
  51. s := sub_timeline_fixer.NewSubTimelineFixerHelperEx(log_helper.GetLogger4Tester(), *settings.NewTimelineFixerSettings())
  52. // path X:\电影\21座桥 (2019)\21座桥 (2019) 720p AAC.chinese(简,subhd).ass
  53. // 音频处理
  54. cloneSrcBase := clone.Clone(srcBase).(*subparser.FileInfo)
  55. bok, _, pipeResultAudio, err := s.ProcessByAudioVAD(audioVADInfos, cloneSrcBase)
  56. if err != nil {
  57. return
  58. }
  59. if bok == false {
  60. return
  61. }
  62. // 字幕处理
  63. cloneSrcBase = clone.Clone(srcBase).(*subparser.FileInfo)
  64. bok, _, pipeResultSub, err := s.ProcessBySubFileInfo(infoBase, cloneSrcBase)
  65. if err != nil {
  66. return
  67. }
  68. if bok == false {
  69. return
  70. }
  71. println(fmt.Sprintf("Audio Score: %f Offset:%f\n", pipeResultAudio.Score, pipeResultAudio.GetOffsetTime()))
  72. println(fmt.Sprintf("Sub Score: %f Offset:%f\n", pipeResultSub.Score, pipeResultSub.GetOffsetTime()))
  73. }
  74. func statistics_subs_score(baseAudioFileFPath, baseSubFileFPath, subSearchRootPath string) {
  75. f := excelize.NewFile()
  76. // Create a new sheet.
  77. sheetName := filepath.Base(subSearchRootPath)
  78. newSheet := f.NewSheet(sheetName)
  79. err := f.SetCellValue(sheetName, fmt.Sprintf("A%d", 1), "SubFPath")
  80. if err != nil {
  81. return
  82. }
  83. err = f.SetCellValue(sheetName, fmt.Sprintf("B%d", 1), "AudioScore")
  84. if err != nil {
  85. return
  86. }
  87. err = f.SetCellValue(sheetName, fmt.Sprintf("C%d", 1), "AudioOffset")
  88. if err != nil {
  89. return
  90. }
  91. err = f.SetCellValue(sheetName, fmt.Sprintf("D%d", 1), "SubScore")
  92. if err != nil {
  93. return
  94. }
  95. err = f.SetCellValue(sheetName, fmt.Sprintf("E%d", 1), "SubOffset")
  96. if err != nil {
  97. return
  98. }
  99. audioVADInfos, err := vad.GetVADInfoFromAudio(vad.AudioInfo{
  100. FileFullPath: baseAudioFileFPath,
  101. SampleRate: 16000,
  102. BitDepth: 16,
  103. }, true)
  104. if err != nil {
  105. return
  106. }
  107. subParserHub := sub_parser_hub.NewSubParserHub(
  108. log_helper.GetLogger4Tester(),
  109. ass.NewParser(log_helper.GetLogger4Tester()),
  110. srt.NewParser(log_helper.GetLogger4Tester()),
  111. )
  112. bFind, infoBase, err := subParserHub.DetermineFileTypeFromFile(baseSubFileFPath)
  113. if err != nil {
  114. return
  115. }
  116. if bFind == false {
  117. return
  118. }
  119. subCounter := 1
  120. err = filepath.Walk(subSearchRootPath,
  121. func(path string, info os.FileInfo, err error) error {
  122. if err != nil {
  123. return err
  124. }
  125. if info.IsDir() == true {
  126. return nil
  127. }
  128. if sub_parser_hub.IsSubExtWanted(info.Name()) == false {
  129. return nil
  130. }
  131. bFind, srcBase, err := subParserHub.DetermineFileTypeFromFile(path)
  132. if err != nil {
  133. return nil
  134. }
  135. if bFind == false {
  136. return nil
  137. }
  138. s := sub_timeline_fixer.NewSubTimelineFixerHelperEx(log_helper.GetLogger4Tester(), *settings.NewTimelineFixerSettings())
  139. // path X:\电影\21座桥 (2019)\21座桥 (2019) 720p AAC.chinese(简,subhd).ass
  140. // 音频处理
  141. cloneSrcBase := clone.Clone(srcBase).(*subparser.FileInfo)
  142. bok, _, pipeResultAudio, err := s.ProcessByAudioVAD(audioVADInfos, cloneSrcBase)
  143. if err != nil {
  144. return nil
  145. }
  146. if bok == false {
  147. return nil
  148. }
  149. // 字幕处理
  150. cloneSrcBase = clone.Clone(srcBase).(*subparser.FileInfo)
  151. bok, _, pipeResultSub, err := s.ProcessBySubFileInfo(infoBase, cloneSrcBase)
  152. if err != nil {
  153. return nil
  154. }
  155. if bok == false {
  156. return nil
  157. }
  158. subCounter++
  159. err = f.SetCellValue(sheetName, fmt.Sprintf("A%d", subCounter+1), info.Name())
  160. if err != nil {
  161. return nil
  162. }
  163. err = f.SetCellValue(sheetName, fmt.Sprintf("B%d", subCounter+1), pipeResultAudio.Score)
  164. if err != nil {
  165. return nil
  166. }
  167. err = f.SetCellValue(sheetName, fmt.Sprintf("C%d", subCounter+1), pipeResultAudio.GetOffsetTime())
  168. if err != nil {
  169. return nil
  170. }
  171. err = f.SetCellValue(sheetName, fmt.Sprintf("D%d", subCounter+1), pipeResultSub.Score)
  172. if err != nil {
  173. return nil
  174. }
  175. err = f.SetCellValue(sheetName, fmt.Sprintf("E%d", subCounter+1), pipeResultSub.GetOffsetTime())
  176. if err != nil {
  177. return nil
  178. }
  179. fmt.Println(subCounter, path, info.Size())
  180. return nil
  181. })
  182. if err != nil {
  183. fmt.Println("Walk", err)
  184. return
  185. }
  186. f.SetActiveSheet(newSheet)
  187. err = f.SaveAs(fmt.Sprintf("%s.xlsx", filepath.Dir(baseSubFileFPath)))
  188. if err != nil {
  189. fmt.Println("SaveAs", err)
  190. return
  191. }
  192. }
  193. func statistics_subs_score_is_match(
  194. logger *logrus.Logger,
  195. s *sub_timeline_fixer.SubTimelineFixerHelperEx,
  196. ffmpegInfo *ffmpeg_helper.FFMPEGInfo,
  197. audioVADInfos []vad.VADInfo, infoBase *subparser.FileInfo,
  198. subSearchRootPath, excelFileName string) {
  199. var err error
  200. f := excelize.NewFile()
  201. // Create a new sheet.
  202. sheetName := filepath.Base(subSearchRootPath)
  203. newSheet := f.NewSheet(sheetName)
  204. err = f.SetCellValue(sheetName, fmt.Sprintf("A%d", 1), "SubFPath")
  205. if err != nil {
  206. logger.Errorln("SetCellValue A Header", err)
  207. return
  208. }
  209. err = f.SetCellValue(sheetName, fmt.Sprintf("B%d", 1), "AudioScore")
  210. if err != nil {
  211. logger.Errorln("SetCellValue B Header", err)
  212. return
  213. }
  214. err = f.SetCellValue(sheetName, fmt.Sprintf("C%d", 1), "AudioOffset")
  215. if err != nil {
  216. logger.Errorln("SetCellValue C Header", err)
  217. return
  218. }
  219. err = f.SetCellValue(sheetName, fmt.Sprintf("D%d", 1), "SubScore")
  220. if err != nil {
  221. logger.Errorln("SetCellValue D Header", err)
  222. return
  223. }
  224. err = f.SetCellValue(sheetName, fmt.Sprintf("E%d", 1), "SubOffset")
  225. if err != nil {
  226. logger.Errorln("SetCellValue E Header", err)
  227. return
  228. }
  229. err = f.SetCellValue(sheetName, fmt.Sprintf("F%d", 1), "IsMatch")
  230. if err != nil {
  231. logger.Errorln("SetCellValue F Header", err)
  232. return
  233. }
  234. err = f.SetCellValue(sheetName, fmt.Sprintf("G%d", 1), "VideoDuration")
  235. if err != nil {
  236. logger.Errorln("SetCellValue G Header", err)
  237. return
  238. }
  239. err = f.SetCellValue(sheetName, fmt.Sprintf("H%d", 1), "TargetSubEndTime")
  240. if err != nil {
  241. logger.Errorln("SetCellValue H Header", err)
  242. return
  243. }
  244. // --------------------------------------------------
  245. // 并发控制
  246. var taskControl *task_control.TaskControl
  247. taskControl, err = task_control.NewTaskControl(6, logger)
  248. if err != nil {
  249. logger.Errorln("NewTaskControl", err)
  250. return
  251. }
  252. taskControl.SetCtxProcessFunc("ScanSubPlayedPool", dealOne, common2.ScanPlayedSubTimeOut)
  253. // --------------------------------------------------
  254. subCounter = 1
  255. err = filepath.Walk(subSearchRootPath,
  256. func(path string, info os.FileInfo, err error) error {
  257. if err != nil {
  258. return err
  259. }
  260. if info.IsDir() == true {
  261. return nil
  262. }
  263. if sub_parser_hub.IsSubExtWanted(info.Name()) == false {
  264. return nil
  265. }
  266. // 并发控制
  267. err = taskControl.Invoke(&task_control.TaskData{
  268. Index: 0,
  269. Count: 0,
  270. DataEx: ExcelInputData{
  271. Logger: logger,
  272. F: f,
  273. S: s,
  274. FfmpegInfo: ffmpegInfo,
  275. AudioVADInfos: audioVADInfos,
  276. InfoBase: infoBase,
  277. NowTargetSubFPath: path,
  278. SubFileName: info.Name(),
  279. SheetName: sheetName,
  280. },
  281. })
  282. if err != nil {
  283. logger.Errorln("Invoke", err)
  284. }
  285. return nil
  286. })
  287. if err != nil {
  288. logger.Errorln("Walk", err)
  289. return
  290. }
  291. taskControl.Hold()
  292. f.SetActiveSheet(newSheet)
  293. err = f.SaveAs(fmt.Sprintf("%s.xlsx", excelFileName))
  294. if err != nil {
  295. logger.Errorln("SaveAs", err)
  296. return
  297. }
  298. logger.Infoln("Done")
  299. }
  300. func dealOne(ctx context.Context, inData interface{}) error {
  301. taskData := inData.(*task_control.TaskData)
  302. excelInputData := taskData.DataEx.(ExcelInputData)
  303. bok, matchResult, err := excelInputData.S.IsMatchBySubFile(
  304. excelInputData.FfmpegInfo,
  305. excelInputData.AudioVADInfos,
  306. excelInputData.InfoBase,
  307. excelInputData.NowTargetSubFPath,
  308. sub_timeline_fixer.CompareConfig{
  309. MinScore: 40000,
  310. OffsetRange: 2,
  311. DialoguesDifferencePercentage: 0.25,
  312. })
  313. if err != nil {
  314. return nil
  315. }
  316. if bok == false && matchResult == nil {
  317. return nil
  318. }
  319. counterLock.Lock()
  320. defer counterLock.Unlock()
  321. subCounter++
  322. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("A%d", subCounter+1), excelInputData.SubFileName)
  323. if err != nil {
  324. excelInputData.Logger.Errorln("SetCellValue A", excelInputData.SubFileName, subCounter+1, err)
  325. return nil
  326. }
  327. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("B%d", subCounter+1), matchResult.AudioCompareScore)
  328. if err != nil {
  329. excelInputData.Logger.Errorln("SetCellValue B", excelInputData.SubFileName, subCounter+1, err)
  330. return nil
  331. }
  332. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("C%d", subCounter+1), matchResult.AudioCompareOffsetTime)
  333. if err != nil {
  334. excelInputData.Logger.Errorln("SetCellValue C", excelInputData.SubFileName, subCounter+1, err)
  335. return nil
  336. }
  337. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("D%d", subCounter+1), matchResult.SubCompareScore)
  338. if err != nil {
  339. excelInputData.Logger.Errorln("SetCellValue D", excelInputData.SubFileName, subCounter+1, err)
  340. return nil
  341. }
  342. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("E%d", subCounter+1), matchResult.SubCompareOffsetTime)
  343. if err != nil {
  344. excelInputData.Logger.Errorln("SetCellValue E", excelInputData.SubFileName, subCounter+1, err)
  345. return nil
  346. }
  347. iTrue := 0
  348. if bok == true {
  349. iTrue = 1
  350. }
  351. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("F%d", subCounter+1), iTrue)
  352. if err != nil {
  353. excelInputData.Logger.Errorln("SetCellValue F", excelInputData.SubFileName, subCounter+1, err)
  354. return nil
  355. }
  356. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("G%d", subCounter+1), matchResult.VideoDuration)
  357. if err != nil {
  358. excelInputData.Logger.Errorln("SetCellValue G", excelInputData.SubFileName, subCounter+1, err)
  359. return nil
  360. }
  361. err = excelInputData.F.SetCellValue(excelInputData.SheetName, fmt.Sprintf("H%d", subCounter+1), matchResult.TargetSubEndTime)
  362. if err != nil {
  363. excelInputData.Logger.Errorln("SetCellValue H", excelInputData.SubFileName, subCounter+1, err)
  364. return nil
  365. }
  366. excelInputData.Logger.Infoln(subCounter, excelInputData.NowTargetSubFPath)
  367. return nil
  368. }
  369. var counterLock sync.Mutex
  370. var subCounter int
  371. type ExcelInputData struct {
  372. Logger *logrus.Logger
  373. F *excelize.File
  374. S *sub_timeline_fixer.SubTimelineFixerHelperEx
  375. FfmpegInfo *ffmpeg_helper.FFMPEGInfo
  376. AudioVADInfos []vad.VADInfo
  377. InfoBase *subparser.FileInfo
  378. NowTargetSubFPath string
  379. SubFileName string
  380. SheetName string
  381. }
  382. type ExcelMathResult struct {
  383. Index int
  384. Name string
  385. MatchResult *sub_timeline_fixer.MatchResult
  386. }