ffmpeg_helper.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403
  1. package ffmpeg_helper
  2. import (
  3. "bytes"
  4. "errors"
  5. "fmt"
  6. "github.com/allanpk716/ChineseSubFinder/internal/common"
  7. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_parser/ass"
  8. "github.com/allanpk716/ChineseSubFinder/internal/logic/sub_parser/srt"
  9. "github.com/allanpk716/ChineseSubFinder/internal/pkg/language"
  10. "github.com/allanpk716/ChineseSubFinder/internal/pkg/log_helper"
  11. "github.com/allanpk716/ChineseSubFinder/internal/pkg/my_util"
  12. "github.com/allanpk716/ChineseSubFinder/internal/pkg/sub_parser_hub"
  13. "github.com/tidwall/gjson"
  14. "os"
  15. "os/exec"
  16. "path/filepath"
  17. "strings"
  18. )
  19. type FFMPEGHelper struct {
  20. subParserHub *sub_parser_hub.SubParserHub // 字幕内容的解析器
  21. }
  22. func NewFFMPEGHelper() *FFMPEGHelper {
  23. return &FFMPEGHelper{
  24. subParserHub: sub_parser_hub.NewSubParserHub(ass.NewParser(), srt.NewParser()),
  25. }
  26. }
  27. // GetFFMPEGInfo 获取 视频的 FFMPEG 信息,包含音频和字幕
  28. // 优先会导出 中、英、日、韩 类型的,字幕如果没有语言类型,则也导出,然后需要额外的字幕语言的判断去辅助标记(读取文件内容)
  29. func (f *FFMPEGHelper) GetFFMPEGInfo(videoFileFullPath string) (bool, *FFMPEGInfo, error) {
  30. const args = "-v error -show_format -show_streams -print_format json"
  31. cmdArgs := strings.Fields(args)
  32. cmdArgs = append(cmdArgs, videoFileFullPath)
  33. cmd := exec.Command("ffprobe", cmdArgs...)
  34. buf := bytes.NewBufferString("")
  35. //指定输出位置
  36. cmd.Stderr = buf
  37. cmd.Stdout = buf
  38. err := cmd.Start()
  39. if err != nil {
  40. return false, nil, err
  41. }
  42. err = cmd.Wait()
  43. if err != nil {
  44. return false, nil, err
  45. }
  46. // 解析得到的字符串反馈
  47. bok, ffMPEGInfo := f.parseJsonString2GetFFProbeInfo(videoFileFullPath, buf.String())
  48. if bok == false {
  49. return false, nil, nil
  50. }
  51. // 在函数调用完毕后,判断是否需要清理
  52. defer func() {
  53. if bok == false && ffMPEGInfo != nil {
  54. err := os.RemoveAll(ffMPEGInfo.GetCacheFolderFPath())
  55. if err != nil {
  56. log_helper.GetLogger().Errorln("GetFFMPEGInfo - RemoveAll", err.Error())
  57. return
  58. }
  59. }
  60. }()
  61. // 判断这个视频是否已经导出过内置的字幕和音频文件了
  62. if ffMPEGInfo.IsExported() == false {
  63. // 说明缓存不存在,需要导出,这里需要注意,如果导出失败了,这个文件夹要清理掉
  64. if my_util.IsDir(ffMPEGInfo.GetCacheFolderFPath()) == true {
  65. // 如果存在则,先清空一个这个文件夹
  66. err = my_util.ClearFolder(ffMPEGInfo.GetCacheFolderFPath())
  67. if err != nil {
  68. bok = false
  69. return bok, nil, err
  70. }
  71. } else {
  72. // 如果不存在则,创建文件夹
  73. err = os.MkdirAll(ffMPEGInfo.GetCacheFolderFPath(), os.ModePerm)
  74. if err != nil {
  75. bok = false
  76. return bok, nil, err
  77. }
  78. }
  79. // 开始导出
  80. // 构建导出的命令参数
  81. subArgs, audioArgs := f.getAudioAndSubExportArgs(videoFileFullPath, ffMPEGInfo)
  82. // 执行导出
  83. execErrorString, err := f.exportAudioAndSubtitles(subArgs, audioArgs)
  84. if err != nil {
  85. log_helper.GetLogger().Errorln("exportAudioAndSubtitles", execErrorString)
  86. bok = false
  87. return bok, nil, err
  88. }
  89. }
  90. // 查找当前这个视频外置字幕列表
  91. err = ffMPEGInfo.GetExternalSubInfos(f.subParserHub)
  92. if err != nil {
  93. return false, nil, err
  94. }
  95. return bok, ffMPEGInfo, nil
  96. }
  97. func (f *FFMPEGHelper) GetAudioInfo(audioFileFullPath string) (bool, float64, error) {
  98. const args = "-v error -show_format -show_streams -print_format json -f s16le -ac 1 -ar 16000"
  99. cmdArgs := strings.Fields(args)
  100. cmdArgs = append(cmdArgs, audioFileFullPath)
  101. cmd := exec.Command("ffprobe", cmdArgs...)
  102. buf := bytes.NewBufferString("")
  103. //指定输出位置
  104. cmd.Stderr = buf
  105. cmd.Stdout = buf
  106. err := cmd.Start()
  107. if err != nil {
  108. return false, 0, err
  109. }
  110. err = cmd.Wait()
  111. if err != nil {
  112. return false, 0, err
  113. }
  114. bok, duration := f.parseJsonString2GetAudioInfo(buf.String())
  115. if bok == false {
  116. return false, 0, errors.New("ffprobe get " + audioFileFullPath + " duration error")
  117. }
  118. return true, duration, nil
  119. }
  120. // ExportAudioArgsByTimeRange 根据输入的时间轴导出音频分段信息 "0:1:27" "28.2"
  121. func (f *FFMPEGHelper) ExportAudioArgsByTimeRange(audioFullPath string, startTimeString, timeLength string) (string, string, error) {
  122. outStartTimeString := strings.ReplaceAll(startTimeString, ":", "-")
  123. outStartTimeString = strings.ReplaceAll(outStartTimeString, ".", "#")
  124. outTimeLength := strings.ReplaceAll(timeLength, ".", "#")
  125. frontName := strings.ReplaceAll(filepath.Base(audioFullPath), filepath.Ext(audioFullPath), "")
  126. outAudioName := frontName + "_" + outStartTimeString + "_" + outTimeLength + filepath.Ext(audioFullPath)
  127. var outAudioFullPath = filepath.Join(filepath.Dir(audioFullPath), outAudioName)
  128. if my_util.IsFile(outAudioFullPath) == true {
  129. err := os.Remove(outAudioFullPath)
  130. if err != nil {
  131. return "", "", err
  132. }
  133. }
  134. args := f.getAudioExportArgsByTimeRange(audioFullPath, startTimeString, timeLength, outAudioFullPath)
  135. execFFMPEG, err := f.execFFMPEG(args)
  136. if err != nil {
  137. return "", execFFMPEG, err
  138. }
  139. return outAudioFullPath, "", nil
  140. }
  141. // parseJsonString2GetFFProbeInfo 使用 ffprobe 获取视频的 stream 信息,从中解析出字幕和音频的索引
  142. func (f *FFMPEGHelper) parseJsonString2GetFFProbeInfo(videoFileFullPath, inputFFProbeString string) (bool, *FFMPEGInfo) {
  143. streamsValue := gjson.Get(inputFFProbeString, "streams.#")
  144. if streamsValue.Exists() == false {
  145. return false, nil
  146. }
  147. ffmpegInfo := NewFFMPEGInfo(videoFileFullPath)
  148. for i := 0; i < int(streamsValue.Num); i++ {
  149. oneIndex := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.index", i))
  150. oneCodecName := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.codec_name", i))
  151. oneCodecType := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.codec_type", i))
  152. oneTimeBase := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.time_base", i))
  153. oneStartTime := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.start_time", i))
  154. oneLanguage := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.tags.language", i))
  155. // 任意一个字段不存在则跳过
  156. if oneIndex.Exists() == false {
  157. continue
  158. }
  159. if oneCodecName.Exists() == false {
  160. continue
  161. }
  162. if oneCodecType.Exists() == false {
  163. continue
  164. }
  165. if oneTimeBase.Exists() == false {
  166. continue
  167. }
  168. if oneStartTime.Exists() == false {
  169. continue
  170. }
  171. // 这里需要区分是字幕还是音频
  172. if oneCodecType.String() == codecTypeSub {
  173. // 字幕
  174. // 这里非必须解析到 language 字段,把所有的都导出来,然后通过额外字幕语言判断即可
  175. oneDurationTS := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.duration_ts", i))
  176. oneDuration := gjson.Get(inputFFProbeString, fmt.Sprintf("streams.%d.duration", i))
  177. // 必须存在的
  178. if oneDurationTS.Exists() == false {
  179. continue
  180. }
  181. if oneDuration.Exists() == false {
  182. continue
  183. }
  184. // 非必须存在的
  185. nowLanguageString := ""
  186. if oneLanguage.Exists() == true {
  187. nowLanguageString = oneLanguage.String()
  188. // 只导出 中、英、日、韩
  189. if language.IsSupportISOString(nowLanguageString) == false {
  190. continue
  191. }
  192. }
  193. subInfo := NewSubtitleInfo(int(oneIndex.Num), oneCodecName.String(), oneCodecType.String(),
  194. oneTimeBase.String(), oneStartTime.String(),
  195. int(oneDurationTS.Num), oneDuration.String(), nowLanguageString)
  196. ffmpegInfo.SubtitleInfoList = append(ffmpegInfo.SubtitleInfoList, *subInfo)
  197. } else if oneCodecType.String() == codecTypeAudio {
  198. // 音频
  199. // 这里必要要能够解析到 language 字段
  200. if oneLanguage.Exists() == false {
  201. continue
  202. }
  203. // 只导出 中、英、日、韩
  204. if language.IsSupportISOString(oneLanguage.String()) == false {
  205. continue
  206. }
  207. audioInfo := NewAudioInfo(int(oneIndex.Num), oneCodecName.String(), oneCodecType.String(),
  208. oneTimeBase.String(), oneStartTime.String(), oneLanguage.String())
  209. ffmpegInfo.AudioInfoList = append(ffmpegInfo.AudioInfoList, *audioInfo)
  210. } else {
  211. continue
  212. }
  213. }
  214. return true, ffmpegInfo
  215. }
  216. // parseJsonString2GetAudioInfo 获取 pcm 音频的长度
  217. func (f *FFMPEGHelper) parseJsonString2GetAudioInfo(inputFFProbeString string) (bool, float64) {
  218. durationValue := gjson.Get(inputFFProbeString, "format.duration")
  219. if durationValue.Exists() == false {
  220. return false, 0
  221. }
  222. return true, durationValue.Float()
  223. }
  224. // exportAudioAndSubtitles 导出音频和字幕文件
  225. func (f *FFMPEGHelper) exportAudioAndSubtitles(subArgs, audioArgs []string) (string, error) {
  226. // 这里导出依赖的是 ffmpeg 这个程序,需要的是构建导出的语句
  227. execErrorString, err := f.execFFMPEG(subArgs)
  228. if err != nil {
  229. return execErrorString, err
  230. }
  231. execErrorString, err = f.execFFMPEG(audioArgs)
  232. if err != nil {
  233. return execErrorString, err
  234. }
  235. return "", nil
  236. }
  237. // execFFMPEG 执行 ffmpeg 命令
  238. func (f *FFMPEGHelper) execFFMPEG(cmds []string) (string, error) {
  239. cmd := exec.Command("ffmpeg", cmds...)
  240. buf := bytes.NewBufferString("")
  241. //指定输出位置
  242. cmd.Stderr = buf
  243. cmd.Stdout = buf
  244. err := cmd.Start()
  245. if err != nil {
  246. return buf.String(), err
  247. }
  248. err = cmd.Wait()
  249. if err != nil {
  250. return buf.String(), err
  251. }
  252. return "", nil
  253. }
  254. // getAudioAndSubExportArgs 构建从原始视频导出字幕、音频的 ffmpeg 的参数
  255. func (f *FFMPEGHelper) getAudioAndSubExportArgs(videoFileFullPath string, ffmpegInfo *FFMPEGInfo) ([]string, []string) {
  256. /*
  257. 导出多个字幕
  258. ffmpeg.exe -i xx.mp4 -vn -an -map 0:7 subs-7.srt -map 0:6 subs-6.srt
  259. 导出音频,从 1m 27s 开始,导出向后的 28 s,转换为 mp3 格式
  260. ffmpeg.exe -i xx.mp4 -vn -map 0:1 -ss 00:1:27 -f mp3 -t 28 audio.mp3
  261. 导出音频,转换为 mp3 格式
  262. ffmpeg.exe -i xx.mp4 -vn -map 0:1 -f mp3 audio.mp3
  263. 导出音频,转换为 16000k 16bit 单通道 采样率的 test.pcm
  264. ffmpeg.exe -i xx.mp4 -vn -map 0:1 -ss 00:1:27 -t 28 -acodec pcm_s16le -f s16le -ac 1 -ar 16000 test.pcm
  265. 截取字幕的时间片段
  266. ffmpeg.exe -i "subs-3.srt" -ss 00:1:27 -t 28 subs-3-cut-from-org.srt
  267. */
  268. var subArgs = make([]string, 0)
  269. var audioArgs = make([]string, 0)
  270. // 基础的输入视频参数
  271. subArgs = append(subArgs, "-i")
  272. audioArgs = append(audioArgs, "-i")
  273. subArgs = append(subArgs, videoFileFullPath)
  274. audioArgs = append(audioArgs, videoFileFullPath)
  275. // 字幕导出的参数构建
  276. subArgs = append(subArgs, "-vn") // 不输出视频流
  277. subArgs = append(subArgs, "-an") // 不输出音频流
  278. for _, subtitleInfo := range ffmpegInfo.SubtitleInfoList {
  279. f.addSubMapArg(&subArgs, subtitleInfo.Index,
  280. filepath.Join(ffmpegInfo.GetCacheFolderFPath(), subtitleInfo.GetName()+common.SubExtSRT))
  281. f.addSubMapArg(&subArgs, subtitleInfo.Index,
  282. filepath.Join(ffmpegInfo.GetCacheFolderFPath(), subtitleInfo.GetName()+common.SubExtASS))
  283. }
  284. // 音频导出的参数构建
  285. audioArgs = append(audioArgs, "-vn")
  286. for _, audioInfo := range ffmpegInfo.AudioInfoList {
  287. f.addAudioMapArg(&audioArgs, audioInfo.Index,
  288. filepath.Join(ffmpegInfo.GetCacheFolderFPath(), audioInfo.GetName()+extPCM))
  289. }
  290. return audioArgs, subArgs
  291. }
  292. // getAudioAndSubExportArgsByTimeRange 导出某个时间范围内的音频和字幕文件文件 startTimeString 00:1:27 timeLeng 向后多少秒
  293. func (f *FFMPEGHelper) getAudioExportArgsByTimeRange(audioFullPath string, startTimeString, timeLeng, outAudioFullPath string) []string {
  294. /*
  295. ffmpeg.exe -ar 16000 -ac 1 -f s16le -i aa.pcm -ss 00:1:27 -t 28 -acodec pcm_s16le -f s16le -ac 1 -ar 16000 bb.pcm
  296. ffmpeg.exe -i aa.srt -ss 00:1:27 -t 28 bb.srt
  297. */
  298. var audioArgs = make([]string, 0)
  299. // 指定读取的音频文件编码格式
  300. audioArgs = append(audioArgs, "-ar")
  301. audioArgs = append(audioArgs, "16000")
  302. audioArgs = append(audioArgs, "-ac")
  303. audioArgs = append(audioArgs, "1")
  304. audioArgs = append(audioArgs, "-f")
  305. audioArgs = append(audioArgs, "s16le")
  306. audioArgs = append(audioArgs, "-i")
  307. audioArgs = append(audioArgs, audioFullPath)
  308. audioArgs = append(audioArgs, "-ss")
  309. audioArgs = append(audioArgs, startTimeString)
  310. audioArgs = append(audioArgs, "-t")
  311. audioArgs = append(audioArgs, timeLeng)
  312. // 指定导出的音频文件编码格式
  313. audioArgs = append(audioArgs, "-acodec")
  314. audioArgs = append(audioArgs, "pcm_s16le")
  315. audioArgs = append(audioArgs, "-f")
  316. audioArgs = append(audioArgs, "s16le")
  317. audioArgs = append(audioArgs, "-ac")
  318. audioArgs = append(audioArgs, "1")
  319. audioArgs = append(audioArgs, "-ar")
  320. audioArgs = append(audioArgs, "16000")
  321. audioArgs = append(audioArgs, outAudioFullPath)
  322. return audioArgs
  323. }
  324. // addSubMapArg 构建字幕的导出参数
  325. func (f *FFMPEGHelper) addSubMapArg(subArgs *[]string, index int, subSaveFullPath string) {
  326. *subArgs = append(*subArgs, "-map")
  327. *subArgs = append(*subArgs, fmt.Sprintf("0:%d", index))
  328. *subArgs = append(*subArgs, subSaveFullPath)
  329. }
  330. // addAudioMapArg 构建音频的导出参数
  331. func (f *FFMPEGHelper) addAudioMapArg(subArgs *[]string, index int, audioSaveFullPath string) {
  332. // -acodec pcm_s16le -f s16le -ac 1 -ar 16000
  333. *subArgs = append(*subArgs, "-map")
  334. *subArgs = append(*subArgs, fmt.Sprintf("0:%d", index))
  335. *subArgs = append(*subArgs, "-acodec")
  336. *subArgs = append(*subArgs, "pcm_s16le")
  337. *subArgs = append(*subArgs, "-f")
  338. *subArgs = append(*subArgs, "s16le")
  339. *subArgs = append(*subArgs, "-ac")
  340. *subArgs = append(*subArgs, "1")
  341. *subArgs = append(*subArgs, "-ar")
  342. *subArgs = append(*subArgs, "16000")
  343. *subArgs = append(*subArgs, audioSaveFullPath)
  344. }
  345. const (
  346. codecTypeSub = "subtitle"
  347. codecTypeAudio = "audio"
  348. extMP3 = ".mp3"
  349. extPCM = ".pcm"
  350. )