fileinfo.go 9.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307
  1. package subparser
  2. import (
  3. "crypto/sha256"
  4. "fmt"
  5. "math"
  6. "sort"
  7. "strings"
  8. "time"
  9. "github.com/ChineseSubFinder/ChineseSubFinder/pkg"
  10. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/types/common"
  11. "github.com/ChineseSubFinder/ChineseSubFinder/pkg/types/language"
  12. )
  13. type FileInfo struct {
  14. PrefixDialogueString string // 在 Dialogue: 这个关键词之前的字符串,ass 中的字体以及其他信息的描述
  15. Content string // 字幕的内容
  16. FromWhereSite string // 从那个网站下载的
  17. Name string // 字幕的名称,注意,这里需要额外的赋值,不会自动检测
  18. Ext string // 字幕的后缀名
  19. Lang language.MyLanguage // 识别出来的语言
  20. FileFullPath string // 字幕文件的全路径
  21. Data []byte // 字幕的二进制文件内容
  22. Dialogues []OneDialogue // 整个字幕文件的所有对话,如果是做时间轴匹配,就使用原始的
  23. DialoguesFilter []OneDialogue // 整个字幕文件的所有对话,过滤掉特殊字符的对白
  24. DialoguesFilterEx []OneDialogueEx // 整个字幕文件的所有对话,过滤掉特殊字符的对白,这里会把一句话中支持的 中、英、韩、日 四国语言给分离出来
  25. CHLines []string // 抽取出所有的中文对话
  26. OtherLines []string // 抽取出所有的第二语言对话,可能是英文、韩文、日文
  27. }
  28. // SaveTranslated 保存字幕文件,注意,这里是用于翻译后的字幕文件
  29. func (f *FileInfo) SaveTranslated(desSubFileFPath string) error {
  30. allString := ""
  31. allString += f.PrefixDialogueString + "\n"
  32. for _, oneDialogue := range f.Dialogues {
  33. if len(oneDialogue.Lines) < 1 {
  34. continue
  35. }
  36. oneDialogueString := "Dialogue: 0," + oneDialogue.StartTime + "," + oneDialogue.EndTime + ",Default,,0,0,0,," + oneDialogue.Lines[0]
  37. allString += oneDialogueString + "\n"
  38. }
  39. return pkg.WriteFile(desSubFileFPath, []byte(allString))
  40. }
  41. // GetSourceTranslateString 获取翻以前的字符串,会移除 \N 这样的信息,替换为空格
  42. func (f *FileInfo) GetSourceTranslateString() string {
  43. sourceString := ""
  44. // 去除每一句中的 \N
  45. for index, oneDialogue := range f.Dialogues {
  46. f.Dialogues[index].Lines[0] = strings.ReplaceAll(oneDialogue.Lines[0], `\N`, " ")
  47. sourceString += f.Dialogues[index].Lines[0] + "\n"
  48. }
  49. return sourceString
  50. }
  51. func (f *FileInfo) SetTranslatedStrings(translatedString string) error {
  52. // 分行
  53. lines := strings.Split(translatedString, "\n")
  54. linesWithOutEmpty := make([]string, 0)
  55. // 移除空行
  56. for _, line := range lines {
  57. if len(line) < 1 {
  58. continue
  59. }
  60. linesWithOutEmpty = append(linesWithOutEmpty, line)
  61. }
  62. // 比较两个数组是否长度一致
  63. if len(f.Dialogues) != len(linesWithOutEmpty) {
  64. return fmt.Errorf("dialogue line not the same,org:%d,translated:%d", len(f.Dialogues), len(linesWithOutEmpty))
  65. }
  66. // 对每一句话进行赋值
  67. for index := range f.Dialogues {
  68. f.Dialogues[index].Lines = []string{linesWithOutEmpty[index]}
  69. }
  70. return nil
  71. }
  72. // SortDialogues 排序对话,时间递减
  73. func (f *FileInfo) SortDialogues() {
  74. sort.Sort(OneDialogueByStartTime(f.Dialogues))
  75. sort.Sort(OneDialogueByStartTime(f.DialoguesFilter))
  76. sort.Sort(OneDialogueByStartTimeEx(f.DialoguesFilterEx))
  77. }
  78. // GetTimeFormat 获取时间轴的格式化格式
  79. func (f FileInfo) GetTimeFormat() string {
  80. if f.Ext == common.SubExtASS || f.Ext == common.SubExtSSA {
  81. return common.TimeFormatPoint2
  82. } else {
  83. return common.TimeFormatPoint3
  84. }
  85. }
  86. // GetDialogueExContent 获取当前字幕文件语言对应索引的对白内容
  87. // 凡是带有 Eng 的返回 Eng,其他的就与对应语言相关
  88. func (f FileInfo) GetDialogueExContent(index int) string {
  89. switch f.Lang {
  90. case language.ChineseSimple, language.ChineseTraditional,
  91. language.ChineseSimpleJapanese, language.ChineseSimpleKorean,
  92. language.ChineseTraditionalJapanese, language.ChineseTraditionalKorean:
  93. // 带有中文的,但是又不是中英的
  94. return f.DialoguesFilterEx[index].ChLine
  95. case language.English, language.ChineseSimpleEnglish, language.ChineseTraditionalEnglish:
  96. return f.DialoguesFilterEx[index].EnLine
  97. case language.Japanese:
  98. return f.DialoguesFilterEx[index].JpLine
  99. case language.Korean:
  100. return f.DialoguesFilterEx[index].KrLine
  101. default:
  102. return f.DialoguesFilterEx[index].EnLine
  103. }
  104. }
  105. // ChangeDialoguesTimeByFramerateRatio 根据帧数比率调整时间轴 对应 ffsubsync -- SubtitleScaler
  106. func (f *FileInfo) ChangeDialoguesTimeByFramerateRatio(framerateRatio float64) error {
  107. timeFormat := f.GetTimeFormat()
  108. f.changeOneDialoguesFramerateRatio(f.Dialogues, framerateRatio, timeFormat)
  109. f.changeOneDialoguesFramerateRatio(f.DialoguesFilter, framerateRatio, timeFormat)
  110. f.changeOneDialogueExsFramerateRatio(f.DialoguesFilterEx, framerateRatio, timeFormat)
  111. return nil
  112. }
  113. func (f *FileInfo) changeOneDialoguesFramerateRatio(oneDialogues []OneDialogue, framerateRatio float64, timeFormat string) {
  114. for i := 0; i < len(oneDialogues); i++ {
  115. timeStart := oneDialogues[i].GetStartTime()
  116. timeEnd := oneDialogues[i].GetEndTime()
  117. timeStartNumber := pkg.Time2SecondNumber(timeStart)
  118. timeEndNumber := pkg.Time2SecondNumber(timeEnd)
  119. scaleTimeStart := pkg.TimeNumber2Time(timeStartNumber * framerateRatio)
  120. scaleTimeEnd := pkg.TimeNumber2Time(timeEndNumber * framerateRatio)
  121. oneDialogues[i].StartTime = pkg.Time2SubTimeString(scaleTimeStart, timeFormat)
  122. oneDialogues[i].EndTime = pkg.Time2SubTimeString(scaleTimeEnd, timeFormat)
  123. }
  124. }
  125. func (f *FileInfo) changeOneDialogueExsFramerateRatio(oneDialogues []OneDialogueEx, framerateRatio float64, timeFormat string) {
  126. for i := 0; i < len(oneDialogues); i++ {
  127. timeStart := oneDialogues[i].GetStartTime()
  128. timeEnd := oneDialogues[i].GetEndTime()
  129. timeStartNumber := pkg.Time2SecondNumber(timeStart)
  130. timeEndNumber := pkg.Time2SecondNumber(timeEnd)
  131. scaleTimeStart := pkg.TimeNumber2Time(timeStartNumber * framerateRatio)
  132. scaleTimeEnd := pkg.TimeNumber2Time(timeEndNumber * framerateRatio)
  133. oneDialogues[i].StartTime = pkg.Time2SubTimeString(scaleTimeStart, timeFormat)
  134. oneDialogues[i].EndTime = pkg.Time2SubTimeString(scaleTimeEnd, timeFormat)
  135. }
  136. }
  137. // GetStartTime 获取的是从 Dialogues 得到的
  138. func (f FileInfo) GetStartTime() time.Time {
  139. startTime := math.MaxFloat64
  140. for i := 0; i < len(f.Dialogues); i++ {
  141. // 找到最小的开始时间
  142. tmpNowStartTimeNumber := pkg.Time2SecondNumber(f.Dialogues[i].GetStartTime())
  143. startTime = math.Min(startTime, tmpNowStartTimeNumber)
  144. }
  145. return pkg.TimeNumber2Time(startTime)
  146. }
  147. // GetEndTime 获取的是从 Dialogues 得到的
  148. func (f FileInfo) GetEndTime() time.Time {
  149. endTime := -math.MaxFloat64
  150. for i := 0; i < len(f.Dialogues); i++ {
  151. // 找到最大的结束时间
  152. tmpNowEndTimeNumber := pkg.Time2SecondNumber(f.Dialogues[i].GetEndTime())
  153. endTime = math.Max(endTime, tmpNowEndTimeNumber)
  154. }
  155. return pkg.TimeNumber2Time(endTime)
  156. }
  157. // GetNumFrames 获取这个字幕的时间 Frame 数量
  158. func (f FileInfo) GetNumFrames() int {
  159. return int(math.Abs((pkg.Time2SecondNumber(f.GetEndTime()) - pkg.Time2SecondNumber(f.GetStartTime())) * 100))
  160. }
  161. func (f FileInfo) GetFileSha256() string {
  162. return fmt.Sprintf("%x", sha256.Sum256(f.Data))
  163. }
  164. // OneDialogue 一句对话
  165. type OneDialogue struct {
  166. Index int // 对白的索引
  167. StartTime string // 开始时间
  168. EndTime string // 结束时间
  169. StyleName string // StyleName
  170. Lines []string // 台词
  171. }
  172. func NewOneDialogue() OneDialogue {
  173. return OneDialogue{
  174. Lines: make([]string, 0),
  175. }
  176. }
  177. func (o OneDialogue) GetStartTime() time.Time {
  178. srcTimeStartNow, err := pkg.ParseTime(o.StartTime)
  179. if err != nil {
  180. return time.Time{}
  181. }
  182. return srcTimeStartNow
  183. }
  184. func (o OneDialogue) GetEndTime() time.Time {
  185. srcTimeEndNow, err := pkg.ParseTime(o.EndTime)
  186. if err != nil {
  187. return time.Time{}
  188. }
  189. return srcTimeEndNow
  190. }
  191. type OneDialogueByStartTime []OneDialogue
  192. func (d OneDialogueByStartTime) Len() int {
  193. return len(d)
  194. }
  195. func (d OneDialogueByStartTime) Swap(i, j int) {
  196. d[i], d[j] = d[j], d[i]
  197. }
  198. func (d OneDialogueByStartTime) Less(i, j int) bool {
  199. subStartTimeI, err := pkg.ParseTime(d[i].StartTime)
  200. if err != nil {
  201. return false
  202. }
  203. subStartTimeJ, err := pkg.ParseTime(d[j].StartTime)
  204. if err != nil {
  205. return false
  206. }
  207. return pkg.Time2SecondNumber(subStartTimeI) < pkg.Time2SecondNumber(subStartTimeJ)
  208. }
  209. // OneDialogueEx 一句对话,这里会把一句话中支持的 中、英、韩、日 四国语言给分离出来
  210. type OneDialogueEx struct {
  211. StartTime string // 开始时间
  212. EndTime string // 结束时间
  213. ChLine string
  214. EnLine string
  215. KrLine string
  216. JpLine string
  217. }
  218. func (o OneDialogueEx) GetStartTime() time.Time {
  219. srcTimeStartNow, err := pkg.ParseTime(o.StartTime)
  220. if err != nil {
  221. return time.Time{}
  222. }
  223. return srcTimeStartNow
  224. }
  225. func (o OneDialogueEx) GetEndTime() time.Time {
  226. srcTimeEndNow, err := pkg.ParseTime(o.EndTime)
  227. if err != nil {
  228. return time.Time{}
  229. }
  230. return srcTimeEndNow
  231. }
  232. type OneDialogueByStartTimeEx []OneDialogueEx
  233. func (d OneDialogueByStartTimeEx) Len() int {
  234. return len(d)
  235. }
  236. func (d OneDialogueByStartTimeEx) Swap(i, j int) {
  237. d[i], d[j] = d[j], d[i]
  238. }
  239. func (d OneDialogueByStartTimeEx) Less(i, j int) bool {
  240. subStartTimeI, err := pkg.ParseTime(d[i].StartTime)
  241. if err != nil {
  242. return false
  243. }
  244. subStartTimeJ, err := pkg.ParseTime(d[j].StartTime)
  245. if err != nil {
  246. return false
  247. }
  248. return pkg.Time2SecondNumber(subStartTimeI) < pkg.Time2SecondNumber(subStartTimeJ)
  249. }
  250. const (
  251. Sub_Ext_Mark_Default = ".default" // 指定这个字幕是默认的
  252. Sub_Ext_Mark_Forced = ".forced" // 指定这个字幕是强制的
  253. )