mirror of
https://github.com/navidrome/navidrome.git
synced 2025-04-03 20:47:35 +03:00
* draft commit * time to fight pipeline * round 2 changes * remove unnecessary line * fight taglib. again * make taglib work again??? * add id3 tags * taglib 1.12 vs 1.13 * use int instead for windows * store as json now * add migration, more tests * support repeated line, multiline * fix ms and support .m, .mm, .mmm * address some concerns, make cpp a bit safer * separate responses from model * remove [:] * Add trace log * Try to unblock pipeline * Fix merge errors * Fix SIGSEGV error (proper handling of empty frames) * Add fallback artist/title to structured lyrics * Rename conflicting named vars * Fix tests * Do we still need ffmpeg in the pipeline? * Revert "Do we still need ffmpeg in the pipeline?" Yes we do. This reverts commit87df7f6df7
. * Does this passes now, with a newer ffmpeg version? * Revert "Does this passes now, with a newer ffmpeg version?" No, it does not :( This reverts commit372eb4b0ae
. * My OCD made me do it :P --------- Co-authored-by: Deluan Quintão <deluan@navidrome.org>
201 lines
4.7 KiB
Go
201 lines
4.7 KiB
Go
package model
|
|
|
|
import (
|
|
"regexp"
|
|
"strconv"
|
|
"strings"
|
|
|
|
"github.com/navidrome/navidrome/log"
|
|
"github.com/navidrome/navidrome/utils"
|
|
)
|
|
|
|
type Line struct {
|
|
Start *int64 `structs:"start,omitempty" json:"start,omitempty"`
|
|
Value string `structs:"value" json:"value"`
|
|
}
|
|
|
|
type Lyrics struct {
|
|
DisplayArtist string `structs:"displayArtist,omitempty" json:"displayArtist,omitempty"`
|
|
DisplayTitle string `structs:"displayTitle,omitempty" json:"displayTitle,omitempty"`
|
|
Lang string `structs:"lang" json:"lang"`
|
|
Line []Line `structs:"line" json:"line"`
|
|
Offset *int64 `structs:"offset,omitempty" json:"offset,omitempty"`
|
|
Synced bool `structs:"synced" json:"synced"`
|
|
}
|
|
|
|
// support the standard [mm:ss.mm], as well as [hh:*] and [*.mmm]
|
|
const timeRegexString = `\[([0-9]{1,2}:)?([0-9]{1,2}):([0-9]{1,2})(.[0-9]{1,3})?\]`
|
|
|
|
var (
|
|
// Should either be at the beginning of file, or beginning of line
|
|
syncRegex = regexp.MustCompile(`(^|\n)\s*` + timeRegexString)
|
|
timeRegex = regexp.MustCompile(timeRegexString)
|
|
lrcIdRegex = regexp.MustCompile(`\[(ar|ti|offset):([^]]+)]`)
|
|
)
|
|
|
|
func ToLyrics(language, text string) (*Lyrics, error) {
|
|
text = utils.SanitizeText(text)
|
|
|
|
lines := strings.Split(text, "\n")
|
|
|
|
artist := ""
|
|
title := ""
|
|
var offset *int64 = nil
|
|
structuredLines := []Line{}
|
|
|
|
synced := syncRegex.MatchString(text)
|
|
priorLine := ""
|
|
validLine := false
|
|
var timestamps []int64
|
|
|
|
for _, line := range lines {
|
|
line := strings.TrimSpace(line)
|
|
if line == "" {
|
|
if validLine {
|
|
priorLine += "\n"
|
|
}
|
|
continue
|
|
}
|
|
var text string
|
|
var time *int64 = nil
|
|
|
|
if synced {
|
|
idTag := lrcIdRegex.FindStringSubmatch(line)
|
|
if idTag != nil {
|
|
switch idTag[1] {
|
|
case "ar":
|
|
artist = utils.SanitizeText(strings.TrimSpace(idTag[2]))
|
|
case "offset":
|
|
{
|
|
off, err := strconv.ParseInt(strings.TrimSpace(idTag[2]), 10, 64)
|
|
if err != nil {
|
|
log.Warn("Error parsing offset", "offset", idTag[2], "error", err)
|
|
} else {
|
|
offset = &off
|
|
}
|
|
}
|
|
case "ti":
|
|
title = utils.SanitizeText(strings.TrimSpace(idTag[2]))
|
|
}
|
|
|
|
continue
|
|
}
|
|
|
|
times := timeRegex.FindAllStringSubmatchIndex(line, -1)
|
|
// The second condition is for when there is a timestamp in the middle of
|
|
// a line (after any text)
|
|
if times == nil || times[0][0] != 0 {
|
|
if validLine {
|
|
priorLine += "\n" + line
|
|
}
|
|
continue
|
|
}
|
|
|
|
if validLine {
|
|
for idx := range timestamps {
|
|
structuredLines = append(structuredLines, Line{
|
|
Start: ×tamps[idx],
|
|
Value: strings.TrimSpace(priorLine),
|
|
})
|
|
}
|
|
timestamps = []int64{}
|
|
}
|
|
|
|
end := 0
|
|
|
|
// [fullStart, fullEnd, hourStart, hourEnd, minStart, minEnd, secStart, secEnd, msStart, msEnd]
|
|
for _, match := range times {
|
|
var hours, millis int64
|
|
var err error
|
|
|
|
// for multiple matches, we need to check that later matches are not
|
|
// in the middle of the string
|
|
if end != 0 {
|
|
middle := strings.TrimSpace(line[end:match[0]])
|
|
if middle != "" {
|
|
break
|
|
}
|
|
}
|
|
|
|
end = match[1]
|
|
|
|
hourStart := match[2]
|
|
if hourStart != -1 {
|
|
// subtract 1 because group has : at the end
|
|
hourEnd := match[3] - 1
|
|
hours, err = strconv.ParseInt(line[hourStart:hourEnd], 10, 64)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
|
|
minutes, err := strconv.ParseInt(line[match[4]:match[5]], 10, 64)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
sec, err := strconv.ParseInt(line[match[6]:match[7]], 10, 64)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
msStart := match[8]
|
|
if msStart != -1 {
|
|
msEnd := match[9]
|
|
// +1 offset since this capture group contains .
|
|
millis, err = strconv.ParseInt(line[msStart+1:msEnd], 10, 64)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
length := msEnd - msStart
|
|
|
|
if length == 3 {
|
|
millis *= 10
|
|
} else if length == 2 {
|
|
millis *= 100
|
|
}
|
|
}
|
|
|
|
timeInMillis := (((((hours * 60) + minutes) * 60) + sec) * 1000) + millis
|
|
timestamps = append(timestamps, timeInMillis)
|
|
}
|
|
|
|
if end >= len(line) {
|
|
priorLine = ""
|
|
} else {
|
|
priorLine = strings.TrimSpace(line[end:])
|
|
}
|
|
|
|
validLine = true
|
|
} else {
|
|
text = line
|
|
structuredLines = append(structuredLines, Line{
|
|
Start: time,
|
|
Value: text,
|
|
})
|
|
}
|
|
}
|
|
|
|
if validLine {
|
|
for idx := range timestamps {
|
|
structuredLines = append(structuredLines, Line{
|
|
Start: ×tamps[idx],
|
|
Value: strings.TrimSpace(priorLine),
|
|
})
|
|
}
|
|
}
|
|
|
|
lyrics := Lyrics{
|
|
DisplayArtist: artist,
|
|
DisplayTitle: title,
|
|
Lang: language,
|
|
Line: structuredLines,
|
|
Offset: offset,
|
|
Synced: synced,
|
|
}
|
|
|
|
return &lyrics, nil
|
|
}
|
|
|
|
type LyricList []Lyrics
|