yt-dlp-telegram-bot/convert.go
2026-03-02 13:11:38 +08:00

300 lines
7.8 KiB
Go

package main
import (
"context"
"encoding/json"
"fmt"
"math/rand"
"net"
"os"
"path"
"path/filepath"
"regexp"
"strconv"
"strings"
"time"
ffmpeg_go "github.com/u2takey/ffmpeg-go"
"golang.org/x/exp/slices"
)
const probeTimeout = 10 * time.Second
const maxFFmpegProbeBytes = 20 * 1024 * 1024
var compatibleVideoCodecs = []string{"h264", "vp9", "hevc"}
var compatibleAudioCodecs = []string{"aac", "opus", "mp3"}
type ffmpegProbeDataStreamsStream struct {
CodecName string `json:"codec_name"`
CodecType string `json:"codec_type"`
Width int `json:"width"`
Height int `json:"height"`
}
type ffmpegProbeDataFormat struct {
FormatName string `json:"format_name"`
Duration string `json:"duration"`
}
type ffmpegProbeData struct {
Streams []ffmpegProbeDataStreamsStream `json:"streams"`
Format ffmpegProbeDataFormat `json:"format"`
}
type Converter struct {
Format string
VideoCodecs string
VideoConvertNeeded bool
SingleVideoStreamNeeded bool
VideoWidth int
VideoHeight int
AudioCodecs string
AudioConvertNeeded bool
SingleAudioStreamNeeded bool
Duration float64
UpdateProgressPercentCallback UpdateProgressPercentCallbackFunc
}
func (c *Converter) ProbeFile(filePath string) error {
fmt.Println(" probing file...")
i, err := ffmpeg_go.ProbeWithTimeout(filePath, probeTimeout, nil)
if err != nil {
return fmt.Errorf("error probing file: %w", err)
}
pd := ffmpegProbeData{}
err = json.Unmarshal([]byte(i), &pd)
if err != nil {
return fmt.Errorf("error decoding probe result: %w", err)
}
c.Duration, err = strconv.ParseFloat(pd.Format.Duration, 64)
if err != nil {
fmt.Println(" error parsing duration:", err)
}
compatibleVideoCodecsCopy := compatibleVideoCodecs
if c.Format == "mp3" {
compatibleVideoCodecsCopy = []string{}
}
compatibleAudioCodecsCopy := compatibleAudioCodecs
if c.Format == "mp3" {
compatibleAudioCodecsCopy = []string{"mp3"}
}
gotVideoStream := false
gotAudioStream := false
for _, stream := range pd.Streams {
if stream.CodecType == "video" && len(compatibleVideoCodecsCopy) > 0 {
if c.VideoCodecs != "" {
c.VideoCodecs += ", "
}
c.VideoCodecs += stream.CodecName
// Store video dimensions for aspect ratio preservation
if stream.Width > 0 && stream.Height > 0 {
c.VideoWidth = stream.Width
c.VideoHeight = stream.Height
}
if gotVideoStream {
fmt.Println(" got additional video stream")
c.SingleVideoStreamNeeded = true
} else if !c.VideoConvertNeeded {
if !slices.Contains(compatibleVideoCodecs, stream.CodecName) {
fmt.Println(" found incompatible video codec:", stream.CodecName)
c.VideoConvertNeeded = true
} else {
fmt.Println(" found video codec:", stream.CodecName)
}
gotVideoStream = true
}
} else if stream.CodecType == "audio" {
if c.AudioCodecs != "" {
c.AudioCodecs += ", "
}
c.AudioCodecs += stream.CodecName
if gotAudioStream {
fmt.Println(" got additional audio stream")
c.SingleAudioStreamNeeded = true
} else if !c.AudioConvertNeeded {
if !slices.Contains(compatibleAudioCodecsCopy, stream.CodecName) {
fmt.Println(" found not compatible audio codec:", stream.CodecName)
c.AudioConvertNeeded = true
} else {
fmt.Println(" found audio codec:", stream.CodecName)
}
gotAudioStream = true
}
}
}
if len(compatibleVideoCodecsCopy) > 0 && !gotVideoStream {
return fmt.Errorf("no video stream found in file")
}
return nil
}
func (c *Converter) ffmpegProgressSock() (sockFilename string, sock net.Listener, err error) {
sockFilename = path.Join(os.TempDir(), fmt.Sprintf("yt-dlp-telegram-bot-%d.sock", rand.Int()))
sock, err = net.Listen("unix", sockFilename)
if err != nil {
fmt.Println(" ffmpeg progress socket create error:", err)
return
}
go func() {
re := regexp.MustCompile(`out_time_ms=(\d+)\n`)
fd, err := sock.Accept()
if err != nil {
fmt.Println(" ffmpeg progress socket accept error:", err)
return
}
defer fd.Close()
buf := make([]byte, 64)
data := ""
for {
_, err := fd.Read(buf)
if err != nil {
return
}
data += string(buf)
a := re.FindAllStringSubmatch(data, -1)
if len(a) > 0 && len(a[len(a)-1]) > 0 {
data = ""
l, _ := strconv.Atoi(a[len(a)-1][len(a[len(a)-1])-1])
c.UpdateProgressPercentCallback(processStr, int(100*float64(l)/c.Duration/1000000))
}
if strings.Contains(data, "progress=end") {
c.UpdateProgressPercentCallback(processStr, 100)
}
}
}()
return
}
func (c *Converter) GetActionsNeeded() string {
var convertNeeded []string
if c.VideoConvertNeeded || c.SingleVideoStreamNeeded {
convertNeeded = append(convertNeeded, "video")
}
if c.AudioConvertNeeded || c.SingleAudioStreamNeeded {
convertNeeded = append(convertNeeded, "audio")
}
return strings.Join(convertNeeded, ", ")
}
func (c *Converter) ConvertIfNeeded(ctx context.Context, inputPath, outputDir string) (outputPath string, outputFormat string, err error) {
fmt.Print(" converting ", c.GetActionsNeeded(), "...\n")
videoNeeded := true
outputFormat = "mp4"
if c.Format == "mp3" {
videoNeeded = false
outputFormat = "mp3"
}
// Determine output path
ext := filepath.Ext(inputPath)
base := strings.TrimSuffix(filepath.Base(inputPath), ext)
outputPath = filepath.Join(outputDir, base+"_converted."+outputFormat)
// Check if conversion is needed
if !c.VideoConvertNeeded && !c.AudioConvertNeeded && !c.SingleVideoStreamNeeded && !c.SingleAudioStreamNeeded {
if outputFormat == "mp4" && ext == ".mkv" {
// Just remux from mkv to mp4, no encoding needed
fmt.Println(" remuxing mkv to mp4...")
} else {
fmt.Println(" no conversion needed, using original file")
return inputPath, outputFormat, nil
}
}
args := ffmpeg_go.KwArgs{
"format": outputFormat,
}
if videoNeeded {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"movflags": "frag_keyframe+empty_moov+faststart"}})
if c.VideoConvertNeeded {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"c:v": "libx264", "crf": 30, "preset": "veryfast"}})
} else {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"c:v": "copy"}})
}
} else {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"vn": ""}})
}
if c.AudioConvertNeeded {
if c.Format == "mp3" {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"c:a": "mp3", "b:a": "320k"}})
} else {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"c:a": "mp3", "q:a": 0}})
}
} else {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"c:a": "copy"}})
}
if videoNeeded {
if c.SingleVideoStreamNeeded || c.SingleAudioStreamNeeded {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"map": "0:v:0,0:a:0"}})
}
} else {
if c.SingleAudioStreamNeeded {
args = ffmpeg_go.MergeKwArgs([]ffmpeg_go.KwArgs{args, {"map": "0:a:0"}})
}
}
ff := ffmpeg_go.Input(inputPath).Output(outputPath, args)
var progressSock net.Listener
if c.UpdateProgressPercentCallback != nil {
if c.Duration > 0 {
var progressSockFilename string
progressSockFilename, progressSock, err = c.ffmpegProgressSock()
if err == nil {
ff = ff.GlobalArgs("-progress", "unix:"+progressSockFilename)
}
} else {
c.UpdateProgressPercentCallback(processStr, -1)
}
}
// Run ffmpeg
cmd := ff.Compile()
// Creating a new cmd with a timeout context
cmdCtx := NewCommand(ctx, cmd.Args[0], cmd.Args[1:]...)
if err := cmdCtx.Run(); err != nil {
if progressSock != nil {
progressSock.Close()
}
return "", "", fmt.Errorf("error converting: %w", err)
}
if progressSock != nil {
progressSock.Close()
}
return outputPath, outputFormat, nil
}
func (c *Converter) NeedConvert() bool {
return c.VideoConvertNeeded || c.AudioConvertNeeded || c.SingleVideoStreamNeeded || c.SingleAudioStreamNeeded
}