466 lines
11 KiB
Go
466 lines
11 KiB
Go
|
package ytdlp
|
||
|
|
||
|
import (
|
||
|
"bytes"
|
||
|
"context"
|
||
|
"encoding/json"
|
||
|
"fmt"
|
||
|
"os/exec"
|
||
|
"path"
|
||
|
"strings"
|
||
|
|
||
|
"github.com/royalcat/ctxprogress"
|
||
|
"golang.org/x/sync/errgroup"
|
||
|
)
|
||
|
|
||
|
type DownloadStatus string
|
||
|
|
||
|
const (
|
||
|
StatusDownloading DownloadStatus = "downloading"
|
||
|
StatusFinished DownloadStatus = "finished"
|
||
|
StatusErrored DownloadStatus = "error"
|
||
|
)
|
||
|
|
||
|
// Progress for the Running call
|
||
|
type DownloadProgress struct {
|
||
|
Status DownloadStatus `json:"status"`
|
||
|
Filename string `json:"filename"`
|
||
|
TmpFilename string `json:"tmpfilename"`
|
||
|
DownloadedBytes int64 `json:"downloaded_bytes"`
|
||
|
TotalBytes int64 `json:"total_bytes"`
|
||
|
TotalBytesEstimate float64 `json:"total_bytes_estimate"`
|
||
|
Elapsed float64 `json:"elapsed"`
|
||
|
ETA float64 `json:"eta"`
|
||
|
Speed float64 `json:"speed"`
|
||
|
FragmentIndex int64 `json:"fragment_index"`
|
||
|
FragmentCount int64 `json:"fragment_count"`
|
||
|
}
|
||
|
|
||
|
// Current implements ctxprogress.Progress.
|
||
|
func (d DownloadProgress) Progress() (int, int) {
|
||
|
if d.TotalBytes != -1 && d.TotalBytes != 0 && d.DownloadedBytes != -1 {
|
||
|
return int(d.DownloadedBytes), int(d.TotalBytes)
|
||
|
}
|
||
|
|
||
|
if d.TotalBytesEstimate != -1 && d.TotalBytesEstimate != 0 && d.DownloadedBytes != -1 {
|
||
|
return int(d.DownloadedBytes), int(d.TotalBytesEstimate)
|
||
|
}
|
||
|
|
||
|
return int(d.FragmentIndex), int(d.FragmentCount)
|
||
|
}
|
||
|
|
||
|
const rawProgressTemplate = `download:
|
||
|
%{
|
||
|
"status":"%(progress.status)s",
|
||
|
"eta":%(progress.eta|-1)s,
|
||
|
"speed":%(progress.speed|0)s,
|
||
|
"downloaded_bytes":%(progress.downloaded_bytes|-1)s,
|
||
|
"total_bytes": %(progress.total_bytes|-1)s,
|
||
|
"total_bytes_estimate": %(progress.total_bytes_estimate|-1)s,
|
||
|
"fragment_index":%(progress.fragment_index|-1)s,
|
||
|
"fragment_count":%(progress.fragment_count|-1)s
|
||
|
}`
|
||
|
|
||
|
var progressTemplate = strings.NewReplacer("\n", "", "\t", "", " ", "").Replace(rawProgressTemplate)
|
||
|
|
||
|
func (c *Client) Download(ctx context.Context, url string, dir string) error {
|
||
|
args := []string{
|
||
|
"--no-simulate", "-j",
|
||
|
"--progress", "--newline", "--progress-template", progressTemplate,
|
||
|
"-o", path.Join(dir, "%(title)s.%(ext)s"),
|
||
|
url,
|
||
|
}
|
||
|
|
||
|
group, ctx := errgroup.WithContext(ctx)
|
||
|
|
||
|
w, lines, err := lineReader(group)
|
||
|
if err != nil {
|
||
|
return err
|
||
|
}
|
||
|
var stderr bytes.Buffer
|
||
|
cmd := exec.CommandContext(ctx, c.binary, args...)
|
||
|
|
||
|
cmd.Stdout = w
|
||
|
cmd.Stderr = &stderr
|
||
|
|
||
|
group.Go(func() error {
|
||
|
err := cmd.Run()
|
||
|
defer w.Close()
|
||
|
if err != nil {
|
||
|
return err
|
||
|
}
|
||
|
return nil
|
||
|
})
|
||
|
|
||
|
for line := range lines {
|
||
|
if line, ok := strings.CutPrefix(line, "%"); ok {
|
||
|
p := DownloadProgress{}
|
||
|
err = json.Unmarshal([]byte(line), &p)
|
||
|
if err != nil {
|
||
|
//TODO: handle error
|
||
|
continue
|
||
|
}
|
||
|
|
||
|
ctxprogress.Set(ctx, p)
|
||
|
}
|
||
|
}
|
||
|
|
||
|
err = group.Wait()
|
||
|
if err != nil {
|
||
|
if _, ok := err.(*exec.ExitError); ok {
|
||
|
return fmt.Errorf("yt-dlp error: %s", stderr.Bytes())
|
||
|
}
|
||
|
return err
|
||
|
}
|
||
|
|
||
|
return nil
|
||
|
}
|
||
|
|
||
|
// // Used to deser the yt-dlp -J output
|
||
|
// type DownloadInfo struct {
|
||
|
// URL string `json:"url"`
|
||
|
// Title string `json:"title"`
|
||
|
// Thumbnail string `json:"thumbnail"`
|
||
|
// Resolution string `json:"resolution"`
|
||
|
// Size int32 `json:"filesize_approx"`
|
||
|
// VCodec string `json:"vcodec"`
|
||
|
// ACodec string `json:"acodec"`
|
||
|
// Extension string `json:"ext"`
|
||
|
// OriginalURL string `json:"original_url"`
|
||
|
// CreatedAt time.Time `json:"created_at"`
|
||
|
// }
|
||
|
|
||
|
// // Process descriptor
|
||
|
// type Process struct {
|
||
|
// Id string
|
||
|
// Url string
|
||
|
// Params []string
|
||
|
// OutputDir string
|
||
|
// Info DownloadInfo
|
||
|
// Progress DownloadProgress
|
||
|
// proc *os.Process
|
||
|
// Logger *slog.Logger
|
||
|
// }
|
||
|
|
||
|
// func NewProcess(dir string) (*Process, error) {
|
||
|
|
||
|
// }
|
||
|
|
||
|
// // Starts spawns/forks a new yt-dlp process and parse its stdout.
|
||
|
// // The process is spawned to outputting a custom progress text that
|
||
|
// // Resembles a JSON Object in order to Unmarshal it later.
|
||
|
// // This approach is anyhow not perfect: quotes are not escaped properly.
|
||
|
// // Each process is not identified by its PID but by a UUIDv4
|
||
|
// func (p *Process) Start() {
|
||
|
// // escape bash variable escaping and command piping, you'll never know
|
||
|
// // what they might come with...
|
||
|
// p.Params = slices.DeleteFunc(p.Params, func(e string) bool {
|
||
|
// match, _ := regexp.MatchString(`(\$\{)|(\&\&)`, e)
|
||
|
// return match
|
||
|
// })
|
||
|
|
||
|
// p.Params = slices.DeleteFunc(p.Params, func(e string) bool {
|
||
|
// return e == ""
|
||
|
// })
|
||
|
|
||
|
// if p.Output.Path != "" {
|
||
|
// out.Path = p.Output.Path
|
||
|
// }
|
||
|
|
||
|
// if p.Output.Filename != "" {
|
||
|
// out.Filename = p.Output.Filename
|
||
|
// }
|
||
|
|
||
|
// buildFilename(&p.Output)
|
||
|
|
||
|
// go p.GetFileName(&out)
|
||
|
|
||
|
// params := []string{
|
||
|
// strings.Split(p.Url, "?list")[0], //no playlist
|
||
|
// "--newline",
|
||
|
// "--no-colors",
|
||
|
// "--no-playlist",
|
||
|
// "--progress-template",
|
||
|
// strings.NewReplacer("\n", "", "\t", "", " ", "").Replace(template),
|
||
|
// }
|
||
|
|
||
|
// // if user asked to manually override the output path...
|
||
|
// if !(slices.Contains(params, "-P") || slices.Contains(params, "--paths")) {
|
||
|
// params = append(params, "-o")
|
||
|
// params = append(params, fmt.Sprintf("%s/%s", out.Path, out.Filename))
|
||
|
// }
|
||
|
|
||
|
// params = append(params, p.Params...)
|
||
|
|
||
|
// // ----------------- main block ----------------- //
|
||
|
// cmd := exec.Command(config.Instance().DownloaderPath, params...)
|
||
|
// cmd.SysProcAttr = &syscall.SysProcAttr{Setpgid: true}
|
||
|
|
||
|
// r, err := cmd.StdoutPipe()
|
||
|
// if err != nil {
|
||
|
// p.Logger.Error(
|
||
|
// "failed to connect to stdout",
|
||
|
// slog.String("err", err.Error()),
|
||
|
// )
|
||
|
// panic(err)
|
||
|
// }
|
||
|
|
||
|
// err = cmd.Start()
|
||
|
// if err != nil {
|
||
|
// p.Logger.Error(
|
||
|
// "failed to start yt-dlp process",
|
||
|
// slog.String("err", err.Error()),
|
||
|
// )
|
||
|
// panic(err)
|
||
|
// }
|
||
|
|
||
|
// p.proc = cmd.Process
|
||
|
|
||
|
// // --------------- progress block --------------- //
|
||
|
// var (
|
||
|
// sourceChan = make(chan []byte)
|
||
|
// doneChan = make(chan struct{})
|
||
|
// )
|
||
|
|
||
|
// // spawn a goroutine that does the dirty job of parsing the stdout
|
||
|
// // filling the channel with as many stdout line as yt-dlp produces (producer)
|
||
|
// go func() {
|
||
|
// scan := bufio.NewScanner(r)
|
||
|
|
||
|
// defer func() {
|
||
|
// r.Close()
|
||
|
// p.Complete()
|
||
|
// doneChan <- struct{}{}
|
||
|
// close(sourceChan)
|
||
|
// close(doneChan)
|
||
|
// }()
|
||
|
|
||
|
// for scan.Scan() {
|
||
|
// sourceChan <- scan.Bytes()
|
||
|
// }
|
||
|
// }()
|
||
|
|
||
|
// // Slows down the unmarshal operation to every 500ms
|
||
|
// go func() {
|
||
|
// rx.Sample(time.Millisecond*500, sourceChan, doneChan, func(event []byte) {
|
||
|
// var progress ProgressTemplate
|
||
|
|
||
|
// if err := json.Unmarshal(event, &progress); err != nil {
|
||
|
// return
|
||
|
// }
|
||
|
|
||
|
// p.Progress = DownloadProgress{
|
||
|
// Status: StatusDownloading,
|
||
|
// Percentage: progress.Percentage,
|
||
|
// Speed: progress.Speed,
|
||
|
// ETA: progress.Eta,
|
||
|
// }
|
||
|
|
||
|
// p.Logger.Info("progress",
|
||
|
// slog.String("id", p.getShortId()),
|
||
|
// slog.String("url", p.Url),
|
||
|
// slog.String("percentage", progress.Percentage),
|
||
|
// )
|
||
|
// })
|
||
|
// }()
|
||
|
|
||
|
// // ------------- end progress block ------------- //
|
||
|
// cmd.Wait()
|
||
|
// }
|
||
|
|
||
|
// // Keep process in the memoryDB but marks it as complete
|
||
|
// // Convention: All completed processes has progress -1
|
||
|
// // and speed 0 bps.
|
||
|
// func (p *Process) Complete() {
|
||
|
// p.Progress = DownloadProgress{
|
||
|
// Status: StatusCompleted,
|
||
|
// Percentage: "-1",
|
||
|
// Speed: 0,
|
||
|
// ETA: 0,
|
||
|
// }
|
||
|
|
||
|
// p.Logger.Info("finished",
|
||
|
// slog.String("id", p.getShortId()),
|
||
|
// slog.String("url", p.Url),
|
||
|
// )
|
||
|
// }
|
||
|
|
||
|
// // Kill a process and remove it from the memory
|
||
|
// func (p *Process) Kill() error {
|
||
|
// // yt-dlp uses multiple child process the parent process
|
||
|
// // has been spawned with setPgid = true. To properly kill
|
||
|
// // all subprocesses a SIGTERM need to be sent to the correct
|
||
|
// // process group
|
||
|
// if p.proc != nil {
|
||
|
// pgid, err := syscall.Getpgid(p.proc.Pid)
|
||
|
// if err != nil {
|
||
|
// return err
|
||
|
// }
|
||
|
// err = syscall.Kill(-pgid, syscall.SIGTERM)
|
||
|
|
||
|
// p.Logger.Info("killed process", slog.String("id", p.Id))
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// return nil
|
||
|
// }
|
||
|
|
||
|
// // Returns the available format for this URL
|
||
|
// func (p *Process) GetFormatsSync() (DownloadFormats, error) {
|
||
|
// cmd := exec.Command(config.Instance().DownloaderPath, p.Url, "-J")
|
||
|
|
||
|
// stdout, err := cmd.Output()
|
||
|
// if err != nil {
|
||
|
// p.Logger.Error(
|
||
|
// "failed to retrieve metadata",
|
||
|
// slog.String("err", err.Error()),
|
||
|
// )
|
||
|
// return DownloadFormats{}, err
|
||
|
// }
|
||
|
|
||
|
// info := DownloadFormats{URL: p.Url}
|
||
|
// best := Format{}
|
||
|
|
||
|
// var (
|
||
|
// wg sync.WaitGroup
|
||
|
// decodingError error
|
||
|
// )
|
||
|
|
||
|
// wg.Add(2)
|
||
|
|
||
|
// log.Println(
|
||
|
// cli.BgRed, "Metadata", cli.Reset,
|
||
|
// cli.BgBlue, "Formats", cli.Reset,
|
||
|
// p.Url,
|
||
|
// )
|
||
|
|
||
|
// p.Logger.Info(
|
||
|
// "retrieving metadata",
|
||
|
// slog.String("caller", "getFormats"),
|
||
|
// slog.String("url", p.Url),
|
||
|
// )
|
||
|
|
||
|
// go func() {
|
||
|
// decodingError = json.Unmarshal(stdout, &info)
|
||
|
// wg.Done()
|
||
|
// }()
|
||
|
|
||
|
// go func() {
|
||
|
// decodingError = json.Unmarshal(stdout, &best)
|
||
|
// wg.Done()
|
||
|
// }()
|
||
|
|
||
|
// wg.Wait()
|
||
|
|
||
|
// if decodingError != nil {
|
||
|
// return DownloadFormats{}, err
|
||
|
// }
|
||
|
|
||
|
// info.Best = best
|
||
|
|
||
|
// return info, nil
|
||
|
// }
|
||
|
|
||
|
// func (p *Process) GetFileName(o *DownloadOutput) error {
|
||
|
// cmd := exec.Command(
|
||
|
// config.Instance().DownloaderPath,
|
||
|
// "--print", "filename",
|
||
|
// "-o", fmt.Sprintf("%s/%s", o.Path, o.Filename),
|
||
|
// p.Url,
|
||
|
// )
|
||
|
// cmd.SysProcAttr = &syscall.SysProcAttr{Setpgid: true}
|
||
|
|
||
|
// out, err := cmd.Output()
|
||
|
// if err != nil {
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// p.Output.SavedFilePath = strings.Trim(string(out), "\n")
|
||
|
// return nil
|
||
|
// }
|
||
|
|
||
|
// func (p *Process) SetPending() {
|
||
|
// // Since video's title isn't available yet, fill in with the URL.
|
||
|
// p.Info = DownloadInfo{
|
||
|
// URL: p.Url,
|
||
|
// Title: p.Url,
|
||
|
// CreatedAt: time.Now(),
|
||
|
// }
|
||
|
// p.Progress.Status = StatusPending
|
||
|
// }
|
||
|
|
||
|
// func (p *Process) SetMetadata() error {
|
||
|
// cmd := exec.Command(config.Instance().DownloaderPath, p.Url, "-J")
|
||
|
// cmd.SysProcAttr = &syscall.SysProcAttr{Setpgid: true}
|
||
|
|
||
|
// stdout, err := cmd.StdoutPipe()
|
||
|
// if err != nil {
|
||
|
// p.Logger.Error("failed to connect to stdout",
|
||
|
// slog.String("id", p.getShortId()),
|
||
|
// slog.String("url", p.Url),
|
||
|
// slog.String("err", err.Error()),
|
||
|
// )
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// stderr, err := cmd.StderrPipe()
|
||
|
// if err != nil {
|
||
|
// p.Logger.Error("failed to connect to stderr",
|
||
|
// slog.String("id", p.getShortId()),
|
||
|
// slog.String("url", p.Url),
|
||
|
// slog.String("err", err.Error()),
|
||
|
// )
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// info := DownloadInfo{
|
||
|
// URL: p.Url,
|
||
|
// CreatedAt: time.Now(),
|
||
|
// }
|
||
|
|
||
|
// if err := cmd.Start(); err != nil {
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// var bufferedStderr bytes.Buffer
|
||
|
|
||
|
// go func() {
|
||
|
// io.Copy(&bufferedStderr, stderr)
|
||
|
// }()
|
||
|
|
||
|
// p.Logger.Info("retrieving metadata",
|
||
|
// slog.String("id", p.getShortId()),
|
||
|
// slog.String("url", p.Url),
|
||
|
// )
|
||
|
|
||
|
// if err := json.NewDecoder(stdout).Decode(&info); err != nil {
|
||
|
// return err
|
||
|
// }
|
||
|
|
||
|
// p.Info = info
|
||
|
// p.Progress.Status = StatusPending
|
||
|
|
||
|
// if err := cmd.Wait(); err != nil {
|
||
|
// return errors.New(bufferedStderr.String())
|
||
|
// }
|
||
|
|
||
|
// return nil
|
||
|
// }
|
||
|
|
||
|
// func (p *Process) getShortId() string {
|
||
|
// return strings.Split(p.Id, "-")[0]
|
||
|
// }
|
||
|
|
||
|
// func buildFilename(o *DownloadOutput) {
|
||
|
// if o.Filename != "" && strings.Contains(o.Filename, ".%(ext)s") {
|
||
|
// o.Filename += ".%(ext)s"
|
||
|
// }
|
||
|
|
||
|
// o.Filename = strings.Replace(
|
||
|
// o.Filename,
|
||
|
// ".%(ext)s.%(ext)s",
|
||
|
// ".%(ext)s",
|
||
|
// 1,
|
||
|
// )
|
||
|
// }
|