539 lines
14 KiB
Go
539 lines
14 KiB
Go
package podcasts
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"net/http"
|
|
"net/url"
|
|
"os"
|
|
"path"
|
|
"path/filepath"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/jinzhu/gorm"
|
|
"github.com/mmcdole/gofeed"
|
|
|
|
"go.senan.xyz/gonic/db"
|
|
"go.senan.xyz/gonic/fileutil"
|
|
"go.senan.xyz/gonic/mime"
|
|
"go.senan.xyz/gonic/scanner/tags"
|
|
)
|
|
|
|
var ErrNoAudioInFeedItem = errors.New("no audio in feed item")
|
|
|
|
const (
|
|
downloadAllWaitInterval = 3 * time.Second
|
|
fetchUserAgent = `Mozilla/5.0 (Macintosh; Intel Mac OS X 10_7_5) AppleWebKit/537.11 (KHTML, like Gecko) Chrome/23.0.1271.64 Safari/537.11`
|
|
)
|
|
|
|
type Podcasts struct {
|
|
db *db.DB
|
|
baseDir string
|
|
tagger tags.Reader
|
|
}
|
|
|
|
func New(db *db.DB, base string, tagger tags.Reader) *Podcasts {
|
|
return &Podcasts{
|
|
db: db,
|
|
baseDir: base,
|
|
tagger: tagger,
|
|
}
|
|
}
|
|
|
|
func (p *Podcasts) GetPodcastOrAll(id int, includeEpisodes bool) ([]*db.Podcast, error) {
|
|
var err error
|
|
podcasts := []*db.Podcast{}
|
|
if id != 0 {
|
|
err = p.db.Where("id=?", id).Find(&podcasts).Error
|
|
} else {
|
|
err = p.db.Find(&podcasts).Error
|
|
}
|
|
if err != nil {
|
|
return nil, fmt.Errorf("finding podcasts: %w", err)
|
|
}
|
|
if !includeEpisodes {
|
|
return podcasts, nil
|
|
}
|
|
for _, c := range podcasts {
|
|
episodes, err := p.GetPodcastEpisodes(c.ID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("finding podcast episodes: %w", err)
|
|
}
|
|
c.Episodes = episodes
|
|
}
|
|
return podcasts, nil
|
|
}
|
|
|
|
func (p *Podcasts) GetPodcastEpisodes(podcastID int) ([]*db.PodcastEpisode, error) {
|
|
episodes := []*db.PodcastEpisode{}
|
|
err := p.db.
|
|
Where("podcast_id=?", podcastID).
|
|
Order("publish_date DESC").
|
|
Find(&episodes).
|
|
Error
|
|
if err != nil {
|
|
return nil, fmt.Errorf("find episodes by podcast id: %w", err)
|
|
}
|
|
return episodes, nil
|
|
}
|
|
|
|
func (p *Podcasts) GetNewestPodcastEpisodes(count int) ([]*db.PodcastEpisode, error) {
|
|
episodes := []*db.PodcastEpisode{}
|
|
err := p.db.
|
|
Order("publish_date DESC").
|
|
Limit(count).
|
|
Find(&episodes).
|
|
Error
|
|
if err != nil {
|
|
return nil, fmt.Errorf("find newest podcast episodes: %w", err)
|
|
}
|
|
return episodes, nil
|
|
}
|
|
|
|
func (p *Podcasts) AddNewPodcast(rssURL string, feed *gofeed.Feed) (*db.Podcast, error) {
|
|
rootDir, err := fileutil.Unique(filepath.Join(p.baseDir, fileutil.Safe(feed.Title)), "")
|
|
if err != nil {
|
|
return nil, fmt.Errorf("find unique podcast dir: %w", err)
|
|
}
|
|
podcast := db.Podcast{
|
|
Description: feed.Description,
|
|
ImageURL: feed.Image.URL,
|
|
Title: feed.Title,
|
|
URL: rssURL,
|
|
RootDir: rootDir,
|
|
}
|
|
if err := os.Mkdir(podcast.RootDir, 0o755); err != nil && !os.IsExist(err) {
|
|
return nil, err
|
|
}
|
|
if err := p.db.Save(&podcast).Error; err != nil {
|
|
return &podcast, err
|
|
}
|
|
if err := p.AddNewEpisodes(&podcast, feed.Items); err != nil {
|
|
return nil, err
|
|
}
|
|
go func() {
|
|
if err := p.downloadPodcastCover(&podcast); err != nil {
|
|
log.Printf("error downloading podcast cover: %v", err)
|
|
}
|
|
}()
|
|
return &podcast, nil
|
|
}
|
|
|
|
func (p *Podcasts) SetAutoDownload(podcastID int, setting db.PodcastAutoDownload) error {
|
|
podcast := db.Podcast{}
|
|
err := p.db.
|
|
Where("id=?", podcastID).
|
|
First(&podcast).
|
|
Error
|
|
if err != nil {
|
|
return err
|
|
}
|
|
podcast.AutoDownload = setting
|
|
if err := p.db.Save(&podcast).Error; err != nil {
|
|
return fmt.Errorf("save setting: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func getEntriesAfterDate(feed []*gofeed.Item, after time.Time) []*gofeed.Item {
|
|
items := []*gofeed.Item{}
|
|
for _, item := range feed {
|
|
if item.PublishedParsed.Before(after) || item.PublishedParsed.Equal(after) {
|
|
continue
|
|
}
|
|
items = append(items, item)
|
|
}
|
|
return items
|
|
}
|
|
|
|
func (p *Podcasts) AddNewEpisodes(podcast *db.Podcast, items []*gofeed.Item) error {
|
|
podcastEpisode := db.PodcastEpisode{}
|
|
err := p.db.
|
|
Where("podcast_id=?", podcast.ID).
|
|
Order("publish_date DESC").
|
|
First(&podcastEpisode).Error
|
|
itemFound := true
|
|
if errors.Is(err, gorm.ErrRecordNotFound) {
|
|
itemFound = false
|
|
} else if err != nil {
|
|
return err
|
|
}
|
|
if !itemFound {
|
|
for _, item := range items {
|
|
if _, err := p.AddEpisode(podcast.ID, item); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
for _, item := range getEntriesAfterDate(items, *podcastEpisode.PublishDate) {
|
|
episode, err := p.AddEpisode(podcast.ID, item)
|
|
if errors.Is(err, ErrNoAudioInFeedItem) {
|
|
log.Printf("failed to find audio in feed (%s, %s) item, skipping", podcast.Title, item.Title)
|
|
continue
|
|
}
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if podcast.AutoDownload == db.PodcastAutoDownloadLatest &&
|
|
(episode.Status != db.PodcastEpisodeStatusCompleted && episode.Status != db.PodcastEpisodeStatusDownloading) {
|
|
if err := p.DownloadEpisode(episode.ID); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func getSecondsFromString(time string) int {
|
|
duration, err := strconv.Atoi(time)
|
|
if err == nil {
|
|
return duration
|
|
}
|
|
splitTime := strings.Split(time, ":")
|
|
if len(splitTime) == 3 {
|
|
hours, _ := strconv.Atoi(splitTime[0])
|
|
minutes, _ := strconv.Atoi(splitTime[1])
|
|
seconds, _ := strconv.Atoi(splitTime[2])
|
|
return (3600 * hours) + (60 * minutes) + seconds
|
|
}
|
|
if len(splitTime) == 2 {
|
|
minutes, _ := strconv.Atoi(splitTime[0])
|
|
seconds, _ := strconv.Atoi(splitTime[1])
|
|
return (60 * minutes) + seconds
|
|
}
|
|
return 0
|
|
}
|
|
|
|
func (p *Podcasts) AddEpisode(podcastID int, item *gofeed.Item) (*db.PodcastEpisode, error) {
|
|
duration := 0
|
|
// if it has the media extension use it
|
|
for _, content := range item.Extensions["media"]["content"] {
|
|
durationExt := content.Attrs["duration"]
|
|
duration = getSecondsFromString(durationExt)
|
|
if duration != 0 {
|
|
break
|
|
}
|
|
}
|
|
// if the itunes extension is available, use AddEpisode
|
|
if duration == 0 && item.ITunesExt != nil {
|
|
duration = getSecondsFromString(item.ITunesExt.Duration)
|
|
}
|
|
|
|
if episode, ok := p.findEnclosureAudio(podcastID, duration, item); ok {
|
|
if err := p.db.Save(episode).Error; err != nil {
|
|
return nil, err
|
|
}
|
|
return episode, nil
|
|
}
|
|
if episode, ok := p.findMediaAudio(podcastID, duration, item); ok {
|
|
if err := p.db.Save(episode).Error; err != nil {
|
|
return nil, err
|
|
}
|
|
return episode, nil
|
|
}
|
|
return nil, ErrNoAudioInFeedItem
|
|
}
|
|
|
|
func isAudio(rawItemURL string) (bool, error) {
|
|
itemURL, err := url.Parse(rawItemURL)
|
|
if err != nil {
|
|
return false, err
|
|
}
|
|
|
|
return mime.TypeByAudioExtension(path.Ext(itemURL.Path)) != "", nil
|
|
}
|
|
|
|
func itemToEpisode(podcastID, size, duration int, audio string,
|
|
item *gofeed.Item,
|
|
) *db.PodcastEpisode {
|
|
return &db.PodcastEpisode{
|
|
PodcastID: podcastID,
|
|
Description: item.Description,
|
|
Title: item.Title,
|
|
Length: duration,
|
|
Size: size,
|
|
PublishDate: item.PublishedParsed,
|
|
AudioURL: audio,
|
|
Status: db.PodcastEpisodeStatusSkipped,
|
|
}
|
|
}
|
|
|
|
func (p *Podcasts) findEnclosureAudio(podcastID, duration int, item *gofeed.Item) (*db.PodcastEpisode, bool) {
|
|
for _, enc := range item.Enclosures {
|
|
if t, err := isAudio(enc.URL); !t || err != nil {
|
|
continue
|
|
}
|
|
size, _ := strconv.Atoi(enc.Length)
|
|
return itemToEpisode(podcastID, size, duration, enc.URL, item), true
|
|
}
|
|
return nil, false
|
|
}
|
|
|
|
func (p *Podcasts) findMediaAudio(podcastID, duration int, item *gofeed.Item) (*db.PodcastEpisode, bool) {
|
|
extensions, ok := item.Extensions["media"]["content"]
|
|
if !ok {
|
|
return nil, false
|
|
}
|
|
for _, ext := range extensions {
|
|
if t, err := isAudio(ext.Attrs["url"]); !t || err != nil {
|
|
continue
|
|
}
|
|
return itemToEpisode(podcastID, 0, duration, ext.Attrs["url"], item), true
|
|
}
|
|
return nil, false
|
|
}
|
|
|
|
func (p *Podcasts) RefreshPodcasts() error {
|
|
podcasts := []*db.Podcast{}
|
|
if err := p.db.Find(&podcasts).Error; err != nil {
|
|
return fmt.Errorf("find podcasts: %w", err)
|
|
}
|
|
if err := p.refreshPodcasts(podcasts); err != nil {
|
|
return fmt.Errorf("refresh podcasts: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *Podcasts) refreshPodcasts(podcasts []*db.Podcast) error {
|
|
var errs []error
|
|
for _, podcast := range podcasts {
|
|
fp := gofeed.NewParser()
|
|
feed, err := fp.ParseURL(podcast.URL)
|
|
if err != nil {
|
|
errs = append(errs, fmt.Errorf("refreshing podcast with url %q: %w", podcast.URL, err))
|
|
continue
|
|
}
|
|
if err = p.AddNewEpisodes(podcast, feed.Items); err != nil {
|
|
errs = append(errs, fmt.Errorf("adding episodes: %w", err))
|
|
continue
|
|
}
|
|
}
|
|
return errors.Join(errs...)
|
|
}
|
|
|
|
func (p *Podcasts) DownloadPodcastAll(podcastID int) error {
|
|
podcastEpisodes := []db.PodcastEpisode{}
|
|
err := p.db.
|
|
Where("podcast_id=?", podcastID).
|
|
Find(&podcastEpisodes).
|
|
Error
|
|
if err != nil {
|
|
return fmt.Errorf("get episodes by podcast id: %w", err)
|
|
}
|
|
go func() {
|
|
for _, episode := range podcastEpisodes {
|
|
if episode.Status == db.PodcastEpisodeStatusDownloading || episode.Status == db.PodcastEpisodeStatusCompleted {
|
|
log.Println("skipping episode is in progress or already downloaded")
|
|
continue
|
|
}
|
|
if err := p.DownloadEpisode(episode.ID); err != nil {
|
|
log.Printf("error downloading episode: %v", err)
|
|
continue
|
|
}
|
|
log.Printf("finished downloading episode: %q", episode.Title)
|
|
time.Sleep(downloadAllWaitInterval)
|
|
}
|
|
}()
|
|
return nil
|
|
}
|
|
|
|
func (p *Podcasts) DownloadEpisode(episodeID int) error {
|
|
podcastEpisode := db.PodcastEpisode{}
|
|
podcast := db.Podcast{}
|
|
err := p.db.
|
|
Preload("Podcast").
|
|
Where("id=?", episodeID).
|
|
First(&podcastEpisode).
|
|
Error
|
|
if err != nil {
|
|
return fmt.Errorf("get podcast episode by id: %w", err)
|
|
}
|
|
err = p.db.
|
|
Where("id=?", podcastEpisode.PodcastID).
|
|
First(&podcast).
|
|
Error
|
|
if err != nil {
|
|
return fmt.Errorf("get podcast by id: %w", err)
|
|
}
|
|
if podcastEpisode.Status == db.PodcastEpisodeStatusDownloading || podcastEpisode.Status == db.PodcastEpisodeStatusCompleted {
|
|
log.Printf("already downloading podcast episode with id %d", episodeID)
|
|
return nil
|
|
}
|
|
podcastEpisode.Status = db.PodcastEpisodeStatusDownloading
|
|
p.db.Save(&podcastEpisode)
|
|
client := &http.Client{}
|
|
req, err := http.NewRequest("GET", podcastEpisode.AudioURL, nil)
|
|
if err != nil {
|
|
return fmt.Errorf("create http request: %w", err)
|
|
}
|
|
req.Header.Add("User-Agent", fetchUserAgent)
|
|
// nolint: bodyclose
|
|
resp, err := client.Do(req)
|
|
if err != nil {
|
|
return fmt.Errorf("fetch podcast audio: %w", err)
|
|
}
|
|
filename, ok := getContentDispositionFilename(resp.Header.Get("content-disposition"))
|
|
if !ok {
|
|
audioURL, err := url.Parse(podcastEpisode.AudioURL)
|
|
if err != nil {
|
|
return fmt.Errorf("parse podcast audio url: %w", err)
|
|
}
|
|
filename = path.Base(audioURL.Path)
|
|
}
|
|
path, err := fileutil.Unique(podcast.RootDir, fileutil.Safe(filename))
|
|
if err != nil {
|
|
return fmt.Errorf("find unique path: %w", err)
|
|
}
|
|
_, filename = filepath.Split(path)
|
|
audioFile, err := os.Create(filepath.Join(podcast.RootDir, filename))
|
|
if err != nil {
|
|
return fmt.Errorf("create audio file: %w", err)
|
|
}
|
|
podcastEpisode.Filename = filename
|
|
p.db.Save(&podcastEpisode)
|
|
go func() {
|
|
if err := p.doPodcastDownload(&podcastEpisode, audioFile, resp.Body); err != nil {
|
|
log.Printf("error downloading podcast: %v", err)
|
|
}
|
|
}()
|
|
return nil
|
|
}
|
|
|
|
func getContentDispositionFilename(header string) (string, bool) {
|
|
_, params, _ := mime.ParseMediaType(header)
|
|
filename, ok := params["filename"]
|
|
return filename, ok
|
|
}
|
|
|
|
func (p *Podcasts) downloadPodcastCover(podcast *db.Podcast) error {
|
|
imageURL, err := url.Parse(podcast.ImageURL)
|
|
if err != nil {
|
|
return fmt.Errorf("parse image url: %w", err)
|
|
}
|
|
ext := path.Ext(imageURL.Path)
|
|
client := &http.Client{}
|
|
req, err := http.NewRequest("GET", podcast.ImageURL, nil)
|
|
if err != nil {
|
|
return fmt.Errorf("create http request: %w", err)
|
|
}
|
|
req.Header.Add("User-Agent", fetchUserAgent)
|
|
// nolint: bodyclose
|
|
resp, err := client.Do(req)
|
|
if err != nil {
|
|
return fmt.Errorf("fetch image url: %w", err)
|
|
}
|
|
if ext == "" {
|
|
contentHeader := resp.Header.Get("content-disposition")
|
|
filename, _ := getContentDispositionFilename(contentHeader)
|
|
ext = filepath.Ext(filename)
|
|
}
|
|
cover := "cover" + ext
|
|
coverFile, err := os.Create(filepath.Join(podcast.RootDir, cover))
|
|
if err != nil {
|
|
return fmt.Errorf("creating podcast cover: %w", err)
|
|
}
|
|
defer coverFile.Close()
|
|
if _, err := io.Copy(coverFile, resp.Body); err != nil {
|
|
return fmt.Errorf("writing podcast cover: %w", err)
|
|
}
|
|
podcast.Image = fmt.Sprintf("cover%s", ext)
|
|
if err := p.db.Save(podcast).Error; err != nil {
|
|
return fmt.Errorf("save podcast: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *Podcasts) doPodcastDownload(podcastEpisode *db.PodcastEpisode, file *os.File, src io.Reader) error {
|
|
if _, err := io.Copy(file, src); err != nil {
|
|
return fmt.Errorf("writing podcast episode: %w", err)
|
|
}
|
|
defer file.Close()
|
|
stat, _ := file.Stat()
|
|
podcastTags, err := p.tagger.Read(podcastEpisode.AbsPath())
|
|
if err != nil {
|
|
log.Printf("error parsing podcast audio: %e", err)
|
|
podcastEpisode.Status = db.PodcastEpisodeStatusError
|
|
p.db.Save(podcastEpisode)
|
|
return nil
|
|
}
|
|
podcastEpisode.Bitrate = podcastTags.Bitrate()
|
|
podcastEpisode.Status = db.PodcastEpisodeStatusCompleted
|
|
podcastEpisode.Length = podcastTags.Length()
|
|
podcastEpisode.Size = int(stat.Size())
|
|
return p.db.Save(podcastEpisode).Error
|
|
}
|
|
|
|
func (p *Podcasts) DeletePodcast(podcastID int) error {
|
|
podcast := db.Podcast{}
|
|
err := p.db.
|
|
Where("id=?", podcastID).
|
|
First(&podcast).
|
|
Error
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if podcast.RootDir == "" {
|
|
return fmt.Errorf("podcast has no root dir")
|
|
}
|
|
|
|
if err := os.RemoveAll(podcast.RootDir); err != nil {
|
|
return fmt.Errorf("delete podcast directory: %w", err)
|
|
}
|
|
err = p.db.
|
|
Where("id=?", podcastID).
|
|
Delete(db.Podcast{}).
|
|
Error
|
|
if err != nil {
|
|
return fmt.Errorf("delete podcast row: %w", err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *Podcasts) DeletePodcastEpisode(podcastEpisodeID int) error {
|
|
episode := db.PodcastEpisode{}
|
|
err := p.db.Preload("Podcast").First(&episode, podcastEpisodeID).Error
|
|
if err != nil {
|
|
return err
|
|
}
|
|
episode.Status = db.PodcastEpisodeStatusDeleted
|
|
p.db.Save(&episode)
|
|
if err := os.Remove(episode.AbsPath()); err != nil {
|
|
return err
|
|
}
|
|
return err
|
|
}
|
|
|
|
func (p *Podcasts) PurgeOldPodcasts(maxAge time.Duration) error {
|
|
expDate := time.Now().Add(-maxAge)
|
|
var episodes []*db.PodcastEpisode
|
|
err := p.db.
|
|
Where("status = ?", db.PodcastEpisodeStatusCompleted).
|
|
Where("created_at < ?", expDate).
|
|
Where("updated_at < ?", expDate).
|
|
Where("modified_at < ?", expDate).
|
|
Preload("Podcast").
|
|
Find(&episodes).
|
|
Error
|
|
if err != nil && !errors.Is(err, gorm.ErrRecordNotFound) {
|
|
return fmt.Errorf("find podcasts: %w", err)
|
|
}
|
|
for _, episode := range episodes {
|
|
episode.Status = db.PodcastEpisodeStatusDeleted
|
|
if err := p.db.Save(episode).Error; err != nil {
|
|
return fmt.Errorf("save new podcast status: %w", err)
|
|
}
|
|
if episode.Podcast == nil {
|
|
return fmt.Errorf("episode %d has no podcast", episode.ID)
|
|
}
|
|
if err := os.Remove(episode.AbsPath()); err != nil {
|
|
return fmt.Errorf("remove podcast path: %w", err)
|
|
}
|
|
}
|
|
return nil
|
|
}
|