// SPDX-FileCopyrightText: Copyright The Miniflux Authors. All rights reserved. // SPDX-License-Identifier: Apache-2.0 package mediaproxy // import "miniflux.app/v2/internal/mediaproxy" import ( "strings" "miniflux.app/v2/internal/config" "miniflux.app/v2/internal/reader/sanitizer" "miniflux.app/v2/internal/urllib" "github.com/PuerkitoBio/goquery" "github.com/gorilla/mux" ) type urlProxyRewriter func(router *mux.Router, url string) string func RewriteDocumentWithRelativeProxyURL(router *mux.Router, htmlDocument string, feedSiteURL ...string) string { proxifyFunction := func(router *mux.Router, mediaURL string) string { return ProxifyRelativeURL(router, mediaURL, feedSiteURL...) } return genericProxyRewriter(router, proxifyFunction, htmlDocument) } func RewriteDocumentWithAbsoluteProxyURL(router *mux.Router, host, htmlDocument string, feedSiteURL ...string) string { proxifyFunction := func(router *mux.Router, url string) string { return ProxifyAbsoluteURL(router, host, url, feedSiteURL...) } return genericProxyRewriter(router, proxifyFunction, htmlDocument) } func genericProxyRewriter(router *mux.Router, proxifyFunction urlProxyRewriter, htmlDocument string) string { proxyOption := config.Opts.MediaProxyMode() if proxyOption == "none" { return htmlDocument } doc, err := goquery.NewDocumentFromReader(strings.NewReader(htmlDocument)) if err != nil { return htmlDocument } for _, mediaType := range config.Opts.MediaProxyResourceTypes() { switch mediaType { case "image": doc.Find("img, picture source").Each(func(i int, img *goquery.Selection) { if srcAttrValue, ok := img.Attr("src"); ok { if shouldProxy(srcAttrValue, proxyOption) { img.SetAttr("src", proxifyFunction(router, srcAttrValue)) } } if srcsetAttrValue, ok := img.Attr("srcset"); ok { proxifySourceSet(img, router, proxifyFunction, proxyOption, srcsetAttrValue) } }) doc.Find("video").Each(func(i int, video *goquery.Selection) { if posterAttrValue, ok := video.Attr("poster"); ok { if shouldProxy(posterAttrValue, proxyOption) { video.SetAttr("poster", proxifyFunction(router, posterAttrValue)) } } }) case "audio": doc.Find("audio, audio source").Each(func(i int, audio *goquery.Selection) { if srcAttrValue, ok := audio.Attr("src"); ok { if shouldProxy(srcAttrValue, proxyOption) { audio.SetAttr("src", proxifyFunction(router, srcAttrValue)) } } }) case "video": doc.Find("video, video source").Each(func(i int, video *goquery.Selection) { if srcAttrValue, ok := video.Attr("src"); ok { if shouldProxy(srcAttrValue, proxyOption) { video.SetAttr("src", proxifyFunction(router, srcAttrValue)) } } if posterAttrValue, ok := video.Attr("poster"); ok { if shouldProxy(posterAttrValue, proxyOption) { video.SetAttr("poster", proxifyFunction(router, posterAttrValue)) } } }) } } output, err := doc.Find("body").First().Html() if err != nil { return htmlDocument } return output } func proxifySourceSet(element *goquery.Selection, router *mux.Router, proxifyFunction urlProxyRewriter, proxyOption, srcsetAttrValue string) { imageCandidates := sanitizer.ParseSrcSetAttribute(srcsetAttrValue) for _, imageCandidate := range imageCandidates { if shouldProxy(imageCandidate.ImageURL, proxyOption) { imageCandidate.ImageURL = proxifyFunction(router, imageCandidate.ImageURL) } } element.SetAttr("srcset", imageCandidates.String()) } func shouldProxy(attrValue, proxyOption string) bool { return !strings.HasPrefix(attrValue, "data:") && (proxyOption == "all" || !urllib.IsHTTPS(attrValue)) }