2018-04-28 19:51:07 +02:00
|
|
|
// Copyright 2018 Frédéric Guillot. All rights reserved.
|
2017-11-20 06:10:04 +01:00
|
|
|
// Use of this source code is governed by the Apache 2.0
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
2018-08-25 06:51:50 +02:00
|
|
|
package client // import "miniflux.app/http/client"
|
2017-11-20 06:10:04 +01:00
|
|
|
|
|
|
|
import (
|
2017-12-19 05:52:46 +01:00
|
|
|
"bytes"
|
2018-02-09 03:16:54 +01:00
|
|
|
"crypto/x509"
|
2017-12-19 05:52:46 +01:00
|
|
|
"encoding/json"
|
2017-11-20 06:10:04 +01:00
|
|
|
"fmt"
|
2017-12-19 05:52:46 +01:00
|
|
|
"io"
|
2018-04-30 08:11:10 +02:00
|
|
|
"io/ioutil"
|
2018-02-09 03:16:54 +01:00
|
|
|
"net"
|
2017-11-20 06:10:04 +01:00
|
|
|
"net/http"
|
|
|
|
"net/url"
|
2017-12-19 05:52:46 +01:00
|
|
|
"strings"
|
2017-11-20 06:10:04 +01:00
|
|
|
"time"
|
2017-11-21 02:12:37 +01:00
|
|
|
|
2019-06-02 16:13:35 +02:00
|
|
|
"miniflux.app/config"
|
2018-08-25 06:51:50 +02:00
|
|
|
"miniflux.app/errors"
|
|
|
|
"miniflux.app/logger"
|
|
|
|
"miniflux.app/timer"
|
2019-12-27 00:26:23 +01:00
|
|
|
url_helper "miniflux.app/url"
|
2018-08-25 06:51:50 +02:00
|
|
|
"miniflux.app/version"
|
2017-11-20 06:10:04 +01:00
|
|
|
)
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
const (
|
|
|
|
defaultHTTPClientTimeout = 20
|
|
|
|
defaultHTTPClientMaxBodySize = 15 * 1024 * 1024
|
|
|
|
)
|
|
|
|
|
2018-02-09 03:16:54 +01:00
|
|
|
var (
|
2018-09-20 03:19:24 +02:00
|
|
|
// DefaultUserAgent sets the User-Agent header used for any requests by miniflux.
|
|
|
|
DefaultUserAgent = "Mozilla/5.0 (compatible; Miniflux/" + version.Version + "; +https://miniflux.app)"
|
|
|
|
|
2018-02-09 03:16:54 +01:00
|
|
|
errInvalidCertificate = "Invalid SSL certificate (original error: %q)"
|
|
|
|
errTemporaryNetworkOperation = "This website is temporarily unreachable (original error: %q)"
|
|
|
|
errPermanentNetworkOperation = "This website is permanently unreachable (original error: %q)"
|
|
|
|
errRequestTimeout = "Website unreachable, the request timed out after %d seconds"
|
|
|
|
)
|
2017-11-20 06:10:04 +01:00
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// Client builds and executes HTTP requests.
|
2017-11-21 02:12:37 +01:00
|
|
|
type Client struct {
|
2020-09-27 23:29:48 +02:00
|
|
|
inputURL string
|
|
|
|
|
|
|
|
requestURL string
|
|
|
|
requestEtagHeader string
|
|
|
|
requestLastModifiedHeader string
|
|
|
|
requestAuthorizationHeader string
|
|
|
|
requestUsername string
|
|
|
|
requestPassword string
|
|
|
|
requestUserAgent string
|
|
|
|
|
2020-11-07 02:39:10 +01:00
|
|
|
useProxy bool
|
|
|
|
doNotFollowRedirects bool
|
2020-09-27 23:29:48 +02:00
|
|
|
|
|
|
|
ClientTimeout int
|
|
|
|
ClientMaxBodySize int64
|
|
|
|
ClientProxyURL string
|
|
|
|
}
|
|
|
|
|
|
|
|
// New initializes a new HTTP client.
|
|
|
|
func New(url string) *Client {
|
|
|
|
return &Client{
|
|
|
|
inputURL: url,
|
|
|
|
requestUserAgent: DefaultUserAgent,
|
|
|
|
ClientTimeout: defaultHTTPClientTimeout,
|
|
|
|
ClientMaxBodySize: defaultHTTPClientMaxBodySize,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewClientWithConfig initializes a new HTTP client with application config options.
|
|
|
|
func NewClientWithConfig(url string, opts *config.Options) *Client {
|
2020-11-27 17:37:55 +01:00
|
|
|
userAgent := opts.UserAgent()
|
|
|
|
if userAgent == "" {
|
|
|
|
userAgent = DefaultUserAgent
|
|
|
|
}
|
2020-09-27 23:29:48 +02:00
|
|
|
return &Client{
|
|
|
|
inputURL: url,
|
2020-11-27 17:37:55 +01:00
|
|
|
requestUserAgent: userAgent,
|
2020-09-27 23:29:48 +02:00
|
|
|
ClientTimeout: opts.HTTPClientTimeout(),
|
|
|
|
ClientMaxBodySize: opts.HTTPClientMaxBodySize(),
|
|
|
|
ClientProxyURL: opts.HTTPClientProxy(),
|
|
|
|
}
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2019-12-27 00:26:23 +01:00
|
|
|
func (c *Client) String() string {
|
2020-09-27 23:29:48 +02:00
|
|
|
etagHeader := c.requestEtagHeader
|
|
|
|
if c.requestEtagHeader == "" {
|
2020-06-06 06:50:59 +02:00
|
|
|
etagHeader = "None"
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
lastModifiedHeader := c.requestLastModifiedHeader
|
|
|
|
if c.requestLastModifiedHeader == "" {
|
2020-06-06 06:50:59 +02:00
|
|
|
lastModifiedHeader = "None"
|
|
|
|
}
|
|
|
|
|
2019-12-27 00:26:23 +01:00
|
|
|
return fmt.Sprintf(
|
2020-09-27 23:29:48 +02:00
|
|
|
`InputURL=%q RequestURL=%q ETag=%s LastModified=%s Auth=%v UserAgent=%q`,
|
2019-12-27 00:26:23 +01:00
|
|
|
c.inputURL,
|
|
|
|
c.requestURL,
|
2020-06-06 06:50:59 +02:00
|
|
|
etagHeader,
|
|
|
|
lastModifiedHeader,
|
2020-09-27 23:29:48 +02:00
|
|
|
c.requestAuthorizationHeader != "" || (c.requestUsername != "" && c.requestPassword != ""),
|
|
|
|
c.requestUserAgent,
|
2019-12-27 00:26:23 +01:00
|
|
|
)
|
|
|
|
}
|
|
|
|
|
2018-04-28 19:51:07 +02:00
|
|
|
// WithCredentials defines the username/password for HTTP Basic authentication.
|
|
|
|
func (c *Client) WithCredentials(username, password string) *Client {
|
2018-06-20 07:58:29 +02:00
|
|
|
if username != "" && password != "" {
|
2020-09-27 23:29:48 +02:00
|
|
|
c.requestUsername = username
|
|
|
|
c.requestPassword = password
|
2018-06-20 07:58:29 +02:00
|
|
|
}
|
2018-04-28 19:51:07 +02:00
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// WithAuthorization defines the authorization HTTP header value.
|
2018-04-28 19:51:07 +02:00
|
|
|
func (c *Client) WithAuthorization(authorization string) *Client {
|
2020-09-27 23:29:48 +02:00
|
|
|
c.requestAuthorizationHeader = authorization
|
2018-04-28 19:51:07 +02:00
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
|
|
|
// WithCacheHeaders defines caching headers.
|
|
|
|
func (c *Client) WithCacheHeaders(etagHeader, lastModifiedHeader string) *Client {
|
2020-09-27 23:29:48 +02:00
|
|
|
c.requestLastModifiedHeader = etagHeader
|
|
|
|
c.requestLastModifiedHeader = lastModifiedHeader
|
2018-04-28 19:51:07 +02:00
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
2020-11-07 02:39:10 +01:00
|
|
|
// WithProxy enables proxy for the current HTTP request.
|
2020-09-10 08:28:54 +02:00
|
|
|
func (c *Client) WithProxy() *Client {
|
2020-09-27 23:29:48 +02:00
|
|
|
c.useProxy = true
|
2020-09-10 08:28:54 +02:00
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
2020-11-07 02:39:10 +01:00
|
|
|
// WithoutRedirects disables HTTP redirects.
|
|
|
|
func (c *Client) WithoutRedirects() *Client {
|
|
|
|
c.doNotFollowRedirects = true
|
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// WithUserAgent defines the User-Agent header to use for HTTP requests.
|
2018-09-20 03:19:24 +02:00
|
|
|
func (c *Client) WithUserAgent(userAgent string) *Client {
|
|
|
|
if userAgent != "" {
|
2020-09-27 23:29:48 +02:00
|
|
|
c.requestUserAgent = userAgent
|
2018-09-20 03:19:24 +02:00
|
|
|
}
|
|
|
|
return c
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// Get performs a GET HTTP request.
|
2017-12-03 04:32:14 +01:00
|
|
|
func (c *Client) Get() (*Response, error) {
|
2017-12-19 05:52:46 +01:00
|
|
|
request, err := c.buildRequest(http.MethodGet, nil)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return c.executeRequest(request)
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// PostForm performs a POST HTTP request with form encoded values.
|
2017-12-19 05:52:46 +01:00
|
|
|
func (c *Client) PostForm(values url.Values) (*Response, error) {
|
|
|
|
request, err := c.buildRequest(http.MethodPost, strings.NewReader(values.Encode()))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
request.Header.Add("Content-Type", "application/x-www-form-urlencoded")
|
|
|
|
return c.executeRequest(request)
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
// PostJSON performs a POST HTTP request with a JSON payload.
|
2017-12-19 05:52:46 +01:00
|
|
|
func (c *Client) PostJSON(data interface{}) (*Response, error) {
|
|
|
|
b, err := json.Marshal(data)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
request, err := c.buildRequest(http.MethodPost, bytes.NewReader(b))
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
request.Header.Add("Content-Type", "application/json")
|
|
|
|
return c.executeRequest(request)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) executeRequest(request *http.Request) (*Response, error) {
|
2019-12-27 00:26:23 +01:00
|
|
|
defer timer.ExecutionTime(time.Now(), fmt.Sprintf("[HttpClient] inputURL=%s", c.inputURL))
|
|
|
|
|
|
|
|
logger.Debug("[HttpClient:Before] Method=%s %s",
|
|
|
|
request.Method,
|
|
|
|
c.String(),
|
|
|
|
)
|
2017-12-19 05:52:46 +01:00
|
|
|
|
2017-12-03 04:32:14 +01:00
|
|
|
client := c.buildClient()
|
2017-12-19 05:52:46 +01:00
|
|
|
resp, err := client.Do(request)
|
2018-06-20 05:13:13 +02:00
|
|
|
if resp != nil {
|
|
|
|
defer resp.Body.Close()
|
|
|
|
}
|
|
|
|
|
2017-11-20 06:10:04 +01:00
|
|
|
if err != nil {
|
2018-02-09 03:16:54 +01:00
|
|
|
if uerr, ok := err.(*url.Error); ok {
|
|
|
|
switch uerr.Err.(type) {
|
|
|
|
case x509.CertificateInvalidError, x509.HostnameError:
|
|
|
|
err = errors.NewLocalizedError(errInvalidCertificate, uerr.Err)
|
|
|
|
case *net.OpError:
|
|
|
|
if uerr.Err.(*net.OpError).Temporary() {
|
|
|
|
err = errors.NewLocalizedError(errTemporaryNetworkOperation, uerr.Err)
|
|
|
|
} else {
|
|
|
|
err = errors.NewLocalizedError(errPermanentNetworkOperation, uerr.Err)
|
|
|
|
}
|
|
|
|
case net.Error:
|
|
|
|
nerr := uerr.Err.(net.Error)
|
|
|
|
if nerr.Timeout() {
|
2020-09-27 23:29:48 +02:00
|
|
|
err = errors.NewLocalizedError(errRequestTimeout, c.ClientTimeout)
|
2018-02-09 03:16:54 +01:00
|
|
|
} else if nerr.Temporary() {
|
|
|
|
err = errors.NewLocalizedError(errTemporaryNetworkOperation, nerr)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-20 06:10:04 +01:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if resp.ContentLength > c.ClientMaxBodySize {
|
2018-01-03 03:30:26 +01:00
|
|
|
return nil, fmt.Errorf("client: response too large (%d bytes)", resp.ContentLength)
|
|
|
|
}
|
|
|
|
|
2018-04-30 08:11:10 +02:00
|
|
|
buf, err := ioutil.ReadAll(resp.Body)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("client: error while reading body %v", err)
|
|
|
|
}
|
|
|
|
|
2017-11-21 02:12:37 +01:00
|
|
|
response := &Response{
|
2018-04-30 08:11:10 +02:00
|
|
|
Body: bytes.NewReader(buf),
|
2018-01-05 03:32:36 +01:00
|
|
|
StatusCode: resp.StatusCode,
|
|
|
|
EffectiveURL: resp.Request.URL.String(),
|
|
|
|
LastModified: resp.Header.Get("Last-Modified"),
|
|
|
|
ETag: resp.Header.Get("ETag"),
|
2019-12-27 00:26:23 +01:00
|
|
|
Expires: resp.Header.Get("Expires"),
|
2018-01-05 03:32:36 +01:00
|
|
|
ContentType: resp.Header.Get("Content-Type"),
|
|
|
|
ContentLength: resp.ContentLength,
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2019-12-27 00:26:23 +01:00
|
|
|
logger.Debug("[HttpClient:After] Method=%s %s; Response => %s",
|
2017-12-19 05:52:46 +01:00
|
|
|
request.Method,
|
2019-12-27 00:26:23 +01:00
|
|
|
c.String(),
|
|
|
|
response,
|
2017-11-20 06:10:04 +01:00
|
|
|
)
|
|
|
|
|
2018-04-10 05:18:54 +02:00
|
|
|
// Ignore caching headers for feeds that do not want any cache.
|
|
|
|
if resp.Header.Get("Expires") == "0" {
|
|
|
|
logger.Debug("[HttpClient] Ignore caching headers for %q", response.EffectiveURL)
|
|
|
|
response.ETag = ""
|
|
|
|
response.LastModified = ""
|
|
|
|
}
|
|
|
|
|
2017-11-20 06:10:04 +01:00
|
|
|
return response, err
|
|
|
|
}
|
|
|
|
|
2017-12-19 05:52:46 +01:00
|
|
|
func (c *Client) buildRequest(method string, body io.Reader) (*http.Request, error) {
|
2019-12-27 00:26:23 +01:00
|
|
|
c.requestURL = url_helper.RequestURI(c.inputURL)
|
|
|
|
request, err := http.NewRequest(method, c.requestURL, body)
|
2017-12-19 05:52:46 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
2017-12-03 04:32:14 +01:00
|
|
|
}
|
|
|
|
|
2018-02-25 20:49:08 +01:00
|
|
|
request.Header = c.buildHeaders()
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if c.requestUsername != "" && c.requestPassword != "" {
|
|
|
|
request.SetBasicAuth(c.requestUsername, c.requestPassword)
|
2017-12-03 04:32:14 +01:00
|
|
|
}
|
|
|
|
|
2017-12-19 05:52:46 +01:00
|
|
|
return request, nil
|
2017-12-03 04:32:14 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
func (c *Client) buildClient() http.Client {
|
2020-11-07 02:39:10 +01:00
|
|
|
client := http.Client{
|
|
|
|
Timeout: time.Duration(c.ClientTimeout) * time.Second,
|
|
|
|
}
|
|
|
|
|
2020-09-27 22:08:55 +02:00
|
|
|
transport := &http.Transport{
|
2020-10-31 03:03:41 +01:00
|
|
|
Proxy: http.ProxyFromEnvironment,
|
2020-09-27 22:08:55 +02:00
|
|
|
DialContext: (&net.Dialer{
|
|
|
|
// Default is 30s.
|
|
|
|
Timeout: 10 * time.Second,
|
|
|
|
|
|
|
|
// Default is 30s.
|
|
|
|
KeepAlive: 15 * time.Second,
|
|
|
|
}).DialContext,
|
|
|
|
|
|
|
|
// Default is 100.
|
|
|
|
MaxIdleConns: 50,
|
|
|
|
|
|
|
|
// Default is 90s.
|
|
|
|
IdleConnTimeout: 10 * time.Second,
|
|
|
|
}
|
|
|
|
|
2020-11-07 02:39:10 +01:00
|
|
|
if c.doNotFollowRedirects {
|
|
|
|
client.CheckRedirect = func(req *http.Request, via []*http.Request) error {
|
|
|
|
return http.ErrUseLastResponse
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if c.useProxy && c.ClientProxyURL != "" {
|
|
|
|
proxyURL, err := url.Parse(c.ClientProxyURL)
|
2020-09-10 08:28:54 +02:00
|
|
|
if err != nil {
|
|
|
|
logger.Error("[HttpClient] Proxy URL error: %v", err)
|
|
|
|
} else {
|
|
|
|
logger.Debug("[HttpClient] Use proxy: %s", proxyURL)
|
|
|
|
transport.Proxy = http.ProxyURL(proxyURL)
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-10 08:28:54 +02:00
|
|
|
client.Transport = transport
|
|
|
|
|
2017-11-21 04:44:28 +01:00
|
|
|
return client
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2017-12-03 04:32:14 +01:00
|
|
|
func (c *Client) buildHeaders() http.Header {
|
2017-11-20 06:10:04 +01:00
|
|
|
headers := make(http.Header)
|
2020-09-27 23:29:48 +02:00
|
|
|
headers.Add("User-Agent", c.requestUserAgent)
|
2017-12-28 04:44:23 +01:00
|
|
|
headers.Add("Accept", "*/*")
|
2017-11-20 06:10:04 +01:00
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if c.requestEtagHeader != "" {
|
|
|
|
headers.Add("If-None-Match", c.requestEtagHeader)
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if c.requestLastModifiedHeader != "" {
|
|
|
|
headers.Add("If-Modified-Since", c.requestLastModifiedHeader)
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-09-27 23:29:48 +02:00
|
|
|
if c.requestAuthorizationHeader != "" {
|
|
|
|
headers.Add("Authorization", c.requestAuthorizationHeader)
|
2017-12-19 05:52:46 +01:00
|
|
|
}
|
|
|
|
|
2018-06-20 05:21:24 +02:00
|
|
|
headers.Add("Connection", "close")
|
2017-11-20 06:10:04 +01:00
|
|
|
return headers
|
|
|
|
}
|