2017-11-20 06:10:04 +01:00
|
|
|
// Copyright 2017 Frédéric Guillot. All rights reserved.
|
|
|
|
// Use of this source code is governed by the Apache 2.0
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
2018-08-25 06:51:50 +02:00
|
|
|
package date // import "miniflux.app/reader/date"
|
2017-11-20 06:10:04 +01:00
|
|
|
|
|
|
|
import (
|
2017-12-23 02:59:28 +01:00
|
|
|
"errors"
|
2017-11-20 06:10:04 +01:00
|
|
|
"fmt"
|
2018-05-09 05:41:24 +02:00
|
|
|
"strconv"
|
2017-11-20 06:10:04 +01:00
|
|
|
"strings"
|
|
|
|
"time"
|
|
|
|
)
|
|
|
|
|
|
|
|
// DateFormats taken from github.com/mjibson/goread
|
|
|
|
var dateFormats = []string{
|
|
|
|
time.RFC822, // RSS
|
|
|
|
time.RFC822Z, // RSS
|
|
|
|
time.RFC3339, // Atom
|
|
|
|
time.UnixDate,
|
|
|
|
time.RubyDate,
|
|
|
|
time.RFC850,
|
|
|
|
time.RFC1123Z,
|
|
|
|
time.RFC1123,
|
|
|
|
time.ANSIC,
|
2020-11-18 02:01:59 +01:00
|
|
|
"Mon, 02 Jan 2006 15:04:05 MST -07:00",
|
2020-11-17 06:31:39 +01:00
|
|
|
"Mon, January 2, 2006, 3:04 PM MST",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Mon, January 2 2006 15:04:05 -0700",
|
|
|
|
"Mon, January 02, 2006, 15:04:05 MST",
|
|
|
|
"Mon, January 02, 2006 15:04:05 MST",
|
|
|
|
"Mon, Jan 2, 2006 15:04 MST",
|
|
|
|
"Mon, Jan 2 2006 15:04 MST",
|
2019-10-20 18:52:18 +02:00
|
|
|
"Mon, Jan 2 2006 15:04:05 MST",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Mon, Jan 2, 2006 15:04:05 MST",
|
|
|
|
"Mon, Jan 2 2006 15:04:05 -700",
|
|
|
|
"Mon, Jan 2 2006 15:04:05 -0700",
|
|
|
|
"Mon Jan 2 15:04 2006",
|
|
|
|
"Mon Jan 2 15:04:05 2006 MST",
|
|
|
|
"Mon Jan 02, 2006 3:04 pm",
|
|
|
|
"Mon, Jan 02,2006 15:04:05 MST",
|
|
|
|
"Mon Jan 02 2006 15:04:05 -0700",
|
2020-11-18 02:01:59 +01:00
|
|
|
"Mon, 02/01/2006",
|
2020-11-17 06:31:39 +01:00
|
|
|
"Monday, 2. January 2006 - 15:04",
|
|
|
|
"Monday 02 January 2006",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Monday, January 2, 2006 15:04:05 MST",
|
|
|
|
"Monday, January 2, 2006 03:04 PM",
|
|
|
|
"Monday, January 2, 2006",
|
|
|
|
"Monday, January 02, 2006",
|
|
|
|
"Monday, 2 January 2006 15:04:05 MST",
|
|
|
|
"Monday, 2 January 2006 15:04:05 -0700",
|
|
|
|
"Monday, 2 Jan 2006 15:04:05 MST",
|
|
|
|
"Monday, 2 Jan 2006 15:04:05 -0700",
|
|
|
|
"Monday, 02 January 2006 15:04:05 MST",
|
|
|
|
"Monday, 02 January 2006 15:04:05 -0700",
|
|
|
|
"Monday, 02 January 2006 15:04:05",
|
2017-12-23 02:59:28 +01:00
|
|
|
"Monday, January 02, 2006 - 3:04pm",
|
|
|
|
"Monday, January 2, 2006 - 3:04pm",
|
2020-04-26 05:03:39 +02:00
|
|
|
"Mon, 01/02/2006 - 15:04",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Mon, 2 January 2006 15:04 MST",
|
|
|
|
"Mon, 2 January 2006, 15:04 -0700",
|
|
|
|
"Mon, 2 January 2006, 15:04:05 MST",
|
|
|
|
"Mon, 2 January 2006 15:04:05 MST",
|
|
|
|
"Mon, 2 January 2006 15:04:05 -0700",
|
|
|
|
"Mon, 2 January 2006",
|
|
|
|
"Mon, 2 Jan 2006 3:04:05 PM -0700",
|
|
|
|
"Mon, 2 Jan 2006 15:4:5 MST",
|
|
|
|
"Mon, 2 Jan 2006 15:4:5 -0700 GMT",
|
|
|
|
"Mon, 2, Jan 2006 15:4",
|
|
|
|
"Mon, 2 Jan 2006 15:04 MST",
|
|
|
|
"Mon, 2 Jan 2006, 15:04 -0700",
|
|
|
|
"Mon, 2 Jan 2006 15:04 -0700",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05 UT",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05MST",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05 MST",
|
|
|
|
"Mon 2 Jan 2006 15:04:05 MST",
|
|
|
|
"mon,2 Jan 2006 15:04:05 MST",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05 -0700 MST",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05-0700",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05 -0700",
|
|
|
|
"Mon, 2 Jan 2006 15:04:05",
|
|
|
|
"Mon, 2 Jan 2006 15:04",
|
2018-04-10 06:27:15 +02:00
|
|
|
"Mon, 02 Jan 2006, 15:04",
|
|
|
|
"Mon, 2 Jan 2006, 15:04",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Mon,2 Jan 2006",
|
|
|
|
"Mon, 2 Jan 2006",
|
|
|
|
"Mon, 2 Jan 15:04:05 MST",
|
|
|
|
"Mon, 2 Jan 06 15:04:05 MST",
|
|
|
|
"Mon, 2 Jan 06 15:04:05 -0700",
|
|
|
|
"Mon, 2006-01-02 15:04",
|
|
|
|
"Mon,02 January 2006 14:04:05 MST",
|
|
|
|
"Mon, 02 January 2006",
|
|
|
|
"Mon, 02 Jan 2006 3:04:05 PM MST",
|
|
|
|
"Mon, 02 Jan 2006 15 -0700",
|
|
|
|
"Mon,02 Jan 2006 15:04 MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04 MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04 -0700",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 Z",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 UT",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 MST-07:00",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 MST -0700",
|
|
|
|
"Mon, 02 Jan 2006, 15:04:05 MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 MST",
|
|
|
|
"Mon , 02 Jan 2006 15:04:05 MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 GMT-0700",
|
|
|
|
"Mon,02 Jan 2006 15:04:05 -0700",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 -0700",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 -07:00",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 --0700",
|
|
|
|
"Mon 02 Jan 2006 15:04:05 -0700",
|
2019-10-20 18:52:18 +02:00
|
|
|
"Mon 02 Jan 2006, 15:04:05 MST",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 MST",
|
2017-11-20 06:10:04 +01:00
|
|
|
"Mon, 02 Jan 2006 15:04:05 -07",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05 00",
|
|
|
|
"Mon, 02 Jan 2006 15:04:05",
|
|
|
|
"Mon, 02 Jan 2006",
|
|
|
|
"Mon, 02 Jan 06 15:04:05 MST",
|
2017-12-23 02:59:28 +01:00
|
|
|
"Mon, 02 Jan 2006 3:04 PM MST",
|
2020-11-17 06:31:39 +01:00
|
|
|
"Mon Jan 02 2006 15:04:05 MST",
|
|
|
|
"Mon, 01 02 2006 15:04:05 -0700",
|
|
|
|
"Mon, 2th Jan 2006 15:05:05 MST",
|
|
|
|
"Jan. 2, 2006, 3:04 a.m.",
|
|
|
|
"fri, 02 jan 2006 15:04:05 -0700",
|
2020-04-26 05:03:39 +02:00
|
|
|
"January 02 2006 03:04:05 PM",
|
2017-11-20 06:10:04 +01:00
|
|
|
"January 2, 2006 3:04 PM",
|
|
|
|
"January 2, 2006, 3:04 p.m.",
|
|
|
|
"January 2, 2006 15:04:05 MST",
|
|
|
|
"January 2, 2006 15:04:05",
|
|
|
|
"January 2, 2006 03:04 PM",
|
|
|
|
"January 2, 2006",
|
|
|
|
"January 02, 2006 15:04:05 MST",
|
|
|
|
"January 02, 2006 15:04",
|
|
|
|
"January 02, 2006 03:04 PM",
|
|
|
|
"January 02, 2006",
|
|
|
|
"Jan 2, 2006 3:04:05 PM MST",
|
|
|
|
"Jan 2, 2006 3:04:05 PM",
|
|
|
|
"Jan 2, 2006 15:04:05 MST",
|
|
|
|
"Jan 2, 2006",
|
|
|
|
"Jan 02 2006 03:04:05PM",
|
|
|
|
"Jan 02, 2006",
|
|
|
|
"6/1/2 15:04",
|
|
|
|
"6-1-2 15:04",
|
|
|
|
"2 January 2006 15:04:05 MST",
|
|
|
|
"2 January 2006 15:04:05 -0700",
|
|
|
|
"2 January 2006",
|
|
|
|
"2 Jan 2006 15:04:05 Z",
|
|
|
|
"2 Jan 2006 15:04:05 MST",
|
|
|
|
"2 Jan 2006 15:04:05 -0700",
|
|
|
|
"2 Jan 2006",
|
2017-12-23 02:59:28 +01:00
|
|
|
"2 Jan 2006 15:04 MST",
|
2017-11-20 06:10:04 +01:00
|
|
|
"2.1.2006 15:04:05",
|
|
|
|
"2/1/2006",
|
|
|
|
"2-1-2006",
|
|
|
|
"2006 January 02",
|
|
|
|
"2006-1-2T15:04:05Z",
|
|
|
|
"2006-1-2 15:04:05",
|
|
|
|
"2006-1-2",
|
2020-11-17 06:31:39 +01:00
|
|
|
"2006-01-02T15:04:05-07:00Z",
|
2017-11-20 06:10:04 +01:00
|
|
|
"2006-1-02T15:04:05Z",
|
|
|
|
"2006-01-02T15:04Z",
|
|
|
|
"2006-01-02T15:04-07:00",
|
|
|
|
"2006-01-02T15:04:05Z",
|
|
|
|
"2006-01-02T15:04:05-07:00:00",
|
|
|
|
"2006-01-02T15:04:05:-0700",
|
|
|
|
"2006-01-02T15:04:05-0700",
|
|
|
|
"2006-01-02T15:04:05-07:00",
|
|
|
|
"2006-01-02T15:04:05 -0700",
|
|
|
|
"2006-01-02T15:04:05:00",
|
|
|
|
"2006-01-02T15:04:05",
|
2020-09-15 06:23:26 +02:00
|
|
|
"2006-01-02T15:04",
|
2017-11-20 06:10:04 +01:00
|
|
|
"2006-01-02 at 15:04:05",
|
|
|
|
"2006-01-02 15:04:05Z",
|
|
|
|
"2006-01-02 15:04:05 MST",
|
|
|
|
"2006-01-02 15:04:05-0700",
|
|
|
|
"2006-01-02 15:04:05-07:00",
|
|
|
|
"2006-01-02 15:04:05 -0700",
|
|
|
|
"2006-01-02 15:04",
|
|
|
|
"2006-01-02 00:00:00.0 15:04:05.0 -0700",
|
|
|
|
"2006/01/02",
|
|
|
|
"2006-01-02",
|
|
|
|
"15:04 02.01.2006 -0700",
|
|
|
|
"1/2/2006 3:04 PM MST",
|
|
|
|
"1/2/2006 3:04:05 PM MST",
|
|
|
|
"1/2/2006 3:04:05 PM",
|
|
|
|
"1/2/2006 15:04:05 MST",
|
|
|
|
"1/2/2006",
|
|
|
|
"06/1/2 15:04",
|
|
|
|
"06-1-2 15:04",
|
|
|
|
"02 Monday, Jan 2006 15:04",
|
|
|
|
"02 Jan 2006 15:04 MST",
|
|
|
|
"02 Jan 2006 15:04:05 UT",
|
|
|
|
"02 Jan 2006 15:04:05 MST",
|
|
|
|
"02 Jan 2006 15:04:05 -0700",
|
|
|
|
"02 Jan 2006 15:04:05",
|
|
|
|
"02 Jan 2006",
|
|
|
|
"02/01/2006 15:04 MST",
|
|
|
|
"02-01-2006 15:04:05 MST",
|
|
|
|
"02.01.2006 15:04:05",
|
|
|
|
"02/01/2006 15:04:05",
|
|
|
|
"02.01.2006 15:04",
|
|
|
|
"02/01/2006 - 15:04",
|
|
|
|
"02.01.2006 -0700",
|
|
|
|
"02/01/2006",
|
|
|
|
"02-01-2006",
|
|
|
|
"01/02/2006 3:04 PM",
|
|
|
|
"01/02/2006 15:04:05 MST",
|
|
|
|
"01/02/2006 - 15:04",
|
|
|
|
"01/02/2006",
|
|
|
|
"01-02-2006",
|
2020-11-17 06:31:39 +01:00
|
|
|
"Jan. 2006",
|
2020-11-18 02:01:59 +01:00
|
|
|
"Jan. 2, 2006, 03:04 p.m.",
|
|
|
|
"2006-01-02 15:04:05 -07:00",
|
|
|
|
"2 January, 2006",
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2020-11-17 06:31:39 +01:00
|
|
|
var invalidTimezoneReplacer = strings.NewReplacer(
|
|
|
|
"Europe/Brussels", "CET",
|
|
|
|
"GMT+0000 (Coordinated Universal Time)", "GMT",
|
2020-11-18 02:01:59 +01:00
|
|
|
"GMT-", "GMT -",
|
2020-11-17 06:31:39 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
var invalidLocalizedDateReplacer = strings.NewReplacer(
|
|
|
|
"Mo,", "Mon,",
|
|
|
|
"Di,", "Tue,",
|
|
|
|
"Mi,", "Wed,",
|
|
|
|
"Do,", "Thu,",
|
|
|
|
"Fr,", "Fri,",
|
|
|
|
"Sa,", "Sat,",
|
|
|
|
"So,", "Sun,",
|
|
|
|
"Mär ", "Mar ",
|
|
|
|
"Mai ", "May ",
|
|
|
|
"Okt ", "Oct ",
|
|
|
|
"Dez ", "Dec ",
|
|
|
|
"lun,", "Mon,",
|
|
|
|
"mar,", "Tue,",
|
|
|
|
"mer,", "Wed,",
|
|
|
|
"jeu,", "Thu,",
|
|
|
|
"ven,", "Fri,",
|
|
|
|
"sam,", "Sat,",
|
|
|
|
"dim,", "Sun,",
|
|
|
|
"lun.", "Mon",
|
|
|
|
"mar.", "Tue",
|
|
|
|
"mer.", "Wed",
|
|
|
|
"jeu.", "Thu",
|
|
|
|
"ven.", "Fri",
|
|
|
|
"sam.", "Sat",
|
|
|
|
"dim.", "Sun",
|
|
|
|
"Lundi,", "Monday,",
|
|
|
|
"Mardi,", "Tuesday,",
|
|
|
|
"Mercredi,", "Wednesday,",
|
|
|
|
"Jeudi,", "Thursday,",
|
|
|
|
"Vendredi,", "Friday,",
|
|
|
|
"Samedi,", "Saturday,",
|
|
|
|
"Dimanche,", "Sunday,",
|
|
|
|
"jan.", "January ",
|
|
|
|
"feb.", "February ",
|
|
|
|
"mars.", "March ",
|
|
|
|
"avril.", "April ",
|
|
|
|
"mai.", "May ",
|
|
|
|
"juin.", "June ",
|
2020-11-18 02:01:59 +01:00
|
|
|
"juil.", "July",
|
|
|
|
"août.", "August",
|
|
|
|
"sept.", "September",
|
|
|
|
"oct.", "October",
|
|
|
|
"nov.", "November",
|
|
|
|
"dec.", "December",
|
2020-12-03 05:59:14 +01:00
|
|
|
"déc.", "December",
|
2020-11-18 02:01:59 +01:00
|
|
|
"janvier ", "January ",
|
|
|
|
"février ", "February ",
|
|
|
|
"mars ", "March ",
|
|
|
|
"avril ", "April ",
|
|
|
|
"mai ", "May ",
|
|
|
|
"juin ", "June ",
|
|
|
|
"juillet ", "July",
|
|
|
|
"août ", "August",
|
|
|
|
"septembre ", "September",
|
|
|
|
"octobre ", "October",
|
|
|
|
"november ", "November",
|
|
|
|
"décembre ", "December",
|
2020-11-17 06:31:39 +01:00
|
|
|
"Janvier", "January",
|
|
|
|
"Février", "February",
|
|
|
|
"Mars", "March",
|
|
|
|
"Avril", "April",
|
|
|
|
"Mai", "May",
|
|
|
|
"Juin", "June",
|
|
|
|
"Juillet", "July",
|
|
|
|
"Août", "August",
|
|
|
|
"Septembre", "September",
|
|
|
|
"Octobre", "October",
|
|
|
|
"Novembre", "November",
|
|
|
|
"Décembre", "December",
|
2020-11-18 02:01:59 +01:00
|
|
|
"avr ", "Apr ",
|
|
|
|
"mai ", "May ",
|
|
|
|
"jui ", "Jun ",
|
|
|
|
"juin ", "June ",
|
2020-11-17 06:31:39 +01:00
|
|
|
)
|
|
|
|
|
2017-11-20 06:10:04 +01:00
|
|
|
// Parse parses a given date string using a large
|
|
|
|
// list of commonly found feed date formats.
|
2020-11-17 06:31:39 +01:00
|
|
|
func Parse(rawInput string) (t time.Time, err error) {
|
|
|
|
timestamp, err := strconv.ParseInt(rawInput, 10, 64)
|
2018-05-09 05:41:24 +02:00
|
|
|
if err == nil {
|
|
|
|
return time.Unix(timestamp, 0), nil
|
|
|
|
}
|
|
|
|
|
2020-11-17 06:31:39 +01:00
|
|
|
processedInput := invalidLocalizedDateReplacer.Replace(rawInput)
|
|
|
|
processedInput = invalidTimezoneReplacer.Replace(processedInput)
|
|
|
|
processedInput = strings.TrimSpace(processedInput)
|
|
|
|
if processedInput == "" {
|
|
|
|
return t, errors.New(`date parser: empty value`)
|
2017-11-20 06:10:04 +01:00
|
|
|
}
|
|
|
|
|
2018-12-27 05:24:38 +01:00
|
|
|
for _, layout := range dateFormats {
|
|
|
|
switch layout {
|
|
|
|
case time.RFC822, time.RFC850, time.RFC1123:
|
2020-11-17 06:31:39 +01:00
|
|
|
if t, err = parseLocalTimeDates(layout, processedInput); err == nil {
|
2018-12-27 05:24:38 +01:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-17 06:31:39 +01:00
|
|
|
if t, err = time.Parse(layout, processedInput); err == nil {
|
2017-11-20 06:10:04 +01:00
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-17 06:31:39 +01:00
|
|
|
err = fmt.Errorf(`date parser: failed to parse date "%s"`, rawInput)
|
2017-11-20 06:10:04 +01:00
|
|
|
return
|
|
|
|
}
|
2018-04-10 06:27:15 +02:00
|
|
|
|
2018-12-27 05:24:38 +01:00
|
|
|
// According to Golang documentation:
|
|
|
|
//
|
|
|
|
// RFC822, RFC850, and RFC1123 formats should be applied only to local times.
|
|
|
|
// Applying them to UTC times will use "UTC" as the time zone abbreviation,
|
|
|
|
// while strictly speaking those RFCs require the use of "GMT" in that case.
|
|
|
|
func parseLocalTimeDates(layout, ds string) (t time.Time, err error) {
|
|
|
|
loc := time.UTC
|
|
|
|
|
|
|
|
// Workaround for dates that don't use GMT.
|
2020-09-22 22:31:04 +02:00
|
|
|
if strings.HasSuffix(ds, "PST") || strings.HasSuffix(ds, "PDT") {
|
2018-12-27 05:24:38 +01:00
|
|
|
loc, _ = time.LoadLocation("America/Los_Angeles")
|
|
|
|
}
|
|
|
|
|
|
|
|
return time.ParseInLocation(layout, ds, loc)
|
|
|
|
}
|