186 lines
5.3 KiB
Go
186 lines
5.3 KiB
Go
|
package iso8601
|
||
|
|
||
|
import (
|
||
|
"encoding/binary"
|
||
|
"errors"
|
||
|
"time"
|
||
|
"unsafe"
|
||
|
)
|
||
|
|
||
|
var (
|
||
|
errInvalidTimestamp = errors.New("invalid ISO8601 timestamp")
|
||
|
errMonthOutOfRange = errors.New("month out of range")
|
||
|
errDayOutOfRange = errors.New("day out of range")
|
||
|
errHourOutOfRange = errors.New("hour out of range")
|
||
|
errMinuteOutOfRange = errors.New("minute out of range")
|
||
|
errSecondOutOfRange = errors.New("second out of range")
|
||
|
)
|
||
|
|
||
|
// Parse parses an ISO8601 timestamp, e.g. "2021-03-25T21:36:12Z".
|
||
|
func Parse(input string) (time.Time, error) {
|
||
|
b := unsafeStringToBytes(input)
|
||
|
if len(b) >= 20 && len(b) <= 30 && b[len(b)-1] == 'Z' {
|
||
|
if len(b) == 21 || (len(b) > 21 && b[19] != '.') {
|
||
|
return time.Time{}, errInvalidTimestamp
|
||
|
}
|
||
|
|
||
|
t1 := binary.LittleEndian.Uint64(b)
|
||
|
t2 := binary.LittleEndian.Uint64(b[8:16])
|
||
|
t3 := uint64(b[16]) | uint64(b[17])<<8 | uint64(b[18])<<16 | uint64('Z')<<24
|
||
|
|
||
|
// Check for valid separators by masking input with " - - T : : Z".
|
||
|
// If separators are all valid, replace them with a '0' (0x30) byte and
|
||
|
// check all bytes are now numeric.
|
||
|
if !match(t1, mask1) || !match(t2, mask2) || !match(t3, mask3) {
|
||
|
return time.Time{}, errInvalidTimestamp
|
||
|
}
|
||
|
t1 ^= replace1
|
||
|
t2 ^= replace2
|
||
|
t3 ^= replace3
|
||
|
if (nonNumeric(t1) | nonNumeric(t2) | nonNumeric(t3)) != 0 {
|
||
|
return time.Time{}, errInvalidTimestamp
|
||
|
}
|
||
|
|
||
|
t1 -= zero
|
||
|
t2 -= zero
|
||
|
t3 -= zero
|
||
|
year := (t1&0xF)*1000 + (t1>>8&0xF)*100 + (t1>>16&0xF)*10 + (t1 >> 24 & 0xF)
|
||
|
month := (t1>>40&0xF)*10 + (t1 >> 48 & 0xF)
|
||
|
day := (t2&0xF)*10 + (t2 >> 8 & 0xF)
|
||
|
hour := (t2>>24&0xF)*10 + (t2 >> 32 & 0xF)
|
||
|
minute := (t2>>48&0xF)*10 + (t2 >> 56)
|
||
|
second := (t3>>8&0xF)*10 + (t3 >> 16)
|
||
|
|
||
|
nanos := int64(0)
|
||
|
if len(b) > 20 {
|
||
|
for _, c := range b[20 : len(b)-1] {
|
||
|
if c < '0' || c > '9' {
|
||
|
return time.Time{}, errInvalidTimestamp
|
||
|
}
|
||
|
nanos = (nanos * 10) + int64(c-'0')
|
||
|
}
|
||
|
nanos *= pow10[30-len(b)]
|
||
|
}
|
||
|
|
||
|
if err := validate(year, month, day, hour, minute, second); err != nil {
|
||
|
return time.Time{}, err
|
||
|
}
|
||
|
|
||
|
unixSeconds := int64(daysSinceEpoch(year, month, day))*86400 + int64(hour*3600+minute*60+second)
|
||
|
return time.Unix(unixSeconds, nanos).UTC(), nil
|
||
|
}
|
||
|
|
||
|
// Fallback to using time.Parse().
|
||
|
t, err := time.Parse(time.RFC3339Nano, input)
|
||
|
if err != nil {
|
||
|
// Override (and don't wrap) the error here. The error returned by
|
||
|
// time.Parse() is dynamic, and includes a reference to the input
|
||
|
// string. By overriding the error, we guarantee that the input string
|
||
|
// doesn't escape.
|
||
|
return time.Time{}, errInvalidTimestamp
|
||
|
}
|
||
|
return t, nil
|
||
|
}
|
||
|
|
||
|
var pow10 = []int64{1, 10, 100, 1000, 1e4, 1e5, 1e6, 1e7, 1e8}
|
||
|
|
||
|
const (
|
||
|
mask1 = 0x2d00002d00000000 // YYYY-MM-
|
||
|
mask2 = 0x00003a0000540000 // DDTHH:MM
|
||
|
mask3 = 0x000000005a00003a // :SSZ____
|
||
|
|
||
|
// Generate masks that replace the separators with a numeric byte.
|
||
|
// The input must have valid separators. XOR with the separator bytes
|
||
|
// to zero them out and then XOR with 0x30 to replace them with '0'.
|
||
|
replace1 = mask1 ^ 0x3000003000000000
|
||
|
replace2 = mask2 ^ 0x0000300000300000
|
||
|
replace3 = mask3 ^ 0x3030303030000030
|
||
|
|
||
|
lsb = ^uint64(0) / 255
|
||
|
msb = lsb * 0x80
|
||
|
|
||
|
zero = lsb * '0'
|
||
|
nine = lsb * '9'
|
||
|
)
|
||
|
|
||
|
func validate(year, month, day, hour, minute, second uint64) error {
|
||
|
if day == 0 || day > 31 {
|
||
|
return errDayOutOfRange
|
||
|
}
|
||
|
if month == 0 || month > 12 {
|
||
|
return errMonthOutOfRange
|
||
|
}
|
||
|
if hour >= 24 {
|
||
|
return errHourOutOfRange
|
||
|
}
|
||
|
if minute >= 60 {
|
||
|
return errMinuteOutOfRange
|
||
|
}
|
||
|
if second >= 60 {
|
||
|
return errSecondOutOfRange
|
||
|
}
|
||
|
if month == 2 && (day > 29 || (day == 29 && !isLeapYear(year))) {
|
||
|
return errDayOutOfRange
|
||
|
}
|
||
|
if day == 31 {
|
||
|
switch month {
|
||
|
case 4, 6, 9, 11:
|
||
|
return errDayOutOfRange
|
||
|
}
|
||
|
}
|
||
|
return nil
|
||
|
}
|
||
|
|
||
|
func match(u, mask uint64) bool {
|
||
|
return (u & mask) == mask
|
||
|
}
|
||
|
|
||
|
func nonNumeric(u uint64) uint64 {
|
||
|
// Derived from https://graphics.stanford.edu/~seander/bithacks.html#HasLessInWord.
|
||
|
// Subtract '0' (0x30) from each byte so that the MSB is set in each byte
|
||
|
// if there's a byte less than '0' (0x30). Add 0x46 (0x7F-'9') so that the
|
||
|
// MSB is set if there's a byte greater than '9' (0x39). To handle overflow
|
||
|
// when adding 0x46, include the MSB from the input bytes in the final mask.
|
||
|
// Remove all but the MSBs and then you're left with a mask where each
|
||
|
// non-numeric byte from the input has its MSB set in the output.
|
||
|
return ((u - zero) | (u + (^msb - nine)) | u) & msb
|
||
|
}
|
||
|
|
||
|
func daysSinceEpoch(year, month, day uint64) uint64 {
|
||
|
// Derived from https://blog.reverberate.org/2020/05/12/optimizing-date-algorithms.html.
|
||
|
monthAdjusted := month - 3
|
||
|
var carry uint64
|
||
|
if monthAdjusted > month {
|
||
|
carry = 1
|
||
|
}
|
||
|
var adjust uint64
|
||
|
if carry == 1 {
|
||
|
adjust = 12
|
||
|
}
|
||
|
yearAdjusted := year + 4800 - carry
|
||
|
monthDays := ((monthAdjusted+adjust)*62719 + 769) / 2048
|
||
|
leapDays := yearAdjusted/4 - yearAdjusted/100 + yearAdjusted/400
|
||
|
return yearAdjusted*365 + leapDays + monthDays + (day - 1) - 2472632
|
||
|
}
|
||
|
|
||
|
func isLeapYear(y uint64) bool {
|
||
|
return (y%4) == 0 && ((y%100) != 0 || (y%400) == 0)
|
||
|
}
|
||
|
|
||
|
func unsafeStringToBytes(s string) []byte {
|
||
|
return *(*[]byte)(unsafe.Pointer(&sliceHeader{
|
||
|
Data: *(*unsafe.Pointer)(unsafe.Pointer(&s)),
|
||
|
Len: len(s),
|
||
|
Cap: len(s),
|
||
|
}))
|
||
|
}
|
||
|
|
||
|
// sliceHeader is like reflect.SliceHeader but the Data field is a
|
||
|
// unsafe.Pointer instead of being a uintptr to avoid invalid
|
||
|
// conversions from uintptr to unsafe.Pointer.
|
||
|
type sliceHeader struct {
|
||
|
Data unsafe.Pointer
|
||
|
Len int
|
||
|
Cap int
|
||
|
}
|