Skip to content

Commit 78b9a4c

Browse files
committed
optimize parsing common timestamps
This commit adds a dedicated function for parsing the two most common timestamps used by sqlite3. ``` goos: darwin goarch: arm64 pkg: github.com/charlievieth/go-sqlite3 cpu: Apple M4 Pro │ base.10.txt │ new.10.txt │ │ sec/op │ sec/op vs base │ Suite/BenchmarkParseTime-14 11.347µ ± 0% 8.044µ ± 0% -29.11% (p=0.000 n=10) │ base.10.txt │ new.10.txt │ │ B/op │ B/op vs base │ Suite/BenchmarkParseTime-14 1.713Ki ± 0% 1.713Ki ± 0% ~ (p=1.000 n=10) ¹ ¹ all samples are equal │ base.10.txt │ new.10.txt │ │ allocs/op │ allocs/op vs base │ Suite/BenchmarkParseTime-14 64.00 ± 0% 64.00 ± 0% ~ (p=1.000 n=10) ¹ ¹ all samples are equal ``` timefmt benchmarks: ``` goos: darwin goarch: arm64 pkg: github.com/charlievieth/go-sqlite3/internal/timefmt cpu: Apple M4 Pro BenchmarkParse/Stdlib-14 11050214 103.5 ns/op 0 B/op 0 allocs/op BenchmarkParse/Timefmt-14 34134667 34.45 ns/op 0 B/op 0 allocs/op BenchmarkParse/Timefmt_T-14 33790362 33.97 ns/op 0 B/op 0 allocs/op PASS ok github.com/charlievieth/go-sqlite3/internal/timefmt 3.814s ```
1 parent 15edb4d commit 78b9a4c

File tree

4 files changed

+280
-8
lines changed

4 files changed

+280
-8
lines changed

internal/timefmt/timefmt.go

+168-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,10 @@
11
package timefmt
22

3-
import "time"
3+
import (
4+
"errors"
5+
"strconv"
6+
"time"
7+
)
48

59
const digits = "0123456789"
610

@@ -120,3 +124,166 @@ func Format(t time.Time) []byte {
120124

121125
return b
122126
}
127+
128+
func isLeap(year int) bool {
129+
return year%4 == 0 && (year%100 != 0 || year%400 == 0)
130+
}
131+
132+
// daysBefore[m] counts the number of days in a non-leap year
133+
// before month m begins. There is an entry for m=12, counting
134+
// the number of days before January of next year (365).
135+
var daysBefore = [...]int32{
136+
0,
137+
31,
138+
31 + 28,
139+
31 + 28 + 31,
140+
31 + 28 + 31 + 30,
141+
31 + 28 + 31 + 30 + 31,
142+
31 + 28 + 31 + 30 + 31 + 30,
143+
31 + 28 + 31 + 30 + 31 + 30 + 31,
144+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31,
145+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30,
146+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31,
147+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31 + 30,
148+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31 + 30 + 31,
149+
}
150+
151+
func daysIn(m time.Month, year int) int {
152+
if m == time.February && isLeap(year) {
153+
return 29
154+
}
155+
return int(daysBefore[m] - daysBefore[m-1])
156+
}
157+
158+
// isDigit reports whether s[i] is in range and is a decimal digit.
159+
func isDigit(s string, i int) bool {
160+
if len(s) <= i {
161+
return false
162+
}
163+
c := s[i]
164+
return '0' <= c && c <= '9'
165+
}
166+
167+
func commaOrPeriod(b byte) bool {
168+
return b == '.' || b == ','
169+
}
170+
171+
var errBad = errors.New("bad value for field") // placeholder not passed to user
172+
173+
func parseNanoseconds(value string, nbytes int) (ns int, rangeErrString string, err error) {
174+
if !commaOrPeriod(value[0]) {
175+
err = errBad
176+
return
177+
}
178+
if nbytes > 10 {
179+
value = value[:10]
180+
nbytes = 10
181+
}
182+
if ns, err = strconv.Atoi(value[1:nbytes]); err != nil {
183+
return
184+
}
185+
if ns < 0 {
186+
rangeErrString = "fractional second"
187+
return
188+
}
189+
// We need nanoseconds, which means scaling by the number
190+
// of missing digits in the format, maximum length 10.
191+
scaleDigits := 10 - nbytes
192+
for i := 0; i < scaleDigits; i++ {
193+
ns *= 10
194+
}
195+
return
196+
}
197+
198+
func parse(s string, local *time.Location) (time.Time, bool) {
199+
// parseUint parses s as an unsigned decimal integer and
200+
// verifies that it is within some range.
201+
// If it is invalid or out-of-range,
202+
// it sets ok to false and returns the min value.
203+
ok := true
204+
parseUint := func(s string, min, max int) (x int) {
205+
for _, c := range []byte(s) {
206+
if c < '0' || '9' < c {
207+
ok = false
208+
return min
209+
}
210+
x = x*10 + int(c) - '0'
211+
}
212+
if x < min || max < x {
213+
ok = false
214+
return min
215+
}
216+
return x
217+
}
218+
219+
// Parse the date and time.
220+
// "2006-01-02 15:04:05.999999999-07:00"
221+
if len(s) < len("2006-01-02 15:04:05") {
222+
return time.Time{}, false
223+
}
224+
year := parseUint(s[0:4], 0, 9999) // e.g., 2006
225+
month := parseUint(s[5:7], 1, 12) // e.g., 01
226+
day := parseUint(s[8:10], 1, daysIn(time.Month(month), year)) // e.g., 02
227+
hour := parseUint(s[11:13], 0, 23) // e.g., 15
228+
min := parseUint(s[14:16], 0, 59) // e.g., 04
229+
sec := parseUint(s[17:19], 0, 59) // e.g., 05
230+
231+
if !ok || !(s[4] == '-' && s[7] == '-' && (s[10] == ' ' || s[10] == 'T') && s[13] == ':' && s[16] == ':') {
232+
return time.Time{}, false
233+
}
234+
s = s[19:]
235+
236+
// Parse the fractional second.
237+
var nsec int
238+
if len(s) >= 2 && s[0] == '.' && isDigit(s, 1) {
239+
n := 2
240+
for ; n < len(s) && isDigit(s, n); n++ {
241+
}
242+
nsec, _, _ = parseNanoseconds(s, n)
243+
s = s[n:]
244+
}
245+
246+
// Parse the time zone.
247+
t := time.Date(year, time.Month(month), day, hour, min, sec, nsec, time.UTC)
248+
if len(s) != 1 || s[0] != 'Z' {
249+
if len(s) != len("-07:00") {
250+
return time.Time{}, false
251+
}
252+
hr := parseUint(s[1:3], 0, 23) // e.g., 07
253+
mm := parseUint(s[4:6], 0, 59) // e.g., 00
254+
if !ok || !((s[0] == '-' || s[0] == '+') && s[3] == ':') {
255+
return time.Time{}, false
256+
}
257+
zoneOffset := (hr*60 + mm) * 60
258+
if s[0] == '-' {
259+
zoneOffset *= -1
260+
}
261+
t = t.Add(-(time.Duration(zoneOffset) * time.Second))
262+
263+
// Use local zone with the given offset if possible.
264+
t2 := t.In(local)
265+
_, offset := t2.Zone()
266+
if offset == zoneOffset {
267+
t = t2
268+
} else {
269+
t = t.In(time.FixedZone("", zoneOffset))
270+
}
271+
}
272+
273+
return t, true
274+
}
275+
276+
// Parse is an specialized version of time.Parse that is optimized for
277+
// the below two timestamps:
278+
//
279+
// - "2006-01-02 15:04:05.999999999-07:00"
280+
// - "2006-01-02T15:04:05.999999999-07:00"
281+
func Parse(s string, local *time.Location) (time.Time, error) {
282+
if t, ok := parse(s, local); ok {
283+
return t, nil
284+
}
285+
if len(s) > 10 && s[10] == 'T' {
286+
return time.Parse("2006-01-02T15:04:05.999999999-07:00", s)
287+
}
288+
return time.Parse("2006-01-02 15:04:05.999999999-07:00", s)
289+
}

internal/timefmt/timefmt_test.go

+90
Original file line numberDiff line numberDiff line change
@@ -54,6 +54,61 @@ func TestFormatTimeAllocs(t *testing.T) {
5454
}
5555
}
5656

57+
func TestParse(t *testing.T) {
58+
rr := rand.New(rand.NewSource(time.Now().UnixNano()))
59+
locs := make([]*time.Location, 1000)
60+
for i := range locs {
61+
offset := rr.Intn(60 * 60 * 14) // 14 hours
62+
if rr.Int()&1 != 0 {
63+
offset = -offset
64+
}
65+
locs[i] = time.FixedZone(strconv.Itoa(offset), offset)
66+
}
67+
// Append some standard locations
68+
locs = append(locs, time.Local, time.UTC)
69+
70+
times := []time.Time{
71+
{},
72+
time.Now(),
73+
time.Date(0, 0, 0, 0, 0, 0, 0, time.UTC),
74+
time.Date(1, 1, 1, 1, 1, 1, 1, time.UTC),
75+
time.Date(20_000, 1, 1, 1, 1, 1, 1, time.UTC),
76+
time.Date(-1, 0, 0, 0, 0, 0, 0, time.UTC),
77+
time.Date(2028, 2, 29, 0, 0, 0, 0, time.UTC), // Leap day
78+
time.Date(2028, 2, 29, 1, 1, 1, 1, time.Local), // Leap day
79+
}
80+
for i := 0; i < 100; i++ {
81+
times = append(times, time.Now().Add(time.Duration(rr.Int63n(int64(time.Hour*24*365)))))
82+
}
83+
84+
passed := 0
85+
for _, loc := range locs {
86+
for _, tt := range times {
87+
tt = tt.In(loc)
88+
for _, format := range sqlite3.SQLiteTimestampFormats[:2] {
89+
s := tt.Format(format)
90+
want, err := time.ParseInLocation(format, s, loc)
91+
if err != nil {
92+
continue
93+
}
94+
got, err := timefmt.Parse(s, loc)
95+
if err != nil {
96+
t.Error(err)
97+
continue
98+
}
99+
if !got.Equal(want) {
100+
t.Errorf("timefmt.Parse(%q) = %s; want: %s", s, got, want)
101+
continue
102+
}
103+
passed++
104+
}
105+
}
106+
}
107+
if passed == 0 {
108+
t.Fatal("No tests passed")
109+
}
110+
}
111+
57112
func BenchmarkFormat(b *testing.B) {
58113
loc, err := time.LoadLocation("America/New_York")
59114
if err != nil {
@@ -64,3 +119,38 @@ func BenchmarkFormat(b *testing.B) {
64119
_ = timefmt.Format(ts)
65120
}
66121
}
122+
123+
func BenchmarkParse(b *testing.B) {
124+
layout := sqlite3.SQLiteTimestampFormats[0]
125+
loc, err := time.LoadLocation("America/New_York")
126+
if err != nil {
127+
b.Fatal(err)
128+
}
129+
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc).Format(layout)
130+
131+
b.Run("Stdlib", func(b *testing.B) {
132+
for i := 0; i < b.N; i++ {
133+
_, err := time.Parse(layout, ts)
134+
if err != nil {
135+
b.Fatal(err)
136+
}
137+
}
138+
})
139+
b.Run("Timefmt", func(b *testing.B) {
140+
for i := 0; i < b.N; i++ {
141+
_, err := timefmt.Parse(ts, time.Local)
142+
if err != nil {
143+
b.Fatal(err)
144+
}
145+
}
146+
})
147+
b.Run("Timefmt_T", func(b *testing.B) {
148+
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc).Format(sqlite3.SQLiteTimestampFormats[1])
149+
for i := 0; i < b.N; i++ {
150+
_, err := timefmt.Parse(ts, time.Local)
151+
if err != nil {
152+
b.Fatal(err)
153+
}
154+
}
155+
})
156+
}

sqlite3.go

+5-3
Original file line numberDiff line numberDiff line change
@@ -2756,9 +2756,11 @@ func (rc *SQLiteRows) nextSyncLocked(dest []driver.Value) error {
27562756
s = strings.TrimSuffix(s, "Z")
27572757
var err error
27582758
var t time.Time
2759-
for _, format := range SQLiteTimestampFormats {
2760-
if t, err = time.ParseInLocation(format, s, time.UTC); err == nil {
2761-
break
2759+
if t, err = timefmt.Parse(s, time.UTC); err != nil {
2760+
for _, format := range SQLiteTimestampFormats[2:] {
2761+
if t, err = time.ParseInLocation(format, s, time.UTC); err == nil {
2762+
break
2763+
}
27622764
}
27632765
}
27642766
if err != nil {

sqlite3_test.go

+17-4
Original file line numberDiff line numberDiff line change
@@ -3468,7 +3468,17 @@ func benchmarkParseTime(b *testing.B) {
34683468
b.Fatal(err)
34693469
}
34703470
defer db.Close()
3471-
if _, err := db.Exec(`CREATE TABLE time_bench (ts DATETIME NOT NULL);`); err != nil {
3471+
const createTableStmt = `
3472+
CREATE TABLE time_bench (
3473+
ts1 DATETIME NOT NULL,
3474+
ts2 DATETIME NOT NULL,
3475+
ts3 DATETIME NOT NULL,
3476+
ts4 DATETIME NOT NULL,
3477+
ts5 DATETIME NOT NULL,
3478+
ts6 DATETIME NOT NULL
3479+
);`
3480+
// if _, err := db.Exec(`CREATE TABLE time_bench (ts DATETIME NOT NULL);`); err != nil {
3481+
if _, err := db.Exec(createTableStmt); err != nil {
34723482
b.Fatal(err)
34733483
}
34743484
// t := time.Date(year, month, day, hour, min, sec, nsec, loc)
@@ -3478,12 +3488,15 @@ func benchmarkParseTime(b *testing.B) {
34783488
}
34793489
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc)
34803490
for i := 0; i < 8; i++ {
3481-
_, err := db.Exec(`INSERT INTO time_bench VALUES(?)`, ts)
3491+
_, err := db.Exec(`INSERT INTO time_bench VALUES(?, ?, ?, ?, ?, ?)`,
3492+
ts, ts, ts, ts, ts, ts)
34823493
if err != nil {
34833494
b.Fatal(err)
34843495
}
34853496
}
3486-
stmt, err := db.Prepare(`SELECT ts FROM time_bench LIMIT 1;`)
3497+
3498+
// stmt, err := db.Prepare(`SELECT ts1, ts2, ts3, ts4, ts5, ts6 FROM time_bench LIMIT 1;`)
3499+
stmt, err := db.Prepare(`SELECT ts1, ts2, ts3, ts4, ts5, ts6 FROM time_bench;`)
34873500
if err != nil {
34883501
b.Fatal(err)
34893502
}
@@ -3495,7 +3508,7 @@ func benchmarkParseTime(b *testing.B) {
34953508
}
34963509
var t time.Time
34973510
for rows.Next() {
3498-
if err := rows.Scan(&t); err != nil {
3511+
if err := rows.Scan(&t, &t, &t, &t, &t, &t); err != nil {
34993512
b.Fatal(err)
35003513
}
35013514
}

0 commit comments

Comments
 (0)