Skip to content

Commit 2384c5b

Browse files
committed
optimize parsing common timestamps
This commit adds a dedicated function for parsing the two most common timestamps used by sqlite3. ``` goos: darwin goarch: arm64 pkg: github.com/charlievieth/go-sqlite3 cpu: Apple M4 Pro │ base.10.txt │ new.10.txt │ │ sec/op │ sec/op vs base │ Suite/BenchmarkParseTime-14 11.347µ ± 0% 8.044µ ± 0% -29.11% (p=0.000 n=10) │ base.10.txt │ new.10.txt │ │ B/op │ B/op vs base │ Suite/BenchmarkParseTime-14 1.713Ki ± 0% 1.713Ki ± 0% ~ (p=1.000 n=10) ¹ ¹ all samples are equal │ base.10.txt │ new.10.txt │ │ allocs/op │ allocs/op vs base │ Suite/BenchmarkParseTime-14 64.00 ± 0% 64.00 ± 0% ~ (p=1.000 n=10) ¹ ¹ all samples are equal ``` timefmt benchmarks: ``` goos: darwin goarch: arm64 pkg: github.com/charlievieth/go-sqlite3/internal/timefmt cpu: Apple M4 Pro BenchmarkParse/Stdlib-14 11050214 103.5 ns/op 0 B/op 0 allocs/op BenchmarkParse/Timefmt-14 34134667 34.45 ns/op 0 B/op 0 allocs/op BenchmarkParse/Timefmt_T-14 33790362 33.97 ns/op 0 B/op 0 allocs/op PASS ok github.com/charlievieth/go-sqlite3/internal/timefmt 3.814s ```
1 parent 15edb4d commit 2384c5b

File tree

4 files changed

+279
-8
lines changed

4 files changed

+279
-8
lines changed

internal/timefmt/timefmt.go

+167-1
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,10 @@
11
package timefmt
22

3-
import "time"
3+
import (
4+
"errors"
5+
"strconv"
6+
"time"
7+
)
48

59
const digits = "0123456789"
610

@@ -120,3 +124,165 @@ func Format(t time.Time) []byte {
120124

121125
return b
122126
}
127+
128+
func isLeap(year int) bool {
129+
return year%4 == 0 && (year%100 != 0 || year%400 == 0)
130+
}
131+
132+
// daysBefore[m] counts the number of days in a non-leap year
133+
// before month m begins. There is an entry for m=12, counting
134+
// the number of days before January of next year (365).
135+
var daysBefore = [...]int32{
136+
0,
137+
31,
138+
31 + 28,
139+
31 + 28 + 31,
140+
31 + 28 + 31 + 30,
141+
31 + 28 + 31 + 30 + 31,
142+
31 + 28 + 31 + 30 + 31 + 30,
143+
31 + 28 + 31 + 30 + 31 + 30 + 31,
144+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31,
145+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30,
146+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31,
147+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31 + 30,
148+
31 + 28 + 31 + 30 + 31 + 30 + 31 + 31 + 30 + 31 + 30 + 31,
149+
}
150+
151+
func daysIn(m time.Month, year int) int {
152+
if m == time.February && isLeap(year) {
153+
return 29
154+
}
155+
return int(daysBefore[m] - daysBefore[m-1])
156+
}
157+
158+
// isDigit reports whether s[i] is in range and is a decimal digit.
159+
func isDigit(s string, i int) bool {
160+
if len(s) <= i {
161+
return false
162+
}
163+
c := s[i]
164+
return '0' <= c && c <= '9'
165+
}
166+
167+
func commaOrPeriod(b byte) bool {
168+
return b == '.' || b == ','
169+
}
170+
171+
var errBad = errors.New("bad value for field") // placeholder not passed to user
172+
173+
func parseNanoseconds(value string, nbytes int) (ns int, rangeErrString string, err error) {
174+
if !commaOrPeriod(value[0]) {
175+
err = errBad
176+
return
177+
}
178+
if nbytes > 10 {
179+
value = value[:10]
180+
nbytes = 10
181+
}
182+
if ns, err = strconv.Atoi(value[1:nbytes]); err != nil {
183+
return
184+
}
185+
if ns < 0 {
186+
rangeErrString = "fractional second"
187+
return
188+
}
189+
// We need nanoseconds, which means scaling by the number
190+
// of missing digits in the format, maximum length 10.
191+
scaleDigits := 10 - nbytes
192+
for i := 0; i < scaleDigits; i++ {
193+
ns *= 10
194+
}
195+
return
196+
}
197+
198+
func parse(s string, local *time.Location) (time.Time, bool) {
199+
// parseUint parses s as an unsigned decimal integer and
200+
// verifies that it is within some range.
201+
// If it is invalid or out-of-range,
202+
// it sets ok to false and returns the min value.
203+
ok := true
204+
parseUint := func(s string, min, max int) (x int) {
205+
for _, c := range []byte(s) {
206+
if c < '0' || '9' < c {
207+
ok = false
208+
return min
209+
}
210+
x = x*10 + int(c) - '0'
211+
}
212+
if x < min || max < x {
213+
ok = false
214+
return min
215+
}
216+
return x
217+
}
218+
219+
// Parse the date and time.
220+
if len(s) < len("2006-01-02 15:04:05") {
221+
return time.Time{}, false
222+
}
223+
year := parseUint(s[0:4], 0, 9999) // e.g., 2006
224+
month := parseUint(s[5:7], 1, 12) // e.g., 01
225+
day := parseUint(s[8:10], 1, daysIn(time.Month(month), year)) // e.g., 02
226+
hour := parseUint(s[11:13], 0, 23) // e.g., 15
227+
min := parseUint(s[14:16], 0, 59) // e.g., 04
228+
sec := parseUint(s[17:19], 0, 59) // e.g., 05
229+
230+
if !ok || !(s[4] == '-' && s[7] == '-' && (s[10] == ' ' || s[10] == 'T') && s[13] == ':' && s[16] == ':') {
231+
return time.Time{}, false
232+
}
233+
s = s[19:]
234+
235+
// Parse the fractional second.
236+
var nsec int
237+
if len(s) >= 2 && s[0] == '.' && isDigit(s, 1) {
238+
n := 2
239+
for ; n < len(s) && isDigit(s, n); n++ {
240+
}
241+
nsec, _, _ = parseNanoseconds(s, n)
242+
s = s[n:]
243+
}
244+
245+
// Parse the time zone.
246+
t := time.Date(year, time.Month(month), day, hour, min, sec, nsec, time.UTC)
247+
if len(s) != 1 || s[0] != 'Z' {
248+
if len(s) != len("-07:00") {
249+
return time.Time{}, false
250+
}
251+
hr := parseUint(s[1:3], 0, 23) // e.g., 07
252+
mm := parseUint(s[4:6], 0, 59) // e.g., 00
253+
if !ok || !((s[0] == '-' || s[0] == '+') && s[3] == ':') {
254+
return time.Time{}, false
255+
}
256+
zoneOffset := (hr*60 + mm) * 60
257+
if s[0] == '-' {
258+
zoneOffset *= -1
259+
}
260+
t = t.Add(-(time.Duration(zoneOffset) * time.Second))
261+
262+
// Use local zone with the given offset if possible.
263+
t2 := t.In(local)
264+
_, offset := t2.Zone()
265+
if offset == zoneOffset {
266+
t = t2
267+
} else {
268+
t = t.In(time.FixedZone("", zoneOffset))
269+
}
270+
}
271+
272+
return t, true
273+
}
274+
275+
// Parse is an specialized version of time.Parse that is optimized for
276+
// the below two timestamps:
277+
//
278+
// - "2006-01-02 15:04:05.999999999-07:00"
279+
// - "2006-01-02T15:04:05.999999999-07:00"
280+
func Parse(s string, local *time.Location) (time.Time, error) {
281+
if t, ok := parse(s, local); ok {
282+
return t, nil
283+
}
284+
if len(s) > 10 && s[10] == 'T' {
285+
return time.Parse("2006-01-02T15:04:05.999999999-07:00", s)
286+
}
287+
return time.Parse("2006-01-02 15:04:05.999999999-07:00", s)
288+
}

internal/timefmt/timefmt_test.go

+90
Original file line numberDiff line numberDiff line change
@@ -54,6 +54,61 @@ func TestFormatTimeAllocs(t *testing.T) {
5454
}
5555
}
5656

57+
func TestParse(t *testing.T) {
58+
rr := rand.New(rand.NewSource(time.Now().UnixNano()))
59+
locs := make([]*time.Location, 1000)
60+
for i := range locs {
61+
offset := rr.Intn(60 * 60 * 14) // 14 hours
62+
if rr.Int()&1 != 0 {
63+
offset = -offset
64+
}
65+
locs[i] = time.FixedZone(strconv.Itoa(offset), offset)
66+
}
67+
// Append some standard locations
68+
locs = append(locs, time.Local, time.UTC)
69+
70+
times := []time.Time{
71+
{},
72+
time.Now(),
73+
time.Date(0, 0, 0, 0, 0, 0, 0, time.UTC),
74+
time.Date(1, 1, 1, 1, 1, 1, 1, time.UTC),
75+
time.Date(20_000, 1, 1, 1, 1, 1, 1, time.UTC),
76+
time.Date(-1, 0, 0, 0, 0, 0, 0, time.UTC),
77+
time.Date(2028, 2, 29, 0, 0, 0, 0, time.UTC), // Leap day
78+
time.Date(2028, 2, 29, 1, 1, 1, 1, time.Local), // Leap day
79+
}
80+
for i := 0; i < 100; i++ {
81+
times = append(times, time.Now().Add(time.Duration(rr.Int63n(int64(time.Hour*24*365)))))
82+
}
83+
84+
passed := 0
85+
for _, loc := range locs {
86+
for _, tt := range times {
87+
tt = tt.In(loc)
88+
for _, format := range sqlite3.SQLiteTimestampFormats[:2] {
89+
s := tt.Format(format)
90+
want, err := time.ParseInLocation(format, s, loc)
91+
if err != nil {
92+
continue
93+
}
94+
got, err := timefmt.Parse(s, loc)
95+
if err != nil {
96+
t.Error(err)
97+
continue
98+
}
99+
if !got.Equal(want) {
100+
t.Errorf("timefmt.Parse(%q) = %s; want: %s", s, got, want)
101+
continue
102+
}
103+
passed++
104+
}
105+
}
106+
}
107+
if passed == 0 {
108+
t.Fatal("No tests passed")
109+
}
110+
}
111+
57112
func BenchmarkFormat(b *testing.B) {
58113
loc, err := time.LoadLocation("America/New_York")
59114
if err != nil {
@@ -64,3 +119,38 @@ func BenchmarkFormat(b *testing.B) {
64119
_ = timefmt.Format(ts)
65120
}
66121
}
122+
123+
func BenchmarkParse(b *testing.B) {
124+
layout := sqlite3.SQLiteTimestampFormats[0]
125+
loc, err := time.LoadLocation("America/New_York")
126+
if err != nil {
127+
b.Fatal(err)
128+
}
129+
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc).Format(layout)
130+
131+
b.Run("Stdlib", func(b *testing.B) {
132+
for i := 0; i < b.N; i++ {
133+
_, err := time.Parse(layout, ts)
134+
if err != nil {
135+
b.Fatal(err)
136+
}
137+
}
138+
})
139+
b.Run("Timefmt", func(b *testing.B) {
140+
for i := 0; i < b.N; i++ {
141+
_, err := timefmt.Parse(ts, time.Local)
142+
if err != nil {
143+
b.Fatal(err)
144+
}
145+
}
146+
})
147+
b.Run("Timefmt_T", func(b *testing.B) {
148+
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc).Format(sqlite3.SQLiteTimestampFormats[1])
149+
for i := 0; i < b.N; i++ {
150+
_, err := timefmt.Parse(ts, time.Local)
151+
if err != nil {
152+
b.Fatal(err)
153+
}
154+
}
155+
})
156+
}

sqlite3.go

+5-3
Original file line numberDiff line numberDiff line change
@@ -2756,9 +2756,11 @@ func (rc *SQLiteRows) nextSyncLocked(dest []driver.Value) error {
27562756
s = strings.TrimSuffix(s, "Z")
27572757
var err error
27582758
var t time.Time
2759-
for _, format := range SQLiteTimestampFormats {
2760-
if t, err = time.ParseInLocation(format, s, time.UTC); err == nil {
2761-
break
2759+
if t, err = timefmt.Parse(s, time.UTC); err != nil {
2760+
for _, format := range SQLiteTimestampFormats[2:] {
2761+
if t, err = time.ParseInLocation(format, s, time.UTC); err == nil {
2762+
break
2763+
}
27622764
}
27632765
}
27642766
if err != nil {

sqlite3_test.go

+17-4
Original file line numberDiff line numberDiff line change
@@ -3468,7 +3468,17 @@ func benchmarkParseTime(b *testing.B) {
34683468
b.Fatal(err)
34693469
}
34703470
defer db.Close()
3471-
if _, err := db.Exec(`CREATE TABLE time_bench (ts DATETIME NOT NULL);`); err != nil {
3471+
const createTableStmt = `
3472+
CREATE TABLE time_bench (
3473+
ts1 DATETIME NOT NULL,
3474+
ts2 DATETIME NOT NULL,
3475+
ts3 DATETIME NOT NULL,
3476+
ts4 DATETIME NOT NULL,
3477+
ts5 DATETIME NOT NULL,
3478+
ts6 DATETIME NOT NULL
3479+
);`
3480+
// if _, err := db.Exec(`CREATE TABLE time_bench (ts DATETIME NOT NULL);`); err != nil {
3481+
if _, err := db.Exec(createTableStmt); err != nil {
34723482
b.Fatal(err)
34733483
}
34743484
// t := time.Date(year, month, day, hour, min, sec, nsec, loc)
@@ -3478,12 +3488,15 @@ func benchmarkParseTime(b *testing.B) {
34783488
}
34793489
ts := time.Date(2024, 1, 2, 15, 4, 5, 123456789, loc)
34803490
for i := 0; i < 8; i++ {
3481-
_, err := db.Exec(`INSERT INTO time_bench VALUES(?)`, ts)
3491+
_, err := db.Exec(`INSERT INTO time_bench VALUES(?, ?, ?, ?, ?, ?)`,
3492+
ts, ts, ts, ts, ts, ts)
34823493
if err != nil {
34833494
b.Fatal(err)
34843495
}
34853496
}
3486-
stmt, err := db.Prepare(`SELECT ts FROM time_bench LIMIT 1;`)
3497+
3498+
// stmt, err := db.Prepare(`SELECT ts1, ts2, ts3, ts4, ts5, ts6 FROM time_bench LIMIT 1;`)
3499+
stmt, err := db.Prepare(`SELECT ts1, ts2, ts3, ts4, ts5, ts6 FROM time_bench;`)
34873500
if err != nil {
34883501
b.Fatal(err)
34893502
}
@@ -3495,7 +3508,7 @@ func benchmarkParseTime(b *testing.B) {
34953508
}
34963509
var t time.Time
34973510
for rows.Next() {
3498-
if err := rows.Scan(&t); err != nil {
3511+
if err := rows.Scan(&t, &t, &t, &t, &t, &t); err != nil {
34993512
b.Fatal(err)
35003513
}
35013514
}

0 commit comments

Comments
 (0)