From 19459aea75d23da02d78fa0b57490dcd5338bb50 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 09:35:19 +0200 Subject: [PATCH 01/12] go fmt --- cmd/benchmark.go | 143 +++++++++++++++++++++--------------------- cmd/example.go | 14 +++-- cmd/timezone.go | 16 ++--- db.go | 158 +++++++++++++++++++++++------------------------ memory.go | 57 ++++++++--------- timezone.go | 140 +++++++++++++++++++++-------------------- 6 files changed, 270 insertions(+), 258 deletions(-) diff --git a/cmd/benchmark.go b/cmd/benchmark.go index 76356fa..799c645 100644 --- a/cmd/benchmark.go +++ b/cmd/benchmark.go @@ -1,88 +1,89 @@ package main + import ( - "time" "fmt" timezone "github.com/evanoberholster/timezoneLookup" + "time" ) func main() { - + tz, err := timezone.LoadTimezones(timezone.Config{ - DatabaseType:"boltdb", // memory or boltdb - DatabaseName:"timezone", // Name without suffix - Snappy: true, - Encoding: "msgpack", // json or msgpack - }) + DatabaseType: "boltdb", // memory or boltdb + DatabaseName: "timezone", // Name without suffix + Snappy: true, + Encoding: "msgpack", // json or msgpack + }) if err != nil { fmt.Println(err) } querys := []timezone.Coord{ - {Lat: 5.261417, Lon: -3.925778,}, // Abijan Airport - {Lat: -15.678889,Lon: 34.973889,}, // Blantyre Airport - {Lat: -12.65945, Lon: 18.25674,}, - {Lat: 41.8976, Lon:-87.6205}, - {Lat: 47.6897, Lon: -122.4023}, - {Lat: 42.7235, Lon:-73.6931}, - {Lat: 42.5807, Lon:-83.0223}, - {Lat: 36.8381, Lon:-84.8500}, - {Lat: 40.1674, Lon:-85.3583}, - {Lat: 37.9643, Lon:-86.7453}, - {Lat: 38.6043, Lon:-90.2417}, - {Lat: 41.1591, Lon:-104.8261}, - {Lat: 35.1991, Lon:-111.6348}, - {Lat: 43.1432, Lon:-115.6750}, - {Lat: 47.5886, Lon:-122.3382}, - {Lat: 58.3168, Lon:-134.4397}, - {Lat: 21.4381, Lon:-158.0493}, - {Lat: 42.7000, Lon:-80.0000}, - {Lat: 51.0036, Lon:-114.0161}, - {Lat:-16.4965, Lon:-68.1702}, - {Lat:-31.9369, Lon:115.8453}, - {Lat: 42.0000, Lon:-87.5000}, - {Lat: 41.8976, Lon:-87.6205}, - {Lat: 47.6897, Lon: -122.4023}, - {Lat: 42.7235, Lon:-73.6931}, - {Lat: 42.5807, Lon:-83.0223}, - {Lat: 36.8381, Lon:-84.8500}, - {Lat: 40.1674, Lon:-85.3583}, - {Lat: 37.9643, Lon:-86.7453}, - {Lat: 38.6043, Lon:-90.2417}, - {Lat: 41.1591, Lon:-104.8261}, - {Lat: 35.1991, Lon:-111.6348}, - {Lat: 43.1432, Lon:-115.6750}, - {Lat: 47.5886, Lon:-122.3382}, - {Lat: 58.3168, Lon:-134.4397}, - {Lat: 21.4381, Lon:-158.0493}, - {Lat: 42.7000, Lon:-80.0000}, - {Lat: 51.0036, Lon:-114.0161}, - {Lat:-16.4965, Lon:-68.1702}, - {Lat:-31.9369, Lon:115.8453}, - {Lat: 42.0000, Lon:-87.5000}, - {Lat: 41.8976, Lon:-87.6205}, - {Lat: 47.6897, Lon: -122.4023}, - {Lat: 42.7235, Lon:-73.6931}, - {Lat: 42.5807, Lon:-83.0223}, - {Lat: 36.8381, Lon:-84.8500}, - {Lat: 40.1674, Lon:-85.3583}, - {Lat: 37.9643, Lon:-86.7453}, - {Lat: 38.6043, Lon:-90.2417}, - {Lat: 41.1591, Lon:-104.8261}, - {Lat: 35.1991, Lon:-111.6348}, - {Lat: 43.1432, Lon:-115.6750}, - {Lat: 47.5886, Lon:-122.3382}, - {Lat: 58.3168, Lon:-134.4397}, - {Lat: 21.4381, Lon:-158.0493}, - {Lat: 42.7000, Lon:-80.0000}, - {Lat: 51.0036, Lon:-114.0161}, - {Lat:-16.4965, Lon:-68.1702}, - {Lat:-31.9369, Lon:115.8453}, - {Lat: 42.0000, Lon:-87.5000}, - } + {Lat: 5.261417, Lon: -3.925778}, // Abijan Airport + {Lat: -15.678889, Lon: 34.973889}, // Blantyre Airport + {Lat: -12.65945, Lon: 18.25674}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + } var times []int64 var total int64 - + for _, query := range querys { start := time.Now() res, err := tz.Query(query) @@ -92,10 +93,10 @@ func main() { elapsed := time.Since(start) fmt.Println("Query Result: ", res, " took: ", elapsed) times = append(times, elapsed.Nanoseconds()) - total += elapsed.Nanoseconds() + total += elapsed.Nanoseconds() } fmt.Println("Average time per query: ", time.Duration(total/int64(len(times)))) tz.Close() - timezone.PrintMemUsage() + timezone.PrintMemUsage() } diff --git a/cmd/example.go b/cmd/example.go index e356c72..b3cf75a 100644 --- a/cmd/example.go +++ b/cmd/example.go @@ -1,23 +1,25 @@ package main + import ( "fmt" timezone "github.com/evanoberholster/timezoneLookup" ) + var tz timezone.TimezoneInterface func main() { tz, err := timezone.LoadTimezones(timezone.Config{ - DatabaseType:"boltdb", // memory or boltdb - DatabaseName:"timezone", // Name without suffix - Snappy: true, - Encoding: "msgpack", // json or msgpack - }) + DatabaseType: "boltdb", // memory or boltdb + DatabaseName: "timezone", // Name without suffix + Snappy: true, + Encoding: "msgpack", // json or msgpack + }) if err != nil { fmt.Println(err) } res, err := tz.Query(timezone.Coord{ - Lat: 5.261417, Lon: -3.925778,}) + Lat: 5.261417, Lon: -3.925778}) if err != nil { fmt.Println(err) } diff --git a/cmd/timezone.go b/cmd/timezone.go index 982c230..e051f5e 100644 --- a/cmd/timezone.go +++ b/cmd/timezone.go @@ -1,16 +1,17 @@ package main + import ( "flag" - "log" timezone "github.com/evanoberholster/timezoneLookup" + "log" ) var ( - snappy = flag.Bool("snappy", true, "Use Snappy compression (true/false)") + snappy = flag.Bool("snappy", true, "Use Snappy compression (true/false)") jsonFilename = flag.String("json", "combined-with-oceans.json", "GEOJSON Filename") - dbFilename = flag.String("db", "timezone", "Destination database filename") - storageType = flag.String("type", "boltdb", "Storage: boltdb or memory") - encoding = flag.String("encoding", "msgpack", "BoltDB encoding type: json or msgpack") + dbFilename = flag.String("db", "timezone", "Destination database filename") + storageType = flag.String("type", "boltdb", "Storage: boltdb or memory") + encoding = flag.String("encoding", "msgpack", "BoltDB encoding type: json or msgpack") ) func main() { @@ -28,7 +29,7 @@ func main() { log.Println("\"-db\" No database type specified") return } - + if *jsonFilename != "" { err := tz.CreateTimezones(*jsonFilename) if err != nil { @@ -43,5 +44,4 @@ func main() { tz.Close() } - -} \ No newline at end of file +} diff --git a/db.go b/db.go index 7558231..550f21c 100644 --- a/db.go +++ b/db.go @@ -1,27 +1,28 @@ package timezoneLookup + import ( - "os" - "errors" "encoding/binary" "encoding/json" - bolt "go.etcd.io/bbolt" + "errors" "github.com/golang/snappy" "github.com/vmihailenco/msgpack" + bolt "go.etcd.io/bbolt" + "os" ) -type Store struct { // Database struct - db *bolt.DB - pIndex []PolygonIndex - filename string - snappy bool - encoding string +type Store struct { // Database struct + db *bolt.DB + pIndex []PolygonIndex + filename string + snappy bool + encoding string } type PolygonIndex struct { - Id uint64 `json:"-"` - Tzid string `json:"tzid"` - Max Coord `json:"max"` - Min Coord `json:"min"` + Id uint64 `json:"-"` + Tzid string `json:"tzid"` + Max Coord `json:"max"` + Min Coord `json:"min"` } func BoltdbStorage(snappy bool, filename string, encoding string) TimezoneInterface { @@ -32,17 +33,17 @@ func BoltdbStorage(snappy bool, filename string, encoding string) TimezoneInterf } return &Store{ filename: filename, - pIndex: []PolygonIndex{}, - snappy: snappy, + pIndex: []PolygonIndex{}, + snappy: snappy, encoding: encoding, } } -func (s *Store)Close() { +func (s *Store) Close() { defer s.db.Close() } -func (s *Store)LoadTimezones() (error) { +func (s *Store) LoadTimezones() error { if _, err := os.Stat(s.filename); os.IsNotExist(err) { return errors.New(errNotExistDatabase) } @@ -50,11 +51,11 @@ func (s *Store)LoadTimezones() (error) { if err != nil { return err } - // Load polygon indexes + // Load polygon indexes return s.db.View(func(tx *bolt.Tx) error { // Assume bucket exists and has keys b := tx.Bucket([]byte("Index")) - + var err error b.ForEach(func(k, v []byte) error { var index PolygonIndex @@ -74,13 +75,13 @@ func (s *Store)LoadTimezones() (error) { }) } -func (s *Store)Query(q Coord) (string, error) { +func (s *Store) Query(q Coord) (string, error) { for _, i := range s.pIndex { if i.Min.Lat < q.Lat && i.Min.Lon < q.Lon && i.Max.Lat > q.Lat && i.Max.Lon > q.Lon { p, err := s.loadPolygon(i.Id) if err != nil { return i.Tzid, errors.New(errPolygonNotFound) - } + } if p.contains(q) { return i.Tzid, nil } @@ -89,7 +90,7 @@ func (s *Store)Query(q Coord) (string, error) { return "Error", errors.New(errTimezoneNotFound) } -func (s *Store)CreateTimezones(jsonFilename string) (error) { +func (s *Store) CreateTimezones(jsonFilename string) error { err := checkFilesExist(jsonFilename, s.filename) if err != nil { return err @@ -112,7 +113,7 @@ func (s *Store)CreateTimezones(jsonFilename string) (error) { return nil } -func checkFilesExist(src string, dest string) (error) { +func checkFilesExist(src string, dest string) error { if _, err := os.Stat(src); os.IsNotExist(err) { return errors.New(errNotExistGeoJSON) } @@ -122,21 +123,21 @@ func checkFilesExist(src string, dest string) (error) { return nil } -func (s *Store)createBuckets() (error) { +func (s *Store) createBuckets() error { return s.db.Update(func(tx *bolt.Tx) error { - _, err := tx.CreateBucket([]byte("Index")) - if err != nil { - return err - } - _, err = tx.CreateBucket([]byte("Polygon")) - if err != nil { - return err - } - return nil + _, err := tx.CreateBucket([]byte("Index")) + if err != nil { + return err + } + _, err = tx.CreateBucket([]byte("Polygon")) + if err != nil { + return err + } + return nil }) } -func (s *Store)InsertPolygons(tz Timezone) { +func (s *Store) InsertPolygons(tz Timezone) { for _, polygon := range tz.Polygons { s.db.Update(func(tx *bolt.Tx) error { b := tx.Bucket([]byte("Polygon")) @@ -144,52 +145,52 @@ func (s *Store)InsertPolygons(tz Timezone) { // Get ID number autoIncrement id, _ := b.NextSequence() - intId := int(id) - - // Create Polygon Index - index := PolygonIndex{ - Tzid: tz.Tzid, - Max: polygon.Max, - Min: polygon.Min, - } - var bufPolygon, bufIndex []byte - var err error - - if s.encoding == "msgpack" { - // Marshal Polygons + intId := int(id) + + // Create Polygon Index + index := PolygonIndex{ + Tzid: tz.Tzid, + Max: polygon.Max, + Min: polygon.Min, + } + var bufPolygon, bufIndex []byte + var err error + + if s.encoding == "msgpack" { + // Marshal Polygons bufPolygon, err = msgpack.Marshal(polygon) - if err != nil { - return err - } - // Marshal Polygon Index - bufIndex, err = msgpack.Marshal(index) - if err != nil { - return err - } + if err != nil { + return err + } + // Marshal Polygon Index + bufIndex, err = msgpack.Marshal(index) + if err != nil { + return err + } } else { - bufPolygon, err = json.Marshal(polygon) - if err != nil { - return err - } - bufIndex, err = json.Marshal(index) - if err != nil { - return err - } + bufPolygon, err = json.Marshal(polygon) + if err != nil { + return err + } + bufIndex, err = json.Marshal(index) + if err != nil { + return err + } + } + if s.snappy { + bufPolygon = snappy.Encode(nil, bufPolygon) } - if s.snappy { - bufPolygon = snappy.Encode(nil, bufPolygon) - } - // Write Polygon Index - err = i.Put(itob(intId), bufIndex) - if err != nil { - return err - } - return b.Put(itob(intId), bufPolygon) + // Write Polygon Index + err = i.Put(itob(intId), bufIndex) + if err != nil { + return err + } + return b.Put(itob(intId), bufPolygon) }) } } -func (s *Store)loadPolygon(id uint64) (Polygon, error) { +func (s *Store) loadPolygon(id uint64) (Polygon, error) { var polygon Polygon err := s.db.View(func(tx *bolt.Tx) error { b := tx.Bucket([]byte("Polygon")) @@ -212,17 +213,16 @@ func (s *Store)loadPolygon(id uint64) (Polygon, error) { // itob returns an 8-byte big endian representation of v. func itob(v int) []byte { - b := make([]byte, 8) - binary.BigEndian.PutUint64(b, uint64(v)) - return b + b := make([]byte, 8) + binary.BigEndian.PutUint64(b, uint64(v)) + return b } - -func (s *Store)OpenDB(path string) (error) { +func (s *Store) OpenDB(path string) error { var err error s.db, err = bolt.Open(path, 0666, nil) if err != nil { - return err + return err } return nil } diff --git a/memory.go b/memory.go index a0cccff..2b95e5b 100644 --- a/memory.go +++ b/memory.go @@ -1,15 +1,16 @@ -package timezoneLookup +package timezoneLookup + import ( - "os" "encoding/json" "errors" "github.com/golang/snappy" + "os" ) type Memory struct { // Memory struct - filename string - timezones []Timezone - snappy bool + filename string + timezones []Timezone + snappy bool } func MemoryStorage(snappy bool, filename string) *Memory { @@ -19,22 +20,22 @@ func MemoryStorage(snappy bool, filename string) *Memory { filename = filename + ".json" } return &Memory{ - filename: filename, + filename: filename, timezones: []Timezone{}, - snappy: snappy, + snappy: snappy, } } -func (m *Memory)Close() { +func (m *Memory) Close() { m.timezones = []Timezone{} } -func (m *Memory)LoadTimezones() (error) { +func (m *Memory) LoadTimezones() error { file, err := os.Open(m.filename) if err != nil { return err } - + var tzs []Timezone if m.snappy { data := snappy.NewReader(file) @@ -61,7 +62,7 @@ func (m *Memory)LoadTimezones() (error) { return nil } -func (m *Memory)Query(q Coord) (string, error) { +func (m *Memory) Query(q Coord) (string, error) { for _, tz := range m.timezones { for _, p := range tz.Polygons { if p.Min.Lat < q.Lat && p.Min.Lon < q.Lon && p.Max.Lat > q.Lat && p.Max.Lon > q.Lon { @@ -74,30 +75,30 @@ func (m *Memory)Query(q Coord) (string, error) { return "Error", errors.New(errTimezoneNotFound) } -func (m *Memory)writeTimezoneJSON(dbFilename string) (error) { - data, err := json.Marshal(m.timezones) - if err != nil { - return err - } +func (m *Memory) writeTimezoneJSON(dbFilename string) error { + data, err := json.Marshal(m.timezones) + if err != nil { + return err + } w, err := os.Create(dbFilename) - if err != nil { - return err - } - defer w.Close() - if m.snappy { - snap := snappy.NewBufferedWriter(w) + if err != nil { + return err + } + defer w.Close() + if m.snappy { + snap := snappy.NewBufferedWriter(w) _, err := snap.Write(data) if err != nil { return err } defer snap.Close() - } else { - _ , err = w.Write(data) - } - return err + } else { + _, err = w.Write(data) + } + return err } -func (m *Memory)CreateTimezones(jsonFilename string) (error) { +func (m *Memory) CreateTimezones(jsonFilename string) error { tzs, err := TimezonesFromGeoJSON(jsonFilename) if err != nil { return err @@ -108,4 +109,4 @@ func (m *Memory)CreateTimezones(jsonFilename string) (error) { return err } return nil -} \ No newline at end of file +} diff --git a/timezone.go b/timezone.go index b0da676..0cf3150 100644 --- a/timezone.go +++ b/timezone.go @@ -1,33 +1,34 @@ package timezoneLookup + import ( - "os" - "time" + "encoding/json" "errors" "fmt" + "os" "runtime" - "encoding/json" + "time" ) const ( WithSnappy = true - NoSnappy = false + NoSnappy = false // Errors - errNotExistGeoJSON = "Error: GeoJSON file does not exist" - errExistDatabase = "Error: Destination Database file already exists" - errNotExistDatabase = "Error: Database file does not exist" - errPolygonNotFound = "Error: Polygon for Timezone not found" - errTimezoneNotFound = "Error: Timezone not found" + errNotExistGeoJSON = "Error: GeoJSON file does not exist" + errExistDatabase = "Error: Destination Database file already exists" + errNotExistDatabase = "Error: Database file does not exist" + errPolygonNotFound = "Error: Polygon for Timezone not found" + errTimezoneNotFound = "Error: Timezone not found" errDatabaseTypeUknown = "Error: Database type unknown" ) type TimezoneInterface interface { - CreateTimezones(jsonFilename string) (error) - LoadTimezones() (error) - Query(q Coord) (string, error) + CreateTimezones(jsonFilename string) error + LoadTimezones() error + Query(q Coord) (string, error) Close() } - + type TimezoneGeoJSON struct { Type string `json:"type"` Features []struct { @@ -43,26 +44,26 @@ type TimezoneGeoJSON struct { } type Timezone struct { - Tzid string `json:"tzid"` - Polygons []Polygon `json:"polygons"` + Tzid string `json:"tzid"` + Polygons []Polygon `json:"polygons"` } type Polygon struct { - Max Coord `json:"max"` - Min Coord `json:"min"` - Coords []Coord `json:"coords"` + Max Coord `json:"max"` + Min Coord `json:"min"` + Coords []Coord `json:"coords"` } type Coord struct { - Lat float32 `json:"lat"` - Lon float32 `json:"lon"` -} + Lat float32 `json:"lat"` + Lon float32 `json:"lon"` +} type Config struct { - DatabaseName string - DatabaseType string - Snappy bool - Encoding string + DatabaseName string + DatabaseType string + Snappy bool + Encoding string } var Tz TimezoneInterface @@ -93,7 +94,7 @@ func TimezonesFromGeoJSON(filename string) ([]Timezone, error) { for dec.More() { var js TimezoneGeoJSON - + err := dec.Decode(&js) if err != nil { return timeZones, err @@ -101,10 +102,10 @@ func TimezonesFromGeoJSON(filename string) ([]Timezone, error) { for _, tz := range js.Features { t := Timezone{Tzid: tz.Properties.Tzid} switch tz.Geometry.Item { - case "Polygon": - t.decodePolygons(tz.Geometry.Coordinates) - case "MultiPolygon": - t.decodeMultiPolygons(tz.Geometry.Coordinates) + case "Polygon": + t.decodePolygons(tz.Geometry.Coordinates) + case "MultiPolygon": + t.decodeMultiPolygons(tz.Geometry.Coordinates) } timeZones = append(timeZones, t) } @@ -114,78 +115,85 @@ func TimezonesFromGeoJSON(filename string) ([]Timezone, error) { return timeZones, nil } -func (t *Timezone)decodePolygons(polys []interface{}) { //1 +func (t *Timezone) decodePolygons(polys []interface{}) { //1 for _, points := range polys { p := t.newPolygon() for _, point := range points.([]interface{}) { //3 - p.updatePolygon(point.([]interface{})) + p.updatePolygon(point.([]interface{})) } t.Polygons = append(t.Polygons, p) } } -func (t *Timezone)decodeMultiPolygons(polys []interface{}) { //1 +func (t *Timezone) decodeMultiPolygons(polys []interface{}) { //1 for _, v := range polys { p := t.newPolygon() for _, points := range v.([]interface{}) { // 2 for _, point := range points.([]interface{}) { //3 - p.updatePolygon(point.([]interface{})) + p.updatePolygon(point.([]interface{})) } } t.Polygons = append(t.Polygons, p) } } -func (t *Timezone)newPolygon() (Polygon) { +func (t *Timezone) newPolygon() Polygon { return Polygon{ - Max: Coord{ Lat: -90, Lon: -180, }, - Min: Coord{ Lat: 90, Lon: 180, }, - } + Max: Coord{Lat: -90, Lon: -180}, + Min: Coord{Lat: 90, Lon: 180}, + } } -func (p *Polygon)updatePolygon(xy []interface{}) { +func (p *Polygon) updatePolygon(xy []interface{}) { lon := float32(xy[0].(float64)) lat := float32(xy[1].(float64)) // Update max and min limits - if p.Max.Lat < lat { p.Max.Lat = lat } - if p.Max.Lon < lon { p.Max.Lon = lon } - if p.Min.Lat > lat { p.Min.Lat = lat } - if p.Min.Lon > lon { p.Min.Lon = lon } + if p.Max.Lat < lat { + p.Max.Lat = lat + } + if p.Max.Lon < lon { + p.Max.Lon = lon + } + if p.Min.Lat > lat { + p.Min.Lat = lat + } + if p.Min.Lon > lon { + p.Min.Lon = lon + } // add Coords to Polygon - p.Coords = append(p.Coords, Coord{Lat:lat, Lon:lon}) + p.Coords = append(p.Coords, Coord{Lat: lat, Lon: lon}) } -func (p *Polygon)contains(queryPt Coord) bool { - if len(p.Coords) < 3 { - return false - } - in := rayIntersectsSegment(queryPt, p.Coords[len(p.Coords)-1], p.Coords[0]) - for i := 1; i < len(p.Coords); i++ { - if rayIntersectsSegment(queryPt, p.Coords[i-1], p.Coords[i]) { - in = !in - } - } - return in +func (p *Polygon) contains(queryPt Coord) bool { + if len(p.Coords) < 3 { + return false + } + in := rayIntersectsSegment(queryPt, p.Coords[len(p.Coords)-1], p.Coords[0]) + for i := 1; i < len(p.Coords); i++ { + if rayIntersectsSegment(queryPt, p.Coords[i-1], p.Coords[i]) { + in = !in + } + } + return in } - func rayIntersectsSegment(p, a, b Coord) bool { - return (a.Lon > p.Lon) != (b.Lon > p.Lon) && - p.Lat < (b.Lat-a.Lat)*(p.Lon-a.Lon)/(b.Lon-a.Lon)+a.Lat + return (a.Lon > p.Lon) != (b.Lon > p.Lon) && + p.Lat < (b.Lat-a.Lat)*(p.Lon-a.Lon)/(b.Lon-a.Lon)+a.Lat } func PrintMemUsage() { - var m runtime.MemStats - runtime.ReadMemStats(&m) - // For info on each, see: https://golang.org/pkg/runtime/#MemStats - fmt.Printf("Allocated Memory = %v MiB", bToMb(m.Alloc)) - fmt.Printf("\tTotal Allocated Memory = %v MiB", bToMb(m.TotalAlloc)) - fmt.Printf("\tSystem Memory = %v MiB", bToMb(m.Sys)) - fmt.Printf("\tNumber of GC = %v\n", m.NumGC) + var m runtime.MemStats + runtime.ReadMemStats(&m) + // For info on each, see: https://golang.org/pkg/runtime/#MemStats + fmt.Printf("Allocated Memory = %v MiB", bToMb(m.Alloc)) + fmt.Printf("\tTotal Allocated Memory = %v MiB", bToMb(m.TotalAlloc)) + fmt.Printf("\tSystem Memory = %v MiB", bToMb(m.Sys)) + fmt.Printf("\tNumber of GC = %v\n", m.NumGC) } func bToMb(b uint64) uint64 { - return b / 1024 / 1024 + return b / 1024 / 1024 } From 50cdcb49a7774699649ea961c8f604d30a24519b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 09:35:26 +0200 Subject: [PATCH 02/12] go mod init --- go.mod | 17 +++++++++++++++++ go.sum | 26 ++++++++++++++++++++++++++ 2 files changed, 43 insertions(+) create mode 100644 go.mod create mode 100644 go.sum diff --git a/go.mod b/go.mod new file mode 100644 index 0000000..063ea04 --- /dev/null +++ b/go.mod @@ -0,0 +1,17 @@ +module github.com/evanoberholster/timezoneLookup + +go 1.17 + +require ( + github.com/golang/snappy v0.0.4 + github.com/vmihailenco/msgpack v4.0.4+incompatible + go.etcd.io/bbolt v1.3.6 +) + +require ( + github.com/golang/protobuf v1.3.1 // indirect + golang.org/x/net v0.0.0-20190603091049-60506f45cf65 // indirect + golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d // indirect + google.golang.org/appengine v1.6.7 // indirect + gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c // indirect +) diff --git a/go.sum b/go.sum new file mode 100644 index 0000000..ece0f93 --- /dev/null +++ b/go.sum @@ -0,0 +1,26 @@ +github.com/golang/protobuf v1.3.1 h1:YF8+flBXS5eO826T4nzqPrxfhQThhXl0YzfuUPu4SBg= +github.com/golang/protobuf v1.3.1/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U= +github.com/golang/snappy v0.0.4 h1:yAGX7huGHXlcLOEtBnF4w7FQwA26wojNCwOYAEhLjQM= +github.com/golang/snappy v0.0.4/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q= +github.com/kr/pretty v0.2.1 h1:Fmg33tUaq4/8ym9TJN1x7sLJnHVwhP33CNkpYV/7rwI= +github.com/kr/pretty v0.2.1/go.mod h1:ipq/a2n7PKx3OHsz4KJII5eveXtPO4qwEXGdVfWzfnI= +github.com/kr/pty v1.1.1/go.mod h1:pFQYn66WHrOpPYNljwOMqo10TkYh1fy3cYio2l3bCsQ= +github.com/kr/text v0.1.0 h1:45sCR5RtlFHMR4UwH9sdQ5TC8v0qDQCHnXt+kaKSTVE= +github.com/kr/text v0.1.0/go.mod h1:4Jbv+DJW3UT/LiOwJeYQe1efqtUx/iVham/4vfdArNI= +github.com/vmihailenco/msgpack v4.0.4+incompatible h1:dSLoQfGFAo3F6OoNhwUmLwVgaUXK79GlxNBwueZn0xI= +github.com/vmihailenco/msgpack v4.0.4+incompatible/go.mod h1:fy3FlTQTDXWkZ7Bh6AcGMlsjHatGryHQYUTf1ShIgkk= +go.etcd.io/bbolt v1.3.6 h1:/ecaJf0sk1l4l6V4awd65v2C3ILy7MSj+s/x1ADCIMU= +go.etcd.io/bbolt v1.3.6/go.mod h1:qXsaaIqmgQH0T+OPdb99Bf+PKfBBQVAdyD6TY9G8XM4= +golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w= +golang.org/x/net v0.0.0-20190603091049-60506f45cf65 h1:+rhAzEzT3f4JtomfC371qB+0Ola2caSKcY69NUBZrRQ= +golang.org/x/net v0.0.0-20190603091049-60506f45cf65/go.mod h1:HSz+uSET+XFnRR8LxR5pz3Of3rY3CfYBVs4xY44aLks= +golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY= +golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d h1:L/IKR6COd7ubZrs2oTnTi73IhgqJ71c9s80WsQnh0Es= +golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs= +golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ= +golang.org/x/text v0.3.2/go.mod h1:bEr9sfX3Q8Zfm5fL9x+3itogRgK3+ptLWKqgva+5dAk= +golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ= +google.golang.org/appengine v1.6.7 h1:FZR1q0exgwxzPzp/aF+VccGrSfxfPpkBqjIIEq3ru6c= +google.golang.org/appengine v1.6.7/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc= +gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk= +gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c/go.mod h1:JHkPIbrfpd72SG/EVd6muEfDQjcINNoR0C8j2r3qZ4Q= From d2e291679b5e7ca548c7a67c57ae3482857ebb64 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 10:16:54 +0200 Subject: [PATCH 03/12] Add Copyright and SPDX-License-Identifier to all source files --- bench_test.go | 100 +++++++++++++++++++++++++++++++++++++++++++++++ cmd/benchmark.go | 9 ++++- cmd/example.go | 10 +++-- cmd/timezone.go | 52 +++++++++++++----------- db.go | 7 +++- example_test.go | 31 +++++++++++++++ memory.go | 7 +++- timezone.go | 4 ++ 8 files changed, 190 insertions(+), 30 deletions(-) create mode 100644 bench_test.go create mode 100644 example_test.go diff --git a/bench_test.go b/bench_test.go new file mode 100644 index 0000000..f9fd349 --- /dev/null +++ b/bench_test.go @@ -0,0 +1,100 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + +package timezoneLookup_test + +import ( + "fmt" + "testing" + + timezone "github.com/evanoberholster/timezoneLookup" +) + +func BenchmarkLookup(b *testing.B) { + tz, err := timezone.LoadTimezones(timezone.Config{ + DatabaseType: "boltdb", // memory or boltdb + DatabaseName: "timezone", // Name without suffix + Snappy: true, + Encoding: "msgpack", // json or msgpack + }) + if err != nil { + b.Fatal(err) + } + defer tz.Close() + + querys := []timezone.Coord{ + {Lat: 5.261417, Lon: -3.925778}, // Abijan Airport + {Lat: -15.678889, Lon: 34.973889}, // Blantyre Airport + {Lat: -12.65945, Lon: 18.25674}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + {Lat: 41.8976, Lon: -87.6205}, + {Lat: 47.6897, Lon: -122.4023}, + {Lat: 42.7235, Lon: -73.6931}, + {Lat: 42.5807, Lon: -83.0223}, + {Lat: 36.8381, Lon: -84.8500}, + {Lat: 40.1674, Lon: -85.3583}, + {Lat: 37.9643, Lon: -86.7453}, + {Lat: 38.6043, Lon: -90.2417}, + {Lat: 41.1591, Lon: -104.8261}, + {Lat: 35.1991, Lon: -111.6348}, + {Lat: 43.1432, Lon: -115.6750}, + {Lat: 47.5886, Lon: -122.3382}, + {Lat: 58.3168, Lon: -134.4397}, + {Lat: 21.4381, Lon: -158.0493}, + {Lat: 42.7000, Lon: -80.0000}, + {Lat: 51.0036, Lon: -114.0161}, + {Lat: -16.4965, Lon: -68.1702}, + {Lat: -31.9369, Lon: 115.8453}, + {Lat: 42.0000, Lon: -87.5000}, + } + + b.ResetTimer() + for i := 0; i < b.N; i++ { + for _, query := range querys { + _, err := tz.Query(query) + if err != nil { + fmt.Println(err) + } + } + } + b.StopTimer() + timezone.PrintMemUsage() +} diff --git a/cmd/benchmark.go b/cmd/benchmark.go index 799c645..9cdd1eb 100644 --- a/cmd/benchmark.go +++ b/cmd/benchmark.go @@ -1,9 +1,16 @@ +// +build: benchmark + +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package main import ( "fmt" - timezone "github.com/evanoberholster/timezoneLookup" "time" + + timezone "github.com/evanoberholster/timezoneLookup" ) func main() { diff --git a/cmd/example.go b/cmd/example.go index b3cf75a..bfe607d 100644 --- a/cmd/example.go +++ b/cmd/example.go @@ -1,12 +1,15 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package main import ( "fmt" + timezone "github.com/evanoberholster/timezoneLookup" ) -var tz timezone.TimezoneInterface - func main() { tz, err := timezone.LoadTimezones(timezone.Config{ DatabaseType: "boltdb", // memory or boltdb @@ -17,6 +20,7 @@ func main() { if err != nil { fmt.Println(err) } + defer tz.Close() res, err := tz.Query(timezone.Coord{ Lat: 5.261417, Lon: -3.925778}) @@ -24,6 +28,4 @@ func main() { fmt.Println(err) } fmt.Println("Query Result: ", res) - - tz.Close() } diff --git a/cmd/timezone.go b/cmd/timezone.go index e051f5e..1df49c2 100644 --- a/cmd/timezone.go +++ b/cmd/timezone.go @@ -1,9 +1,15 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package main import ( + "errors" "flag" - timezone "github.com/evanoberholster/timezoneLookup" "log" + + timezone "github.com/evanoberholster/timezoneLookup" ) var ( @@ -15,33 +21,33 @@ var ( ) func main() { + if err := Main(); err != nil { + log.Fatalln(err) + } +} +func Main() error { flag.Parse() if *dbFilename == "" || *jsonFilename == "" { log.Printf("Options:\n\t -snappy=true\t Use Snappy compression\n\t -json=filename\t GEOJSON filename \n\t -db=filename\t Database destination\n\t -type=boltdb\t Type of Storage (boltdb or memory) ") + return nil + } + var tz timezone.TimezoneInterface + if *storageType == "memory" { + tz = timezone.MemoryStorage(*snappy, *dbFilename) + } else if *storageType == "boltdb" { + tz = timezone.BoltdbStorage(*snappy, *dbFilename, *encoding) } else { - var tz timezone.TimezoneInterface - if *storageType == "memory" { - tz = timezone.MemoryStorage(*snappy, *dbFilename) - } else if *storageType == "boltdb" { - tz = timezone.BoltdbStorage(*snappy, *dbFilename, *encoding) - } else { - log.Println("\"-db\" No database type specified") - return - } - - if *jsonFilename != "" { - err := tz.CreateTimezones(*jsonFilename) - if err != nil { - log.Println(err) - return - } - } else { - log.Println("\"-json\" No GeoJSON source file specified") - return - } - - tz.Close() + return errors.New("\"-db\" No database type specified") } + if *jsonFilename == "" { + return errors.New("\"-json\" No GeoJSON source file specified") + } + err := tz.CreateTimezones(*jsonFilename) + if err != nil { + return err + } + tz.Close() + return nil } diff --git a/db.go b/db.go index 550f21c..93364ad 100644 --- a/db.go +++ b/db.go @@ -1,13 +1,18 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package timezoneLookup import ( "encoding/binary" "encoding/json" "errors" + "os" + "github.com/golang/snappy" "github.com/vmihailenco/msgpack" bolt "go.etcd.io/bbolt" - "os" ) type Store struct { // Database struct diff --git a/example_test.go b/example_test.go new file mode 100644 index 0000000..662821b --- /dev/null +++ b/example_test.go @@ -0,0 +1,31 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + +package timezoneLookup_test + +import ( + "fmt" + + timezone "github.com/evanoberholster/timezoneLookup" +) + +func ExampleQuery() { + tz, err := timezone.LoadTimezones(timezone.Config{ + DatabaseType: "boltdb", // memory or boltdb + DatabaseName: "timezone", // Name without suffix + Snappy: true, + Encoding: "msgpack", // json or msgpack + }) + if err != nil { + fmt.Println(err) + } + defer tz.Close() + + res, err := tz.Query(timezone.Coord{ + Lat: 5.261417, Lon: -3.925778}) + if err != nil { + fmt.Println(err) + } + fmt.Println("Query Result: ", res) +} diff --git a/memory.go b/memory.go index 2b95e5b..fa27034 100644 --- a/memory.go +++ b/memory.go @@ -1,10 +1,15 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package timezoneLookup import ( "encoding/json" "errors" - "github.com/golang/snappy" "os" + + "github.com/golang/snappy" ) type Memory struct { // Memory struct diff --git a/timezone.go b/timezone.go index 0cf3150..ed331f0 100644 --- a/timezone.go +++ b/timezone.go @@ -1,3 +1,7 @@ +// Copyright 2018 Evan Oberholster. +// +// SPDX-License-Identifier: MIT + package timezoneLookup import ( From 9319a5328a7186efdb40f4cb27dd3c115306ec86 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 10:26:53 +0200 Subject: [PATCH 04/12] cmd/timezone.go: Download 2020d if not exist --- cmd/timezone.go | 38 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) diff --git a/cmd/timezone.go b/cmd/timezone.go index 1df49c2..f45af39 100644 --- a/cmd/timezone.go +++ b/cmd/timezone.go @@ -5,9 +5,14 @@ package main import ( + "archive/zip" + "bytes" "errors" "flag" + "io" "log" + "net/http" + "os" timezone "github.com/evanoberholster/timezoneLookup" ) @@ -17,6 +22,7 @@ var ( jsonFilename = flag.String("json", "combined-with-oceans.json", "GEOJSON Filename") dbFilename = flag.String("db", "timezone", "Destination database filename") storageType = flag.String("type", "boltdb", "Storage: boltdb or memory") + jsonURL = flag.String("json-url", "https://github.com/evansiroky/timezone-boundary-builder/releases/download/2020d/timezones-with-oceans.geojson.zip", "Download GeoJSON file from here if not exist") encoding = flag.String("encoding", "msgpack", "BoltDB encoding type: json or msgpack") ) @@ -44,6 +50,38 @@ func Main() error { if *jsonFilename == "" { return errors.New("\"-json\" No GeoJSON source file specified") } + if _, err := os.Stat(*jsonFilename); err != nil && os.IsNotExist(err) { + log.Println("Downloading " + *jsonURL) + resp, err := http.Get(*jsonURL) + if err != nil { + return err + } + var buf bytes.Buffer + _, err = io.Copy(&buf, resp.Body) + resp.Body.Close() + if err != nil { + return err + } + zr, err := zip.NewReader(bytes.NewReader(buf.Bytes()), int64(buf.Len())) + if err != nil { + return err + } + sr, err := zr.Open("combined-with-oceans.json") + if err != nil { + return err + } + fh, err := os.Create(*jsonFilename) + if err != nil { + return err + } + defer fh.Close() + if _, err = io.Copy(fh, sr); err != nil { + return err + } + if err := fh.Close(); err != nil { + return err + } + } err := tz.CreateTimezones(*jsonFilename) if err != nil { return err From b1d5a48a027b7a85df5f2e14ded3d11e7653a989 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 10:31:02 +0200 Subject: [PATCH 05/12] Benchmark: Measure per query performance --- bench_test.go | 11 +++++------ db.go | 1 + 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/bench_test.go b/bench_test.go index f9fd349..03b56a3 100644 --- a/bench_test.go +++ b/bench_test.go @@ -86,15 +86,14 @@ func BenchmarkLookup(b *testing.B) { {Lat: 42.0000, Lon: -87.5000}, } + b.ReportAllocs() b.ResetTimer() for i := 0; i < b.N; i++ { - for _, query := range querys { - _, err := tz.Query(query) - if err != nil { - fmt.Println(err) - } + query := querys[i%len(querys)] + _, err := tz.Query(query) + if err != nil { + fmt.Println(err) } } b.StopTimer() - timezone.PrintMemUsage() } diff --git a/db.go b/db.go index 93364ad..605619e 100644 --- a/db.go +++ b/db.go @@ -11,6 +11,7 @@ import ( "os" "github.com/golang/snappy" + //"github.com/klauspost/compress/snappy" "github.com/vmihailenco/msgpack" bolt "go.etcd.io/bbolt" ) From 390c8bbcebfbbdc6cdba05ab4aa5f49d7a6a1a4f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 10:42:09 +0200 Subject: [PATCH 06/12] BenchmarkLookup: Download 2020d if not exist --- bench_test.go | 7 +++++++ cmd/timezone.go | 1 + db.go | 5 ++--- go.mod | 3 +++ go.sum | 12 ++++++++++++ 5 files changed, 25 insertions(+), 3 deletions(-) diff --git a/bench_test.go b/bench_test.go index 03b56a3..03a8eed 100644 --- a/bench_test.go +++ b/bench_test.go @@ -6,12 +6,19 @@ package timezoneLookup_test import ( "fmt" + "os" + "os/exec" "testing" timezone "github.com/evanoberholster/timezoneLookup" ) func BenchmarkLookup(b *testing.B) { + if _, err := os.Stat("timezone.snap.db"); err != nil && os.IsNotExist(err) { + cmd := exec.Command("go", "run", "cmd/timezone.go") + cmd.Stdout, cmd.Stderr = os.Stdout, os.Stderr + _ = cmd.Run() + } tz, err := timezone.LoadTimezones(timezone.Config{ DatabaseType: "boltdb", // memory or boltdb DatabaseName: "timezone", // Name without suffix diff --git a/cmd/timezone.go b/cmd/timezone.go index f45af39..ede8f0d 100644 --- a/cmd/timezone.go +++ b/cmd/timezone.go @@ -74,6 +74,7 @@ func Main() error { if err != nil { return err } + defer func() { _ = os.Remove(fh.Name()) }() defer fh.Close() if _, err = io.Copy(fh, sr); err != nil { return err diff --git a/db.go b/db.go index 605619e..6f50c8f 100644 --- a/db.go +++ b/db.go @@ -10,9 +10,8 @@ import ( "errors" "os" - "github.com/golang/snappy" - //"github.com/klauspost/compress/snappy" - "github.com/vmihailenco/msgpack" + "github.com/klauspost/compress/snappy" + "github.com/vmihailenco/msgpack/v5" bolt "go.etcd.io/bbolt" ) diff --git a/go.mod b/go.mod index 063ea04..56c58b0 100644 --- a/go.mod +++ b/go.mod @@ -10,6 +10,9 @@ require ( require ( github.com/golang/protobuf v1.3.1 // indirect + github.com/klauspost/compress v1.13.6 // indirect + github.com/vmihailenco/msgpack/v5 v5.3.4 // indirect + github.com/vmihailenco/tagparser/v2 v2.0.0 // indirect golang.org/x/net v0.0.0-20190603091049-60506f45cf65 // indirect golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d // indirect google.golang.org/appengine v1.6.7 // indirect diff --git a/go.sum b/go.sum index ece0f93..8cf5b3e 100644 --- a/go.sum +++ b/go.sum @@ -1,14 +1,24 @@ +github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38= github.com/golang/protobuf v1.3.1 h1:YF8+flBXS5eO826T4nzqPrxfhQThhXl0YzfuUPu4SBg= github.com/golang/protobuf v1.3.1/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U= github.com/golang/snappy v0.0.4 h1:yAGX7huGHXlcLOEtBnF4w7FQwA26wojNCwOYAEhLjQM= github.com/golang/snappy v0.0.4/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q= +github.com/klauspost/compress v1.13.6 h1:P76CopJELS0TiO2mebmnzgWaajssP/EszplttgQxcgc= +github.com/klauspost/compress v1.13.6/go.mod h1:/3/Vjq9QcHkK5uEr5lBEmyoZ1iFhe47etQ6QUkpK6sk= github.com/kr/pretty v0.2.1 h1:Fmg33tUaq4/8ym9TJN1x7sLJnHVwhP33CNkpYV/7rwI= github.com/kr/pretty v0.2.1/go.mod h1:ipq/a2n7PKx3OHsz4KJII5eveXtPO4qwEXGdVfWzfnI= github.com/kr/pty v1.1.1/go.mod h1:pFQYn66WHrOpPYNljwOMqo10TkYh1fy3cYio2l3bCsQ= github.com/kr/text v0.1.0 h1:45sCR5RtlFHMR4UwH9sdQ5TC8v0qDQCHnXt+kaKSTVE= github.com/kr/text v0.1.0/go.mod h1:4Jbv+DJW3UT/LiOwJeYQe1efqtUx/iVham/4vfdArNI= +github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4= +github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME= +github.com/stretchr/testify v1.6.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg= github.com/vmihailenco/msgpack v4.0.4+incompatible h1:dSLoQfGFAo3F6OoNhwUmLwVgaUXK79GlxNBwueZn0xI= github.com/vmihailenco/msgpack v4.0.4+incompatible/go.mod h1:fy3FlTQTDXWkZ7Bh6AcGMlsjHatGryHQYUTf1ShIgkk= +github.com/vmihailenco/msgpack/v5 v5.3.4 h1:qMKAwOV+meBw2Y8k9cVwAy7qErtYCwBzZ2ellBfvnqc= +github.com/vmihailenco/msgpack/v5 v5.3.4/go.mod h1:7xyJ9e+0+9SaZT0Wt1RGleJXzli6Q/V5KbhBonMG9jc= +github.com/vmihailenco/tagparser/v2 v2.0.0 h1:y09buUbR+b5aycVFQs/g70pqKVZNBmxwAhO7/IwNM9g= +github.com/vmihailenco/tagparser/v2 v2.0.0/go.mod h1:Wri+At7QHww0WTrCBeu4J6bNtoV6mEfg5OIWRZA9qds= go.etcd.io/bbolt v1.3.6 h1:/ecaJf0sk1l4l6V4awd65v2C3ILy7MSj+s/x1ADCIMU= go.etcd.io/bbolt v1.3.6/go.mod h1:qXsaaIqmgQH0T+OPdb99Bf+PKfBBQVAdyD6TY9G8XM4= golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w= @@ -22,5 +32,7 @@ golang.org/x/text v0.3.2/go.mod h1:bEr9sfX3Q8Zfm5fL9x+3itogRgK3+ptLWKqgva+5dAk= golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ= google.golang.org/appengine v1.6.7 h1:FZR1q0exgwxzPzp/aF+VccGrSfxfPpkBqjIIEq3ru6c= google.golang.org/appengine v1.6.7/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc= +gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0= gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk= gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c/go.mod h1:JHkPIbrfpd72SG/EVd6muEfDQjcINNoR0C8j2r3qZ4Q= +gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM= From 7fe62edc725e4f2342a944a201a4c8db81d78ca6 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 10:56:42 +0200 Subject: [PATCH 07/12] Make encoding an enum --- bench_test.go | 2 +- cmd/benchmark.go | 3 ++- cmd/example.go | 3 +++ cmd/timezone.go | 16 ++++++++++++-- db.go | 56 +++++++++++++++++++++++++++++++++++++----------- example_test.go | 2 +- timezone.go | 2 +- 7 files changed, 66 insertions(+), 18 deletions(-) diff --git a/bench_test.go b/bench_test.go index 03a8eed..e4be12e 100644 --- a/bench_test.go +++ b/bench_test.go @@ -23,7 +23,7 @@ func BenchmarkLookup(b *testing.B) { DatabaseType: "boltdb", // memory or boltdb DatabaseName: "timezone", // Name without suffix Snappy: true, - Encoding: "msgpack", // json or msgpack + Encoding: timezone.EncMsgPack, // json or msgpack }) if err != nil { b.Fatal(err) diff --git a/cmd/benchmark.go b/cmd/benchmark.go index 9cdd1eb..d2ac449 100644 --- a/cmd/benchmark.go +++ b/cmd/benchmark.go @@ -1,4 +1,5 @@ -// +build: benchmark +//go:build benchmark +// +build benchmark // Copyright 2018 Evan Oberholster. // diff --git a/cmd/example.go b/cmd/example.go index bfe607d..bec56ad 100644 --- a/cmd/example.go +++ b/cmd/example.go @@ -1,3 +1,6 @@ +//go:build example +// +build example + // Copyright 2018 Evan Oberholster. // // SPDX-License-Identifier: MIT diff --git a/cmd/timezone.go b/cmd/timezone.go index ede8f0d..356da21 100644 --- a/cmd/timezone.go +++ b/cmd/timezone.go @@ -7,12 +7,14 @@ package main import ( "archive/zip" "bytes" + "context" "errors" "flag" "io" "log" "net/http" "os" + "os/signal" timezone "github.com/evanoberholster/timezoneLookup" ) @@ -42,7 +44,11 @@ func Main() error { if *storageType == "memory" { tz = timezone.MemoryStorage(*snappy, *dbFilename) } else if *storageType == "boltdb" { - tz = timezone.BoltdbStorage(*snappy, *dbFilename, *encoding) + e, err := timezone.EncodingFromString(*encoding) + if err != nil { + return err + } + tz = timezone.BoltdbStorage(*snappy, *dbFilename, e) } else { return errors.New("\"-db\" No database type specified") } @@ -50,9 +56,15 @@ func Main() error { if *jsonFilename == "" { return errors.New("\"-json\" No GeoJSON source file specified") } + ctx, cancel := signal.NotifyContext(context.Background(), os.Interrupt) + defer cancel() if _, err := os.Stat(*jsonFilename); err != nil && os.IsNotExist(err) { log.Println("Downloading " + *jsonURL) - resp, err := http.Get(*jsonURL) + req, err := http.NewRequest("GET", *jsonURL, nil) + if err != nil { + return err + } + resp, err := http.DefaultClient.Do(req.WithContext(ctx)) if err != nil { return err } diff --git a/db.go b/db.go index 6f50c8f..f70ce32 100644 --- a/db.go +++ b/db.go @@ -8,6 +8,7 @@ import ( "encoding/binary" "encoding/json" "errors" + "fmt" "os" "github.com/klauspost/compress/snappy" @@ -20,7 +21,7 @@ type Store struct { // Database struct pIndex []PolygonIndex filename string snappy bool - encoding string + encoding encoding } type PolygonIndex struct { @@ -30,7 +31,7 @@ type PolygonIndex struct { Min Coord `json:"min"` } -func BoltdbStorage(snappy bool, filename string, encoding string) TimezoneInterface { +func BoltdbStorage(snappy bool, filename string, encoding encoding) TimezoneInterface { if snappy { filename = filename + ".snap.db" } else { @@ -48,6 +49,33 @@ func (s *Store) Close() { defer s.db.Close() } +type encoding struct { + Type uint8 +} + +func (e encoding) String() string { + if e == EncMsgPack { + return "msgpack" + } + return "json" +} +func EncodingFromString(s string) (encoding, error) { + switch s { + case "msgpack": + return EncMsgPack, nil + case "json": + return EncJSON, nil + default: + return EncUnknown, fmt.Errorf("unknown encoding %q (neither msgpack, nor json)", s) + } +} + +var ( + EncUnknown = encoding{} + EncMsgPack = encoding{1} + EncJSON = encoding{2} +) + func (s *Store) LoadTimezones() error { if _, err := os.Stat(s.filename); os.IsNotExist(err) { return errors.New(errNotExistDatabase) @@ -61,10 +89,10 @@ func (s *Store) LoadTimezones() error { // Assume bucket exists and has keys b := tx.Bucket([]byte("Index")) - var err error - b.ForEach(func(k, v []byte) error { + return b.ForEach(func(k, v []byte) error { var index PolygonIndex - if s.encoding == "msgpack" { + var err error + if s.encoding == EncMsgPack { err = msgpack.Unmarshal(v, &index) } else { err = json.Unmarshal(v, &index) @@ -76,7 +104,6 @@ func (s *Store) LoadTimezones() error { s.pIndex = append(s.pIndex, index) return nil }) - return nil }) } @@ -113,7 +140,9 @@ func (s *Store) CreateTimezones(jsonFilename string) error { return err } for _, tz := range tzs { - s.InsertPolygons(tz) + if err := s.InsertPolygons(tz); err != nil { + return err + } } return nil } @@ -142,9 +171,9 @@ func (s *Store) createBuckets() error { }) } -func (s *Store) InsertPolygons(tz Timezone) { +func (s *Store) InsertPolygons(tz Timezone) error { for _, polygon := range tz.Polygons { - s.db.Update(func(tx *bolt.Tx) error { + if err := s.db.Update(func(tx *bolt.Tx) error { b := tx.Bucket([]byte("Polygon")) i := tx.Bucket([]byte("Index")) @@ -161,7 +190,7 @@ func (s *Store) InsertPolygons(tz Timezone) { var bufPolygon, bufIndex []byte var err error - if s.encoding == "msgpack" { + if s.encoding == EncMsgPack { // Marshal Polygons bufPolygon, err = msgpack.Marshal(polygon) if err != nil { @@ -191,8 +220,11 @@ func (s *Store) InsertPolygons(tz Timezone) { return err } return b.Put(itob(intId), bufPolygon) - }) + }); err != nil { + return err + } } + return nil } func (s *Store) loadPolygon(id uint64) (Polygon, error) { @@ -207,7 +239,7 @@ func (s *Store) loadPolygon(id uint64) (Polygon, error) { return err } } - if s.encoding == "msgpack" { + if s.encoding == EncMsgPack { return msgpack.Unmarshal(v, &polygon) } else { return json.Unmarshal(v, &polygon) diff --git a/example_test.go b/example_test.go index 662821b..159ea10 100644 --- a/example_test.go +++ b/example_test.go @@ -15,7 +15,7 @@ func ExampleQuery() { DatabaseType: "boltdb", // memory or boltdb DatabaseName: "timezone", // Name without suffix Snappy: true, - Encoding: "msgpack", // json or msgpack + Encoding: timezone.EncMsgPack, // json or msgpack }) if err != nil { fmt.Println(err) diff --git a/timezone.go b/timezone.go index ed331f0..1409e5b 100644 --- a/timezone.go +++ b/timezone.go @@ -67,7 +67,7 @@ type Config struct { DatabaseName string DatabaseType string Snappy bool - Encoding string + Encoding encoding } var Tz TimezoneInterface From a216d3dcd3f6a9b5fb54b65c2417bce199275a52 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 17:38:31 +0200 Subject: [PATCH 08/12] protobuf: twice as fast, 10% shorter than MsgPack, but allocates more --- bench_test.go | 41 ++++-- db.go | 148 +++++++++++++++------ go.mod | 3 +- go.sum | 6 + pb/timezone.pb.go | 333 ++++++++++++++++++++++++++++++++++++++++++++++ pb/timezone.proto | 26 ++++ timezone.go | 43 ++++++ 7 files changed, 542 insertions(+), 58 deletions(-) create mode 100644 pb/timezone.pb.go create mode 100644 pb/timezone.proto diff --git a/bench_test.go b/bench_test.go index e4be12e..3fb6f7a 100644 --- a/bench_test.go +++ b/bench_test.go @@ -14,22 +14,35 @@ import ( ) func BenchmarkLookup(b *testing.B) { - if _, err := os.Stat("timezone.snap.db"); err != nil && os.IsNotExist(err) { - cmd := exec.Command("go", "run", "cmd/timezone.go") - cmd.Stdout, cmd.Stderr = os.Stdout, os.Stderr - _ = cmd.Run() - } - tz, err := timezone.LoadTimezones(timezone.Config{ - DatabaseType: "boltdb", // memory or boltdb - DatabaseName: "timezone", // Name without suffix - Snappy: true, - Encoding: timezone.EncMsgPack, // json or msgpack - }) - if err != nil { - b.Fatal(err) + for _, e := range []string{"msgpack", "protobuf"} { + e := e + b.Run(e, func(b *testing.B) { + if _, err := os.Stat("timezone." + e + ".snap.db"); err != nil && os.IsNotExist(err) { + cmd := exec.Command("go", "run", "cmd/timezone.go", "-encoding="+e) + cmd.Stdout, cmd.Stderr = os.Stdout, os.Stderr + _ = cmd.Run() + } + enc, err := timezone.EncodingFromString(e) + if err != nil { + b.Fatal(err) + } + tz, err := timezone.LoadTimezones(timezone.Config{ + DatabaseType: "boltdb", // memory or boltdb + DatabaseName: "timezone", // Name without suffix + Snappy: true, + Encoding: enc, // json or msgpack + }) + if err != nil { + b.Fatal(err) + } + defer tz.Close() + + benchLookup(b, tz) + }) } - defer tz.Close() +} +func benchLookup(b *testing.B, tz timezone.TimezoneInterface) { querys := []timezone.Coord{ {Lat: 5.261417, Lon: -3.925778}, // Abijan Airport {Lat: -15.678889, Lon: 34.973889}, // Blantyre Airport diff --git a/db.go b/db.go index f70ce32..a096c63 100644 --- a/db.go +++ b/db.go @@ -11,9 +11,11 @@ import ( "fmt" "os" + "github.com/evanoberholster/timezoneLookup/pb" "github.com/klauspost/compress/snappy" "github.com/vmihailenco/msgpack/v5" bolt "go.etcd.io/bbolt" + "google.golang.org/protobuf/proto" ) type Store struct { // Database struct @@ -31,12 +33,24 @@ type PolygonIndex struct { Min Coord `json:"min"` } +func (dst *PolygonIndex) FromPB(src *pb.PolygonIndex) { + dst.Id, dst.Tzid = src.Id, src.Tzid + dst.Max.FromPB(src.Max) + dst.Min.FromPB(src.Min) +} +func (src *PolygonIndex) ToPB(dst *pb.PolygonIndex) { + dst.Reset() + dst.Id, dst.Tzid = src.Id, src.Tzid + dst.Max = src.Max.ToPB(dst.Max) + dst.Min = src.Min.ToPB(dst.Min) +} + func BoltdbStorage(snappy bool, filename string, encoding encoding) TimezoneInterface { + filename += "." + encoding.String() if snappy { - filename = filename + ".snap.db" - } else { - filename = filename + ".db" + filename += ".snap" } + filename += ".db" return &Store{ filename: filename, pIndex: []PolygonIndex{}, @@ -54,10 +68,16 @@ type encoding struct { } func (e encoding) String() string { - if e == EncMsgPack { + switch e { + case EncMsgPack: return "msgpack" + case EncJSON: + return "json" + case EncProtobuf: + return "protobuf" + default: + return "unknown" } - return "json" } func EncodingFromString(s string) (encoding, error) { switch s { @@ -65,15 +85,18 @@ func EncodingFromString(s string) (encoding, error) { return EncMsgPack, nil case "json": return EncJSON, nil + case "protobuf": + return EncProtobuf, nil default: return EncUnknown, fmt.Errorf("unknown encoding %q (neither msgpack, nor json)", s) } } var ( - EncUnknown = encoding{} - EncMsgPack = encoding{1} - EncJSON = encoding{2} + EncUnknown = encoding{} + EncMsgPack = encoding{1} + EncJSON = encoding{2} + EncProtobuf = encoding{3} ) func (s *Store) LoadTimezones() error { @@ -84,6 +107,24 @@ func (s *Store) LoadTimezones() error { if err != nil { return err } + var pbIndex pb.PolygonIndex + U := func(index *PolygonIndex, v []byte) error { + if err := proto.Unmarshal(v, &pbIndex); err != nil { + return err + } + index.FromPB(&pbIndex) + return nil + } + switch s.encoding { + case EncMsgPack: + U = func(index *PolygonIndex, v []byte) error { + return msgpack.Unmarshal(v, index) + } + case EncJSON: + U = func(index *PolygonIndex, v []byte) error { + return json.Unmarshal(v, index) + } + } // Load polygon indexes return s.db.View(func(tx *bolt.Tx) error { // Assume bucket exists and has keys @@ -91,13 +132,7 @@ func (s *Store) LoadTimezones() error { return b.ForEach(func(k, v []byte) error { var index PolygonIndex - var err error - if s.encoding == EncMsgPack { - err = msgpack.Unmarshal(v, &index) - } else { - err = json.Unmarshal(v, &index) - } - if err != nil { + if err := U(&index, v); err != nil { return err } index.Id = binary.BigEndian.Uint64(k) @@ -172,6 +207,39 @@ func (s *Store) createBuckets() error { } func (s *Store) InsertPolygons(tz Timezone) error { + var pbPoly pb.Polygon + var pbIndex pb.PolygonIndex + E := func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { + polygon.ToPB(&pbPoly) + bufPolygon, err := proto.Marshal(&pbPoly) + if err != nil { + return nil, nil, err + } + index.ToPB(&pbIndex) + bufIndex, err := proto.Marshal(&pbIndex) + return bufPolygon, bufIndex, err + } + switch s.encoding { + case EncMsgPack: + E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { + bufPolygon, err := msgpack.Marshal(polygon) + if err != nil { + return nil, nil, err + } + // Marshal Polygon Index + bufIndex, err := msgpack.Marshal(index) + return bufPolygon, bufIndex, err + } + case EncJSON: + E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { + bufPolygon, err := json.Marshal(polygon) + if err != nil { + return nil, nil, err + } + bufIndex, err := json.Marshal(index) + return bufPolygon, bufIndex, err + } + } for _, polygon := range tz.Polygons { if err := s.db.Update(func(tx *bolt.Tx) error { b := tx.Bucket([]byte("Polygon")) @@ -187,29 +255,9 @@ func (s *Store) InsertPolygons(tz Timezone) error { Max: polygon.Max, Min: polygon.Min, } - var bufPolygon, bufIndex []byte - var err error - - if s.encoding == EncMsgPack { - // Marshal Polygons - bufPolygon, err = msgpack.Marshal(polygon) - if err != nil { - return err - } - // Marshal Polygon Index - bufIndex, err = msgpack.Marshal(index) - if err != nil { - return err - } - } else { - bufPolygon, err = json.Marshal(polygon) - if err != nil { - return err - } - bufIndex, err = json.Marshal(index) - if err != nil { - return err - } + bufPolygon, bufIndex, err := E(polygon, index) + if err != nil { + return err } if s.snappy { bufPolygon = snappy.Encode(nil, bufPolygon) @@ -228,6 +276,24 @@ func (s *Store) InsertPolygons(tz Timezone) error { } func (s *Store) loadPolygon(id uint64) (Polygon, error) { + var pbPoly pb.Polygon + U := func(polygon *Polygon, v []byte) error { + if err := proto.Unmarshal(v, &pbPoly); err != nil { + return err + } + polygon.FromPB(&pbPoly) + return nil + } + switch s.encoding { + case EncMsgPack: + U = func(polygon *Polygon, v []byte) error { + return msgpack.Unmarshal(v, polygon) + } + case EncJSON: + U = func(polygon *Polygon, v []byte) error { + return json.Unmarshal(v, polygon) + } + } var polygon Polygon err := s.db.View(func(tx *bolt.Tx) error { b := tx.Bucket([]byte("Polygon")) @@ -239,11 +305,7 @@ func (s *Store) loadPolygon(id uint64) (Polygon, error) { return err } } - if s.encoding == EncMsgPack { - return msgpack.Unmarshal(v, &polygon) - } else { - return json.Unmarshal(v, &polygon) - } + return U(&polygon, v) }) return polygon, err } diff --git a/go.mod b/go.mod index 56c58b0..424cc96 100644 --- a/go.mod +++ b/go.mod @@ -9,12 +9,13 @@ require ( ) require ( - github.com/golang/protobuf v1.3.1 // indirect + github.com/golang/protobuf v1.5.0 // indirect github.com/klauspost/compress v1.13.6 // indirect github.com/vmihailenco/msgpack/v5 v5.3.4 // indirect github.com/vmihailenco/tagparser/v2 v2.0.0 // indirect golang.org/x/net v0.0.0-20190603091049-60506f45cf65 // indirect golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d // indirect google.golang.org/appengine v1.6.7 // indirect + google.golang.org/protobuf v1.27.1 // indirect gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c // indirect ) diff --git a/go.sum b/go.sum index 8cf5b3e..1d3fac0 100644 --- a/go.sum +++ b/go.sum @@ -1,8 +1,10 @@ github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38= github.com/golang/protobuf v1.3.1 h1:YF8+flBXS5eO826T4nzqPrxfhQThhXl0YzfuUPu4SBg= github.com/golang/protobuf v1.3.1/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U= +github.com/golang/protobuf v1.5.0/go.mod h1:FsONVRAS9T7sI+LIUmWTfcYkHO4aIWwzhcaSAoJOfIk= github.com/golang/snappy v0.0.4 h1:yAGX7huGHXlcLOEtBnF4w7FQwA26wojNCwOYAEhLjQM= github.com/golang/snappy v0.0.4/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q= +github.com/google/go-cmp v0.5.5/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE= github.com/klauspost/compress v1.13.6 h1:P76CopJELS0TiO2mebmnzgWaajssP/EszplttgQxcgc= github.com/klauspost/compress v1.13.6/go.mod h1:/3/Vjq9QcHkK5uEr5lBEmyoZ1iFhe47etQ6QUkpK6sk= github.com/kr/pretty v0.2.1 h1:Fmg33tUaq4/8ym9TJN1x7sLJnHVwhP33CNkpYV/7rwI= @@ -30,8 +32,12 @@ golang.org/x/sys v0.0.0-20200923182605-d9f96fdee20d/go.mod h1:h1NjWce9XRLGQEsW7w golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ= golang.org/x/text v0.3.2/go.mod h1:bEr9sfX3Q8Zfm5fL9x+3itogRgK3+ptLWKqgva+5dAk= golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ= +golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0= google.golang.org/appengine v1.6.7 h1:FZR1q0exgwxzPzp/aF+VccGrSfxfPpkBqjIIEq3ru6c= google.golang.org/appengine v1.6.7/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc= +google.golang.org/protobuf v1.26.0-rc.1/go.mod h1:jlhhOSvTdKEhbULTjvd4ARK9grFBp09yW+WbY/TyQbw= +google.golang.org/protobuf v1.27.1 h1:SnqbnDw1V7RiZcXPx5MEeqPv2s79L9i7BJUlG/+RurQ= +google.golang.org/protobuf v1.27.1/go.mod h1:9q0QmTI4eRPtz6boOQmLYwt+qCgq0jsYwAQnmE0givc= gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0= gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk= gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c/go.mod h1:JHkPIbrfpd72SG/EVd6muEfDQjcINNoR0C8j2r3qZ4Q= diff --git a/pb/timezone.pb.go b/pb/timezone.pb.go new file mode 100644 index 0000000..16fca81 --- /dev/null +++ b/pb/timezone.pb.go @@ -0,0 +1,333 @@ +// Copyright 2021 Tamás Gulácsi. +// +// SPDX-License-Identifier: MIT + +// Code generated by protoc-gen-go. DO NOT EDIT. +// versions: +// protoc-gen-go v1.27.1 +// protoc v3.12.4 +// source: timezone.proto + +package pb + +import ( + protoreflect "google.golang.org/protobuf/reflect/protoreflect" + protoimpl "google.golang.org/protobuf/runtime/protoimpl" + reflect "reflect" + sync "sync" +) + +const ( + // Verify that this generated code is sufficiently up-to-date. + _ = protoimpl.EnforceVersion(20 - protoimpl.MinVersion) + // Verify that runtime/protoimpl is sufficiently up-to-date. + _ = protoimpl.EnforceVersion(protoimpl.MaxVersion - 20) +) + +type Coord struct { + state protoimpl.MessageState + sizeCache protoimpl.SizeCache + unknownFields protoimpl.UnknownFields + + Lat float32 `protobuf:"fixed32,1,opt,name=Lat,proto3" json:"Lat,omitempty"` + Lon float32 `protobuf:"fixed32,2,opt,name=Lon,proto3" json:"Lon,omitempty"` +} + +func (x *Coord) Reset() { + *x = Coord{} + if protoimpl.UnsafeEnabled { + mi := &file_timezone_proto_msgTypes[0] + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + ms.StoreMessageInfo(mi) + } +} + +func (x *Coord) String() string { + return protoimpl.X.MessageStringOf(x) +} + +func (*Coord) ProtoMessage() {} + +func (x *Coord) ProtoReflect() protoreflect.Message { + mi := &file_timezone_proto_msgTypes[0] + if protoimpl.UnsafeEnabled && x != nil { + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + if ms.LoadMessageInfo() == nil { + ms.StoreMessageInfo(mi) + } + return ms + } + return mi.MessageOf(x) +} + +// Deprecated: Use Coord.ProtoReflect.Descriptor instead. +func (*Coord) Descriptor() ([]byte, []int) { + return file_timezone_proto_rawDescGZIP(), []int{0} +} + +func (x *Coord) GetLat() float32 { + if x != nil { + return x.Lat + } + return 0 +} + +func (x *Coord) GetLon() float32 { + if x != nil { + return x.Lon + } + return 0 +} + +type Polygon struct { + state protoimpl.MessageState + sizeCache protoimpl.SizeCache + unknownFields protoimpl.UnknownFields + + Max *Coord `protobuf:"bytes,1,opt,name=Max,proto3" json:"Max,omitempty"` + Min *Coord `protobuf:"bytes,2,opt,name=Min,proto3" json:"Min,omitempty"` + Coords []*Coord `protobuf:"bytes,4,rep,name=Coords,proto3" json:"Coords,omitempty"` +} + +func (x *Polygon) Reset() { + *x = Polygon{} + if protoimpl.UnsafeEnabled { + mi := &file_timezone_proto_msgTypes[1] + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + ms.StoreMessageInfo(mi) + } +} + +func (x *Polygon) String() string { + return protoimpl.X.MessageStringOf(x) +} + +func (*Polygon) ProtoMessage() {} + +func (x *Polygon) ProtoReflect() protoreflect.Message { + mi := &file_timezone_proto_msgTypes[1] + if protoimpl.UnsafeEnabled && x != nil { + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + if ms.LoadMessageInfo() == nil { + ms.StoreMessageInfo(mi) + } + return ms + } + return mi.MessageOf(x) +} + +// Deprecated: Use Polygon.ProtoReflect.Descriptor instead. +func (*Polygon) Descriptor() ([]byte, []int) { + return file_timezone_proto_rawDescGZIP(), []int{1} +} + +func (x *Polygon) GetMax() *Coord { + if x != nil { + return x.Max + } + return nil +} + +func (x *Polygon) GetMin() *Coord { + if x != nil { + return x.Min + } + return nil +} + +func (x *Polygon) GetCoords() []*Coord { + if x != nil { + return x.Coords + } + return nil +} + +type PolygonIndex struct { + state protoimpl.MessageState + sizeCache protoimpl.SizeCache + unknownFields protoimpl.UnknownFields + + Id uint64 `protobuf:"varint,1,opt,name=Id,proto3" json:"Id,omitempty"` + Tzid string `protobuf:"bytes,2,opt,name=Tzid,proto3" json:"Tzid,omitempty"` + Max *Coord `protobuf:"bytes,3,opt,name=Max,proto3" json:"Max,omitempty"` + Min *Coord `protobuf:"bytes,4,opt,name=Min,proto3" json:"Min,omitempty"` +} + +func (x *PolygonIndex) Reset() { + *x = PolygonIndex{} + if protoimpl.UnsafeEnabled { + mi := &file_timezone_proto_msgTypes[2] + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + ms.StoreMessageInfo(mi) + } +} + +func (x *PolygonIndex) String() string { + return protoimpl.X.MessageStringOf(x) +} + +func (*PolygonIndex) ProtoMessage() {} + +func (x *PolygonIndex) ProtoReflect() protoreflect.Message { + mi := &file_timezone_proto_msgTypes[2] + if protoimpl.UnsafeEnabled && x != nil { + ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x)) + if ms.LoadMessageInfo() == nil { + ms.StoreMessageInfo(mi) + } + return ms + } + return mi.MessageOf(x) +} + +// Deprecated: Use PolygonIndex.ProtoReflect.Descriptor instead. +func (*PolygonIndex) Descriptor() ([]byte, []int) { + return file_timezone_proto_rawDescGZIP(), []int{2} +} + +func (x *PolygonIndex) GetId() uint64 { + if x != nil { + return x.Id + } + return 0 +} + +func (x *PolygonIndex) GetTzid() string { + if x != nil { + return x.Tzid + } + return "" +} + +func (x *PolygonIndex) GetMax() *Coord { + if x != nil { + return x.Max + } + return nil +} + +func (x *PolygonIndex) GetMin() *Coord { + if x != nil { + return x.Min + } + return nil +} + +var File_timezone_proto protoreflect.FileDescriptor + +var file_timezone_proto_rawDesc = []byte{ + 0x0a, 0x0e, 0x74, 0x69, 0x6d, 0x65, 0x7a, 0x6f, 0x6e, 0x65, 0x2e, 0x70, 0x72, 0x6f, 0x74, 0x6f, + 0x22, 0x2b, 0x0a, 0x05, 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x12, 0x10, 0x0a, 0x03, 0x4c, 0x61, 0x74, + 0x18, 0x01, 0x20, 0x01, 0x28, 0x02, 0x52, 0x03, 0x4c, 0x61, 0x74, 0x12, 0x10, 0x0a, 0x03, 0x4c, + 0x6f, 0x6e, 0x18, 0x02, 0x20, 0x01, 0x28, 0x02, 0x52, 0x03, 0x4c, 0x6f, 0x6e, 0x22, 0x5d, 0x0a, + 0x07, 0x50, 0x6f, 0x6c, 0x79, 0x67, 0x6f, 0x6e, 0x12, 0x18, 0x0a, 0x03, 0x4d, 0x61, 0x78, 0x18, + 0x01, 0x20, 0x01, 0x28, 0x0b, 0x32, 0x06, 0x2e, 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x52, 0x03, 0x4d, + 0x61, 0x78, 0x12, 0x18, 0x0a, 0x03, 0x4d, 0x69, 0x6e, 0x18, 0x02, 0x20, 0x01, 0x28, 0x0b, 0x32, + 0x06, 0x2e, 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x52, 0x03, 0x4d, 0x69, 0x6e, 0x12, 0x1e, 0x0a, 0x06, + 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x73, 0x18, 0x04, 0x20, 0x03, 0x28, 0x0b, 0x32, 0x06, 0x2e, 0x43, + 0x6f, 0x6f, 0x72, 0x64, 0x52, 0x06, 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x73, 0x22, 0x66, 0x0a, 0x0c, + 0x50, 0x6f, 0x6c, 0x79, 0x67, 0x6f, 0x6e, 0x49, 0x6e, 0x64, 0x65, 0x78, 0x12, 0x0e, 0x0a, 0x02, + 0x49, 0x64, 0x18, 0x01, 0x20, 0x01, 0x28, 0x04, 0x52, 0x02, 0x49, 0x64, 0x12, 0x12, 0x0a, 0x04, + 0x54, 0x7a, 0x69, 0x64, 0x18, 0x02, 0x20, 0x01, 0x28, 0x09, 0x52, 0x04, 0x54, 0x7a, 0x69, 0x64, + 0x12, 0x18, 0x0a, 0x03, 0x4d, 0x61, 0x78, 0x18, 0x03, 0x20, 0x01, 0x28, 0x0b, 0x32, 0x06, 0x2e, + 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x52, 0x03, 0x4d, 0x61, 0x78, 0x12, 0x18, 0x0a, 0x03, 0x4d, 0x69, + 0x6e, 0x18, 0x04, 0x20, 0x01, 0x28, 0x0b, 0x32, 0x06, 0x2e, 0x43, 0x6f, 0x6f, 0x72, 0x64, 0x52, + 0x03, 0x4d, 0x69, 0x6e, 0x42, 0x2e, 0x5a, 0x2c, 0x67, 0x69, 0x74, 0x68, 0x75, 0x62, 0x2e, 0x63, + 0x6f, 0x6d, 0x2f, 0x65, 0x76, 0x61, 0x6e, 0x6f, 0x62, 0x65, 0x72, 0x68, 0x6f, 0x6c, 0x73, 0x74, + 0x65, 0x72, 0x2f, 0x74, 0x69, 0x6d, 0x65, 0x7a, 0x6f, 0x6e, 0x65, 0x4c, 0x6f, 0x6f, 0x6b, 0x75, + 0x70, 0x2f, 0x70, 0x62, 0x62, 0x06, 0x70, 0x72, 0x6f, 0x74, 0x6f, 0x33, +} + +var ( + file_timezone_proto_rawDescOnce sync.Once + file_timezone_proto_rawDescData = file_timezone_proto_rawDesc +) + +func file_timezone_proto_rawDescGZIP() []byte { + file_timezone_proto_rawDescOnce.Do(func() { + file_timezone_proto_rawDescData = protoimpl.X.CompressGZIP(file_timezone_proto_rawDescData) + }) + return file_timezone_proto_rawDescData +} + +var file_timezone_proto_msgTypes = make([]protoimpl.MessageInfo, 3) +var file_timezone_proto_goTypes = []interface{}{ + (*Coord)(nil), // 0: Coord + (*Polygon)(nil), // 1: Polygon + (*PolygonIndex)(nil), // 2: PolygonIndex +} +var file_timezone_proto_depIdxs = []int32{ + 0, // 0: Polygon.Max:type_name -> Coord + 0, // 1: Polygon.Min:type_name -> Coord + 0, // 2: Polygon.Coords:type_name -> Coord + 0, // 3: PolygonIndex.Max:type_name -> Coord + 0, // 4: PolygonIndex.Min:type_name -> Coord + 5, // [5:5] is the sub-list for method output_type + 5, // [5:5] is the sub-list for method input_type + 5, // [5:5] is the sub-list for extension type_name + 5, // [5:5] is the sub-list for extension extendee + 0, // [0:5] is the sub-list for field type_name +} + +func init() { file_timezone_proto_init() } +func file_timezone_proto_init() { + if File_timezone_proto != nil { + return + } + if !protoimpl.UnsafeEnabled { + file_timezone_proto_msgTypes[0].Exporter = func(v interface{}, i int) interface{} { + switch v := v.(*Coord); i { + case 0: + return &v.state + case 1: + return &v.sizeCache + case 2: + return &v.unknownFields + default: + return nil + } + } + file_timezone_proto_msgTypes[1].Exporter = func(v interface{}, i int) interface{} { + switch v := v.(*Polygon); i { + case 0: + return &v.state + case 1: + return &v.sizeCache + case 2: + return &v.unknownFields + default: + return nil + } + } + file_timezone_proto_msgTypes[2].Exporter = func(v interface{}, i int) interface{} { + switch v := v.(*PolygonIndex); i { + case 0: + return &v.state + case 1: + return &v.sizeCache + case 2: + return &v.unknownFields + default: + return nil + } + } + } + type x struct{} + out := protoimpl.TypeBuilder{ + File: protoimpl.DescBuilder{ + GoPackagePath: reflect.TypeOf(x{}).PkgPath(), + RawDescriptor: file_timezone_proto_rawDesc, + NumEnums: 0, + NumMessages: 3, + NumExtensions: 0, + NumServices: 0, + }, + GoTypes: file_timezone_proto_goTypes, + DependencyIndexes: file_timezone_proto_depIdxs, + MessageInfos: file_timezone_proto_msgTypes, + }.Build() + File_timezone_proto = out.File + file_timezone_proto_rawDesc = nil + file_timezone_proto_goTypes = nil + file_timezone_proto_depIdxs = nil +} diff --git a/pb/timezone.proto b/pb/timezone.proto new file mode 100644 index 0000000..14ea824 --- /dev/null +++ b/pb/timezone.proto @@ -0,0 +1,26 @@ +// Copyright 2021 Tamás Gulácsi. +// +// SPDX-License-Identifier: MIT + +syntax = "proto3"; +option go_package = "github.com/evanoberholster/timezoneLookup/pb"; +//import "google/protobuf/timestamp.proto"; + +message Coord { + float Lat = 1; + float Lon = 2; +} + +message Polygon { + Coord Max = 1; + Coord Min = 2; + repeated Coord Coords = 4; +} + +message PolygonIndex { + uint64 Id = 1; + string Tzid = 2; + Coord Max = 3; + Coord Min = 4; +} + diff --git a/timezone.go b/timezone.go index 1409e5b..a298362 100644 --- a/timezone.go +++ b/timezone.go @@ -11,8 +11,13 @@ import ( "os" "runtime" "time" + + "github.com/evanoberholster/timezoneLookup/pb" ) +//go:generate go install google.golang.org/protobuf/cmd/protoc-gen-go@latest +//go:generate protoc --proto_path=pb --go_out=pb --go_opt=paths=source_relative pb/timezone.proto + const ( WithSnappy = true NoSnappy = false @@ -58,11 +63,49 @@ type Polygon struct { Coords []Coord `json:"coords"` } +func (dst *Polygon) FromPB(src *pb.Polygon) { + dst.Max.FromPB(src.Max) + dst.Min.FromPB(src.Min) + if cap(dst.Coords) < len(src.Coords) { + dst.Coords = make([]Coord, len(src.Coords)) + } else { + dst.Coords = dst.Coords[:len(src.Coords)] + } + for i, c := range src.Coords { + dst.Coords[i].FromPB(c) + } +} +func (src Polygon) ToPB(dst *pb.Polygon) { + dst.Reset() + dst.Max = src.Max.ToPB(dst.Max) + dst.Min = src.Min.ToPB(dst.Min) + if cap(dst.Coords) < len(src.Coords) { + dst.Coords = make([]*pb.Coord, len(src.Coords)) + } else { + dst.Coords = dst.Coords[:len(src.Coords)] + } + for i, c := range src.Coords { + dst.Coords[i] = c.ToPB(dst.Coords[i]) + } +} + type Coord struct { Lat float32 `json:"lat"` Lon float32 `json:"lon"` } +func (src Coord) ToPB(dst *pb.Coord) *pb.Coord { + if dst == nil { + return &pb.Coord{Lat: src.Lat, Lon: src.Lon} + } + dst.Reset() + dst.Lat, dst.Lon = src.Lat, src.Lon + return dst +} +func (dst *Coord) FromPB(src *pb.Coord) { + dst.Lat, dst.Lon = src.Lat, src.Lon +} + type Config struct { DatabaseName string DatabaseType string From 7231ede985e0a2e02ee4cac4348d537b79e06354 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 18:27:28 +0200 Subject: [PATCH 09/12] Faster Marshal by reusing buffer --- db.go | 75 +++++++++++++++++++++++++++++++++++------------------------ 1 file changed, 44 insertions(+), 31 deletions(-) diff --git a/db.go b/db.go index a096c63..ec5dcfe 100644 --- a/db.go +++ b/db.go @@ -5,6 +5,7 @@ package timezoneLookup import ( + "bytes" "encoding/binary" "encoding/json" "errors" @@ -108,13 +109,7 @@ func (s *Store) LoadTimezones() error { return err } var pbIndex pb.PolygonIndex - U := func(index *PolygonIndex, v []byte) error { - if err := proto.Unmarshal(v, &pbIndex); err != nil { - return err - } - index.FromPB(&pbIndex) - return nil - } + var U func(index *PolygonIndex, v []byte) error switch s.encoding { case EncMsgPack: U = func(index *PolygonIndex, v []byte) error { @@ -124,6 +119,14 @@ func (s *Store) LoadTimezones() error { U = func(index *PolygonIndex, v []byte) error { return json.Unmarshal(v, index) } + case EncProtobuf: + U = func(index *PolygonIndex, v []byte) error { + if err := proto.Unmarshal(v, &pbIndex); err != nil { + return err + } + index.FromPB(&pbIndex) + return nil + } } // Load polygon indexes return s.db.View(func(tx *bolt.Tx) error { @@ -207,36 +210,44 @@ func (s *Store) createBuckets() error { } func (s *Store) InsertPolygons(tz Timezone) error { - var pbPoly pb.Polygon - var pbIndex pb.PolygonIndex - E := func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { - polygon.ToPB(&pbPoly) - bufPolygon, err := proto.Marshal(&pbPoly) - if err != nil { - return nil, nil, err - } - index.ToPB(&pbIndex) - bufIndex, err := proto.Marshal(&pbIndex) - return bufPolygon, bufIndex, err - } + var bufPolygon, bufIndex []byte + var E func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) switch s.encoding { case EncMsgPack: + eP := msgpack.NewEncoder(bytes.NewBuffer(bufPolygon)) + eI := msgpack.NewEncoder(bytes.NewBuffer(bufIndex)) E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { - bufPolygon, err := msgpack.Marshal(polygon) - if err != nil { + bufPolygon, bufIndex = bufPolygon[:0], bufIndex[:0] + if err := eP.Encode(polygon); err != nil { return nil, nil, err } // Marshal Polygon Index - bufIndex, err := msgpack.Marshal(index) + err := eI.Encode(index) return bufPolygon, bufIndex, err } case EncJSON: + eP := json.NewEncoder(bytes.NewBuffer(bufPolygon)) + eI := json.NewEncoder(bytes.NewBuffer(bufIndex)) E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { - bufPolygon, err := json.Marshal(polygon) + bufPolygon, bufIndex = bufPolygon[:0], bufIndex[:0] + if err := eP.Encode(polygon); err != nil { + return nil, nil, err + } + err := eI.Encode(index) + return bufPolygon, bufIndex, err + } + case EncProtobuf: + var pbPoly pb.Polygon + var pbIndex pb.PolygonIndex + var mo proto.MarshalOptions + E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { + polygon.ToPB(&pbPoly) + bufPolygon, err := mo.MarshalAppend(bufPolygon[:0], &pbPoly) if err != nil { return nil, nil, err } - bufIndex, err := json.Marshal(index) + index.ToPB(&pbIndex) + bufIndex, err := mo.MarshalAppend(bufIndex[:0], &pbIndex) return bufPolygon, bufIndex, err } } @@ -277,13 +288,7 @@ func (s *Store) InsertPolygons(tz Timezone) error { func (s *Store) loadPolygon(id uint64) (Polygon, error) { var pbPoly pb.Polygon - U := func(polygon *Polygon, v []byte) error { - if err := proto.Unmarshal(v, &pbPoly); err != nil { - return err - } - polygon.FromPB(&pbPoly) - return nil - } + var U func(polygon *Polygon, v []byte) error switch s.encoding { case EncMsgPack: U = func(polygon *Polygon, v []byte) error { @@ -293,6 +298,14 @@ func (s *Store) loadPolygon(id uint64) (Polygon, error) { U = func(polygon *Polygon, v []byte) error { return json.Unmarshal(v, polygon) } + case EncProtobuf: + U = func(polygon *Polygon, v []byte) error { + if err := proto.Unmarshal(v, &pbPoly); err != nil { + return err + } + polygon.FromPB(&pbPoly) + return nil + } } var polygon Polygon err := s.db.View(func(tx *bolt.Tx) error { From abbb31958b975b7b6309214fc17e0990d1176e5f Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 18:38:30 +0200 Subject: [PATCH 10/12] memory: Reduce memory usage of Marshal by compressing on-the fly --- db.go | 2 +- go.mod | 1 + go.sum | 2 ++ memory.go | 32 +++++++++++++++----------------- timezone.go | 2 +- 5 files changed, 20 insertions(+), 19 deletions(-) diff --git a/db.go b/db.go index ec5dcfe..774303b 100644 --- a/db.go +++ b/db.go @@ -7,12 +7,12 @@ package timezoneLookup import ( "bytes" "encoding/binary" - "encoding/json" "errors" "fmt" "os" "github.com/evanoberholster/timezoneLookup/pb" + json "github.com/goccy/go-json" "github.com/klauspost/compress/snappy" "github.com/vmihailenco/msgpack/v5" bolt "go.etcd.io/bbolt" diff --git a/go.mod b/go.mod index 424cc96..9807e72 100644 --- a/go.mod +++ b/go.mod @@ -9,6 +9,7 @@ require ( ) require ( + github.com/goccy/go-json v0.7.10 // indirect github.com/golang/protobuf v1.5.0 // indirect github.com/klauspost/compress v1.13.6 // indirect github.com/vmihailenco/msgpack/v5 v5.3.4 // indirect diff --git a/go.sum b/go.sum index 1d3fac0..003cc46 100644 --- a/go.sum +++ b/go.sum @@ -1,4 +1,6 @@ github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38= +github.com/goccy/go-json v0.7.10 h1:ulhbuNe1JqE68nMRXXTJRrUu0uhouf0VevLINxQq4Ec= +github.com/goccy/go-json v0.7.10/go.mod h1:6MelG93GURQebXPDq3khkgXZkazVtN9CRI+MGFi0w8I= github.com/golang/protobuf v1.3.1 h1:YF8+flBXS5eO826T4nzqPrxfhQThhXl0YzfuUPu4SBg= github.com/golang/protobuf v1.3.1/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U= github.com/golang/protobuf v1.5.0/go.mod h1:FsONVRAS9T7sI+LIUmWTfcYkHO4aIWwzhcaSAoJOfIk= diff --git a/memory.go b/memory.go index fa27034..a928181 100644 --- a/memory.go +++ b/memory.go @@ -5,11 +5,12 @@ package timezoneLookup import ( - "encoding/json" "errors" + "io" "os" - "github.com/golang/snappy" + json "github.com/goccy/go-json" + "github.com/klauspost/compress/snappy" ) type Memory struct { // Memory struct @@ -20,10 +21,9 @@ type Memory struct { // Memory struct func MemoryStorage(snappy bool, filename string) *Memory { if snappy { - filename = filename + ".snap.json" - } else { - filename = filename + ".json" + filename += ".snap" } + filename += ".json" return &Memory{ filename: filename, timezones: []Timezone{}, @@ -46,7 +46,6 @@ func (m *Memory) LoadTimezones() error { data := snappy.NewReader(file) dec := json.NewDecoder(data) for dec.More() { - err := dec.Decode(&tzs) if err != nil { return err @@ -81,24 +80,23 @@ func (m *Memory) Query(q Coord) (string, error) { } func (m *Memory) writeTimezoneJSON(dbFilename string) error { - data, err := json.Marshal(m.timezones) - if err != nil { - return err - } w, err := os.Create(dbFilename) if err != nil { return err } defer w.Close() + sw := io.WriteCloser(w) if m.snappy { - snap := snappy.NewBufferedWriter(w) - _, err := snap.Write(data) - if err != nil { - return err + sw = snappy.NewBufferedWriter(w) + } + err = json.NewEncoder(sw).Encode(m.timezones) + if closeErr := sw.Close(); closeErr != nil && err == nil { + err = closeErr + } + if m.snappy { + if closeErr := w.Close(); closeErr != nil && err == nil { + err = closeErr } - defer snap.Close() - } else { - _, err = w.Write(data) } return err } diff --git a/timezone.go b/timezone.go index a298362..cbd0afe 100644 --- a/timezone.go +++ b/timezone.go @@ -5,7 +5,6 @@ package timezoneLookup import ( - "encoding/json" "errors" "fmt" "os" @@ -13,6 +12,7 @@ import ( "time" "github.com/evanoberholster/timezoneLookup/pb" + json "github.com/goccy/go-json" ) //go:generate go install google.golang.org/protobuf/cmd/protoc-gen-go@latest From 0879a3f022c1a4450865103dbc743c3f7a4ecac2 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 19:24:09 +0200 Subject: [PATCH 11/12] Fix InsertPolygons for MsgPack --- db.go | 20 ++++++++++++-------- 1 file changed, 12 insertions(+), 8 deletions(-) diff --git a/db.go b/db.go index 774303b..cca1fa4 100644 --- a/db.go +++ b/db.go @@ -214,27 +214,31 @@ func (s *Store) InsertPolygons(tz Timezone) error { var E func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) switch s.encoding { case EncMsgPack: - eP := msgpack.NewEncoder(bytes.NewBuffer(bufPolygon)) - eI := msgpack.NewEncoder(bytes.NewBuffer(bufIndex)) + pBuf, iBuf := bytes.NewBuffer(bufPolygon), bytes.NewBuffer(bufIndex) + eP := msgpack.NewEncoder(pBuf) + eI := msgpack.NewEncoder(iBuf) E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { - bufPolygon, bufIndex = bufPolygon[:0], bufIndex[:0] + pBuf.Reset() if err := eP.Encode(polygon); err != nil { return nil, nil, err } // Marshal Polygon Index + iBuf.Reset() err := eI.Encode(index) - return bufPolygon, bufIndex, err + return pBuf.Bytes(), iBuf.Bytes(), err } case EncJSON: - eP := json.NewEncoder(bytes.NewBuffer(bufPolygon)) - eI := json.NewEncoder(bytes.NewBuffer(bufIndex)) + pBuf, iBuf := bytes.NewBuffer(bufPolygon), bytes.NewBuffer(bufIndex) + eP := json.NewEncoder(pBuf) + eI := json.NewEncoder(iBuf) E = func(polygon Polygon, index PolygonIndex) ([]byte, []byte, error) { - bufPolygon, bufIndex = bufPolygon[:0], bufIndex[:0] + pBuf.Reset() if err := eP.Encode(polygon); err != nil { return nil, nil, err } + iBuf.Reset() err := eI.Encode(index) - return bufPolygon, bufIndex, err + return pBuf.Bytes(), iBuf.Bytes(), err } case EncProtobuf: var pbPoly pb.Polygon From 58a16b0f31574a9f1a7a6ac7c48dedda3a53e371 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Tam=C3=A1s=20Gul=C3=A1csi?= Date: Sun, 17 Oct 2021 19:26:57 +0200 Subject: [PATCH 12/12] BenchmarkLookup: Benchmark memory, put files under testdata/ --- bench_test.go | 41 +++++++++++++++++++++++++++-------------- 1 file changed, 27 insertions(+), 14 deletions(-) diff --git a/bench_test.go b/bench_test.go index 3fb6f7a..f6786f8 100644 --- a/bench_test.go +++ b/bench_test.go @@ -8,32 +8,45 @@ import ( "fmt" "os" "os/exec" + "path/filepath" "testing" timezone "github.com/evanoberholster/timezoneLookup" ) func BenchmarkLookup(b *testing.B) { - for _, e := range []string{"msgpack", "protobuf"} { - e := e - b.Run(e, func(b *testing.B) { - if _, err := os.Stat("timezone." + e + ".snap.db"); err != nil && os.IsNotExist(err) { - cmd := exec.Command("go", "run", "cmd/timezone.go", "-encoding="+e) + _ = os.MkdirAll("testdata", 0755) + tzgo := filepath.Join("..", "cmd", "timezone.go") + for _, e := range []string{"msgpack", "protobuf", "json"} { + cfg := timezone.Config{ + DatabaseName: filepath.Join("testdata", "timezone"), + Snappy: true, + } + if e == "json" { + if _, err := os.Stat(cfg.DatabaseName + ".snap.json"); err != nil && os.IsNotExist(err) { + cmd := exec.Command("go", "run", tzgo, "-type=memory") cmd.Stdout, cmd.Stderr = os.Stdout, os.Stderr + cmd.Dir = "testdata" _ = cmd.Run() } - enc, err := timezone.EncodingFromString(e) - if err != nil { + cfg.DatabaseType = "memory" + } else { + if _, err := os.Stat(cfg.DatabaseName + "." + e + ".snap.db"); err != nil && os.IsNotExist(err) { + cmd := exec.Command("go", "run", tzgo, "-encoding="+e) + cmd.Stdout, cmd.Stderr = os.Stdout, os.Stderr + cmd.Dir = "testdata" + _ = cmd.Run() + } + var err error + if cfg.Encoding, err = timezone.EncodingFromString(e); err != nil { b.Fatal(err) } - tz, err := timezone.LoadTimezones(timezone.Config{ - DatabaseType: "boltdb", // memory or boltdb - DatabaseName: "timezone", // Name without suffix - Snappy: true, - Encoding: enc, // json or msgpack - }) + cfg.DatabaseType = "boltdb" + } + b.Run(e, func(b *testing.B) { + tz, err := timezone.LoadTimezones(cfg) if err != nil { - b.Fatal(err) + b.Fatalf("%q: %#v: %+v", e, cfg, err) } defer tz.Close()