moved fields to a collection map

This commit is contained in:
Josh Baker 2016-12-31 09:29:02 -07:00
parent d6ca25d14b
commit b9e61777e6
2 changed files with 161 additions and 79 deletions

View File

@ -14,7 +14,6 @@ const (
type itemT struct { type itemT struct {
id string id string
object geojson.Object object geojson.Object
fields []float64
} }
func (i *itemT) Less(item btree.Item, ctx interface{}) bool { func (i *itemT) Less(item btree.Item, ctx interface{}) bool {
@ -52,6 +51,7 @@ type Collection struct {
values *btree.BTree // items sorted by value+key values *btree.BTree // items sorted by value+key
index *index.Index // items geospatially indexed index *index.Index // items geospatially indexed
fieldMap map[string]int fieldMap map[string]int
fieldValues map[string][]float64
weight int weight int
points int points int
objects int // geometry count objects int // geometry count
@ -64,13 +64,32 @@ var counter uint64
func New() *Collection { func New() *Collection {
col := &Collection{ col := &Collection{
index: index.New(), index: index.New(),
items: btree.New(48, idOrdered), items: btree.New(128, idOrdered),
values: btree.New(48, valueOrdered), values: btree.New(128, valueOrdered),
fieldMap: make(map[string]int), fieldMap: make(map[string]int),
} }
return col return col
} }
func (c *Collection) setFieldValues(id string, values []float64) {
if c.fieldValues == nil {
c.fieldValues = make(map[string][]float64)
}
c.fieldValues[id] = values
}
func (c *Collection) getFieldValues(id string) (values []float64) {
if c.fieldValues == nil {
return nil
}
return c.fieldValues[id]
}
func (c *Collection) deleteFieldValues(id string) {
if c.fieldValues != nil {
delete(c.fieldValues, id)
}
}
// Count returns the number of objects in collection. // Count returns the number of objects in collection.
func (c *Collection) Count() int { func (c *Collection) Count() int {
return c.objects + c.nobjects return c.objects + c.nobjects
@ -122,13 +141,13 @@ func (c *Collection) ReplaceOrInsert(id string, obj geojson.Object, fields []str
c.points -= oldItem.object.PositionCount() c.points -= oldItem.object.PositionCount()
// decrement the weights // decrement the weights
c.weight -= len(oldItem.fields) * 8 c.weight -= len(c.getFieldValues(id)) * 8
c.weight -= oldItem.object.Weight() + len(oldItem.id) c.weight -= oldItem.object.Weight() + len(oldItem.id)
// references // references
oldObject = oldItem.object oldObject = oldItem.object
oldFields = oldItem.fields oldFields = c.getFieldValues(id)
newItem.fields = oldFields newFields = oldFields
} }
// insert the new item into the rtree or strings tree. // insert the new item into the rtree or strings tree.
if obj.IsGeometry() { if obj.IsGeometry() {
@ -142,30 +161,37 @@ func (c *Collection) ReplaceOrInsert(id string, obj geojson.Object, fields []str
c.points += obj.PositionCount() c.points += obj.PositionCount()
// add the new weights // add the new weights
c.weight += len(newItem.fields) * 8 c.weight += len(newFields) * 8
c.weight += obj.Weight() + len(id) c.weight += obj.Weight() + len(id)
if fields == nil { if fields == nil {
if len(values) > 0 { if len(values) > 0 {
// directly set the field values, update weight // directly set the field values, update weight
c.weight -= len(newItem.fields) * 8 c.weight -= len(newFields) * 8
newItem.fields = values newFields = values
c.weight += len(newItem.fields) * 8 c.setFieldValues(id, newFields)
c.weight += len(newFields) * 8
} }
} else { } else {
if len(fields) == 0 {
panic("if fields is empty, make it nil")
}
// map field name to value // map field name to value
for i, field := range fields { for i, field := range fields {
c.setField(newItem, field, values[i]) c.setField(newItem, field, values[i])
} }
newFields = c.getFieldValues(id)
} }
return oldObject, oldFields, newItem.fields return oldObject, oldFields, newFields
} }
func (c *Collection) remove(id string) (item *itemT, ok bool) { // Remove removes an object and returns it.
// If the object does not exist then the 'ok' return value will be false.
func (c *Collection) Remove(id string) (obj geojson.Object, fields []float64, ok bool) {
i := c.items.Delete(&itemT{id: id}) i := c.items.Delete(&itemT{id: id})
if i == nil { if i == nil {
return nil, false return nil, nil, false
} }
item = i.(*itemT) item := i.(*itemT)
if item.object.IsGeometry() { if item.object.IsGeometry() {
c.index.Remove(item) c.index.Remove(item)
c.objects-- c.objects--
@ -173,50 +199,23 @@ func (c *Collection) remove(id string) (item *itemT, ok bool) {
c.values.Delete(item) c.values.Delete(item)
c.nobjects-- c.nobjects--
} }
c.weight -= len(item.fields) * 8 fields = c.getFieldValues(id)
c.deleteFieldValues(id)
c.weight -= len(fields) * 8
c.weight -= item.object.Weight() + len(item.id) c.weight -= item.object.Weight() + len(item.id)
c.points -= item.object.PositionCount() c.points -= item.object.PositionCount()
return item, true return item.object, fields, true
}
func (c *Collection) insert(id string, obj geojson.Object) (item *itemT) {
item = &itemT{id: id, object: obj}
if obj.IsGeometry() {
c.index.Insert(item)
c.objects++
} else {
c.values.ReplaceOrInsert(item)
c.nobjects++
}
c.items.ReplaceOrInsert(item)
c.weight += obj.Weight() + len(id)
c.points += obj.PositionCount()
return item
}
// Remove removes an object and returns it.
// If the object does not exist then the 'ok' return value will be false.
func (c *Collection) Remove(id string) (obj geojson.Object, fields []float64, ok bool) {
item, ok := c.remove(id)
if !ok {
return nil, nil, false
}
return item.object, item.fields, true
}
func (c *Collection) get(id string) (obj geojson.Object, fields []float64, ok bool) {
i := c.items.Get(&itemT{id: id})
if i == nil {
return nil, nil, false
}
item := i.(*itemT)
return item.object, item.fields, true
} }
// Get returns an object. // Get returns an object.
// If the object does not exist then the 'ok' return value will be false. // If the object does not exist then the 'ok' return value will be false.
func (c *Collection) Get(id string) (obj geojson.Object, fields []float64, ok bool) { func (c *Collection) Get(id string) (obj geojson.Object, fields []float64, ok bool) {
return c.get(id) i := c.items.Get(&itemT{id: id})
if i == nil {
return nil, nil, false
}
item := i.(*itemT)
return item.object, c.getFieldValues(id), true
} }
// SetField set a field value for an object and returns that object. // SetField set a field value for an object and returns that object.
@ -229,7 +228,7 @@ func (c *Collection) SetField(id, field string, value float64) (obj geojson.Obje
} }
item := i.(*itemT) item := i.(*itemT)
updated = c.setField(item, field, value) updated = c.setField(item, field, value)
return item.object, item.fields, updated, true return item.object, c.getFieldValues(id), updated, true
} }
func (c *Collection) setField(item *itemT, field string, value float64) (updated bool) { func (c *Collection) setField(item *itemT, field string, value float64) (updated bool) {
@ -238,13 +237,15 @@ func (c *Collection) setField(item *itemT, field string, value float64) (updated
idx = len(c.fieldMap) idx = len(c.fieldMap)
c.fieldMap[field] = idx c.fieldMap[field] = idx
} }
c.weight -= len(item.fields) * 8 fields := c.getFieldValues(item.id)
for idx >= len(item.fields) { c.weight -= len(fields) * 8
item.fields = append(item.fields, 0) for idx >= len(fields) {
fields = append(fields, 0)
} }
c.weight += len(item.fields) * 8 c.weight += len(fields) * 8
ovalue := item.fields[idx] ovalue := fields[idx]
item.fields[idx] = value fields[idx] = value
c.setFieldValues(item.id, fields)
return ovalue != value return ovalue != value
} }
@ -271,7 +272,7 @@ func (c *Collection) Scan(cursor uint64, desc bool,
iter := func(item btree.Item) bool { iter := func(item btree.Item) bool {
if i >= cursor { if i >= cursor {
iitm := item.(*itemT) iitm := item.(*itemT)
active = iterator(iitm.id, iitm.object, iitm.fields) active = iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id))
} }
i++ i++
return active return active
@ -293,7 +294,7 @@ func (c *Collection) ScanRange(cursor uint64, start, end string, desc bool,
iter := func(item btree.Item) bool { iter := func(item btree.Item) bool {
if i >= cursor { if i >= cursor {
iitm := item.(*itemT) iitm := item.(*itemT)
active = iterator(iitm.id, iitm.object, iitm.fields) active = iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id))
} }
i++ i++
return active return active
@ -316,7 +317,7 @@ func (c *Collection) SearchValues(cursor uint64, desc bool,
iter := func(item btree.Item) bool { iter := func(item btree.Item) bool {
if i >= cursor { if i >= cursor {
iitm := item.(*itemT) iitm := item.(*itemT)
active = iterator(iitm.id, iitm.object, iitm.fields) active = iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id))
} }
i++ i++
return active return active
@ -338,7 +339,7 @@ func (c *Collection) SearchValuesRange(cursor uint64, start, end string, desc bo
iter := func(item btree.Item) bool { iter := func(item btree.Item) bool {
if i >= cursor { if i >= cursor {
iitm := item.(*itemT) iitm := item.(*itemT)
active = iterator(iitm.id, iitm.object, iitm.fields) active = iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id))
} }
i++ i++
return active return active
@ -360,7 +361,7 @@ func (c *Collection) ScanGreaterOrEqual(id string, cursor uint64, desc bool,
iter := func(item btree.Item) bool { iter := func(item btree.Item) bool {
if i >= cursor { if i >= cursor {
iitm := item.(*itemT) iitm := item.(*itemT)
active = iterator(iitm.id, iitm.object, iitm.fields) active = iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id))
} }
i++ i++
return active return active
@ -380,7 +381,7 @@ func (c *Collection) geoSearch(cursor uint64, bbox geojson.BBox, iterator func(i
if !ok { if !ok {
return true // just ignore return true // just ignore
} }
if !iterator(iitm.id, iitm.object, iitm.fields) { if !iterator(iitm.id, iitm.object, c.getFieldValues(iitm.id)) {
return false return false
} }
return true return true

View File

@ -90,20 +90,101 @@ func TestManyCollections(t *testing.T) {
}) })
} }
type testPointItem struct {
id string
object geojson.Object
}
func BenchmarkInsert(t *testing.B) { func BenchmarkInsert(t *testing.B) {
rand.Seed(time.Now().UnixNano()) rand.Seed(time.Now().UnixNano())
ids := make([]string, t.N) items := make([]testPointItem, t.N)
points := make([]geojson.Object, t.N)
for i := 0; i < t.N; i++ { for i := 0; i < t.N; i++ {
points[i] = geojson.SimplePoint{ items[i] = testPointItem{
fmt.Sprintf("%d", i),
geojson.SimplePoint{
Y: rand.Float64()*180 - 90, Y: rand.Float64()*180 - 90,
X: rand.Float64()*360 - 180, X: rand.Float64()*360 - 180,
},
} }
ids[i] = fmt.Sprintf("%d", i)
} }
col := New() col := New()
t.ResetTimer() t.ResetTimer()
for i := 0; i < t.N; i++ { for i := 0; i < t.N; i++ {
col.ReplaceOrInsert(ids[i], points[i], nil, nil) col.ReplaceOrInsert(items[i].id, items[i].object, nil, nil)
}
}
func BenchmarkReplace(t *testing.B) {
rand.Seed(time.Now().UnixNano())
items := make([]testPointItem, t.N)
for i := 0; i < t.N; i++ {
items[i] = testPointItem{
fmt.Sprintf("%d", i),
geojson.SimplePoint{
Y: rand.Float64()*180 - 90,
X: rand.Float64()*360 - 180,
},
}
}
col := New()
for i := 0; i < t.N; i++ {
col.ReplaceOrInsert(items[i].id, items[i].object, nil, nil)
}
t.ResetTimer()
for _, i := range rand.Perm(t.N) {
o, _, _ := col.ReplaceOrInsert(items[i].id, items[i].object, nil, nil)
if o != items[i].object {
t.Fatal("shoot!")
}
}
}
func BenchmarkGet(t *testing.B) {
rand.Seed(time.Now().UnixNano())
items := make([]testPointItem, t.N)
for i := 0; i < t.N; i++ {
items[i] = testPointItem{
fmt.Sprintf("%d", i),
geojson.SimplePoint{
Y: rand.Float64()*180 - 90,
X: rand.Float64()*360 - 180,
},
}
}
col := New()
for i := 0; i < t.N; i++ {
col.ReplaceOrInsert(items[i].id, items[i].object, nil, nil)
}
t.ResetTimer()
for _, i := range rand.Perm(t.N) {
o, _, _ := col.Get(items[i].id)
if o != items[i].object {
t.Fatal("shoot!")
}
}
}
func BenchmarkRemove(t *testing.B) {
rand.Seed(time.Now().UnixNano())
items := make([]testPointItem, t.N)
for i := 0; i < t.N; i++ {
items[i] = testPointItem{
fmt.Sprintf("%d", i),
geojson.SimplePoint{
Y: rand.Float64()*180 - 90,
X: rand.Float64()*360 - 180,
},
}
}
col := New()
for i := 0; i < t.N; i++ {
col.ReplaceOrInsert(items[i].id, items[i].object, nil, nil)
}
t.ResetTimer()
for _, i := range rand.Perm(t.N) {
o, _, _ := col.Remove(items[i].id)
if o != items[i].object {
t.Fatal("shoot!")
}
} }
} }