aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorChris Lu <chris.lu@gmail.com>2018-12-15 05:55:56 -0800
committerChris Lu <chris.lu@gmail.com>2018-12-15 05:55:56 -0800
commit42cb9b76c4851a59a479fb1e0e7cc53551ab7d82 (patch)
treea57d3cae8d96ade2543804092132e9fa4faf20b0
parent21315f709de9520ae8dc8cd7a8998802ee89af72 (diff)
downloadseaweedfs-42cb9b76c4851a59a479fb1e0e7cc53551ab7d82.tar.xz
seaweedfs-42cb9b76c4851a59a479fb1e0e7cc53551ab7d82.zip
reduce needle map memory usage by 25%
-rw-r--r--weed/storage/needle/compact_map.go69
-rw-r--r--weed/storage/needle/compact_map_perf_test.go9
-rw-r--r--weed/storage/needle/compact_map_test.go18
3 files changed, 63 insertions, 33 deletions
diff --git a/weed/storage/needle/compact_map.go b/weed/storage/needle/compact_map.go
index 2b0b7532e..7c4b6d72c 100644
--- a/weed/storage/needle/compact_map.go
+++ b/weed/storage/needle/compact_map.go
@@ -10,21 +10,31 @@ const (
batch = 100000
)
+type SectionalNeedleId uint32
+
+const SectionalNeedleIdLimit = 1<<32 - 1
+
+type SectionalNeedleValue struct {
+ Key SectionalNeedleId
+ Offset Offset `comment:"Volume offset"` //since aligned to 8 bytes, range is 4G*8=32G
+ Size uint32 `comment:"Size of the data portion"`
+}
+
type CompactSection struct {
sync.RWMutex
- values []NeedleValue
+ values []SectionalNeedleValue
overflow Overflow
start NeedleId
end NeedleId
counter int
}
-type Overflow []NeedleValue
+type Overflow []SectionalNeedleValue
func NewCompactSection(start NeedleId) *CompactSection {
return &CompactSection{
- values: make([]NeedleValue, batch),
- overflow: Overflow(make([]NeedleValue, 0)),
+ values: make([]SectionalNeedleValue, batch),
+ overflow: Overflow(make([]SectionalNeedleValue, 0)),
start: start,
}
}
@@ -35,22 +45,23 @@ func (cs *CompactSection) Set(key NeedleId, offset Offset, size uint32) (oldOffs
if key > cs.end {
cs.end = key
}
- if i := cs.binarySearchValues(key); i >= 0 {
+ skey := SectionalNeedleId(key - cs.start)
+ if i := cs.binarySearchValues(skey); i >= 0 {
oldOffset, oldSize = cs.values[i].Offset, cs.values[i].Size
//println("key", key, "old size", ret)
cs.values[i].Offset, cs.values[i].Size = offset, size
} else {
needOverflow := cs.counter >= batch
- needOverflow = needOverflow || cs.counter > 0 && cs.values[cs.counter-1].Key > key
+ needOverflow = needOverflow || cs.counter > 0 && cs.values[cs.counter-1].Key > skey
if needOverflow {
//println("start", cs.start, "counter", cs.counter, "key", key)
- if oldValue, found := cs.overflow.findOverflowEntry(key); found {
+ if oldValue, found := cs.overflow.findOverflowEntry(skey); found {
oldOffset, oldSize = oldValue.Offset, oldValue.Size
}
- cs.overflow = cs.overflow.setOverflowEntry(NeedleValue{Key: key, Offset: offset, Size: size})
+ cs.overflow = cs.overflow.setOverflowEntry(SectionalNeedleValue{Key: skey, Offset: offset, Size: size})
} else {
p := &cs.values[cs.counter]
- p.Key, p.Offset, p.Size = key, offset, size
+ p.Key, p.Offset, p.Size = skey, offset, size
//println("added index", cs.counter, "key", key, cs.values[cs.counter].Key)
cs.counter++
}
@@ -61,16 +72,17 @@ func (cs *CompactSection) Set(key NeedleId, offset Offset, size uint32) (oldOffs
//return old entry size
func (cs *CompactSection) Delete(key NeedleId) uint32 {
+ skey := SectionalNeedleId(key - cs.start)
cs.Lock()
ret := uint32(0)
- if i := cs.binarySearchValues(key); i >= 0 {
+ if i := cs.binarySearchValues(skey); i >= 0 {
if cs.values[i].Size > 0 {
ret = cs.values[i].Size
cs.values[i].Size = 0
}
}
- if v, found := cs.overflow.findOverflowEntry(key); found {
- cs.overflow = cs.overflow.deleteOverflowEntry(key)
+ if v, found := cs.overflow.findOverflowEntry(skey); found {
+ cs.overflow = cs.overflow.deleteOverflowEntry(skey)
ret = v.Size
}
cs.Unlock()
@@ -78,18 +90,21 @@ func (cs *CompactSection) Delete(key NeedleId) uint32 {
}
func (cs *CompactSection) Get(key NeedleId) (*NeedleValue, bool) {
cs.RLock()
- if v, ok := cs.overflow.findOverflowEntry(key); ok {
+ skey := SectionalNeedleId(key - cs.start)
+ if v, ok := cs.overflow.findOverflowEntry(skey); ok {
cs.RUnlock()
- return &v, true
+ nv := v.toNeedleValue(cs)
+ return &nv, true
}
- if i := cs.binarySearchValues(key); i >= 0 {
+ if i := cs.binarySearchValues(skey); i >= 0 {
cs.RUnlock()
- return &cs.values[i], true
+ nv := cs.values[i].toNeedleValue(cs)
+ return &nv, true
}
cs.RUnlock()
return nil, false
}
-func (cs *CompactSection) binarySearchValues(key NeedleId) int {
+func (cs *CompactSection) binarySearchValues(key SectionalNeedleId) int {
l, h := 0, cs.counter-1
if h >= 0 && cs.values[h].Key < key {
return -2
@@ -122,7 +137,7 @@ func NewCompactMap() *CompactMap {
func (cm *CompactMap) Set(key NeedleId, offset Offset, size uint32) (oldOffset Offset, oldSize uint32) {
x := cm.binarySearchCompactSection(key)
- if x < 0 {
+ if x < 0 || (key-cm.list[x].start) > SectionalNeedleIdLimit {
//println(x, "creating", len(cm.list), "section, starting", key)
cs := NewCompactSection(key)
cm.list = append(cm.list, cs)
@@ -185,14 +200,14 @@ func (cm *CompactMap) Visit(visit func(NeedleValue) error) error {
for _, cs := range cm.list {
cs.RLock()
for _, v := range cs.overflow {
- if err := visit(v); err != nil {
+ if err := visit(v.toNeedleValue(cs)); err != nil {
cs.RUnlock()
return err
}
}
for _, v := range cs.values {
if _, found := cs.overflow.findOverflowEntry(v.Key); !found {
- if err := visit(v); err != nil {
+ if err := visit(v.toNeedleValue(cs)); err != nil {
cs.RUnlock()
return err
}
@@ -203,7 +218,7 @@ func (cm *CompactMap) Visit(visit func(NeedleValue) error) error {
return nil
}
-func (o Overflow) deleteOverflowEntry(key NeedleId) Overflow {
+func (o Overflow) deleteOverflowEntry(key SectionalNeedleId) Overflow {
length := len(o)
deleteCandidate := sort.Search(length, func(i int) bool {
return o[i].Key >= key
@@ -217,7 +232,7 @@ func (o Overflow) deleteOverflowEntry(key NeedleId) Overflow {
return o
}
-func (o Overflow) setOverflowEntry(needleValue NeedleValue) Overflow {
+func (o Overflow) setOverflowEntry(needleValue SectionalNeedleValue) Overflow {
insertCandidate := sort.Search(len(o), func(i int) bool {
return o[i].Key >= needleValue.Key
})
@@ -233,7 +248,7 @@ func (o Overflow) setOverflowEntry(needleValue NeedleValue) Overflow {
return o
}
-func (o Overflow) findOverflowEntry(key NeedleId) (nv NeedleValue, found bool) {
+func (o Overflow) findOverflowEntry(key SectionalNeedleId) (nv SectionalNeedleValue, found bool) {
foundCandidate := sort.Search(len(o), func(i int) bool {
return o[i].Key >= key
})
@@ -242,3 +257,11 @@ func (o Overflow) findOverflowEntry(key NeedleId) (nv NeedleValue, found bool) {
}
return nv, false
}
+
+func (snv SectionalNeedleValue) toNeedleValue(cs *CompactSection) NeedleValue {
+ return NeedleValue{NeedleId(snv.Key) + cs.start, snv.Offset, snv.Size}
+}
+
+func (nv NeedleValue) toSectionalNeedleValue(cs *CompactSection) SectionalNeedleValue {
+ return SectionalNeedleValue{SectionalNeedleId(nv.Key - cs.start), nv.Offset, nv.Size}
+}
diff --git a/weed/storage/needle/compact_map_perf_test.go b/weed/storage/needle/compact_map_perf_test.go
index fe0a9179a..cd21cc184 100644
--- a/weed/storage/needle/compact_map_perf_test.go
+++ b/weed/storage/needle/compact_map_perf_test.go
@@ -6,6 +6,7 @@ import (
"os"
"runtime"
"testing"
+ "time"
. "github.com/chrislusf/seaweedfs/weed/storage/types"
"github.com/chrislusf/seaweedfs/weed/util"
@@ -28,6 +29,7 @@ func TestMemoryUsage(t *testing.T) {
var maps []*CompactMap
+ startTime := time.Now()
for i := 0; i < 10; i++ {
indexFile, ie := os.OpenFile("../../../test/sample.idx", os.O_RDWR|os.O_RDONLY, 0644)
if ie != nil {
@@ -38,6 +40,9 @@ func TestMemoryUsage(t *testing.T) {
indexFile.Close()
PrintMemUsage()
+ now := time.Now()
+ fmt.Printf("\tTaken = %v\n", now.Sub(startTime))
+ startTime = now
}
}
@@ -67,13 +72,15 @@ func loadNewNeedleMap(file *os.File) *CompactMap {
}
func PrintMemUsage() {
+
+ runtime.GC()
var m runtime.MemStats
runtime.ReadMemStats(&m)
// For info on each, see: https://golang.org/pkg/runtime/#MemStats
fmt.Printf("Alloc = %v MiB", bToMb(m.Alloc))
fmt.Printf("\tTotalAlloc = %v MiB", bToMb(m.TotalAlloc))
fmt.Printf("\tSys = %v MiB", bToMb(m.Sys))
- fmt.Printf("\tNumGC = %v\n", m.NumGC)
+ fmt.Printf("\tNumGC = %v", m.NumGC)
}
func bToMb(b uint64) uint64 {
return b / 1024 / 1024
diff --git a/weed/storage/needle/compact_map_test.go b/weed/storage/needle/compact_map_test.go
index 77b96e230..1320e81ba 100644
--- a/weed/storage/needle/compact_map_test.go
+++ b/weed/storage/needle/compact_map_test.go
@@ -78,19 +78,19 @@ func TestCompactMap(t *testing.T) {
}
func TestOverflow(t *testing.T) {
- o := Overflow(make([]NeedleValue, 0))
+ o := Overflow(make([]SectionalNeedleValue, 0))
- o = o.setOverflowEntry(NeedleValue{Key: 1, Offset: 12, Size: 12})
- o = o.setOverflowEntry(NeedleValue{Key: 2, Offset: 12, Size: 12})
- o = o.setOverflowEntry(NeedleValue{Key: 3, Offset: 12, Size: 12})
- o = o.setOverflowEntry(NeedleValue{Key: 4, Offset: 12, Size: 12})
- o = o.setOverflowEntry(NeedleValue{Key: 5, Offset: 12, Size: 12})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 1, Offset: 12, Size: 12})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 2, Offset: 12, Size: 12})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 3, Offset: 12, Size: 12})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 4, Offset: 12, Size: 12})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 5, Offset: 12, Size: 12})
if o[2].Key != 3 {
t.Fatalf("expecting o[2] has key 3: %+v", o[2].Key)
}
- o = o.setOverflowEntry(NeedleValue{Key: 3, Offset: 24, Size: 24})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 3, Offset: 24, Size: 24})
if o[2].Key != 3 {
t.Fatalf("expecting o[2] has key 3: %+v", o[2].Key)
@@ -123,13 +123,13 @@ func TestOverflow(t *testing.T) {
}
println()
- o = o.setOverflowEntry(NeedleValue{Key: 4, Offset: 44, Size: 44})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 4, Offset: 44, Size: 44})
for i, x := range o {
println("overflow[", i, "]:", x.Key)
}
println()
- o = o.setOverflowEntry(NeedleValue{Key: 1, Offset: 11, Size: 11})
+ o = o.setOverflowEntry(SectionalNeedleValue{Key: 1, Offset: 11, Size: 11})
for i, x := range o {
println("overflow[", i, "]:", x.Key)