Put an upper limit on walk pool sizes (#9848)

Fixes potentially infinite allocations, especially in FS mode, 
since lookups live up to 30 minutes. Limit walk pool sizes to 50 
max parameter entries and 4 concurrent operations with the same
parameters.

Fixes #9835
master
Klaus Post 4 years ago committed by GitHub
parent 1813ff9dfa
commit 8aae8b1d27
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
  1. 43
      cmd/merge-walk-pool.go
  2. 56
      cmd/merge-walk-pool_test.go
  3. 49
      cmd/tree-walk-pool.go
  4. 54
      cmd/tree-walk-pool_test.go

@ -35,6 +35,7 @@ type mergeWalkVersions struct {
// mergeWalk - represents the go routine that does the merge walk. // mergeWalk - represents the go routine that does the merge walk.
type mergeWalk struct { type mergeWalk struct {
added time.Time
entryChs []FileInfoCh entryChs []FileInfoCh
endWalkCh chan struct{} // To signal when mergeWalk go-routine should end. endWalkCh chan struct{} // To signal when mergeWalk go-routine should end.
endTimerCh chan<- struct{} // To signal when timer go-routine should end. endTimerCh chan<- struct{} // To signal when timer go-routine should end.
@ -160,7 +161,7 @@ func NewMergeWalkPool(timeout time.Duration) *MergeWalkPool {
// Release - selects a mergeWalk from the pool based on the input // Release - selects a mergeWalk from the pool based on the input
// listParams, removes it from the pool, and returns the MergeWalkResult // listParams, removes it from the pool, and returns the MergeWalkResult
// channel. // channel.
// Returns nil if listParams does not have an asccociated mergeWalk. // Returns nil if listParams does not have an associated mergeWalk.
func (t *MergeWalkPool) Release(params listParams) ([]FileInfoCh, chan struct{}) { func (t *MergeWalkPool) Release(params listParams) ([]FileInfoCh, chan struct{}) {
t.Lock() t.Lock()
defer t.Unlock() defer t.Unlock()
@ -169,6 +170,7 @@ func (t *MergeWalkPool) Release(params listParams) ([]FileInfoCh, chan struct{})
if len(walks) > 0 { if len(walks) > 0 {
// Pop out the first valid walk entry. // Pop out the first valid walk entry.
walk := walks[0] walk := walks[0]
walks[0] = mergeWalk{} // clear references.
walks = walks[1:] walks = walks[1:]
if len(walks) > 0 { if len(walks) > 0 {
t.pool[params] = walks t.pool[params] = walks
@ -195,17 +197,54 @@ func (t *MergeWalkPool) Set(params listParams, resultChs []FileInfoCh, endWalkCh
t.Lock() t.Lock()
defer t.Unlock() defer t.Unlock()
// If we are above the limit delete at least one entry from the pool.
if len(t.pool) > treeWalkEntryLimit {
age := time.Now()
var oldest listParams
for k, v := range t.pool {
if len(v) == 0 {
delete(t.pool, k)
continue
}
// The first element is the oldest, so we only check that.
if v[0].added.Before(age) {
oldest = k
}
}
// Invalidate and delete oldest.
if walks, ok := t.pool[oldest]; ok {
walk := walks[0]
walks[0] = mergeWalk{} // clear references.
walks = walks[1:]
if len(walks) > 0 {
t.pool[params] = walks
} else {
delete(t.pool, params)
}
walk.endTimerCh <- struct{}{}
}
}
// Should be a buffered channel so that Release() never blocks. // Should be a buffered channel so that Release() never blocks.
endTimerCh := make(chan struct{}, 1) endTimerCh := make(chan struct{}, 1)
walkInfo := mergeWalk{ walkInfo := mergeWalk{
added: UTCNow(),
entryChs: resultChs, entryChs: resultChs,
endWalkCh: endWalkCh, endWalkCh: endWalkCh,
endTimerCh: endTimerCh, endTimerCh: endTimerCh,
} }
// Append new walk info. // Append new walk info.
t.pool[params] = append(t.pool[params], walkInfo) walks := t.pool[params]
if len(walks) < treeWalkSameEntryLimit {
t.pool[params] = append(walks, walkInfo)
} else {
// We are at limit, invalidate oldest, move list down and add new as last.
walks[0].endTimerCh <- struct{}{}
copy(walks, walks[1:])
walks[len(walks)-1] = walkInfo
}
// Timer go-routine which times out after t.timeOut seconds. // Timer go-routine which times out after t.timeOut seconds.
go func(endTimerCh <-chan struct{}, walkInfo mergeWalk) { go func(endTimerCh <-chan struct{}, walkInfo mergeWalk) {

@ -74,7 +74,7 @@ func TestManyMergeWalksSameParam(t *testing.T) {
break break
default: default:
// Create many treeWalk go-routines for the same params. // Create many treeWalk go-routines for the same params.
for i := 0; i < 10; i++ { for i := 0; i < treeWalkSameEntryLimit; i++ {
endWalkCh := make(chan struct{}) endWalkCh := make(chan struct{})
walkChs := make([]FileInfoCh, 0) walkChs := make([]FileInfoCh, 0)
tw.Set(params, walkChs, endWalkCh) tw.Set(params, walkChs, endWalkCh)
@ -82,16 +82,62 @@ func TestManyMergeWalksSameParam(t *testing.T) {
tw.Lock() tw.Lock()
if walks, ok := tw.pool[params]; ok { if walks, ok := tw.pool[params]; ok {
if len(walks) != 10 { if len(walks) != treeWalkSameEntryLimit {
t.Error("There aren't as many walks as were Set") t.Error("There aren't as many walks as were Set")
} }
} }
tw.Unlock() tw.Unlock()
for i := 0; i < 10; i++ { for i := 0; i < treeWalkSameEntryLimit; i++ {
tw.Lock() tw.Lock()
if walks, ok := tw.pool[params]; ok { if walks, ok := tw.pool[params]; ok {
// Before ith Release we should have 10-i treeWalk go-routines. // Before ith Release we should have n-i treeWalk go-routines.
if 10-i != len(walks) { if treeWalkSameEntryLimit-i != len(walks) {
t.Error("There aren't as many walks as were Set")
}
}
tw.Unlock()
tw.Release(params)
}
}
}
// Test if multiple merge walkers for the same listParams are managed as expected by the pool
// but that treeWalkSameEntryLimit is respected.
func TestManyMergeWalksSameParamPrune(t *testing.T) {
// Create a treeWalkPool.
tw := NewMergeWalkPool(5 * time.Second)
// Create sample params.
params := listParams{
bucket: "test-bucket",
}
select {
// This timeout is an upper-bound. This is started
// before the first treeWalk go-routine's timeout period starts.
case <-time.After(5 * time.Second):
break
default:
// Create many treeWalk go-routines for the same params.
for i := 0; i < treeWalkSameEntryLimit*4; i++ {
endWalkCh := make(chan struct{})
walkChs := make([]FileInfoCh, 0)
tw.Set(params, walkChs, endWalkCh)
}
tw.Lock()
if walks, ok := tw.pool[params]; ok {
if len(walks) > treeWalkSameEntryLimit {
t.Error("There aren't as many walks as were Set")
}
}
tw.Unlock()
for i := 0; i < treeWalkSameEntryLimit; i++ {
tw.Lock()
if walks, ok := tw.pool[params]; ok {
// Before ith Release we should have n-i treeWalk go-routines.
if treeWalkSameEntryLimit-i != len(walks) {
t.Error("There aren't as many walks as were Set") t.Error("There aren't as many walks as were Set")
} }
} }

@ -25,7 +25,9 @@ import (
// Global lookup timeout. // Global lookup timeout.
const ( const (
globalLookupTimeout = time.Minute * 30 // 30minutes. globalLookupTimeout = time.Minute * 30 // 30minutes.
treeWalkEntryLimit = 50
treeWalkSameEntryLimit = 4
) )
// listParams - list object params used for list object map // listParams - list object params used for list object map
@ -44,6 +46,7 @@ var errWalkAbort = errors.New("treeWalk abort")
// treeWalk - represents the go routine that does the file tree walk. // treeWalk - represents the go routine that does the file tree walk.
type treeWalk struct { type treeWalk struct {
added time.Time
resultCh chan TreeWalkResult resultCh chan TreeWalkResult
endWalkCh chan struct{} // To signal when treeWalk go-routine should end. endWalkCh chan struct{} // To signal when treeWalk go-routine should end.
endTimerCh chan<- struct{} // To signal when timer go-routine should end. endTimerCh chan<- struct{} // To signal when timer go-routine should end.
@ -72,7 +75,7 @@ func NewTreeWalkPool(timeout time.Duration) *TreeWalkPool {
// Release - selects a treeWalk from the pool based on the input // Release - selects a treeWalk from the pool based on the input
// listParams, removes it from the pool, and returns the TreeWalkResult // listParams, removes it from the pool, and returns the TreeWalkResult
// channel. // channel.
// Returns nil if listParams does not have an asccociated treeWalk. // Returns nil if listParams does not have an associated treeWalk.
func (t *TreeWalkPool) Release(params listParams) (resultCh chan TreeWalkResult, endWalkCh chan struct{}) { func (t *TreeWalkPool) Release(params listParams) (resultCh chan TreeWalkResult, endWalkCh chan struct{}) {
t.Lock() t.Lock()
defer t.Unlock() defer t.Unlock()
@ -81,6 +84,7 @@ func (t *TreeWalkPool) Release(params listParams) (resultCh chan TreeWalkResult,
if len(walks) > 0 { if len(walks) > 0 {
// Pop out the first valid walk entry. // Pop out the first valid walk entry.
walk := walks[0] walk := walks[0]
walks[0] = treeWalk{} // clear references.
walks = walks[1:] walks = walks[1:]
if len(walks) > 0 { if len(walks) > 0 {
t.pool[params] = walks t.pool[params] = walks
@ -100,22 +104,59 @@ func (t *TreeWalkPool) Release(params listParams) (resultCh chan TreeWalkResult,
// 1) time.After() expires after t.timeOut seconds. // 1) time.After() expires after t.timeOut seconds.
// The expiration is needed so that the treeWalk go-routine resources are freed after a timeout // The expiration is needed so that the treeWalk go-routine resources are freed after a timeout
// if the S3 client does only partial listing of objects. // if the S3 client does only partial listing of objects.
// 2) Relase() signals the timer go-routine to end on endTimerCh. // 2) Release() signals the timer go-routine to end on endTimerCh.
// During listing the timer should not timeout and end the treeWalk go-routine, hence the // During listing the timer should not timeout and end the treeWalk go-routine, hence the
// timer go-routine should be ended. // timer go-routine should be ended.
func (t *TreeWalkPool) Set(params listParams, resultCh chan TreeWalkResult, endWalkCh chan struct{}) { func (t *TreeWalkPool) Set(params listParams, resultCh chan TreeWalkResult, endWalkCh chan struct{}) {
t.Lock() t.Lock()
defer t.Unlock() defer t.Unlock()
// If we are above the limit delete at least one entry from the pool.
if len(t.pool) > treeWalkEntryLimit {
age := time.Now()
var oldest listParams
for k, v := range t.pool {
if len(v) == 0 {
delete(t.pool, k)
continue
}
// The first element is the oldest, so we only check that.
if v[0].added.Before(age) {
oldest = k
}
}
// Invalidate and delete oldest.
if walks, ok := t.pool[oldest]; ok {
walk := walks[0]
walks[0] = treeWalk{} // clear references.
walks = walks[1:]
if len(walks) > 0 {
t.pool[params] = walks
} else {
delete(t.pool, params)
}
walk.endTimerCh <- struct{}{}
}
}
// Should be a buffered channel so that Release() never blocks. // Should be a buffered channel so that Release() never blocks.
endTimerCh := make(chan struct{}, 1) endTimerCh := make(chan struct{}, 1)
walkInfo := treeWalk{ walkInfo := treeWalk{
added: UTCNow(),
resultCh: resultCh, resultCh: resultCh,
endWalkCh: endWalkCh, endWalkCh: endWalkCh,
endTimerCh: endTimerCh, endTimerCh: endTimerCh,
} }
// Append new walk info. // Append new walk info.
t.pool[params] = append(t.pool[params], walkInfo) walks := t.pool[params]
if len(walks) < treeWalkSameEntryLimit {
t.pool[params] = append(walks, walkInfo)
} else {
// We are at limit, invalidate oldest, move list down and add new as last.
walks[0].endTimerCh <- struct{}{}
copy(walks, walks[1:])
walks[len(walks)-1] = walkInfo
}
// Timer go-routine which times out after t.timeOut seconds. // Timer go-routine which times out after t.timeOut seconds.
go func(endTimerCh <-chan struct{}) { go func(endTimerCh <-chan struct{}) {

@ -74,7 +74,7 @@ func TestManyWalksSameParam(t *testing.T) {
break break
default: default:
// Create many treeWalk go-routines for the same params. // Create many treeWalk go-routines for the same params.
for i := 0; i < 10; i++ { for i := 0; i < treeWalkSameEntryLimit; i++ {
resultCh := make(chan TreeWalkResult) resultCh := make(chan TreeWalkResult)
endWalkCh := make(chan struct{}) endWalkCh := make(chan struct{})
tw.Set(params, resultCh, endWalkCh) tw.Set(params, resultCh, endWalkCh)
@ -82,16 +82,16 @@ func TestManyWalksSameParam(t *testing.T) {
tw.Lock() tw.Lock()
if walks, ok := tw.pool[params]; ok { if walks, ok := tw.pool[params]; ok {
if len(walks) != 10 { if len(walks) != treeWalkSameEntryLimit {
t.Error("There aren't as many walks as were Set") t.Error("There aren't as many walks as were Set")
} }
} }
tw.Unlock() tw.Unlock()
for i := 0; i < 10; i++ { for i := 0; i < treeWalkSameEntryLimit; i++ {
tw.Lock() tw.Lock()
if walks, ok := tw.pool[params]; ok { if walks, ok := tw.pool[params]; ok {
// Before ith Release we should have 10-i treeWalk go-routines. // Before ith Release we should have n-i treeWalk go-routines.
if 10-i != len(walks) { if treeWalkSameEntryLimit-i != len(walks) {
t.Error("There aren't as many walks as were Set") t.Error("There aren't as many walks as were Set")
} }
} }
@ -99,5 +99,49 @@ func TestManyWalksSameParam(t *testing.T) {
tw.Release(params) tw.Release(params)
} }
} }
}
// Test if multiple tree walkers for the same listParams are managed as expected by the pool
// but that treeWalkSameEntryLimit is respected.
func TestManyWalksSameParamPrune(t *testing.T) {
// Create a treeWalkPool.
tw := NewTreeWalkPool(5 * time.Second)
// Create sample params.
params := listParams{
bucket: "test-bucket",
}
select {
// This timeout is an upper-bound. This is started
// before the first treeWalk go-routine's timeout period starts.
case <-time.After(5 * time.Second):
break
default:
// Create many treeWalk go-routines for the same params.
for i := 0; i < treeWalkSameEntryLimit*4; i++ {
resultCh := make(chan TreeWalkResult)
endWalkCh := make(chan struct{})
tw.Set(params, resultCh, endWalkCh)
}
tw.Lock()
if walks, ok := tw.pool[params]; ok {
if len(walks) != treeWalkSameEntryLimit {
t.Error("There aren't as many walks as were Set")
}
}
tw.Unlock()
for i := 0; i < treeWalkSameEntryLimit; i++ {
tw.Lock()
if walks, ok := tw.pool[params]; ok {
// Before ith Release we should have n-i treeWalk go-routines.
if treeWalkSameEntryLimit-i != len(walks) {
t.Error("There aren't as many walks as were Set")
}
}
tw.Unlock()
tw.Release(params)
}
}
} }

Loading…
Cancel
Save