VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
package fairshare
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"reflect"
|
|
|
|
"sync"
|
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
)
|
|
|
|
|
|
|
|
func TestJobManager_NewJobManager(t *testing.T) {
|
|
|
|
testCases := []struct {
|
|
|
|
name string
|
|
|
|
numWorkers int
|
|
|
|
expectedNumWorkers int
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
name: "",
|
|
|
|
numWorkers: 0,
|
|
|
|
expectedNumWorkers: 1,
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "",
|
|
|
|
numWorkers: 5,
|
|
|
|
expectedNumWorkers: 5,
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "",
|
|
|
|
numWorkers: 5,
|
|
|
|
expectedNumWorkers: 5,
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "",
|
|
|
|
numWorkers: 5,
|
|
|
|
expectedNumWorkers: 5,
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "",
|
|
|
|
numWorkers: 5,
|
|
|
|
expectedNumWorkers: 5,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
l := newTestLogger("jobmanager-test")
|
|
|
|
for tcNum, tc := range testCases {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager(tc.name, tc.numWorkers, l, nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
if tc.name != "" && tc.name != j.name {
|
|
|
|
t.Errorf("tc %d: expected name %s, got %s", tcNum, tc.name, j.name)
|
|
|
|
}
|
|
|
|
if j.queues == nil {
|
|
|
|
t.Errorf("tc %d: queues not set up properly", tcNum)
|
|
|
|
}
|
|
|
|
if j.queuesIndex == nil {
|
|
|
|
t.Errorf("tc %d: queues index not set up properly", tcNum)
|
|
|
|
}
|
|
|
|
if j.quit == nil {
|
|
|
|
t.Errorf("tc %d: quit channel not set up properly", tcNum)
|
|
|
|
}
|
|
|
|
if j.workerPool.numWorkers != tc.expectedNumWorkers {
|
|
|
|
t.Errorf("tc %d: expected %d workers, got %d", tcNum, tc.expectedNumWorkers, j.workerPool.numWorkers)
|
|
|
|
}
|
|
|
|
if j.logger == nil {
|
|
|
|
t.Errorf("tc %d: logger not set up properly", tcNum)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_Start(t *testing.T) {
|
|
|
|
numJobs := 10
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 3, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(numJobs)
|
|
|
|
j.Start()
|
|
|
|
defer j.Stop()
|
|
|
|
|
|
|
|
doneCh := make(chan struct{})
|
|
|
|
timeout := time.After(5 * time.Second)
|
|
|
|
go func() {
|
|
|
|
wg.Wait()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
ex := func(_ string) error {
|
|
|
|
wg.Done()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
onFail := func(_ error) {}
|
|
|
|
|
|
|
|
for i := 0; i < numJobs; i++ {
|
|
|
|
// distribute jobs between 3 queues in the job manager
|
|
|
|
job := newTestJob(t, fmt.Sprintf("test-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, fmt.Sprintf("queue-%d", i%3))
|
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_StartAndPause(t *testing.T) {
|
|
|
|
numJobs := 10
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 3, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(numJobs)
|
|
|
|
j.Start()
|
|
|
|
defer j.Stop()
|
|
|
|
|
|
|
|
doneCh := make(chan struct{})
|
|
|
|
timeout := time.After(5 * time.Second)
|
|
|
|
go func() {
|
|
|
|
wg.Wait()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
ex := func(_ string) error {
|
|
|
|
wg.Done()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
onFail := func(_ error) {}
|
|
|
|
|
|
|
|
for i := 0; i < numJobs; i++ {
|
|
|
|
// distribute jobs between 3 queues in the job manager
|
|
|
|
job := newTestJob(t, fmt.Sprintf("test-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, fmt.Sprintf("queue-%d", i%3))
|
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
|
|
|
|
// now that the work queue is empty, let's add more jobs and make sure
|
|
|
|
// we pick up where we left off
|
|
|
|
|
|
|
|
for i := 0; i < 5; i++ {
|
|
|
|
numAdditionalJobs := 5
|
|
|
|
wg.Add(numAdditionalJobs)
|
|
|
|
|
|
|
|
timeout = time.After(5 * time.Second)
|
|
|
|
go func() {
|
|
|
|
wg.Wait()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
for i := numJobs; i < numJobs+numAdditionalJobs; i++ {
|
|
|
|
// distribute jobs between 3 queues in the job manager
|
|
|
|
job := newTestJob(t, fmt.Sprintf("test-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, fmt.Sprintf("queue-%d", i%3))
|
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
|
|
|
|
numJobs += numAdditionalJobs
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_Stop(t *testing.T) {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 5, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
j.Start()
|
|
|
|
|
|
|
|
doneCh := make(chan struct{})
|
|
|
|
timeout := time.After(5 * time.Second)
|
|
|
|
go func() {
|
|
|
|
j.Stop()
|
2021-02-25 21:33:02 +00:00
|
|
|
j.wg.Wait()
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestFairshare_StopMultiple(t *testing.T) {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 5, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
j.Start()
|
|
|
|
|
|
|
|
doneCh := make(chan struct{})
|
|
|
|
timeout := time.After(5 * time.Second)
|
|
|
|
go func() {
|
|
|
|
j.Stop()
|
2021-02-25 21:33:02 +00:00
|
|
|
j.wg.Wait()
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
|
|
|
|
// essentially, we don't want to panic here
|
|
|
|
var r interface{}
|
|
|
|
go func() {
|
|
|
|
t.Helper()
|
|
|
|
|
|
|
|
defer func() {
|
|
|
|
r = recover()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
j.Stop()
|
2021-02-25 21:33:02 +00:00
|
|
|
j.wg.Wait()
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
}()
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
|
|
|
|
if r != nil {
|
|
|
|
t.Fatalf("panic during second stop: %v", r)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_AddJob(t *testing.T) {
|
|
|
|
testCases := []struct {
|
|
|
|
name string
|
|
|
|
queueID string
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
name: "test1",
|
|
|
|
queueID: "q1",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "test2",
|
|
|
|
queueID: "q1",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "test3",
|
|
|
|
queueID: "q1",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "test4",
|
|
|
|
queueID: "q2",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "test5",
|
|
|
|
queueID: "q3",
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 3, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
expectedCount := make(map[string]int)
|
|
|
|
for _, tc := range testCases {
|
|
|
|
if _, ok := expectedCount[tc.queueID]; !ok {
|
|
|
|
expectedCount[tc.queueID] = 1
|
|
|
|
} else {
|
|
|
|
expectedCount[tc.queueID]++
|
|
|
|
}
|
|
|
|
|
|
|
|
job := newDefaultTestJob(t, tc.name)
|
|
|
|
j.AddJob(&job, tc.queueID)
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(expectedCount) != len(j.queues) {
|
|
|
|
t.Fatalf("expected %d queues, got %d", len(expectedCount), len(j.queues))
|
|
|
|
}
|
|
|
|
|
|
|
|
for k, v := range j.queues {
|
|
|
|
if v.Len() != expectedCount[k] {
|
|
|
|
t.Fatalf("queue %s has bad count. expected %d, got %d", k, expectedCount[k], v.Len())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_GetPendingJobCount(t *testing.T) {
|
|
|
|
numJobs := 15
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("test-job-mgr", 3, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
for i := 0; i < numJobs; i++ {
|
|
|
|
job := newDefaultTestJob(t, fmt.Sprintf("job-%d", i))
|
|
|
|
j.AddJob(&job, fmt.Sprintf("queue-%d", i%4))
|
|
|
|
}
|
|
|
|
|
|
|
|
pendingJobs := j.GetPendingJobCount()
|
|
|
|
if pendingJobs != numJobs {
|
|
|
|
t.Errorf("expected %d jobs, got %d", numJobs, pendingJobs)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_GetWorkQueueLengths(t *testing.T) {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("test-job-mgr", 3, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
expected := make(map[string]int)
|
|
|
|
for i := 0; i < 25; i++ {
|
|
|
|
queueID := fmt.Sprintf("queue-%d", i%4)
|
|
|
|
job := newDefaultTestJob(t, fmt.Sprintf("job-%d", i))
|
|
|
|
|
|
|
|
j.AddJob(&job, queueID)
|
|
|
|
|
|
|
|
if _, ok := expected[queueID]; !ok {
|
2021-06-25 20:06:49 +00:00
|
|
|
expected[queueID] = 0
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
}
|
2021-06-25 20:06:49 +00:00
|
|
|
|
|
|
|
expected[queueID]++
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
pendingJobs := j.GetWorkQueueLengths()
|
|
|
|
if !reflect.DeepEqual(pendingJobs, expected) {
|
|
|
|
t.Errorf("expected %v job count, got %v", expected, pendingJobs)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_removeLastQueueAccessed(t *testing.T) {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("job-mgr-test", 1, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
|
|
|
|
testCases := []struct {
|
|
|
|
lastQueueAccessed int
|
|
|
|
updatedLastQueueAccessed int
|
|
|
|
len int
|
|
|
|
expectedQueues []string
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
// remove with bad index (too low)
|
|
|
|
lastQueueAccessed: -1,
|
|
|
|
updatedLastQueueAccessed: -1,
|
|
|
|
len: 3,
|
|
|
|
expectedQueues: []string{"queue-0", "queue-1", "queue-2"},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
// remove with bad index (too high)
|
|
|
|
lastQueueAccessed: 3,
|
|
|
|
updatedLastQueueAccessed: 3,
|
|
|
|
len: 3,
|
|
|
|
expectedQueues: []string{"queue-0", "queue-1", "queue-2"},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
// remove queue-1 (index 1)
|
|
|
|
lastQueueAccessed: 1,
|
|
|
|
updatedLastQueueAccessed: 0,
|
|
|
|
len: 2,
|
|
|
|
expectedQueues: []string{"queue-0", "queue-2"},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
// remove queue-0 (index 0)
|
|
|
|
lastQueueAccessed: 0,
|
|
|
|
updatedLastQueueAccessed: 0,
|
|
|
|
len: 1,
|
|
|
|
expectedQueues: []string{"queue-2"},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
// remove queue-1 (index 1)
|
|
|
|
lastQueueAccessed: 0,
|
|
|
|
updatedLastQueueAccessed: -1,
|
|
|
|
len: 0,
|
|
|
|
expectedQueues: []string{},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
j.l.Lock()
|
|
|
|
defer j.l.Unlock()
|
2021-06-25 20:06:49 +00:00
|
|
|
|
|
|
|
j.addQueue("queue-0")
|
|
|
|
j.addQueue("queue-1")
|
|
|
|
j.addQueue("queue-2")
|
|
|
|
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
for _, tc := range testCases {
|
|
|
|
j.lastQueueAccessed = tc.lastQueueAccessed
|
|
|
|
j.removeLastQueueAccessed()
|
|
|
|
|
|
|
|
if j.lastQueueAccessed != tc.updatedLastQueueAccessed {
|
|
|
|
t.Errorf("last queue access update failed. expected %d, got %d", tc.updatedLastQueueAccessed, j.lastQueueAccessed)
|
|
|
|
}
|
|
|
|
if len(j.queuesIndex) != tc.len {
|
|
|
|
t.Fatalf("queue index update failed. expected %d elements, found %v", tc.len, j.queues)
|
|
|
|
}
|
|
|
|
if len(j.queues) != len(tc.expectedQueues) {
|
|
|
|
t.Fatalf("bad amount of queues. expected %d, found %v", len(tc.expectedQueues), j.queues)
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, q := range tc.expectedQueues {
|
|
|
|
if _, ok := j.queues[q]; !ok {
|
|
|
|
t.Errorf("bad queue. expected %s in %v", q, j.queues)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-25 20:06:49 +00:00
|
|
|
func TestJobManager_EndToEnd(t *testing.T) {
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
testCases := []struct {
|
|
|
|
name string
|
|
|
|
queueID string
|
|
|
|
}{
|
|
|
|
{
|
|
|
|
name: "job-1",
|
|
|
|
queueID: "queue-1",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "job-2",
|
|
|
|
queueID: "queue-2",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "job-3",
|
|
|
|
queueID: "queue-1",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "job-4",
|
|
|
|
queueID: "queue-3",
|
|
|
|
},
|
|
|
|
{
|
|
|
|
name: "job-5",
|
|
|
|
queueID: "queue-3",
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
// we add the jobs before starting the workers, so we'd expect the round
|
|
|
|
// robin to pick the least-recently-added job from each queue, and cycle
|
|
|
|
// through queues in a round-robin fashion. jobs would appear on the queues
|
|
|
|
// as illustrated below, and we expect to round robin as:
|
|
|
|
// queue-1 -> queue-2 -> queue-3 -> queue-1 ...
|
|
|
|
//
|
|
|
|
// queue-1 [job-3, job-1]
|
|
|
|
// queue-2 [job-2]
|
|
|
|
// queue-3 [job-5, job-4]
|
|
|
|
|
|
|
|
// ... where jobs are pushed to the left side and popped from the right side
|
|
|
|
|
|
|
|
expectedOrder := []string{"job-1", "job-2", "job-4", "job-3", "job-5"}
|
|
|
|
|
|
|
|
resultsCh := make(chan string)
|
|
|
|
defer close(resultsCh)
|
|
|
|
|
|
|
|
var mu sync.Mutex
|
|
|
|
order := make([]string, 0)
|
|
|
|
|
|
|
|
go func() {
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case res, ok := <-resultsCh:
|
|
|
|
if !ok {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
mu.Lock()
|
|
|
|
order = append(order, res)
|
|
|
|
mu.Unlock()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
ex := func(name string) error {
|
|
|
|
resultsCh <- name
|
|
|
|
time.Sleep(50 * time.Millisecond)
|
|
|
|
wg.Done()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
onFail := func(_ error) {}
|
|
|
|
|
2021-06-25 20:06:49 +00:00
|
|
|
// use one worker to guarantee ordering
|
|
|
|
j := NewJobManager("test-job-mgr", 1, newTestLogger("jobmanager-test"), nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
for _, tc := range testCases {
|
|
|
|
wg.Add(1)
|
|
|
|
job := newTestJob(t, tc.name, ex, onFail)
|
|
|
|
j.AddJob(&job, tc.queueID)
|
|
|
|
}
|
|
|
|
|
|
|
|
j.Start()
|
|
|
|
defer j.Stop()
|
|
|
|
|
2021-06-25 20:06:49 +00:00
|
|
|
doneCh := make(chan struct{})
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
go func() {
|
|
|
|
wg.Wait()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
2021-06-25 20:06:49 +00:00
|
|
|
timeout := time.After(5 * time.Second)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
|
|
|
|
mu.Lock()
|
|
|
|
defer mu.Unlock()
|
|
|
|
if !reflect.DeepEqual(order, expectedOrder) {
|
|
|
|
t.Fatalf("results out of order. \nexpected: %v\ngot: %v", expectedOrder, order)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-25 20:06:49 +00:00
|
|
|
func TestFairshare_StressTest(t *testing.T) {
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
ex := func(name string) error {
|
|
|
|
wg.Done()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
onFail := func(_ error) {}
|
|
|
|
|
|
|
|
j := NewJobManager("test-job-mgr", 15, nil, nil)
|
|
|
|
j.Start()
|
|
|
|
defer j.Stop()
|
|
|
|
|
|
|
|
for i := 0; i < 3000; i++ {
|
|
|
|
wg.Add(1)
|
|
|
|
job := newTestJob(t, fmt.Sprintf("a-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, "a")
|
|
|
|
}
|
|
|
|
for i := 0; i < 4000; i++ {
|
|
|
|
wg.Add(1)
|
|
|
|
job := newTestJob(t, fmt.Sprintf("b-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, "b")
|
|
|
|
}
|
|
|
|
for i := 0; i < 3000; i++ {
|
|
|
|
wg.Add(1)
|
|
|
|
job := newTestJob(t, fmt.Sprintf("c-job-%d", i), ex, onFail)
|
|
|
|
j.AddJob(&job, "c")
|
|
|
|
}
|
|
|
|
|
|
|
|
doneCh := make(chan struct{})
|
|
|
|
go func() {
|
|
|
|
wg.Wait()
|
|
|
|
doneCh <- struct{}{}
|
|
|
|
}()
|
|
|
|
|
|
|
|
timeout := time.After(5 * time.Second)
|
|
|
|
select {
|
|
|
|
case <-doneCh:
|
|
|
|
break
|
|
|
|
case <-timeout:
|
|
|
|
t.Fatal("timed out")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
func TestFairshare_nilLoggerJobManager(t *testing.T) {
|
2021-02-27 00:00:39 +00:00
|
|
|
j := NewJobManager("test-job-mgr", 1, nil, nil)
|
VAULT-1401 and 1402 - preliminary fair sharing (#1701) (#10917)
* basic pool and start testing
* refactor a bit for testing
* workFunc, start/stop safety, testing
* cleanup function for worker quit, more tests
* redo public/private members
* improve tests, export types, switch uuid package
* fix loop capture bug, cleanup
* cleanup tests
* update worker pool file name, other improvements
* add job manager prototype
* remove remnants
* add functions to wait for job manager and worker pool to stop, other fixes
* test job manager functionality, fix bugs
* encapsulate how jobs are distributed to workers
* make worker job channel read only
* add job interface, more testing, fixes
* set name for dispatcher
* fix test races
* dispatcher and job manager constructors don't return errors
* logger now dependency injected
* make some members private, test fcn to get worker pool size
* make GetNumWorkers public
* Update helper/fairshare/jobmanager_test.go
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
* make workerpool private
* remove custom worker names
* concurrency improvements
* remove worker pool cleanup function
* remove cleanup func from job manager, remove non blocking stop from fairshare
* stop fairshare when started in tests
* stop leaking job manager goroutine
* prototype channel for waking up to assign work
* fix typo/bug and add tests
* improve job manager wake up, fix test typo
* put channel drain back
* better start/pause test for job manager
* go mod vendor
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
Co-authored-by: Brian Kassouf <briankassouf@users.noreply.github.com>
2021-02-12 21:51:52 +00:00
|
|
|
if j.logger == nil {
|
|
|
|
t.Error("logger not set up properly")
|
|
|
|
}
|
|
|
|
}
|
2021-06-25 20:06:49 +00:00
|
|
|
|
|
|
|
func TestFairshare_getNextQueue(t *testing.T) {
|
|
|
|
j := NewJobManager("test-job-mgr", 18, nil, nil)
|
|
|
|
|
|
|
|
for i := 0; i < 10; i++ {
|
|
|
|
job := newDefaultTestJob(t, fmt.Sprintf("job-%d", i))
|
|
|
|
j.AddJob(&job, "a")
|
|
|
|
j.AddJob(&job, "b")
|
|
|
|
j.AddJob(&job, "c")
|
|
|
|
}
|
|
|
|
|
|
|
|
j.l.Lock()
|
|
|
|
defer j.l.Unlock()
|
|
|
|
|
|
|
|
// fake out some number of workers with various remaining work scenario
|
|
|
|
// no queue can be assigned more than 6 workers
|
|
|
|
j.workerCount["a"] = 1
|
|
|
|
j.workerCount["b"] = 2
|
|
|
|
j.workerCount["c"] = 5
|
|
|
|
|
|
|
|
expectedOrder := []string{"a", "b", "c", "a", "b", "a", "b", "a", "b", "a"}
|
|
|
|
|
|
|
|
for _, expectedQueueID := range expectedOrder {
|
|
|
|
queueID, canAssignWorker := j.getNextQueue()
|
|
|
|
|
|
|
|
if !canAssignWorker {
|
|
|
|
t.Fatalf("expected have work true, got false for queue %q", queueID)
|
|
|
|
}
|
|
|
|
if queueID != expectedQueueID {
|
|
|
|
t.Errorf("expected queueID %q, got %q", expectedQueueID, queueID)
|
|
|
|
}
|
|
|
|
|
|
|
|
// simulate a worker being added to that queue
|
|
|
|
j.workerCount[queueID]++
|
|
|
|
}
|
|
|
|
|
|
|
|
// queues are saturated with work, we shouldn't be able to find a queue
|
|
|
|
// eligible for a worker (and last accessed queue shouldn't update)
|
|
|
|
expectedLastQueueAccessed := j.lastQueueAccessed
|
|
|
|
queueID, canAssignWork := j.getNextQueue()
|
|
|
|
if canAssignWork {
|
|
|
|
t.Error("should not be able to assign work with all queues saturated")
|
|
|
|
}
|
|
|
|
if queueID != "" {
|
|
|
|
t.Errorf("expected no queueID, got %s", queueID)
|
|
|
|
}
|
|
|
|
if j.lastQueueAccessed != expectedLastQueueAccessed {
|
|
|
|
t.Errorf("expected no last queue accessed update. had %d, got %d", expectedLastQueueAccessed, j.lastQueueAccessed)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestJobManager_pruneEmptyQueues(t *testing.T) {
|
|
|
|
j := NewJobManager("test-job-mgr", 18, nil, nil)
|
|
|
|
|
|
|
|
// add a few jobs to test out queue pruning
|
|
|
|
// for test simplicity, we'll keep the number of workers per queue at 0
|
|
|
|
testJob := newDefaultTestJob(t, "job-0")
|
|
|
|
j.AddJob(&testJob, "a")
|
|
|
|
j.AddJob(&testJob, "a")
|
|
|
|
j.AddJob(&testJob, "b")
|
|
|
|
|
|
|
|
job, queueID := j.getNextJob()
|
|
|
|
if queueID != "a" || job == nil {
|
|
|
|
t.Fatalf("bad next job: queueID %s, job: %#v", queueID, job)
|
|
|
|
}
|
|
|
|
|
|
|
|
j.l.RLock()
|
|
|
|
if _, ok := j.queues["a"]; !ok {
|
|
|
|
t.Error("expected queue 'a' to exist")
|
|
|
|
}
|
|
|
|
if _, ok := j.queues["b"]; !ok {
|
|
|
|
t.Error("expected queue 'b' to exist")
|
|
|
|
}
|
|
|
|
j.l.RUnlock()
|
|
|
|
|
|
|
|
job, queueID = j.getNextJob()
|
|
|
|
if queueID != "b" || job == nil {
|
|
|
|
t.Fatalf("bad next job: queueID %s, job: %#v", queueID, job)
|
|
|
|
}
|
|
|
|
|
|
|
|
j.l.RLock()
|
|
|
|
if _, ok := j.queues["a"]; !ok {
|
|
|
|
t.Error("expected queue 'a' to exist")
|
|
|
|
}
|
|
|
|
if _, ok := j.queues["b"]; ok {
|
|
|
|
t.Error("expected queue 'b' to be pruned")
|
|
|
|
}
|
|
|
|
j.l.RUnlock()
|
|
|
|
|
|
|
|
job, queueID = j.getNextJob()
|
|
|
|
if queueID != "a" || job == nil {
|
|
|
|
t.Fatalf("bad next job: queueID %s, job: %#v", queueID, job)
|
|
|
|
}
|
|
|
|
|
|
|
|
j.l.RLock()
|
|
|
|
if _, ok := j.queues["a"]; ok {
|
|
|
|
t.Error("expected queue 'a' to be pruned")
|
|
|
|
}
|
|
|
|
if _, ok := j.queues["b"]; ok {
|
|
|
|
t.Error("expected queue 'b' to be pruned")
|
|
|
|
}
|
|
|
|
j.l.RUnlock()
|
|
|
|
|
|
|
|
job, queueID = j.getNextJob()
|
|
|
|
if job != nil {
|
|
|
|
t.Errorf("expected no more jobs (out of queues). queueID: %s, job: %#v", queueID, job)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestFairshare_WorkerCount_IncrementAndDecrement(t *testing.T) {
|
|
|
|
j := NewJobManager("test-job-mgr", 18, nil, nil)
|
|
|
|
|
|
|
|
job := newDefaultTestJob(t, "job-0")
|
|
|
|
j.AddJob(&job, "a")
|
|
|
|
j.AddJob(&job, "b")
|
|
|
|
j.AddJob(&job, "c")
|
|
|
|
|
|
|
|
// test to make sure increment works
|
|
|
|
j.incrementWorkerCount("a")
|
|
|
|
workerCounts := j.GetWorkerCounts()
|
|
|
|
if workerCounts["a"] != 1 {
|
|
|
|
t.Fatalf("expected 1 worker on 'a', got %d", workerCounts["a"])
|
|
|
|
}
|
|
|
|
if workerCounts["b"] != 0 {
|
|
|
|
t.Fatalf("expected 0 workers on 'b', got %d", workerCounts["b"])
|
|
|
|
}
|
|
|
|
if workerCounts["c"] != 0 {
|
|
|
|
t.Fatalf("expected 0 workers on 'c', got %d", workerCounts["c"])
|
|
|
|
}
|
|
|
|
|
|
|
|
// test to make sure decrement works (when there is still work for the queue)
|
|
|
|
j.decrementWorkerCount("a")
|
|
|
|
workerCounts = j.GetWorkerCounts()
|
|
|
|
if workerCounts["a"] != 0 {
|
|
|
|
t.Fatalf("expected 0 workers on 'a', got %d", workerCounts["a"])
|
|
|
|
}
|
|
|
|
|
|
|
|
// add a worker to queue "a" and remove all work to ensure worker count gets
|
|
|
|
// cleared out for "a"
|
|
|
|
j.incrementWorkerCount("a")
|
|
|
|
j.l.Lock()
|
|
|
|
delete(j.queues, "a")
|
|
|
|
j.l.Unlock()
|
|
|
|
|
|
|
|
j.decrementWorkerCount("a")
|
|
|
|
workerCounts = j.GetWorkerCounts()
|
|
|
|
if _, ok := workerCounts["a"]; ok {
|
|
|
|
t.Fatalf("expected no worker count for 'a', got %#v", workerCounts)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestFairshare_queueWorkersSaturated(t *testing.T) {
|
|
|
|
j := NewJobManager("test-job-mgr", 20, nil, nil)
|
|
|
|
|
|
|
|
job := newDefaultTestJob(t, "job-0")
|
|
|
|
j.AddJob(&job, "a")
|
|
|
|
j.AddJob(&job, "b")
|
|
|
|
|
|
|
|
// no more than 9 workers can be assigned to a single queue in this example
|
|
|
|
for i := 0; i < 8; i++ {
|
|
|
|
j.incrementWorkerCount("a")
|
|
|
|
j.incrementWorkerCount("b")
|
|
|
|
|
|
|
|
j.l.RLock()
|
|
|
|
if j.queueWorkersSaturated("a") {
|
|
|
|
j.l.RUnlock()
|
|
|
|
t.Fatalf("queue 'a' falsely saturated: %#v", j.GetWorkerCounts())
|
|
|
|
}
|
|
|
|
if j.queueWorkersSaturated("b") {
|
|
|
|
j.l.RUnlock()
|
|
|
|
t.Fatalf("queue 'b' falsely saturated: %#v", j.GetWorkerCounts())
|
|
|
|
}
|
|
|
|
j.l.RUnlock()
|
|
|
|
}
|
|
|
|
|
|
|
|
// adding the 9th and 10th workers should saturate the number of workers we
|
|
|
|
// can have per queue
|
|
|
|
for i := 8; i < 10; i++ {
|
|
|
|
j.incrementWorkerCount("a")
|
|
|
|
j.incrementWorkerCount("b")
|
|
|
|
|
|
|
|
j.l.RLock()
|
|
|
|
if !j.queueWorkersSaturated("a") {
|
|
|
|
j.l.RUnlock()
|
|
|
|
t.Fatalf("queue 'a' falsely unsaturated: %#v", j.GetWorkerCounts())
|
|
|
|
}
|
|
|
|
if !j.queueWorkersSaturated("b") {
|
|
|
|
j.l.RUnlock()
|
|
|
|
t.Fatalf("queue 'b' falsely unsaturated: %#v", j.GetWorkerCounts())
|
|
|
|
}
|
|
|
|
j.l.RUnlock()
|
|
|
|
}
|
|
|
|
}
|