initial working release

2019-04-11 16:21:27 +02:00 · 2019-04-11 16:21:27 +02:00 · 6482410063
commit 6482410063
11 changed files with 556 additions and 0 deletions
--- a/README.md
+++ b/README.md
@ -0,0 +1,29 @@
+# gtq - the go task queue
+
+## what?
+a simple goroutine scheduler for longer-running goroutines, allowing you
+to put them into priority buckets, and get roughly fair queuing of which
+tasks will be processed next.
+
+## why?
+goroutines are awesome, and typically super fast. but what if you need to
+queue up a lot of longer running work in the background? and what if you
+want some control over which chunks of work will get executed next?
+
+gtq provides simple task queuing and scheduling for longer running goroutines.
+in this case, "long" means on the order of 1ms or longer, as many simple
+goroutines can run in a matter of ns.
+
+## how?
+We use simple heap based queues for each priority level, and track statistics
+in a rolling window for task execution times in each of those. Then we
+have a scheduler which looks at those statistics, in relation to the priority
+level for the queue, and decides which queue to pull from next and feed to task
+runners.
+
+Overhead for this process is typically < 1000ns, so it's not suitable for
+typical short lived goroutines, but those type of goroutines don't really,
+need scheduling anyway.
+
+## usage
+TODO
--- a/go.mod
+++ b/go.mod
@ -0,0 +1,8 @@
+module github.com/nergdron/gtq
+
+go 1.12
+
+require (
+	gopkg.in/eapache/queue.v1 v1.1.0
+	gopkg.in/yaml.v2 v2.2.2
+)
--- a/go.sum
+++ b/go.sum
@ -0,0 +1,5 @@
+gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
+gopkg.in/eapache/queue.v1 v1.1.0 h1:EldqoJEGtXYiVCMRo2C9mePO2UUGnYn2+qLmlQSqPdc=
+gopkg.in/eapache/queue.v1 v1.1.0/go.mod h1:wNtmx1/O7kZSR9zNT1TTOJ7GLpm3Vn7srzlfylFbQwU=
+gopkg.in/yaml.v2 v2.2.2 h1:ZCJp+EgiOT7lHqUV2J862kp8Qj64Jo6az82+3Td9dZw=
+gopkg.in/yaml.v2 v2.2.2/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
--- a/queue.go
+++ b/queue.go
@ -0,0 +1,71 @@
+package gtq
+
+import (
+	"gopkg.in/eapache/queue.v1"
+	"sync"
+)
+
+// NewQueue initializes and returns an new Queue.
+func NewQueue() (q *Queue) {
+	return &Queue{
+		queue: queue.New(),
+		Done:  NewStat(0),
+	}
+}
+
+// Queue wraps eapache/queue with locking for thread safety. Also bundles in
+// Stats, used by schedulers to help pick tasks to execute.
+type Queue struct {
+	queue *queue.Queue
+	mutex sync.Mutex
+	// Stat which tracks task removal rate from the queue.
+	Done *Stat
+}
+
+// Add puts an element on the end of the queue.
+func (q *Queue) Add(task func()) {
+	q.mutex.Lock()
+	defer q.mutex.Unlock()
+	q.queue.Add(task)
+}
+
+// Get returns the element at index i in the queue.
+// This method accepts both positive and negative index values.
+// Index 0 refers to the first element, and index -1 refers to the last.
+func (q *Queue) Get(i int) (task func()) {
+	q.mutex.Lock()
+	defer q.mutex.Unlock()
+	if (q.queue.Length() < 1 || i > q.queue.Length()-1) || (i < -1) {
+		return nil
+	}
+	return q.queue.Get(i).(func())
+}
+
+// Length returns the number of elements currently stored in the queue.
+func (q *Queue) Length() int {
+	q.mutex.Lock()
+	defer q.mutex.Unlock()
+	return q.queue.Length()
+}
+
+// Peek returns the element at the head of the queue.
+func (q *Queue) Peek() (task func()) {
+	q.mutex.Lock()
+	defer q.mutex.Unlock()
+	if q.Length() < 1 {
+		return nil
+	}
+	return q.queue.Peek().(func())
+}
+
+// Remove removes and returns the element from the front of the queue.
+func (q *Queue) Remove() (task func()) {
+	q.mutex.Lock()
+	defer q.mutex.Unlock()
+	if q.queue.Length() < 1 {
+		return nil
+	}
+	task = q.queue.Remove().(func())
+	q.Done.Add(1)
+	return task
+}
--- a/queue_test.go
+++ b/queue_test.go
@ -0,0 +1,87 @@
+package gtq
+
+import (
+	"runtime"
+	"sync"
+	"testing"
+	"time"
+)
+
+var testQ = NewQueue()
+
+func testAdd(n int) {
+	for i := 0; i < n; i++ {
+		testQ.Add(func() {
+			time.Sleep(1)
+		})
+	}
+}
+
+func testRemove(wg *sync.WaitGroup, removed chan int) {
+	defer wg.Done()
+	var i int
+	for testQ.Remove() != nil {
+		i++
+	}
+	removed <- i
+}
+
+func TestParallelQueueAdd(t *testing.T) {
+	max := runtime.GOMAXPROCS(0)
+	var wg sync.WaitGroup
+	for n := 0; n < max; n++ {
+		wg.Add(1)
+		go func() {
+			defer wg.Done()
+			testAdd(1000000)
+		}()
+	}
+	wg.Wait()
+	t.Log("Queue size is", testQ.Length())
+	targetSize := max * 1000000
+	if testQ.Length() != targetSize {
+		t.Error("Queue size should be", targetSize)
+	}
+}
+
+func TestParallelQueueRemove(t *testing.T) {
+	target := testQ.Length()
+	var wg sync.WaitGroup
+	max := runtime.GOMAXPROCS(0)
+	removed := make(chan int, max)
+	for n := 0; n < max; n++ {
+		wg.Add(1)
+		go testRemove(&wg, removed)
+	}
+	wg.Wait()
+	close(removed)
+	var total int
+	for count := range removed {
+		total += count
+	}
+	if total != target {
+		t.Error("removed", total, "but expected", target)
+	}
+	t.Log("removed", total)
+}
+
+func BenchmarkParallelQueue(b *testing.B) {
+	testQ = NewQueue()
+	b.ResetTimer()
+	max := runtime.GOMAXPROCS(0)
+	var wg1, wg2 sync.WaitGroup
+	removed := make(chan int, max)
+	for i := 0; i < max; i++ {
+		wg1.Add(1)
+		wg2.Add(1)
+		go func() {
+			testAdd(b.N / (max * 2))
+			wg1.Done()
+		}()
+		go func() {
+			testRemove(&wg2, removed)
+		}()
+	}
+	wg1.Wait()
+	wg2.Wait()
+}
--- a/scheduler.go
+++ b/scheduler.go
@ -0,0 +1,39 @@
+package gtq
+
+import (
+	"sort"
+)
+
+// Scheduler is an internal goroutine which examines the Queues and
+// choses which tasks to run next. Returns true if tasks were scheduled,
+// or false if there's nothing left to schedule.
+type Scheduler func(tq *TaskQueue) bool
+
+// SimpleScheduler is the simplest possible implementation, which just takes
+// tasks off the highest priority queue.
+func SimpleScheduler(tq *TaskQueue) bool {
+	pc := tq.PriorityCounts()
+	// sort priorities
+	prios := make([]uint, 0, len(pc))
+	for k := range pc {
+		prios = append(prios, k)
+	}
+	sort.Sort(UIntSlice(prios))
+
+	var queued uint
+	for _, prio := range prios {
+		q, ok := tq.queues.Load(prio)
+		if !ok {
+			continue
+		}
+		for q.(*Queue).Length() > 0 {
+			task := q.(*Queue).Remove()
+			tq.nextTask <- task
+			queued++
+		}
+	}
+	if queued >= (tq.numJobs * 2) {
+		return true
+	}
+	return false
+}
--- a/stats.go
+++ b/stats.go
@ -0,0 +1,118 @@
+package gtq
+
+import (
+	"gopkg.in/yaml.v2"
+	"sync"
+	"time"
+)
+
+// Counter is an incrementing statistical value, with a Start time for rate
+// calculation.
+type Counter struct {
+	Start time.Time
+	Value uint64
+}
+
+// Stat for a queue priority level, grouped into timeslice buckets.
+type Stat struct {
+	timeSlices   []Counter
+	currentSlice int
+	window       time.Duration
+	mutex        sync.Mutex
+}
+
+// NewStat initializes and returns a new Stat. window determines
+// the size of the rolling statistics timeframe that is captured,
+// which in turn determines how finely grained stats collection and task
+// scheduling can be. window defaults to 1 second.
+func NewStat(window time.Duration) (s *Stat) {
+	s = &Stat{window: window}
+	if s.window == 0 {
+		s.window = time.Second
+	}
+	// default to 10 timeslice buckets, maybe make configurable later.
+	s.timeSlices = make([]Counter, 10)
+	return s
+}
+
+// Add increments the specified counter by the amount in val. window specifies
+func (s *Stat) Add(val uint64) {
+	s.mutex.Lock()
+	defer s.mutex.Unlock()
+	// roll over to next timeslice if slice duration has been exceeded.
+	sliceLength := s.window / time.Duration(len(s.timeSlices))
+	now := time.Now()
+	elapsed := now.Sub(s.timeSlices[s.currentSlice].Start)
+	if elapsed > sliceLength {
+		s.currentSlice++
+		s.currentSlice = s.currentSlice % len(s.timeSlices)
+		s.timeSlices[s.currentSlice].Start = now
+		s.timeSlices[s.currentSlice].Value = val
+	}
+	s.timeSlices[s.currentSlice].Value += val
+}
+
+// Total returns the current rolling total for this Stat.
+func (s *Stat) Total() (t uint64) {
+	for _, slice := range s.timeSlices {
+		t += slice.Value
+	}
+	return t
+}
+
+// Start returns the start time for this statistics window.
+func (s *Stat) Start() (start time.Time) {
+	for i := s.currentSlice; i < 10; i++ {
+		if s.timeSlices[i%10].Start.After(time.Time{}) {
+			return s.timeSlices[i%10].Start
+		}
+	}
+	return start
+}
+
+// Duration returns the size of the current statistics window in this Stat.
+// This will fluctuate between 90-100% of the window size set when the state
+// was created, as internal buckets roll over.
+func (s *Stat) Duration() time.Duration {
+	return time.Now().Sub(s.Start())
+}
+
+// Rate returns the flow rate of this counter, which is the current rolling
+// value / the current statistics duration.
+func (s *Stat) Rate() (r float64) {
+	return float64(s.Total()) / (float64(s.Duration()) / float64(time.Second))
+}
+
+// QueueStats is a report of formatted Stat data about a specific priority
+// queue captured at a point in time.
+type QueueStats struct {
+	Start time.Time
+	time.Duration
+	Count uint64
+	Rate  float64
+}
+
+func (qs *QueueStats) String() string {
+	b, _ := yaml.Marshal(qs)
+	return string(b)
+}
+
+// Stats returns the current time usage statistics for all active task
+// priority levels.
+func (tq *TaskQueue) Stats() (stats map[uint]*QueueStats) {
+	stats = make(map[uint]*QueueStats)
+	tq.mutex.Lock()
+	defer tq.mutex.Unlock()
+	tq.queues.Range(func(prio, q interface{}) bool {
+		stat := q.(*Queue).Done
+		qs := &QueueStats{
+			Start:    stat.Start(),
+			Duration: stat.Duration(),
+			Count:    stat.Total(),
+			Rate:     stat.Rate(),
+		}
+		stats[prio.(uint)] = qs
+		return true
+	})
+	return stats
+}
--- a/stats_test.go
+++ b/stats_test.go
@ -0,0 +1,22 @@
+package gtq
+
+import (
+	"math/rand"
+	"testing"
+	"time"
+)
+
+var testStat = NewStat(0)
+
+func TestStat(t *testing.T) {
+	total := int64(10000)
+	perOp := int64(time.Second) / total
+	for i := int64(0); i < total; i++ {
+		testStat.Add(1)
+		// random sleep to introduce some flow rate variation to capture.
+		time.Sleep(time.Duration(rand.Float64() * float64(perOp)))
+	}
+	t.Log("completed", testStat.Total(), "ops in", testStat.Duration(),
+		"for a total rate of", int64(testStat.Rate()), "ops/sec",
+	)
+}
--- a/taskqueue.go
+++ b/taskqueue.go
@ -0,0 +1,101 @@
+package gtq
+
+import (
+	"runtime"
+	"sync"
+	"time"
+)
+
+// TaskQueue manages multiple Queues with different priorities.
+// Task clients request tasks to run from this, and it decides which Task
+// to give the client, based on a roughly even time division based on the
+// priority numbers. Items from priority 2 will be given twice as much
+// processing time as items from priorty 1, for instance.
+type TaskQueue struct {
+	queues sync.Map
+	// task runners read off this channel, scheduler pushes onto it.
+	nextTask chan func()
+	// we need locking when cleaning up unused priorities.
+	mutex   sync.Mutex
+	running bool
+	numJobs uint
+}
+
+// NewTaskQueue returns an initialized TaskQueue.
+// numJobs specifies how many task workers you want running simultaneously, if
+// 0, defaults to runtime.GOMAXPROCS(0).
+func NewTaskQueue(numJobs uint) (tq *TaskQueue) {
+	if numJobs == 0 {
+		numJobs = uint(runtime.GOMAXPROCS(0))
+	}
+	tq = &TaskQueue{
+		// make sure we can buffer up at least one extra job per worker.
+		nextTask: make(chan func(), numJobs*2),
+		numJobs:  numJobs,
+	}
+	return tq
+}
+
+// Add a task to the TaskQueue with a given priority.
+func (tq *TaskQueue) Add(task func(), priority uint) {
+	q, _ := tq.queues.LoadOrStore(priority, NewQueue())
+	q.(*Queue).Add(task)
+}
+
+// Length returns the number of tasks at all priorities.
+func (tq *TaskQueue) Length() (length uint) {
+	tq.mutex.Lock()
+	defer tq.mutex.Unlock()
+	tq.queues.Range(func(_, q interface{}) bool {
+		length += uint(q.(*Queue).Length())
+		return true
+	})
+	return length
+}
+
+// PriorityCounts returns a map where the key is an active priority level,
+// and the value is the number of tasks left at that priority.
+func (tq *TaskQueue) PriorityCounts() (pc map[uint]int) {
+	pc = make(map[uint]int)
+	tq.mutex.Lock()
+	defer tq.mutex.Unlock()
+	tq.queues.Range(func(prio, q interface{}) bool {
+		pc[prio.(uint)] = q.(*Queue).Length()
+		return true
+	})
+	return pc
+}
+
+// Start begins processing tasks.
+func (tq *TaskQueue) Start(scheduler Scheduler) {
+	tq.mutex.Lock()
+	tq.running = true
+	tq.mutex.Unlock()
+	// start workers!
+	var j uint
+	for j = 0; j < tq.numJobs; j++ {
+		go func() {
+			for job := range tq.nextTask {
+				job()
+			}
+		}()
+	}
+	if scheduler == nil {
+		scheduler = SimpleScheduler
+	}
+	go func() {
+		for tq.running {
+			workQueued := scheduler(tq)
+			if !workQueued {
+				time.Sleep(1 * time.Millisecond)
+			}
+		}
+	}()
+}
+
+// Stop pauses processing of tasks. TaskQueue state is retained.
+func (tq *TaskQueue) Stop() {
+	tq.mutex.Lock()
+	defer tq.mutex.Unlock()
+	tq.running = false
+}
--- a/taskqueue_test.go
+++ b/taskqueue_test.go
@ -0,0 +1,51 @@
+package gtq
+
+import (
+	"runtime"
+	"sync"
+	"testing"
+	"time"
+)
+
+var numTestPrios = 10
+var tq *TaskQueue
+
+func testTQAdd(n int) {
+	workers := runtime.GOMAXPROCS(0)
+	var wg sync.WaitGroup
+	for i := 0; i < workers; i++ {
+		wg.Add(1)
+		go func() {
+			for i := 0; i < n; i++ {
+				// simplest possible task
+				tq.Add(func() {
+					time.Sleep(0)
+				}, uint(i%numTestPrios))
+			}
+			wg.Done()
+		}()
+	}
+	wg.Wait()
+}
+
+func TestTaskQueueAdd(t *testing.T) {
+	tq = NewTaskQueue(0)
+	testTQAdd(1000000)
+	expected := 1000000 * runtime.GOMAXPROCS(0)
+	added := tq.Length()
+	if uint(expected) != added {
+		t.Error("expected to add", expected, "but added", added)
+	} else {
+		t.Log("added", added)
+	}
+}
+
+func BenchmarkTaskQueue(b *testing.B) {
+	tq = NewTaskQueue(0)
+	testTQAdd(b.N / (runtime.GOMAXPROCS(0)))
+	tq.Start(nil)
+	for tq.Length() > 0 {
+		time.Sleep(10 * time.Millisecond)
+	}
+	tq.Stop()
+}
--- a/uintslice.go
+++ b/uintslice.go
@ -0,0 +1,25 @@
+package gtq
+
+// UIntSlice just subtypes []uint to fulfill sort.Interface, as demonstrated
+// for other types in the sort package.
+type UIntSlice []uint
+
+// Len helps fulfill sort.Interface.
+func (list UIntSlice) Len() int {
+	return len(list)
+}
+
+// Less helps fulfill sort.Interface.
+func (list UIntSlice) Less(i, j int) bool {
+	if list[i] <= list[j] {
+		return true
+	}
+	return false
+}
+
+// Swap helps fulfill sort.Interface
+func (list UIntSlice) Swap(i, j int) {
+	tmp := list[i]
+	list[i] = list[j]
+	list[j] = tmp
+}