-
Notifications
You must be signed in to change notification settings - Fork 122
/
pool.go
228 lines (204 loc) · 5.83 KB
/
pool.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
package pool
import (
"io"
"runtime"
"sync"
"sync/atomic"
)
// searchAlone runs f, which may return nil, until count elements are found
func searchAlone(f func() interface{}, count int) []interface{} {
results := make([]interface{}, count)
for i := 0; i < len(results); i++ {
results[i] = nil
for ; results[i] == nil; results[i] = f() {
}
}
return results
}
// parallelizeAlone calculates the result of f count times
func parallelizeAlone(f func(int) interface{}, count int) []interface{} {
results := make([]interface{}, count)
for i := 0; i < len(results); i++ {
results[i] = f(i)
}
return results
}
// command is used to trigger our latent workers to do something.
//
// The idea is that a worker is told to either calculate a function once,
// or keep calculating a function until it returns a non nil result.
type command struct {
search bool
// This counter indicates the number of results that still need to be produced.
ctr *int64
// This channel is used to signal that the counter was modified
ctrChanged chan<- struct{}
// This is the index we evaluate our function at, when not searching
i int
f func(int) interface{}
// This is the array where we put results
results []interface{}
}
// workerSearch is the subroutine called when doing a search command.
//
// We need to keep searching for successful queries of f while *ctr > 0.
// When we find a successful result, we decrement *ctr.
func workerSearch(results []interface{}, ctrChanged chan<- struct{}, f func(int) interface{}, ctr *int64) {
for atomic.LoadInt64(ctr) > 0 {
res := f(0)
if res == nil {
continue
}
i := atomic.AddInt64(ctr, -1)
if i >= 0 {
results[i] = res
}
ctrChanged <- struct{}{}
}
}
// worker starts up a new worker, listening to commands, and producing results
func worker(commands <-chan command) {
for c := range commands {
if c.search {
workerSearch(c.results, c.ctrChanged, c.f, c.ctr)
} else {
c.results[c.i] = c.f(c.i)
atomic.AddInt64(c.ctr, -1)
c.ctrChanged <- struct{}{}
}
}
}
// Pool represents a pool of workers, used for parallelizing functions.
//
// Functions needing a *Pool will work with a nil receiver, doing the equivalent
// work on the current thread instead.
//
// By creating a pool, you avoid the overhead of spinning up goroutines for
// each new operation.
//
// A Pool is only ever intended to be used from a single goroutine, and might cause deadlocks
// if used by multiple goroutines concurrently.
type Pool struct {
// The common channel used to send commands to the workers.
//
// This effectively makes a work stealing pool.
commands chan command
// This holds the number of workers we've created
workerCount int
}
// NewPool creates a new pool, with a certain number of workers.
//
// If count ⩽ 0, this will use the number of available CPUs instead.
func NewPool(count int) *Pool {
var p Pool
if count <= 0 {
count = runtime.NumCPU()
}
p.commands = make(chan command)
p.workerCount = count
for i := 0; i < count; i++ {
go worker(p.commands)
}
return &p
}
// TearDown cleanly tears down a pool, closing channels, etc.
func (p *Pool) TearDown() {
if p != nil {
close(p.commands)
}
}
// Search queries the function f, until count successes are found.
//
// f is supposed to try a single candidate, returning nil if that candidate isn't
// successful.
//
// The result will be an array containing the first count successes.
func (p *Pool) Search(count int, f func() interface{}) []interface{} {
if p == nil {
return searchAlone(f, count)
}
results := make([]interface{}, count)
ctr := int64(count)
ctrChanged := make(chan struct{})
cmd := command{
search: true,
ctr: &ctr,
ctrChanged: ctrChanged,
f: func(i int) interface{} { return f() },
results: results,
}
cmdI := 0
for cmdI < p.workerCount {
select {
case p.commands <- cmd:
cmdI++
case <-ctrChanged:
}
}
for atomic.LoadInt64(&ctr) > 0 {
<-ctrChanged
}
return results
}
// Parallelize calls a function count times, passing in indices from 0..count-1.
//
// The result will be a slice containing [f(0), f(1), ..., f(count - 1)].
func (p *Pool) Parallelize(count int, f func(int) interface{}) []interface{} {
if p == nil {
return parallelizeAlone(f, count)
}
results := make([]interface{}, count)
ctr := int64(count)
ctrChanged := make(chan struct{})
cmdI := 0
for cmdI < count {
cmd := command{
search: false,
i: cmdI,
ctr: &ctr,
ctrChanged: ctrChanged,
f: f,
results: results,
}
// We won't be able to send all the commands without blocking, so we make
// sure to interleave picking off the results of workers to free them up
// to receive our commands
select {
case p.commands <- cmd:
cmdI++
case <-ctrChanged:
}
}
for atomic.LoadInt64(&ctr) > 0 {
<-ctrChanged
}
return results
}
// LockedReader wraps an io.Reader to be safe for concurrent reads.
//
// This type implements io.Reader, returning the same output.
//
// This means acquiring a lock whenever a read happens, so be aware of that
// for performance or concurrency reasons.
type LockedReader struct {
reader io.Reader
m sync.Mutex
}
// NewLockedReader creates a LockedReader by wrapping an underlying value.
func NewLockedReader(r io.Reader) *LockedReader {
// Intentionally not initializing m, since the zero value is ok
return &LockedReader{reader: r}
}
// Read implements io.Reader for LockedReader
//
// The behavior is to return the same output as the underlying reader. The difference
// is that it's safe to call this function concurrently.
//
// Naturally, when calling this function concurrently, what value ends up getting
// read is raced, but you won't end up reading the same value twice, or otherwise
// messing up the state of the reader.
func (r *LockedReader) Read(p []byte) (int, error) {
r.m.Lock()
defer r.m.Unlock()
return r.reader.Read(p)
}