@@ -2,43 +2,47 @@ package mfs
2
2
3
3
import (
4
4
"context"
5
+ "errors"
6
+ "sync"
5
7
"time"
6
8
7
9
cid "github.com/ipfs/go-cid"
8
10
)
9
11
12
+ // closeTimeout is how long to wait for current publishing to finish before
13
+ // shutting down the republisher.
14
+ const closeTimeout = 5 * time .Second
15
+
10
16
// PubFunc is the user-defined function that determines exactly what
11
17
// logic entails "publishing" a `Cid` value.
12
18
type PubFunc func (context.Context , cid.Cid ) error
13
19
14
20
// Republisher manages when to publish a given entry.
15
21
type Republisher struct {
16
- TimeoutLong time.Duration
17
- TimeoutShort time.Duration
18
- RetryTimeout time.Duration
19
- pubfunc PubFunc
20
-
22
+ pubfunc PubFunc
21
23
update chan cid.Cid
22
24
immediatePublish chan chan struct {}
23
25
24
- ctx context.Context
25
- cancel func ()
26
+ cancel func ()
27
+ closeOnce sync.Once
28
+ stopped chan struct {}
26
29
}
27
30
28
31
// NewRepublisher creates a new Republisher object to republish the given root
29
32
// using the given short and long time intervals.
30
- func NewRepublisher (ctx context.Context , pf PubFunc , tshort , tlong time.Duration ) * Republisher {
31
- ctx , cancel := context .WithCancel (ctx )
32
- return & Republisher {
33
- TimeoutShort : tshort ,
34
- TimeoutLong : tlong ,
35
- RetryTimeout : tlong ,
33
+ func NewRepublisher (pf PubFunc , tshort , tlong time.Duration , lastPublished cid.Cid ) * Republisher {
34
+ ctx , cancel := context .WithCancel (context .Background ())
35
+ rp := & Republisher {
36
36
update : make (chan cid.Cid , 1 ),
37
37
pubfunc : pf ,
38
38
immediatePublish : make (chan chan struct {}),
39
- ctx : ctx ,
40
39
cancel : cancel ,
40
+ stopped : make (chan struct {}),
41
41
}
42
+
43
+ go rp .run (ctx , tshort , tlong , lastPublished )
44
+
45
+ return rp
42
46
}
43
47
44
48
// WaitPub waits for the current value to be published (or returns early
@@ -58,10 +62,22 @@ func (rp *Republisher) WaitPub(ctx context.Context) error {
58
62
}
59
63
}
60
64
65
+ // Close tells the republisher to stop and waits for it to stop.
61
66
func (rp * Republisher ) Close () error {
62
- // TODO(steb): Wait for `Run` to stop
63
- err := rp .WaitPub (rp .ctx )
64
- rp .cancel ()
67
+ var err error
68
+ rp .closeOnce .Do (func () {
69
+ // Wait a short amount of time for any current publishing to finish.
70
+ ctx , cancel := context .WithTimeout (context .Background (), closeTimeout )
71
+ err = rp .WaitPub (ctx )
72
+ if errors .Is (err , context .DeadlineExceeded ) {
73
+ err = errors .New ("mfs/republisher: timed out waiting to publish during close" )
74
+ }
75
+ cancel ()
76
+ // Shutdown the publisher.
77
+ rp .cancel ()
78
+ })
79
+ // Wait for pblisher to stop and then return.
80
+ <- rp .stopped
65
81
return err
66
82
}
67
83
@@ -82,22 +98,28 @@ func (rp *Republisher) Update(c cid.Cid) {
82
98
}
83
99
84
100
// Run contains the core logic of the `Republisher`. It calls the user-defined
85
- // `pubfunc` function whenever the `Cid` value is updated to a *new* value. The
86
- // complexity comes from the fact that `pubfunc` may be slow so we need to batch
87
- // updates.
101
+ // `pubfunc` function whenever the `Cid` value is updated to a *new* value.
102
+ // Since calling the `pubfunc` may be slow, updates are batched
88
103
//
89
104
// Algorithm:
90
- // 1. When we receive the first update after publishing, we set a `longer` timer.
91
- // 2. When we receive any update, we reset the `quick` timer.
92
- // 3. If either the `quick` timeout or the `longer` timeout elapses,
93
- // we call `publish` with the latest updated value.
105
+ // 1. When receiving the first update after publishing, set a `longer` timer
106
+ // 2. When receiving any update, reset the `quick` timer
107
+ // 3. If either the `quick` timeout or the `longer` timeout elapses, call
108
+ // `publish` with the latest updated value.
109
+ //
110
+ // The `longer` timer ensures that publishing is delayed by at most that
111
+ // duration. The `quick` timer allows publishing sooner if there are no more
112
+ // updates available.
94
113
//
95
- // The `longer` timer ensures that we delay publishing by at most
96
- // `TimeoutLong`. The `quick` timer allows us to publish sooner if
97
- // it looks like there are no more updates coming down the pipe.
114
+ // In other words, the quick timeout means there are no more values to put into
115
+ // the "batch", so do update. The long timeout means there are that the "batch"
116
+ // is full, so do update, even though there are still values (no quick timeout
117
+ // yet) arriving.
98
118
//
99
- // Note: If a publish fails, we retry repeatedly every TimeoutRetry.
100
- func (rp * Republisher ) Run (lastPublished cid.Cid ) {
119
+ // If a publish fails, retry repeatedly every `longer` timeout.
120
+ func (rp * Republisher ) run (ctx context.Context , timeoutShort , timeoutLong time.Duration , lastPublished cid.Cid ) {
121
+ defer close (rp .stopped )
122
+
101
123
quick := time .NewTimer (0 )
102
124
if ! quick .Stop () {
103
125
<- quick .C
@@ -107,12 +129,13 @@ func (rp *Republisher) Run(lastPublished cid.Cid) {
107
129
<- longer .C
108
130
}
109
131
132
+ immediatePublish := rp .immediatePublish
110
133
var toPublish cid.Cid
111
- for rp .ctx .Err () == nil {
112
- var waiter chan struct {}
134
+ var waiter chan struct {}
113
135
136
+ for {
114
137
select {
115
- case <- rp . ctx .Done ():
138
+ case <- ctx .Done ():
116
139
return
117
140
case newValue := <- rp .update :
118
141
// Skip already published values.
@@ -123,19 +146,20 @@ func (rp *Republisher) Run(lastPublished cid.Cid) {
123
146
break
124
147
}
125
148
126
- // If we aren't already waiting to publish something,
127
- // reset the long timeout.
149
+ // If not already waiting to publish something, reset the long
150
+ // timeout.
128
151
if ! toPublish .Defined () {
129
- longer .Reset (rp . TimeoutLong )
152
+ longer .Reset (timeoutLong )
130
153
}
131
154
132
155
// Always reset the short timeout.
133
- quick .Reset (rp . TimeoutShort )
156
+ quick .Reset (timeoutShort )
134
157
135
158
// Finally, set the new value to publish.
136
159
toPublish = newValue
160
+ // Wait for a newer value or the quick timer.
137
161
continue
138
- case waiter = <- rp . immediatePublish :
162
+ case waiter = <- immediatePublish :
139
163
// Make sure to grab the *latest* value to publish.
140
164
select {
141
165
case toPublish = <- rp .update :
@@ -147,60 +171,62 @@ func (rp *Republisher) Run(lastPublished cid.Cid) {
147
171
toPublish = cid .Undef
148
172
}
149
173
case <- quick .C :
174
+ // Waited a short time for more updates and no more received.
150
175
case <- longer .C :
176
+ // Keep getting updates and now it is time to send what has been
177
+ // received so far.
151
178
}
152
179
153
180
// Cleanup, publish, and close waiters.
154
181
155
- // 1. Stop any timers. Don't use the `if !t.Stop() { ... }`
156
- // idiom as these timers may not be running.
157
-
182
+ // 1. Stop any timers.
158
183
quick .Stop ()
184
+ longer .Stop ()
185
+
186
+ // Do not use the `if !t.Stop() { ... }` idiom as these timers may not
187
+ // be running.
188
+ //
189
+ // TODO: remove after go1.23 required.
159
190
select {
160
191
case <- quick .C :
161
192
default :
162
193
}
163
-
164
- longer .Stop ()
165
194
select {
166
195
case <- longer .C :
167
196
default :
168
197
}
169
198
170
- // 2. If we have a value to publish, publish it now.
199
+ // 2. If there is a value to publish then publish it now.
171
200
if toPublish .Defined () {
172
- var timer * time.Timer
173
- for {
174
- err := rp .pubfunc (rp .ctx , toPublish )
175
- if err == nil {
176
- break
177
- }
178
-
179
- if timer == nil {
180
- timer = time .NewTimer (rp .RetryTimeout )
181
- defer timer .Stop ()
182
- } else {
183
- timer .Reset (rp .RetryTimeout )
184
- }
185
-
186
- // Keep retrying until we succeed or we abort.
187
- // TODO(steb): We could try pulling new values
188
- // off `update` but that's not critical (and
189
- // complicates this code a bit). We'll pull off
190
- // a new value on the next loop through.
191
- select {
192
- case <- timer .C :
193
- case <- rp .ctx .Done ():
194
- return
195
- }
201
+ err := rp .pubfunc (ctx , toPublish )
202
+ if err != nil {
203
+ // Republish failed, so retry after waiting for long timeout.
204
+ //
205
+ // Instead of entering a retry loop here, go back to waiting
206
+ // for more values and retrying to publish after the lomg
207
+ // timeout. Keep using the current waiter until it has been
208
+ // notified of a successful publish.
209
+ //
210
+ // Reset the long timer as it effectively becomes the retry
211
+ // timeout.
212
+ longer .Reset (timeoutLong )
213
+ // Stop reading waiters from immediatePublish while retrying,
214
+ // This causes the current waiter to be notified only after a
215
+ // successful call to pubfunc, and is what constitutes a retry.
216
+ immediatePublish = nil
217
+ continue
196
218
}
197
219
lastPublished = toPublish
198
220
toPublish = cid .Undef
221
+ // Resume reading waiters,
222
+ immediatePublish = rp .immediatePublish
199
223
}
200
224
201
- // 3. Trigger anything waiting in `WaitPub`.
225
+ // 3. Notify anything waiting in `WaitPub` on successful call to
226
+ // pubfunc or if nothing to publish.
202
227
if waiter != nil {
203
228
close (waiter )
229
+ waiter = nil
204
230
}
205
231
}
206
232
}
0 commit comments