watch.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482
  1. // Copyright 2016 CoreOS, Inc.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. package clientv3
  15. import (
  16. "fmt"
  17. "sync"
  18. "github.com/coreos/etcd/Godeps/_workspace/src/golang.org/x/net/context"
  19. "github.com/coreos/etcd/Godeps/_workspace/src/google.golang.org/grpc"
  20. pb "github.com/coreos/etcd/etcdserver/etcdserverpb"
  21. storagepb "github.com/coreos/etcd/storage/storagepb"
  22. )
  23. type Watcher interface {
  24. // Watch watches on a single key. The watched events will be returned
  25. // through the returned channel.
  26. // If the watch is slow or the required rev is compacted, the watch request
  27. // might be canceled from the server-side and the chan will be closed.
  28. Watch(cxt context.Context, key string, rev int64) <-chan WatchResponse
  29. // Watch watches on a prefix. The watched events will be returned
  30. // through the returned channel.
  31. // If the watch is slow or the required rev is compacted, the watch request
  32. // might be canceled from the server-side and the chan will be closed.
  33. WatchPrefix(cxt context.Context, prefix string, rev int64) <-chan WatchResponse
  34. // Close closes the watcher and cancels all watch requests.
  35. Close() error
  36. }
  37. type WatchResponse struct {
  38. Header pb.ResponseHeader
  39. Events []*storagepb.Event
  40. }
  41. // watcher implements the Watcher interface
  42. type watcher struct {
  43. c *Client
  44. conn *grpc.ClientConn
  45. remote pb.WatchClient
  46. // ctx controls internal remote.Watch requests
  47. ctx context.Context
  48. cancel context.CancelFunc
  49. // streams holds all active watchers
  50. streams map[int64]*watcherStream
  51. // mu protects the streams map
  52. mu sync.RWMutex
  53. // reqc sends a watch request from Watch() to the main goroutine
  54. reqc chan *watchRequest
  55. // respc receives data from the watch client
  56. respc chan *pb.WatchResponse
  57. // stopc is sent to the main goroutine to stop all processing
  58. stopc chan struct{}
  59. // donec closes to broadcast shutdown
  60. donec chan struct{}
  61. // errc transmits errors from grpc Recv
  62. errc chan error
  63. }
  64. // watchRequest is issued by the subscriber to start a new watcher
  65. type watchRequest struct {
  66. ctx context.Context
  67. key string
  68. prefix string
  69. rev int64
  70. // retc receives a chan WatchResponse once the watcher is established
  71. retc chan chan WatchResponse
  72. }
  73. // watcherStream represents a registered watcher
  74. type watcherStream struct {
  75. initReq watchRequest
  76. // outc publishes watch responses to subscriber
  77. outc chan<- WatchResponse
  78. // recvc buffers watch responses before publishing
  79. recvc chan *WatchResponse
  80. id int64
  81. // lastRev is revision last successfully sent over outc
  82. lastRev int64
  83. // resumec indicates the stream must recover at a given revision
  84. resumec chan int64
  85. }
  86. func NewWatcher(c *Client) Watcher {
  87. ctx, cancel := context.WithCancel(context.Background())
  88. conn := c.ActiveConnection()
  89. w := &watcher{
  90. c: c,
  91. conn: conn,
  92. remote: pb.NewWatchClient(conn),
  93. ctx: ctx,
  94. cancel: cancel,
  95. streams: make(map[int64]*watcherStream),
  96. respc: make(chan *pb.WatchResponse),
  97. reqc: make(chan *watchRequest),
  98. stopc: make(chan struct{}),
  99. donec: make(chan struct{}),
  100. errc: make(chan error, 1),
  101. }
  102. go w.run()
  103. return w
  104. }
  105. func (w *watcher) Watch(ctx context.Context, key string, rev int64) <-chan WatchResponse {
  106. return w.watch(ctx, key, "", rev)
  107. }
  108. func (w *watcher) WatchPrefix(ctx context.Context, prefix string, rev int64) <-chan WatchResponse {
  109. return w.watch(ctx, "", prefix, rev)
  110. }
  111. func (w *watcher) Close() error {
  112. select {
  113. case w.stopc <- struct{}{}:
  114. case <-w.donec:
  115. }
  116. <-w.donec
  117. return <-w.errc
  118. }
  119. // watch posts a watch request to run() and waits for a new watcher channel
  120. func (w *watcher) watch(ctx context.Context, key, prefix string, rev int64) <-chan WatchResponse {
  121. retc := make(chan chan WatchResponse, 1)
  122. wr := &watchRequest{ctx: ctx, key: key, prefix: prefix, rev: rev, retc: retc}
  123. // submit request
  124. select {
  125. case w.reqc <- wr:
  126. case <-wr.ctx.Done():
  127. return nil
  128. case <-w.donec:
  129. return nil
  130. }
  131. // receive channel
  132. select {
  133. case ret := <-retc:
  134. return ret
  135. case <-ctx.Done():
  136. return nil
  137. case <-w.donec:
  138. return nil
  139. }
  140. }
  141. func (w *watcher) addStream(resp *pb.WatchResponse, pendingReq *watchRequest) {
  142. if pendingReq == nil {
  143. // no pending request; ignore
  144. return
  145. } else if resp.WatchId == -1 || resp.Compacted {
  146. // failed; no channel
  147. pendingReq.retc <- nil
  148. return
  149. }
  150. ret := make(chan WatchResponse)
  151. ws := &watcherStream{
  152. initReq: *pendingReq,
  153. id: resp.WatchId,
  154. outc: ret,
  155. // buffered so unlikely to block on sending while holding mu
  156. recvc: make(chan *WatchResponse, 4),
  157. resumec: make(chan int64),
  158. }
  159. w.mu.Lock()
  160. w.streams[ws.id] = ws
  161. w.mu.Unlock()
  162. // send messages to subscriber
  163. go w.serveStream(ws)
  164. // pass back the subscriber channel for the watcher
  165. pendingReq.retc <- ret
  166. }
  167. // closeStream closes the watcher resources and removes it
  168. func (w *watcher) closeStream(ws *watcherStream) {
  169. // cancels request stream; subscriber receives nil channel
  170. close(ws.initReq.retc)
  171. // close subscriber's channel
  172. close(ws.outc)
  173. // shutdown serveStream
  174. close(ws.recvc)
  175. delete(w.streams, ws.id)
  176. }
  177. // run is the root of the goroutines for managing a watcher client
  178. func (w *watcher) run() {
  179. defer func() {
  180. close(w.donec)
  181. w.cancel()
  182. }()
  183. // start a stream with the etcd grpc server
  184. wc, wcerr := w.newWatchClient()
  185. if wcerr != nil {
  186. w.errc <- wcerr
  187. return
  188. }
  189. var pendingReq, failedReq *watchRequest
  190. curReqC := w.reqc
  191. cancelSet := make(map[int64]struct{})
  192. for {
  193. select {
  194. // Watch() requested
  195. case pendingReq = <-curReqC:
  196. // no more watch requests until there's a response
  197. curReqC = nil
  198. if err := wc.Send(pendingReq.toPB()); err == nil {
  199. // pendingReq now waits on w.respc
  200. break
  201. }
  202. failedReq = pendingReq
  203. // New events from the watch client
  204. case pbresp := <-w.respc:
  205. switch {
  206. case pbresp.Canceled:
  207. delete(cancelSet, pbresp.WatchId)
  208. case pbresp.Compacted:
  209. w.mu.Lock()
  210. if ws, ok := w.streams[pbresp.WatchId]; ok {
  211. w.closeStream(ws)
  212. }
  213. w.mu.Unlock()
  214. case pbresp.Created:
  215. // response to pending req, try to add
  216. w.addStream(pbresp, pendingReq)
  217. pendingReq = nil
  218. curReqC = w.reqc
  219. default:
  220. // dispatch to appropriate watch stream
  221. if ok := w.dispatchEvent(pbresp); ok {
  222. break
  223. }
  224. // watch response on unexpected watch id; cancel id
  225. if _, ok := cancelSet[pbresp.WatchId]; ok {
  226. break
  227. }
  228. cancelSet[pbresp.WatchId] = struct{}{}
  229. cr := &pb.WatchRequest_CancelRequest{
  230. CancelRequest: &pb.WatchCancelRequest{
  231. WatchId: pbresp.WatchId,
  232. },
  233. }
  234. req := &pb.WatchRequest{RequestUnion: cr}
  235. wc.Send(req)
  236. }
  237. // watch client failed to recv; spawn another if possible
  238. // TODO report watch client errors from errc?
  239. case <-w.errc:
  240. if wc, wcerr = w.newWatchClient(); wcerr != nil {
  241. w.errc <- wcerr
  242. return
  243. }
  244. curReqC = w.reqc
  245. if pendingReq != nil {
  246. failedReq = pendingReq
  247. }
  248. cancelSet = make(map[int64]struct{})
  249. case <-w.stopc:
  250. w.errc <- nil
  251. return
  252. }
  253. // send failed; queue for retry
  254. if failedReq != nil {
  255. go func() {
  256. select {
  257. case w.reqc <- pendingReq:
  258. case <-pendingReq.ctx.Done():
  259. case <-w.donec:
  260. }
  261. }()
  262. failedReq = nil
  263. pendingReq = nil
  264. }
  265. }
  266. }
  267. // dispatchEvent sends a WatchResponse to the appropriate watcher stream
  268. func (w *watcher) dispatchEvent(pbresp *pb.WatchResponse) bool {
  269. w.mu.RLock()
  270. defer w.mu.RUnlock()
  271. ws, ok := w.streams[pbresp.WatchId]
  272. if ok {
  273. wr := &WatchResponse{*pbresp.Header, pbresp.Events}
  274. ws.recvc <- wr
  275. }
  276. return ok
  277. }
  278. // serveWatchClient forwards messages from the grpc stream to run()
  279. func (w *watcher) serveWatchClient(wc pb.Watch_WatchClient) {
  280. for {
  281. resp, err := wc.Recv()
  282. if err != nil {
  283. select {
  284. case w.errc <- err:
  285. case <-w.donec:
  286. }
  287. return
  288. }
  289. select {
  290. case w.respc <- resp:
  291. case <-w.donec:
  292. return
  293. }
  294. }
  295. }
  296. // serveStream forwards watch responses from run() to the subscriber
  297. func (w *watcher) serveStream(ws *watcherStream) {
  298. emptyWr := &WatchResponse{}
  299. wrs := []*WatchResponse{}
  300. resuming := false
  301. closing := false
  302. for !closing {
  303. curWr := emptyWr
  304. outc := ws.outc
  305. if len(wrs) > 0 {
  306. curWr = wrs[0]
  307. } else {
  308. outc = nil
  309. }
  310. select {
  311. case outc <- *curWr:
  312. newRev := wrs[0].Events[len(wrs[0].Events)-1].Kv.ModRevision
  313. if newRev != ws.lastRev {
  314. ws.lastRev = newRev
  315. }
  316. wrs[0] = nil
  317. wrs = wrs[1:]
  318. case wr, ok := <-ws.recvc:
  319. if !ok {
  320. // shutdown from closeStream
  321. return
  322. }
  323. // resume up to last seen event if disconnected
  324. if resuming {
  325. resuming = false
  326. // trim events already seen
  327. for i := 0; i < len(wr.Events); i++ {
  328. if wr.Events[i].Kv.ModRevision > ws.lastRev {
  329. wr.Events = wr.Events[i:]
  330. break
  331. }
  332. }
  333. // only forward new events
  334. if wr.Events[0].Kv.ModRevision == ws.lastRev {
  335. break
  336. }
  337. }
  338. // TODO don't keep buffering if subscriber stops reading
  339. wrs = append(wrs, wr)
  340. case resumeRev := <-ws.resumec:
  341. if resumeRev != ws.lastRev {
  342. panic("unexpected resume revision")
  343. }
  344. wrs = nil
  345. resuming = true
  346. case <-w.donec:
  347. closing = true
  348. case <-ws.initReq.ctx.Done():
  349. closing = true
  350. }
  351. }
  352. w.mu.Lock()
  353. w.closeStream(ws)
  354. w.mu.Unlock()
  355. // lazily send cancel message if events on missing id
  356. }
  357. func (w *watcher) newWatchClient() (pb.Watch_WatchClient, error) {
  358. ws, rerr := w.resume()
  359. if rerr != nil {
  360. return nil, rerr
  361. }
  362. go w.serveWatchClient(ws)
  363. return ws, nil
  364. }
  365. // resume creates a new WatchClient with all current watchers reestablished
  366. func (w *watcher) resume() (ws pb.Watch_WatchClient, err error) {
  367. for {
  368. if ws, err = w.openWatchClient(); err != nil {
  369. break
  370. } else if err = w.resumeWatchers(ws); err == nil {
  371. break
  372. }
  373. }
  374. return ws, err
  375. }
  376. // openWatchClient retries opening a watchclient until retryConnection fails
  377. func (w *watcher) openWatchClient() (ws pb.Watch_WatchClient, err error) {
  378. for {
  379. if ws, err = w.remote.Watch(w.ctx); ws != nil {
  380. break
  381. } else if isRPCError(err) {
  382. return nil, err
  383. }
  384. newConn, nerr := w.c.retryConnection(w.conn, nil)
  385. if nerr != nil {
  386. return nil, nerr
  387. }
  388. w.conn = newConn
  389. w.remote = pb.NewWatchClient(w.conn)
  390. }
  391. return ws, nil
  392. }
  393. // resumeWatchers rebuilds every registered watcher on a new client
  394. func (w *watcher) resumeWatchers(wc pb.Watch_WatchClient) error {
  395. streams := []*watcherStream{}
  396. w.mu.RLock()
  397. for _, ws := range w.streams {
  398. streams = append(streams, ws)
  399. }
  400. w.mu.RUnlock()
  401. for _, ws := range streams {
  402. // reconstruct watcher from initial request
  403. if ws.lastRev != 0 {
  404. ws.initReq.rev = ws.lastRev
  405. }
  406. if err := wc.Send(ws.initReq.toPB()); err != nil {
  407. return err
  408. }
  409. // wait for request ack
  410. resp, err := wc.Recv()
  411. if err != nil {
  412. return err
  413. } else if len(resp.Events) != 0 || resp.Created != true {
  414. return fmt.Errorf("watcher: unexpected response (%+v)", resp)
  415. }
  416. // id may be different since new remote watcher; update map
  417. w.mu.Lock()
  418. delete(w.streams, ws.id)
  419. ws.id = resp.WatchId
  420. w.streams[ws.id] = ws
  421. w.mu.Unlock()
  422. ws.resumec <- ws.lastRev
  423. }
  424. return nil
  425. }
  426. // toPB converts an internal watch request structure to its protobuf messagefunc (wr *watchRequest)
  427. func (wr *watchRequest) toPB() *pb.WatchRequest {
  428. req := &pb.WatchCreateRequest{StartRevision: wr.rev}
  429. if wr.key != "" {
  430. req.Key = []byte(wr.key)
  431. } else {
  432. req.Prefix = []byte(wr.prefix)
  433. }
  434. cr := &pb.WatchRequest_CreateRequest{CreateRequest: req}
  435. return &pb.WatchRequest{RequestUnion: cr}
  436. }