policies.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701
  1. // Copyright (c) 2012 The gocql Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. //This file will be the future home for more policies
  5. package gocql
  6. import (
  7. "fmt"
  8. "math"
  9. "math/rand"
  10. "net"
  11. "sync"
  12. "sync/atomic"
  13. "time"
  14. "github.com/hailocab/go-hostpool"
  15. )
  16. // cowHostList implements a copy on write host list, its equivalent type is []*HostInfo
  17. type cowHostList struct {
  18. list atomic.Value
  19. mu sync.Mutex
  20. }
  21. func (c *cowHostList) String() string {
  22. return fmt.Sprintf("%+v", c.get())
  23. }
  24. func (c *cowHostList) get() []*HostInfo {
  25. // TODO(zariel): should we replace this with []*HostInfo?
  26. l, ok := c.list.Load().(*[]*HostInfo)
  27. if !ok {
  28. return nil
  29. }
  30. return *l
  31. }
  32. func (c *cowHostList) set(list []*HostInfo) {
  33. c.mu.Lock()
  34. c.list.Store(&list)
  35. c.mu.Unlock()
  36. }
  37. // add will add a host if it not already in the list
  38. func (c *cowHostList) add(host *HostInfo) bool {
  39. c.mu.Lock()
  40. l := c.get()
  41. if n := len(l); n == 0 {
  42. l = []*HostInfo{host}
  43. } else {
  44. newL := make([]*HostInfo, n+1)
  45. for i := 0; i < n; i++ {
  46. if host.Equal(l[i]) {
  47. c.mu.Unlock()
  48. return false
  49. }
  50. newL[i] = l[i]
  51. }
  52. newL[n] = host
  53. l = newL
  54. }
  55. c.list.Store(&l)
  56. c.mu.Unlock()
  57. return true
  58. }
  59. func (c *cowHostList) update(host *HostInfo) {
  60. c.mu.Lock()
  61. l := c.get()
  62. if len(l) == 0 {
  63. c.mu.Unlock()
  64. return
  65. }
  66. found := false
  67. newL := make([]*HostInfo, len(l))
  68. for i := range l {
  69. if host.Equal(l[i]) {
  70. newL[i] = host
  71. found = true
  72. } else {
  73. newL[i] = l[i]
  74. }
  75. }
  76. if found {
  77. c.list.Store(&newL)
  78. }
  79. c.mu.Unlock()
  80. }
  81. func (c *cowHostList) remove(ip net.IP) bool {
  82. c.mu.Lock()
  83. l := c.get()
  84. size := len(l)
  85. if size == 0 {
  86. c.mu.Unlock()
  87. return false
  88. }
  89. found := false
  90. newL := make([]*HostInfo, 0, size)
  91. for i := 0; i < len(l); i++ {
  92. if !l[i].ConnectAddress().Equal(ip) {
  93. newL = append(newL, l[i])
  94. } else {
  95. found = true
  96. }
  97. }
  98. if !found {
  99. c.mu.Unlock()
  100. return false
  101. }
  102. newL = newL[:size-1 : size-1]
  103. c.list.Store(&newL)
  104. c.mu.Unlock()
  105. return true
  106. }
  107. // RetryableQuery is an interface that represents a query or batch statement that
  108. // exposes the correct functions for the retry policy logic to evaluate correctly.
  109. type RetryableQuery interface {
  110. Attempts() int
  111. GetConsistency() Consistency
  112. }
  113. // RetryPolicy interface is used by gocql to determine if a query can be attempted
  114. // again after a retryable error has been received. The interface allows gocql
  115. // users to implement their own logic to determine if a query can be attempted
  116. // again.
  117. //
  118. // See SimpleRetryPolicy as an example of implementing and using a RetryPolicy
  119. // interface.
  120. type RetryPolicy interface {
  121. Attempt(RetryableQuery) bool
  122. }
  123. // SimpleRetryPolicy has simple logic for attempting a query a fixed number of times.
  124. //
  125. // See below for examples of usage:
  126. //
  127. // //Assign to the cluster
  128. // cluster.RetryPolicy = &gocql.SimpleRetryPolicy{NumRetries: 3}
  129. //
  130. // //Assign to a query
  131. // query.RetryPolicy(&gocql.SimpleRetryPolicy{NumRetries: 1})
  132. //
  133. type SimpleRetryPolicy struct {
  134. NumRetries int //Number of times to retry a query
  135. }
  136. // Attempt tells gocql to attempt the query again based on query.Attempts being less
  137. // than the NumRetries defined in the policy.
  138. func (s *SimpleRetryPolicy) Attempt(q RetryableQuery) bool {
  139. return q.Attempts() <= s.NumRetries
  140. }
  141. // ExponentialBackoffRetryPolicy sleeps between attempts
  142. type ExponentialBackoffRetryPolicy struct {
  143. NumRetries int
  144. Min, Max time.Duration
  145. }
  146. func (e *ExponentialBackoffRetryPolicy) Attempt(q RetryableQuery) bool {
  147. if q.Attempts() > e.NumRetries {
  148. return false
  149. }
  150. time.Sleep(e.napTime(q.Attempts()))
  151. return true
  152. }
  153. func (e *ExponentialBackoffRetryPolicy) napTime(attempts int) time.Duration {
  154. if e.Min <= 0 {
  155. e.Min = 100 * time.Millisecond
  156. }
  157. if e.Max <= 0 {
  158. e.Max = 10 * time.Second
  159. }
  160. minFloat := float64(e.Min)
  161. napDuration := minFloat * math.Pow(2, float64(attempts-1))
  162. // add some jitter
  163. napDuration += rand.Float64()*minFloat - (minFloat / 2)
  164. if napDuration > float64(e.Max) {
  165. return time.Duration(e.Max)
  166. }
  167. return time.Duration(napDuration)
  168. }
  169. type HostStateNotifier interface {
  170. AddHost(host *HostInfo)
  171. RemoveHost(host *HostInfo)
  172. HostUp(host *HostInfo)
  173. HostDown(host *HostInfo)
  174. }
  175. type KeyspaceUpdateEvent struct {
  176. Keyspace string
  177. Change string
  178. }
  179. // HostSelectionPolicy is an interface for selecting
  180. // the most appropriate host to execute a given query.
  181. type HostSelectionPolicy interface {
  182. HostStateNotifier
  183. SetPartitioner
  184. KeyspaceChanged(KeyspaceUpdateEvent)
  185. Init(*Session)
  186. //Pick returns an iteration function over selected hosts
  187. Pick(ExecutableQuery) NextHost
  188. }
  189. // SelectedHost is an interface returned when picking a host from a host
  190. // selection policy.
  191. type SelectedHost interface {
  192. Info() *HostInfo
  193. Mark(error)
  194. }
  195. type selectedHost HostInfo
  196. func (host *selectedHost) Info() *HostInfo {
  197. return (*HostInfo)(host)
  198. }
  199. func (host *selectedHost) Mark(err error) {}
  200. // NextHost is an iteration function over picked hosts
  201. type NextHost func() SelectedHost
  202. // RoundRobinHostPolicy is a round-robin load balancing policy, where each host
  203. // is tried sequentially for each query.
  204. func RoundRobinHostPolicy() HostSelectionPolicy {
  205. return &roundRobinHostPolicy{}
  206. }
  207. type roundRobinHostPolicy struct {
  208. hosts cowHostList
  209. pos uint32
  210. mu sync.RWMutex
  211. }
  212. func (r *roundRobinHostPolicy) KeyspaceChanged(KeyspaceUpdateEvent) {}
  213. func (r *roundRobinHostPolicy) SetPartitioner(partitioner string) {}
  214. func (r *roundRobinHostPolicy) Init(*Session) {}
  215. func (r *roundRobinHostPolicy) Pick(qry ExecutableQuery) NextHost {
  216. // i is used to limit the number of attempts to find a host
  217. // to the number of hosts known to this policy
  218. var i int
  219. return func() SelectedHost {
  220. hosts := r.hosts.get()
  221. if len(hosts) == 0 {
  222. return nil
  223. }
  224. // always increment pos to evenly distribute traffic in case of
  225. // failures
  226. pos := atomic.AddUint32(&r.pos, 1) - 1
  227. if i >= len(hosts) {
  228. return nil
  229. }
  230. host := hosts[(pos)%uint32(len(hosts))]
  231. i++
  232. return (*selectedHost)(host)
  233. }
  234. }
  235. func (r *roundRobinHostPolicy) AddHost(host *HostInfo) {
  236. r.hosts.add(host)
  237. }
  238. func (r *roundRobinHostPolicy) RemoveHost(host *HostInfo) {
  239. r.hosts.remove(host.ConnectAddress())
  240. }
  241. func (r *roundRobinHostPolicy) HostUp(host *HostInfo) {
  242. r.AddHost(host)
  243. }
  244. func (r *roundRobinHostPolicy) HostDown(host *HostInfo) {
  245. r.RemoveHost(host)
  246. }
  247. func ShuffleReplicas() func(*tokenAwareHostPolicy) {
  248. return func(t *tokenAwareHostPolicy) {
  249. t.shuffleReplicas = true
  250. }
  251. }
  252. // TokenAwareHostPolicy is a token aware host selection policy, where hosts are
  253. // selected based on the partition key, so queries are sent to the host which
  254. // owns the partition. Fallback is used when routing information is not available.
  255. func TokenAwareHostPolicy(fallback HostSelectionPolicy, opts ...func(*tokenAwareHostPolicy)) HostSelectionPolicy {
  256. p := &tokenAwareHostPolicy{fallback: fallback}
  257. for _, opt := range opts {
  258. opt(p)
  259. }
  260. return p
  261. }
  262. type keyspaceMeta struct {
  263. replicas map[string]map[token][]*HostInfo
  264. }
  265. type tokenAwareHostPolicy struct {
  266. hosts cowHostList
  267. mu sync.RWMutex
  268. partitioner string
  269. fallback HostSelectionPolicy
  270. session *Session
  271. tokenRing atomic.Value // *tokenRing
  272. keyspaces atomic.Value // *keyspaceMeta
  273. shuffleReplicas bool
  274. }
  275. func (t *tokenAwareHostPolicy) Init(s *Session) {
  276. t.session = s
  277. }
  278. func (t *tokenAwareHostPolicy) KeyspaceChanged(update KeyspaceUpdateEvent) {
  279. meta, _ := t.keyspaces.Load().(*keyspaceMeta)
  280. var size = 1
  281. if meta != nil {
  282. size = len(meta.replicas)
  283. }
  284. newMeta := &keyspaceMeta{
  285. replicas: make(map[string]map[token][]*HostInfo, size),
  286. }
  287. ks, err := t.session.KeyspaceMetadata(update.Keyspace)
  288. if err == nil {
  289. strat := getStrategy(ks)
  290. tr := t.tokenRing.Load().(*tokenRing)
  291. if tr != nil {
  292. newMeta.replicas[update.Keyspace] = strat.replicaMap(t.hosts.get(), tr.tokens)
  293. }
  294. }
  295. if meta != nil {
  296. for ks, replicas := range meta.replicas {
  297. if ks != update.Keyspace {
  298. newMeta.replicas[ks] = replicas
  299. }
  300. }
  301. }
  302. t.keyspaces.Store(newMeta)
  303. }
  304. func (t *tokenAwareHostPolicy) SetPartitioner(partitioner string) {
  305. t.mu.Lock()
  306. defer t.mu.Unlock()
  307. if t.partitioner != partitioner {
  308. t.fallback.SetPartitioner(partitioner)
  309. t.partitioner = partitioner
  310. t.resetTokenRing(partitioner)
  311. }
  312. }
  313. func (t *tokenAwareHostPolicy) AddHost(host *HostInfo) {
  314. t.hosts.add(host)
  315. t.fallback.AddHost(host)
  316. t.mu.RLock()
  317. partitioner := t.partitioner
  318. t.mu.RUnlock()
  319. t.resetTokenRing(partitioner)
  320. }
  321. func (t *tokenAwareHostPolicy) RemoveHost(host *HostInfo) {
  322. t.hosts.remove(host.ConnectAddress())
  323. t.fallback.RemoveHost(host)
  324. t.mu.RLock()
  325. partitioner := t.partitioner
  326. t.mu.RUnlock()
  327. t.resetTokenRing(partitioner)
  328. }
  329. func (t *tokenAwareHostPolicy) HostUp(host *HostInfo) {
  330. // TODO: need to avoid doing all the work on AddHost on hostup/down
  331. // because it now expensive to calculate the replica map for each
  332. // token
  333. t.AddHost(host)
  334. }
  335. func (t *tokenAwareHostPolicy) HostDown(host *HostInfo) {
  336. t.RemoveHost(host)
  337. }
  338. func (t *tokenAwareHostPolicy) resetTokenRing(partitioner string) {
  339. if partitioner == "" {
  340. // partitioner not yet set
  341. return
  342. }
  343. // create a new token ring
  344. hosts := t.hosts.get()
  345. tokenRing, err := newTokenRing(partitioner, hosts)
  346. if err != nil {
  347. Logger.Printf("Unable to update the token ring due to error: %s", err)
  348. return
  349. }
  350. // replace the token ring
  351. t.tokenRing.Store(tokenRing)
  352. }
  353. func (t *tokenAwareHostPolicy) getReplicas(keyspace string, token token) ([]*HostInfo, bool) {
  354. meta, _ := t.keyspaces.Load().(*keyspaceMeta)
  355. if meta == nil {
  356. return nil, false
  357. }
  358. tokens, ok := meta.replicas[keyspace][token]
  359. return tokens, ok
  360. }
  361. func (t *tokenAwareHostPolicy) Pick(qry ExecutableQuery) NextHost {
  362. if qry == nil {
  363. return t.fallback.Pick(qry)
  364. }
  365. routingKey, err := qry.GetRoutingKey()
  366. if err != nil {
  367. return t.fallback.Pick(qry)
  368. } else if routingKey == nil {
  369. return t.fallback.Pick(qry)
  370. }
  371. tr, _ := t.tokenRing.Load().(*tokenRing)
  372. if tr == nil {
  373. return t.fallback.Pick(qry)
  374. }
  375. token := tr.partitioner.Hash(routingKey)
  376. primaryEndpoint := tr.GetHostForToken(token)
  377. if primaryEndpoint == nil || token == nil {
  378. return t.fallback.Pick(qry)
  379. }
  380. replicas, ok := t.getReplicas(qry.Keyspace(), token)
  381. if !ok {
  382. replicas = []*HostInfo{primaryEndpoint}
  383. } else if t.shuffleReplicas {
  384. replicas = shuffleHosts(replicas)
  385. }
  386. var (
  387. fallbackIter NextHost
  388. i int
  389. )
  390. used := make(map[*HostInfo]bool)
  391. return func() SelectedHost {
  392. for i < len(replicas) {
  393. h := replicas[i]
  394. i++
  395. if !h.IsUp() {
  396. // TODO: need a way to handle host distance, as we may want to not
  397. // use hosts in specific DC's
  398. continue
  399. }
  400. used[h] = true
  401. return (*selectedHost)(h)
  402. }
  403. if fallbackIter == nil {
  404. // fallback
  405. fallbackIter = t.fallback.Pick(qry)
  406. }
  407. // filter the token aware selected hosts from the fallback hosts
  408. for fallbackHost := fallbackIter(); fallbackHost != nil; fallbackHost = fallbackIter() {
  409. if !used[fallbackHost.Info()] {
  410. return fallbackHost
  411. }
  412. }
  413. return nil
  414. }
  415. }
  416. // HostPoolHostPolicy is a host policy which uses the bitly/go-hostpool library
  417. // to distribute queries between hosts and prevent sending queries to
  418. // unresponsive hosts. When creating the host pool that is passed to the policy
  419. // use an empty slice of hosts as the hostpool will be populated later by gocql.
  420. // See below for examples of usage:
  421. //
  422. // // Create host selection policy using a simple host pool
  423. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(hostpool.New(nil))
  424. //
  425. // // Create host selection policy using an epsilon greedy pool
  426. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(
  427. // hostpool.NewEpsilonGreedy(nil, 0, &hostpool.LinearEpsilonValueCalculator{}),
  428. // )
  429. //
  430. func HostPoolHostPolicy(hp hostpool.HostPool) HostSelectionPolicy {
  431. return &hostPoolHostPolicy{hostMap: map[string]*HostInfo{}, hp: hp}
  432. }
  433. type hostPoolHostPolicy struct {
  434. hp hostpool.HostPool
  435. mu sync.RWMutex
  436. hostMap map[string]*HostInfo
  437. }
  438. func (r *hostPoolHostPolicy) Init(*Session) {}
  439. func (r *hostPoolHostPolicy) KeyspaceChanged(KeyspaceUpdateEvent) {}
  440. func (r *hostPoolHostPolicy) SetPartitioner(string) {}
  441. func (r *hostPoolHostPolicy) SetHosts(hosts []*HostInfo) {
  442. peers := make([]string, len(hosts))
  443. hostMap := make(map[string]*HostInfo, len(hosts))
  444. for i, host := range hosts {
  445. ip := host.ConnectAddress().String()
  446. peers[i] = ip
  447. hostMap[ip] = host
  448. }
  449. r.mu.Lock()
  450. r.hp.SetHosts(peers)
  451. r.hostMap = hostMap
  452. r.mu.Unlock()
  453. }
  454. func (r *hostPoolHostPolicy) AddHost(host *HostInfo) {
  455. ip := host.ConnectAddress().String()
  456. r.mu.Lock()
  457. defer r.mu.Unlock()
  458. // If the host addr is present and isn't nil return
  459. if h, ok := r.hostMap[ip]; ok && h != nil {
  460. return
  461. }
  462. // otherwise, add the host to the map
  463. r.hostMap[ip] = host
  464. // and construct a new peer list to give to the HostPool
  465. hosts := make([]string, 0, len(r.hostMap))
  466. for addr := range r.hostMap {
  467. hosts = append(hosts, addr)
  468. }
  469. r.hp.SetHosts(hosts)
  470. }
  471. func (r *hostPoolHostPolicy) RemoveHost(host *HostInfo) {
  472. ip := host.ConnectAddress().String()
  473. r.mu.Lock()
  474. defer r.mu.Unlock()
  475. if _, ok := r.hostMap[ip]; !ok {
  476. return
  477. }
  478. delete(r.hostMap, ip)
  479. hosts := make([]string, 0, len(r.hostMap))
  480. for _, host := range r.hostMap {
  481. hosts = append(hosts, host.ConnectAddress().String())
  482. }
  483. r.hp.SetHosts(hosts)
  484. }
  485. func (r *hostPoolHostPolicy) HostUp(host *HostInfo) {
  486. r.AddHost(host)
  487. }
  488. func (r *hostPoolHostPolicy) HostDown(host *HostInfo) {
  489. r.RemoveHost(host)
  490. }
  491. func (r *hostPoolHostPolicy) Pick(qry ExecutableQuery) NextHost {
  492. return func() SelectedHost {
  493. r.mu.RLock()
  494. defer r.mu.RUnlock()
  495. if len(r.hostMap) == 0 {
  496. return nil
  497. }
  498. hostR := r.hp.Get()
  499. host, ok := r.hostMap[hostR.Host()]
  500. if !ok {
  501. return nil
  502. }
  503. return selectedHostPoolHost{
  504. policy: r,
  505. info: host,
  506. hostR: hostR,
  507. }
  508. }
  509. }
  510. // selectedHostPoolHost is a host returned by the hostPoolHostPolicy and
  511. // implements the SelectedHost interface
  512. type selectedHostPoolHost struct {
  513. policy *hostPoolHostPolicy
  514. info *HostInfo
  515. hostR hostpool.HostPoolResponse
  516. }
  517. func (host selectedHostPoolHost) Info() *HostInfo {
  518. return host.info
  519. }
  520. func (host selectedHostPoolHost) Mark(err error) {
  521. ip := host.info.ConnectAddress().String()
  522. host.policy.mu.RLock()
  523. defer host.policy.mu.RUnlock()
  524. if _, ok := host.policy.hostMap[ip]; !ok {
  525. // host was removed between pick and mark
  526. return
  527. }
  528. host.hostR.Mark(err)
  529. }
  530. type dcAwareRR struct {
  531. local string
  532. pos uint32
  533. mu sync.RWMutex
  534. localHosts cowHostList
  535. remoteHosts cowHostList
  536. }
  537. // DCAwareRoundRobinPolicy is a host selection policies which will prioritize and
  538. // return hosts which are in the local datacentre before returning hosts in all
  539. // other datercentres
  540. func DCAwareRoundRobinPolicy(localDC string) HostSelectionPolicy {
  541. return &dcAwareRR{local: localDC}
  542. }
  543. func (r *dcAwareRR) Init(*Session) {}
  544. func (r *dcAwareRR) KeyspaceChanged(KeyspaceUpdateEvent) {}
  545. func (d *dcAwareRR) SetPartitioner(p string) {}
  546. func (d *dcAwareRR) AddHost(host *HostInfo) {
  547. if host.DataCenter() == d.local {
  548. d.localHosts.add(host)
  549. } else {
  550. d.remoteHosts.add(host)
  551. }
  552. }
  553. func (d *dcAwareRR) RemoveHost(host *HostInfo) {
  554. if host.DataCenter() == d.local {
  555. d.localHosts.remove(host.ConnectAddress())
  556. } else {
  557. d.remoteHosts.remove(host.ConnectAddress())
  558. }
  559. }
  560. func (d *dcAwareRR) HostUp(host *HostInfo) { d.AddHost(host) }
  561. func (d *dcAwareRR) HostDown(host *HostInfo) { d.RemoveHost(host) }
  562. func (d *dcAwareRR) Pick(q ExecutableQuery) NextHost {
  563. var i int
  564. return func() SelectedHost {
  565. var hosts []*HostInfo
  566. localHosts := d.localHosts.get()
  567. remoteHosts := d.remoteHosts.get()
  568. if len(localHosts) != 0 {
  569. hosts = localHosts
  570. } else {
  571. hosts = remoteHosts
  572. }
  573. if len(hosts) == 0 {
  574. return nil
  575. }
  576. // always increment pos to evenly distribute traffic in case of
  577. // failures
  578. pos := atomic.AddUint32(&d.pos, 1) - 1
  579. if i >= len(localHosts)+len(remoteHosts) {
  580. return nil
  581. }
  582. host := hosts[(pos)%uint32(len(hosts))]
  583. i++
  584. return (*selectedHost)(host)
  585. }
  586. }