policies.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697
  1. // Copyright (c) 2012 The gocql Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. //This file will be the future home for more policies
  5. package gocql
  6. import (
  7. "fmt"
  8. "math"
  9. "math/rand"
  10. "net"
  11. "sync"
  12. "sync/atomic"
  13. "time"
  14. "github.com/hailocab/go-hostpool"
  15. )
  16. // cowHostList implements a copy on write host list, its equivalent type is []*HostInfo
  17. type cowHostList struct {
  18. list atomic.Value
  19. mu sync.Mutex
  20. }
  21. func (c *cowHostList) String() string {
  22. return fmt.Sprintf("%+v", c.get())
  23. }
  24. func (c *cowHostList) get() []*HostInfo {
  25. // TODO(zariel): should we replace this with []*HostInfo?
  26. l, ok := c.list.Load().(*[]*HostInfo)
  27. if !ok {
  28. return nil
  29. }
  30. return *l
  31. }
  32. func (c *cowHostList) set(list []*HostInfo) {
  33. c.mu.Lock()
  34. c.list.Store(&list)
  35. c.mu.Unlock()
  36. }
  37. // add will add a host if it not already in the list
  38. func (c *cowHostList) add(host *HostInfo) bool {
  39. c.mu.Lock()
  40. l := c.get()
  41. if n := len(l); n == 0 {
  42. l = []*HostInfo{host}
  43. } else {
  44. newL := make([]*HostInfo, n+1)
  45. for i := 0; i < n; i++ {
  46. if host.Equal(l[i]) {
  47. c.mu.Unlock()
  48. return false
  49. }
  50. newL[i] = l[i]
  51. }
  52. newL[n] = host
  53. l = newL
  54. }
  55. c.list.Store(&l)
  56. c.mu.Unlock()
  57. return true
  58. }
  59. func (c *cowHostList) update(host *HostInfo) {
  60. c.mu.Lock()
  61. l := c.get()
  62. if len(l) == 0 {
  63. c.mu.Unlock()
  64. return
  65. }
  66. found := false
  67. newL := make([]*HostInfo, len(l))
  68. for i := range l {
  69. if host.Equal(l[i]) {
  70. newL[i] = host
  71. found = true
  72. } else {
  73. newL[i] = l[i]
  74. }
  75. }
  76. if found {
  77. c.list.Store(&newL)
  78. }
  79. c.mu.Unlock()
  80. }
  81. func (c *cowHostList) remove(ip net.IP) bool {
  82. c.mu.Lock()
  83. l := c.get()
  84. size := len(l)
  85. if size == 0 {
  86. c.mu.Unlock()
  87. return false
  88. }
  89. found := false
  90. newL := make([]*HostInfo, 0, size)
  91. for i := 0; i < len(l); i++ {
  92. if !l[i].ConnectAddress().Equal(ip) {
  93. newL = append(newL, l[i])
  94. } else {
  95. found = true
  96. }
  97. }
  98. if !found {
  99. c.mu.Unlock()
  100. return false
  101. }
  102. newL = newL[:size-1 : size-1]
  103. c.list.Store(&newL)
  104. c.mu.Unlock()
  105. return true
  106. }
  107. // RetryableQuery is an interface that represents a query or batch statement that
  108. // exposes the correct functions for the retry policy logic to evaluate correctly.
  109. type RetryableQuery interface {
  110. Attempts() int
  111. GetConsistency() Consistency
  112. }
  113. // RetryPolicy interface is used by gocql to determine if a query can be attempted
  114. // again after a retryable error has been received. The interface allows gocql
  115. // users to implement their own logic to determine if a query can be attempted
  116. // again.
  117. //
  118. // See SimpleRetryPolicy as an example of implementing and using a RetryPolicy
  119. // interface.
  120. type RetryPolicy interface {
  121. Attempt(RetryableQuery) bool
  122. }
  123. // SimpleRetryPolicy has simple logic for attempting a query a fixed number of times.
  124. //
  125. // See below for examples of usage:
  126. //
  127. // //Assign to the cluster
  128. // cluster.RetryPolicy = &gocql.SimpleRetryPolicy{NumRetries: 3}
  129. //
  130. // //Assign to a query
  131. // query.RetryPolicy(&gocql.SimpleRetryPolicy{NumRetries: 1})
  132. //
  133. type SimpleRetryPolicy struct {
  134. NumRetries int //Number of times to retry a query
  135. }
  136. // Attempt tells gocql to attempt the query again based on query.Attempts being less
  137. // than the NumRetries defined in the policy.
  138. func (s *SimpleRetryPolicy) Attempt(q RetryableQuery) bool {
  139. return q.Attempts() <= s.NumRetries
  140. }
  141. // ExponentialBackoffRetryPolicy sleeps between attempts
  142. type ExponentialBackoffRetryPolicy struct {
  143. NumRetries int
  144. Min, Max time.Duration
  145. }
  146. func (e *ExponentialBackoffRetryPolicy) Attempt(q RetryableQuery) bool {
  147. if q.Attempts() > e.NumRetries {
  148. return false
  149. }
  150. time.Sleep(e.napTime(q.Attempts()))
  151. return true
  152. }
  153. func (e *ExponentialBackoffRetryPolicy) napTime(attempts int) time.Duration {
  154. if e.Min <= 0 {
  155. e.Min = 100 * time.Millisecond
  156. }
  157. if e.Max <= 0 {
  158. e.Max = 10 * time.Second
  159. }
  160. minFloat := float64(e.Min)
  161. napDuration := minFloat * math.Pow(2, float64(attempts-1))
  162. // add some jitter
  163. napDuration += rand.Float64()*minFloat - (minFloat / 2)
  164. if napDuration > float64(e.Max) {
  165. return time.Duration(e.Max)
  166. }
  167. return time.Duration(napDuration)
  168. }
  169. type HostStateNotifier interface {
  170. AddHost(host *HostInfo)
  171. RemoveHost(host *HostInfo)
  172. HostUp(host *HostInfo)
  173. HostDown(host *HostInfo)
  174. }
  175. type KeyspaceUpdateEvent struct {
  176. Keyspace string
  177. Change string
  178. }
  179. // HostSelectionPolicy is an interface for selecting
  180. // the most appropriate host to execute a given query.
  181. type HostSelectionPolicy interface {
  182. HostStateNotifier
  183. SetPartitioner
  184. KeyspaceChanged(KeyspaceUpdateEvent)
  185. Init(*Session)
  186. //Pick returns an iteration function over selected hosts
  187. Pick(ExecutableQuery) NextHost
  188. }
  189. // SelectedHost is an interface returned when picking a host from a host
  190. // selection policy.
  191. type SelectedHost interface {
  192. Info() *HostInfo
  193. Mark(error)
  194. }
  195. type selectedHost HostInfo
  196. func (host *selectedHost) Info() *HostInfo {
  197. return (*HostInfo)(host)
  198. }
  199. func (host *selectedHost) Mark(err error) {}
  200. // NextHost is an iteration function over picked hosts
  201. type NextHost func() SelectedHost
  202. // RoundRobinHostPolicy is a round-robin load balancing policy, where each host
  203. // is tried sequentially for each query.
  204. func RoundRobinHostPolicy() HostSelectionPolicy {
  205. return &roundRobinHostPolicy{}
  206. }
  207. type roundRobinHostPolicy struct {
  208. hosts cowHostList
  209. pos uint32
  210. mu sync.RWMutex
  211. }
  212. func (r *roundRobinHostPolicy) KeyspaceChanged(KeyspaceUpdateEvent) {}
  213. func (r *roundRobinHostPolicy) SetPartitioner(partitioner string) {}
  214. func (r *roundRobinHostPolicy) Init(*Session) {}
  215. func (r *roundRobinHostPolicy) Pick(qry ExecutableQuery) NextHost {
  216. // i is used to limit the number of attempts to find a host
  217. // to the number of hosts known to this policy
  218. var i int
  219. return func() SelectedHost {
  220. hosts := r.hosts.get()
  221. if len(hosts) == 0 {
  222. return nil
  223. }
  224. // always increment pos to evenly distribute traffic in case of
  225. // failures
  226. pos := atomic.AddUint32(&r.pos, 1) - 1
  227. if i >= len(hosts) {
  228. return nil
  229. }
  230. host := hosts[(pos)%uint32(len(hosts))]
  231. i++
  232. return (*selectedHost)(host)
  233. }
  234. }
  235. func (r *roundRobinHostPolicy) AddHost(host *HostInfo) {
  236. r.hosts.add(host)
  237. }
  238. func (r *roundRobinHostPolicy) RemoveHost(host *HostInfo) {
  239. r.hosts.remove(host.ConnectAddress())
  240. }
  241. func (r *roundRobinHostPolicy) HostUp(host *HostInfo) {
  242. r.AddHost(host)
  243. }
  244. func (r *roundRobinHostPolicy) HostDown(host *HostInfo) {
  245. r.RemoveHost(host)
  246. }
  247. func ShuffleReplicas() func(*tokenAwareHostPolicy) {
  248. return func(t *tokenAwareHostPolicy) {
  249. t.shuffleReplicas = true
  250. }
  251. }
  252. // TokenAwareHostPolicy is a token aware host selection policy, where hosts are
  253. // selected based on the partition key, so queries are sent to the host which
  254. // owns the partition. Fallback is used when routing information is not available.
  255. func TokenAwareHostPolicy(fallback HostSelectionPolicy, opts ...func(*tokenAwareHostPolicy)) HostSelectionPolicy {
  256. p := &tokenAwareHostPolicy{fallback: fallback}
  257. for _, opt := range opts {
  258. opt(p)
  259. }
  260. return p
  261. }
  262. type keyspaceMeta struct {
  263. replicas map[string]map[token][]*HostInfo
  264. }
  265. type tokenAwareHostPolicy struct {
  266. hosts cowHostList
  267. mu sync.RWMutex
  268. partitioner string
  269. fallback HostSelectionPolicy
  270. session *Session
  271. tokenRing atomic.Value // *tokenRing
  272. keyspaces atomic.Value // *keyspaceMeta
  273. shuffleReplicas bool
  274. }
  275. func (t *tokenAwareHostPolicy) Init(s *Session) {
  276. t.session = s
  277. }
  278. func (t *tokenAwareHostPolicy) KeyspaceChanged(update KeyspaceUpdateEvent) {
  279. meta, _ := t.keyspaces.Load().(*keyspaceMeta)
  280. // TODO: avoid recaulating things which havnt changed
  281. newMeta := &keyspaceMeta{
  282. replicas: make(map[string]map[token][]*HostInfo, len(meta.replicas)),
  283. }
  284. ks, err := t.session.KeyspaceMetadata(update.Keyspace)
  285. if err == nil {
  286. strat := getStrategy(ks)
  287. tr := t.tokenRing.Load().(*tokenRing)
  288. if tr != nil {
  289. newMeta.replicas[update.Keyspace] = strat.replicaMap(t.hosts.get(), tr.tokens)
  290. }
  291. }
  292. if meta != nil {
  293. for ks, replicas := range meta.replicas {
  294. if ks != update.Keyspace {
  295. newMeta.replicas[ks] = replicas
  296. }
  297. }
  298. }
  299. t.keyspaces.Store(newMeta)
  300. }
  301. func (t *tokenAwareHostPolicy) SetPartitioner(partitioner string) {
  302. t.mu.Lock()
  303. defer t.mu.Unlock()
  304. if t.partitioner != partitioner {
  305. t.fallback.SetPartitioner(partitioner)
  306. t.partitioner = partitioner
  307. t.resetTokenRing(partitioner)
  308. }
  309. }
  310. func (t *tokenAwareHostPolicy) AddHost(host *HostInfo) {
  311. t.hosts.add(host)
  312. t.fallback.AddHost(host)
  313. t.mu.RLock()
  314. partitioner := t.partitioner
  315. t.mu.RUnlock()
  316. t.resetTokenRing(partitioner)
  317. }
  318. func (t *tokenAwareHostPolicy) RemoveHost(host *HostInfo) {
  319. t.hosts.remove(host.ConnectAddress())
  320. t.fallback.RemoveHost(host)
  321. t.mu.RLock()
  322. partitioner := t.partitioner
  323. t.mu.RUnlock()
  324. t.resetTokenRing(partitioner)
  325. }
  326. func (t *tokenAwareHostPolicy) HostUp(host *HostInfo) {
  327. // TODO: need to avoid doing all the work on AddHost on hostup/down
  328. // because it now expensive to calculate the replica map for each
  329. // token
  330. t.AddHost(host)
  331. }
  332. func (t *tokenAwareHostPolicy) HostDown(host *HostInfo) {
  333. t.RemoveHost(host)
  334. }
  335. func (t *tokenAwareHostPolicy) resetTokenRing(partitioner string) {
  336. if partitioner == "" {
  337. // partitioner not yet set
  338. return
  339. }
  340. // create a new token ring
  341. hosts := t.hosts.get()
  342. tokenRing, err := newTokenRing(partitioner, hosts)
  343. if err != nil {
  344. Logger.Printf("Unable to update the token ring due to error: %s", err)
  345. return
  346. }
  347. // replace the token ring
  348. t.tokenRing.Store(tokenRing)
  349. }
  350. func (t *tokenAwareHostPolicy) getReplicas(keyspace string, token token) ([]*HostInfo, bool) {
  351. meta, _ := t.keyspaces.Load().(*keyspaceMeta)
  352. if meta == nil {
  353. return nil, false
  354. }
  355. tokens, ok := meta.replicas[keyspace][token]
  356. return tokens, ok
  357. }
  358. func (t *tokenAwareHostPolicy) Pick(qry ExecutableQuery) NextHost {
  359. if qry == nil {
  360. return t.fallback.Pick(qry)
  361. }
  362. routingKey, err := qry.GetRoutingKey()
  363. if err != nil {
  364. return t.fallback.Pick(qry)
  365. } else if routingKey == nil {
  366. return t.fallback.Pick(qry)
  367. }
  368. tr, _ := t.tokenRing.Load().(*tokenRing)
  369. if tr == nil {
  370. return t.fallback.Pick(qry)
  371. }
  372. token := tr.partitioner.Hash(routingKey)
  373. primaryEndpoint := tr.GetHostForToken(token)
  374. if primaryEndpoint == nil || token == nil {
  375. return t.fallback.Pick(qry)
  376. }
  377. replicas, ok := t.getReplicas(qry.Keyspace(), token)
  378. if !ok {
  379. replicas = []*HostInfo{primaryEndpoint}
  380. } else if t.shuffleReplicas {
  381. replicas = shuffleHosts(replicas)
  382. }
  383. var (
  384. fallbackIter NextHost
  385. i int
  386. )
  387. used := make(map[*HostInfo]bool)
  388. return func() SelectedHost {
  389. for i < len(replicas) {
  390. h := replicas[i]
  391. i++
  392. if !h.IsUp() {
  393. // TODO: need a way to handle host distance, as we may want to not
  394. // use hosts in specific DC's
  395. continue
  396. }
  397. used[h] = true
  398. return (*selectedHost)(h)
  399. }
  400. if fallbackIter == nil {
  401. // fallback
  402. fallbackIter = t.fallback.Pick(qry)
  403. }
  404. // filter the token aware selected hosts from the fallback hosts
  405. for fallbackHost := fallbackIter(); fallbackHost != nil; fallbackHost = fallbackIter() {
  406. if !used[fallbackHost.Info()] {
  407. return fallbackHost
  408. }
  409. }
  410. return nil
  411. }
  412. }
  413. // HostPoolHostPolicy is a host policy which uses the bitly/go-hostpool library
  414. // to distribute queries between hosts and prevent sending queries to
  415. // unresponsive hosts. When creating the host pool that is passed to the policy
  416. // use an empty slice of hosts as the hostpool will be populated later by gocql.
  417. // See below for examples of usage:
  418. //
  419. // // Create host selection policy using a simple host pool
  420. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(hostpool.New(nil))
  421. //
  422. // // Create host selection policy using an epsilon greedy pool
  423. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(
  424. // hostpool.NewEpsilonGreedy(nil, 0, &hostpool.LinearEpsilonValueCalculator{}),
  425. // )
  426. //
  427. func HostPoolHostPolicy(hp hostpool.HostPool) HostSelectionPolicy {
  428. return &hostPoolHostPolicy{hostMap: map[string]*HostInfo{}, hp: hp}
  429. }
  430. type hostPoolHostPolicy struct {
  431. hp hostpool.HostPool
  432. mu sync.RWMutex
  433. hostMap map[string]*HostInfo
  434. }
  435. func (r *hostPoolHostPolicy) Init(*Session) {}
  436. func (r *hostPoolHostPolicy) KeyspaceChanged(KeyspaceUpdateEvent) {}
  437. func (r *hostPoolHostPolicy) SetPartitioner(string) {}
  438. func (r *hostPoolHostPolicy) SetHosts(hosts []*HostInfo) {
  439. peers := make([]string, len(hosts))
  440. hostMap := make(map[string]*HostInfo, len(hosts))
  441. for i, host := range hosts {
  442. ip := host.ConnectAddress().String()
  443. peers[i] = ip
  444. hostMap[ip] = host
  445. }
  446. r.mu.Lock()
  447. r.hp.SetHosts(peers)
  448. r.hostMap = hostMap
  449. r.mu.Unlock()
  450. }
  451. func (r *hostPoolHostPolicy) AddHost(host *HostInfo) {
  452. ip := host.ConnectAddress().String()
  453. r.mu.Lock()
  454. defer r.mu.Unlock()
  455. // If the host addr is present and isn't nil return
  456. if h, ok := r.hostMap[ip]; ok && h != nil {
  457. return
  458. }
  459. // otherwise, add the host to the map
  460. r.hostMap[ip] = host
  461. // and construct a new peer list to give to the HostPool
  462. hosts := make([]string, 0, len(r.hostMap))
  463. for addr := range r.hostMap {
  464. hosts = append(hosts, addr)
  465. }
  466. r.hp.SetHosts(hosts)
  467. }
  468. func (r *hostPoolHostPolicy) RemoveHost(host *HostInfo) {
  469. ip := host.ConnectAddress().String()
  470. r.mu.Lock()
  471. defer r.mu.Unlock()
  472. if _, ok := r.hostMap[ip]; !ok {
  473. return
  474. }
  475. delete(r.hostMap, ip)
  476. hosts := make([]string, 0, len(r.hostMap))
  477. for _, host := range r.hostMap {
  478. hosts = append(hosts, host.ConnectAddress().String())
  479. }
  480. r.hp.SetHosts(hosts)
  481. }
  482. func (r *hostPoolHostPolicy) HostUp(host *HostInfo) {
  483. r.AddHost(host)
  484. }
  485. func (r *hostPoolHostPolicy) HostDown(host *HostInfo) {
  486. r.RemoveHost(host)
  487. }
  488. func (r *hostPoolHostPolicy) Pick(qry ExecutableQuery) NextHost {
  489. return func() SelectedHost {
  490. r.mu.RLock()
  491. defer r.mu.RUnlock()
  492. if len(r.hostMap) == 0 {
  493. return nil
  494. }
  495. hostR := r.hp.Get()
  496. host, ok := r.hostMap[hostR.Host()]
  497. if !ok {
  498. return nil
  499. }
  500. return selectedHostPoolHost{
  501. policy: r,
  502. info: host,
  503. hostR: hostR,
  504. }
  505. }
  506. }
  507. // selectedHostPoolHost is a host returned by the hostPoolHostPolicy and
  508. // implements the SelectedHost interface
  509. type selectedHostPoolHost struct {
  510. policy *hostPoolHostPolicy
  511. info *HostInfo
  512. hostR hostpool.HostPoolResponse
  513. }
  514. func (host selectedHostPoolHost) Info() *HostInfo {
  515. return host.info
  516. }
  517. func (host selectedHostPoolHost) Mark(err error) {
  518. ip := host.info.ConnectAddress().String()
  519. host.policy.mu.RLock()
  520. defer host.policy.mu.RUnlock()
  521. if _, ok := host.policy.hostMap[ip]; !ok {
  522. // host was removed between pick and mark
  523. return
  524. }
  525. host.hostR.Mark(err)
  526. }
  527. type dcAwareRR struct {
  528. local string
  529. pos uint32
  530. mu sync.RWMutex
  531. localHosts cowHostList
  532. remoteHosts cowHostList
  533. }
  534. // DCAwareRoundRobinPolicy is a host selection policies which will prioritize and
  535. // return hosts which are in the local datacentre before returning hosts in all
  536. // other datercentres
  537. func DCAwareRoundRobinPolicy(localDC string) HostSelectionPolicy {
  538. return &dcAwareRR{local: localDC}
  539. }
  540. func (r *dcAwareRR) Init(*Session) {}
  541. func (r *dcAwareRR) KeyspaceChanged(KeyspaceUpdateEvent) {}
  542. func (d *dcAwareRR) SetPartitioner(p string) {}
  543. func (d *dcAwareRR) AddHost(host *HostInfo) {
  544. if host.DataCenter() == d.local {
  545. d.localHosts.add(host)
  546. } else {
  547. d.remoteHosts.add(host)
  548. }
  549. }
  550. func (d *dcAwareRR) RemoveHost(host *HostInfo) {
  551. if host.DataCenter() == d.local {
  552. d.localHosts.remove(host.ConnectAddress())
  553. } else {
  554. d.remoteHosts.remove(host.ConnectAddress())
  555. }
  556. }
  557. func (d *dcAwareRR) HostUp(host *HostInfo) { d.AddHost(host) }
  558. func (d *dcAwareRR) HostDown(host *HostInfo) { d.RemoveHost(host) }
  559. func (d *dcAwareRR) Pick(q ExecutableQuery) NextHost {
  560. var i int
  561. return func() SelectedHost {
  562. var hosts []*HostInfo
  563. localHosts := d.localHosts.get()
  564. remoteHosts := d.remoteHosts.get()
  565. if len(localHosts) != 0 {
  566. hosts = localHosts
  567. } else {
  568. hosts = remoteHosts
  569. }
  570. if len(hosts) == 0 {
  571. return nil
  572. }
  573. // always increment pos to evenly distribute traffic in case of
  574. // failures
  575. pos := atomic.AddUint32(&d.pos, 1) - 1
  576. if i >= len(localHosts)+len(remoteHosts) {
  577. return nil
  578. }
  579. host := hosts[(pos)%uint32(len(hosts))]
  580. i++
  581. return (*selectedHost)(host)
  582. }
  583. }