policies.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616
  1. // Copyright (c) 2012 The gocql Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. //This file will be the future home for more policies
  5. package gocql
  6. import (
  7. "fmt"
  8. "math"
  9. "math/rand"
  10. "net"
  11. "sync"
  12. "sync/atomic"
  13. "time"
  14. "github.com/hailocab/go-hostpool"
  15. )
  16. // cowHostList implements a copy on write host list, its equivalent type is []*HostInfo
  17. type cowHostList struct {
  18. list atomic.Value
  19. mu sync.Mutex
  20. }
  21. func (c *cowHostList) String() string {
  22. return fmt.Sprintf("%+v", c.get())
  23. }
  24. func (c *cowHostList) get() []*HostInfo {
  25. // TODO(zariel): should we replace this with []*HostInfo?
  26. l, ok := c.list.Load().(*[]*HostInfo)
  27. if !ok {
  28. return nil
  29. }
  30. return *l
  31. }
  32. func (c *cowHostList) set(list []*HostInfo) {
  33. c.mu.Lock()
  34. c.list.Store(&list)
  35. c.mu.Unlock()
  36. }
  37. // add will add a host if it not already in the list
  38. func (c *cowHostList) add(host *HostInfo) bool {
  39. c.mu.Lock()
  40. l := c.get()
  41. if n := len(l); n == 0 {
  42. l = []*HostInfo{host}
  43. } else {
  44. newL := make([]*HostInfo, n+1)
  45. for i := 0; i < n; i++ {
  46. if host.Equal(l[i]) {
  47. c.mu.Unlock()
  48. return false
  49. }
  50. newL[i] = l[i]
  51. }
  52. newL[n] = host
  53. l = newL
  54. }
  55. c.list.Store(&l)
  56. c.mu.Unlock()
  57. return true
  58. }
  59. func (c *cowHostList) update(host *HostInfo) {
  60. c.mu.Lock()
  61. l := c.get()
  62. if len(l) == 0 {
  63. c.mu.Unlock()
  64. return
  65. }
  66. found := false
  67. newL := make([]*HostInfo, len(l))
  68. for i := range l {
  69. if host.Equal(l[i]) {
  70. newL[i] = host
  71. found = true
  72. } else {
  73. newL[i] = l[i]
  74. }
  75. }
  76. if found {
  77. c.list.Store(&newL)
  78. }
  79. c.mu.Unlock()
  80. }
  81. func (c *cowHostList) remove(ip net.IP) bool {
  82. c.mu.Lock()
  83. l := c.get()
  84. size := len(l)
  85. if size == 0 {
  86. c.mu.Unlock()
  87. return false
  88. }
  89. found := false
  90. newL := make([]*HostInfo, 0, size)
  91. for i := 0; i < len(l); i++ {
  92. if !l[i].ConnectAddress().Equal(ip) {
  93. newL = append(newL, l[i])
  94. } else {
  95. found = true
  96. }
  97. }
  98. if !found {
  99. c.mu.Unlock()
  100. return false
  101. }
  102. newL = newL[:size-1 : size-1]
  103. c.list.Store(&newL)
  104. c.mu.Unlock()
  105. return true
  106. }
  107. // RetryableQuery is an interface that represents a query or batch statement that
  108. // exposes the correct functions for the retry policy logic to evaluate correctly.
  109. type RetryableQuery interface {
  110. Attempts() int
  111. GetConsistency() Consistency
  112. }
  113. // RetryPolicy interface is used by gocql to determine if a query can be attempted
  114. // again after a retryable error has been received. The interface allows gocql
  115. // users to implement their own logic to determine if a query can be attempted
  116. // again.
  117. //
  118. // See SimpleRetryPolicy as an example of implementing and using a RetryPolicy
  119. // interface.
  120. type RetryPolicy interface {
  121. Attempt(RetryableQuery) bool
  122. }
  123. // SimpleRetryPolicy has simple logic for attempting a query a fixed number of times.
  124. //
  125. // See below for examples of usage:
  126. //
  127. // //Assign to the cluster
  128. // cluster.RetryPolicy = &gocql.SimpleRetryPolicy{NumRetries: 3}
  129. //
  130. // //Assign to a query
  131. // query.RetryPolicy(&gocql.SimpleRetryPolicy{NumRetries: 1})
  132. //
  133. type SimpleRetryPolicy struct {
  134. NumRetries int //Number of times to retry a query
  135. }
  136. // Attempt tells gocql to attempt the query again based on query.Attempts being less
  137. // than the NumRetries defined in the policy.
  138. func (s *SimpleRetryPolicy) Attempt(q RetryableQuery) bool {
  139. return q.Attempts() <= s.NumRetries
  140. }
  141. // ExponentialBackoffRetryPolicy sleeps between attempts
  142. type ExponentialBackoffRetryPolicy struct {
  143. NumRetries int
  144. Min, Max time.Duration
  145. }
  146. func (e *ExponentialBackoffRetryPolicy) Attempt(q RetryableQuery) bool {
  147. if q.Attempts() > e.NumRetries {
  148. return false
  149. }
  150. time.Sleep(e.napTime(q.Attempts()))
  151. return true
  152. }
  153. func (e *ExponentialBackoffRetryPolicy) napTime(attempts int) time.Duration {
  154. if e.Min <= 0 {
  155. e.Min = 100 * time.Millisecond
  156. }
  157. if e.Max <= 0 {
  158. e.Max = 10 * time.Second
  159. }
  160. minFloat := float64(e.Min)
  161. napDuration := minFloat * math.Pow(2, float64(attempts-1))
  162. // add some jitter
  163. napDuration += rand.Float64()*minFloat - (minFloat / 2)
  164. if napDuration > float64(e.Max) {
  165. return time.Duration(e.Max)
  166. }
  167. return time.Duration(napDuration)
  168. }
  169. type HostStateNotifier interface {
  170. AddHost(host *HostInfo)
  171. RemoveHost(host *HostInfo)
  172. HostUp(host *HostInfo)
  173. HostDown(host *HostInfo)
  174. }
  175. // HostSelectionPolicy is an interface for selecting
  176. // the most appropriate host to execute a given query.
  177. type HostSelectionPolicy interface {
  178. HostStateNotifier
  179. SetPartitioner
  180. //Pick returns an iteration function over selected hosts
  181. Pick(ExecutableQuery) NextHost
  182. }
  183. // SelectedHost is an interface returned when picking a host from a host
  184. // selection policy.
  185. type SelectedHost interface {
  186. Info() *HostInfo
  187. Mark(error)
  188. }
  189. type selectedHost HostInfo
  190. func (host *selectedHost) Info() *HostInfo {
  191. return (*HostInfo)(host)
  192. }
  193. func (host *selectedHost) Mark(err error) {}
  194. // NextHost is an iteration function over picked hosts
  195. type NextHost func() SelectedHost
  196. // RoundRobinHostPolicy is a round-robin load balancing policy, where each host
  197. // is tried sequentially for each query.
  198. func RoundRobinHostPolicy() HostSelectionPolicy {
  199. return &roundRobinHostPolicy{}
  200. }
  201. type roundRobinHostPolicy struct {
  202. hosts cowHostList
  203. pos uint32
  204. mu sync.RWMutex
  205. }
  206. func (r *roundRobinHostPolicy) SetPartitioner(partitioner string) {
  207. // noop
  208. }
  209. func (r *roundRobinHostPolicy) Pick(qry ExecutableQuery) NextHost {
  210. // i is used to limit the number of attempts to find a host
  211. // to the number of hosts known to this policy
  212. var i int
  213. return func() SelectedHost {
  214. hosts := r.hosts.get()
  215. if len(hosts) == 0 {
  216. return nil
  217. }
  218. // always increment pos to evenly distribute traffic in case of
  219. // failures
  220. pos := atomic.AddUint32(&r.pos, 1) - 1
  221. if i >= len(hosts) {
  222. return nil
  223. }
  224. host := hosts[(pos)%uint32(len(hosts))]
  225. i++
  226. return (*selectedHost)(host)
  227. }
  228. }
  229. func (r *roundRobinHostPolicy) AddHost(host *HostInfo) {
  230. r.hosts.add(host)
  231. }
  232. func (r *roundRobinHostPolicy) RemoveHost(host *HostInfo) {
  233. r.hosts.remove(host.ConnectAddress())
  234. }
  235. func (r *roundRobinHostPolicy) HostUp(host *HostInfo) {
  236. r.AddHost(host)
  237. }
  238. func (r *roundRobinHostPolicy) HostDown(host *HostInfo) {
  239. r.RemoveHost(host)
  240. }
  241. // TokenAwareHostPolicy is a token aware host selection policy, where hosts are
  242. // selected based on the partition key, so queries are sent to the host which
  243. // owns the partition. Fallback is used when routing information is not available.
  244. func TokenAwareHostPolicy(fallback HostSelectionPolicy) HostSelectionPolicy {
  245. return &tokenAwareHostPolicy{fallback: fallback}
  246. }
  247. type tokenAwareHostPolicy struct {
  248. hosts cowHostList
  249. mu sync.RWMutex
  250. partitioner string
  251. tokenRing *tokenRing
  252. fallback HostSelectionPolicy
  253. }
  254. func (t *tokenAwareHostPolicy) SetPartitioner(partitioner string) {
  255. t.mu.Lock()
  256. defer t.mu.Unlock()
  257. if t.partitioner != partitioner {
  258. t.fallback.SetPartitioner(partitioner)
  259. t.partitioner = partitioner
  260. t.resetTokenRing()
  261. }
  262. }
  263. func (t *tokenAwareHostPolicy) AddHost(host *HostInfo) {
  264. t.mu.Lock()
  265. defer t.mu.Unlock()
  266. t.hosts.add(host)
  267. t.fallback.AddHost(host)
  268. t.resetTokenRing()
  269. }
  270. func (t *tokenAwareHostPolicy) RemoveHost(host *HostInfo) {
  271. t.mu.Lock()
  272. defer t.mu.Unlock()
  273. t.hosts.remove(host.ConnectAddress())
  274. t.fallback.RemoveHost(host)
  275. t.resetTokenRing()
  276. }
  277. func (t *tokenAwareHostPolicy) HostUp(host *HostInfo) {
  278. t.AddHost(host)
  279. }
  280. func (t *tokenAwareHostPolicy) HostDown(host *HostInfo) {
  281. t.RemoveHost(host)
  282. }
  283. func (t *tokenAwareHostPolicy) resetTokenRing() {
  284. if t.partitioner == "" {
  285. // partitioner not yet set
  286. return
  287. }
  288. // create a new token ring
  289. hosts := t.hosts.get()
  290. tokenRing, err := newTokenRing(t.partitioner, hosts)
  291. if err != nil {
  292. Logger.Printf("Unable to update the token ring due to error: %s", err)
  293. return
  294. }
  295. // replace the token ring
  296. t.tokenRing = tokenRing
  297. }
  298. func (t *tokenAwareHostPolicy) Pick(qry ExecutableQuery) NextHost {
  299. if qry == nil {
  300. return t.fallback.Pick(qry)
  301. }
  302. routingKey, err := qry.GetRoutingKey()
  303. if err != nil {
  304. return t.fallback.Pick(qry)
  305. }
  306. if routingKey == nil {
  307. return t.fallback.Pick(qry)
  308. }
  309. t.mu.RLock()
  310. // TODO retrieve a list of hosts based on the replication strategy
  311. host := t.tokenRing.GetHostForPartitionKey(routingKey)
  312. t.mu.RUnlock()
  313. if host == nil {
  314. return t.fallback.Pick(qry)
  315. }
  316. // scope these variables for the same lifetime as the iterator function
  317. var (
  318. hostReturned bool
  319. fallbackIter NextHost
  320. )
  321. return func() SelectedHost {
  322. if !hostReturned {
  323. hostReturned = true
  324. return (*selectedHost)(host)
  325. }
  326. // fallback
  327. if fallbackIter == nil {
  328. fallbackIter = t.fallback.Pick(qry)
  329. }
  330. fallbackHost := fallbackIter()
  331. // filter the token aware selected hosts from the fallback hosts
  332. if fallbackHost != nil && fallbackHost.Info() == host {
  333. fallbackHost = fallbackIter()
  334. }
  335. return fallbackHost
  336. }
  337. }
  338. // HostPoolHostPolicy is a host policy which uses the bitly/go-hostpool library
  339. // to distribute queries between hosts and prevent sending queries to
  340. // unresponsive hosts. When creating the host pool that is passed to the policy
  341. // use an empty slice of hosts as the hostpool will be populated later by gocql.
  342. // See below for examples of usage:
  343. //
  344. // // Create host selection policy using a simple host pool
  345. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(hostpool.New(nil))
  346. //
  347. // // Create host selection policy using an epsilon greedy pool
  348. // cluster.PoolConfig.HostSelectionPolicy = HostPoolHostPolicy(
  349. // hostpool.NewEpsilonGreedy(nil, 0, &hostpool.LinearEpsilonValueCalculator{}),
  350. // )
  351. //
  352. func HostPoolHostPolicy(hp hostpool.HostPool) HostSelectionPolicy {
  353. return &hostPoolHostPolicy{hostMap: map[string]*HostInfo{}, hp: hp}
  354. }
  355. type hostPoolHostPolicy struct {
  356. hp hostpool.HostPool
  357. mu sync.RWMutex
  358. hostMap map[string]*HostInfo
  359. }
  360. func (r *hostPoolHostPolicy) SetHosts(hosts []*HostInfo) {
  361. peers := make([]string, len(hosts))
  362. hostMap := make(map[string]*HostInfo, len(hosts))
  363. for i, host := range hosts {
  364. ip := host.ConnectAddress().String()
  365. peers[i] = ip
  366. hostMap[ip] = host
  367. }
  368. r.mu.Lock()
  369. r.hp.SetHosts(peers)
  370. r.hostMap = hostMap
  371. r.mu.Unlock()
  372. }
  373. func (r *hostPoolHostPolicy) AddHost(host *HostInfo) {
  374. ip := host.ConnectAddress().String()
  375. r.mu.Lock()
  376. defer r.mu.Unlock()
  377. // If the host addr is present and isn't nil return
  378. if h, ok := r.hostMap[ip]; ok && h != nil {
  379. return
  380. }
  381. // otherwise, add the host to the map
  382. r.hostMap[ip] = host
  383. // and construct a new peer list to give to the HostPool
  384. hosts := make([]string, 0, len(r.hostMap))
  385. for addr := range r.hostMap {
  386. hosts = append(hosts, addr)
  387. }
  388. r.hp.SetHosts(hosts)
  389. }
  390. func (r *hostPoolHostPolicy) RemoveHost(host *HostInfo) {
  391. ip := host.ConnectAddress().String()
  392. r.mu.Lock()
  393. defer r.mu.Unlock()
  394. if _, ok := r.hostMap[ip]; !ok {
  395. return
  396. }
  397. delete(r.hostMap, ip)
  398. hosts := make([]string, 0, len(r.hostMap))
  399. for _, host := range r.hostMap {
  400. hosts = append(hosts, host.ConnectAddress().String())
  401. }
  402. r.hp.SetHosts(hosts)
  403. }
  404. func (r *hostPoolHostPolicy) HostUp(host *HostInfo) {
  405. r.AddHost(host)
  406. }
  407. func (r *hostPoolHostPolicy) HostDown(host *HostInfo) {
  408. r.RemoveHost(host)
  409. }
  410. func (r *hostPoolHostPolicy) SetPartitioner(partitioner string) {
  411. // noop
  412. }
  413. func (r *hostPoolHostPolicy) Pick(qry ExecutableQuery) NextHost {
  414. return func() SelectedHost {
  415. r.mu.RLock()
  416. defer r.mu.RUnlock()
  417. if len(r.hostMap) == 0 {
  418. return nil
  419. }
  420. hostR := r.hp.Get()
  421. host, ok := r.hostMap[hostR.Host()]
  422. if !ok {
  423. return nil
  424. }
  425. return selectedHostPoolHost{
  426. policy: r,
  427. info: host,
  428. hostR: hostR,
  429. }
  430. }
  431. }
  432. // selectedHostPoolHost is a host returned by the hostPoolHostPolicy and
  433. // implements the SelectedHost interface
  434. type selectedHostPoolHost struct {
  435. policy *hostPoolHostPolicy
  436. info *HostInfo
  437. hostR hostpool.HostPoolResponse
  438. }
  439. func (host selectedHostPoolHost) Info() *HostInfo {
  440. return host.info
  441. }
  442. func (host selectedHostPoolHost) Mark(err error) {
  443. ip := host.info.ConnectAddress().String()
  444. host.policy.mu.RLock()
  445. defer host.policy.mu.RUnlock()
  446. if _, ok := host.policy.hostMap[ip]; !ok {
  447. // host was removed between pick and mark
  448. return
  449. }
  450. host.hostR.Mark(err)
  451. }
  452. type dcAwareRR struct {
  453. local string
  454. pos uint32
  455. mu sync.RWMutex
  456. localHosts cowHostList
  457. remoteHosts cowHostList
  458. }
  459. // DCAwareRoundRobinPolicy is a host selection policies which will prioritize and
  460. // return hosts which are in the local datacentre before returning hosts in all
  461. // other datercentres
  462. func DCAwareRoundRobinPolicy(localDC string) HostSelectionPolicy {
  463. return &dcAwareRR{
  464. local: localDC,
  465. }
  466. }
  467. func (d *dcAwareRR) AddHost(host *HostInfo) {
  468. if host.DataCenter() == d.local {
  469. d.localHosts.add(host)
  470. } else {
  471. d.remoteHosts.add(host)
  472. }
  473. }
  474. func (d *dcAwareRR) RemoveHost(host *HostInfo) {
  475. if host.DataCenter() == d.local {
  476. d.localHosts.remove(host.ConnectAddress())
  477. } else {
  478. d.remoteHosts.remove(host.ConnectAddress())
  479. }
  480. }
  481. func (d *dcAwareRR) HostUp(host *HostInfo) {
  482. d.AddHost(host)
  483. }
  484. func (d *dcAwareRR) HostDown(host *HostInfo) {
  485. d.RemoveHost(host)
  486. }
  487. func (d *dcAwareRR) SetPartitioner(p string) {}
  488. func (d *dcAwareRR) Pick(q ExecutableQuery) NextHost {
  489. var i int
  490. return func() SelectedHost {
  491. var hosts []*HostInfo
  492. localHosts := d.localHosts.get()
  493. remoteHosts := d.remoteHosts.get()
  494. if len(localHosts) != 0 {
  495. hosts = localHosts
  496. } else {
  497. hosts = remoteHosts
  498. }
  499. if len(hosts) == 0 {
  500. return nil
  501. }
  502. // always increment pos to evenly distribute traffic in case of
  503. // failures
  504. pos := atomic.AddUint32(&d.pos, 1) - 1
  505. if i >= len(localHosts)+len(remoteHosts) {
  506. return nil
  507. }
  508. host := hosts[(pos)%uint32(len(hosts))]
  509. i++
  510. return (*selectedHost)(host)
  511. }
  512. }