conn.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786
  1. // Copyright (c) 2012 The gocql Authors. All rights reserved.
  2. // Use of this source code is governed by a BSD-style
  3. // license that can be found in the LICENSE file.
  4. package gocql
  5. import (
  6. "bufio"
  7. "crypto/tls"
  8. "errors"
  9. "fmt"
  10. "io"
  11. "log"
  12. "net"
  13. "strconv"
  14. "strings"
  15. "sync"
  16. "sync/atomic"
  17. "time"
  18. )
  19. //JoinHostPort is a utility to return a address string that can be used
  20. //gocql.Conn to form a connection with a host.
  21. func JoinHostPort(addr string, port int) string {
  22. addr = strings.TrimSpace(addr)
  23. if _, _, err := net.SplitHostPort(addr); err != nil {
  24. addr = net.JoinHostPort(addr, strconv.Itoa(port))
  25. }
  26. return addr
  27. }
  28. type Authenticator interface {
  29. Challenge(req []byte) (resp []byte, auth Authenticator, err error)
  30. Success(data []byte) error
  31. }
  32. type PasswordAuthenticator struct {
  33. Username string
  34. Password string
  35. }
  36. func (p PasswordAuthenticator) Challenge(req []byte) ([]byte, Authenticator, error) {
  37. if string(req) != "org.apache.cassandra.auth.PasswordAuthenticator" {
  38. return nil, nil, fmt.Errorf("unexpected authenticator %q", req)
  39. }
  40. resp := make([]byte, 2+len(p.Username)+len(p.Password))
  41. resp[0] = 0
  42. copy(resp[1:], p.Username)
  43. resp[len(p.Username)+1] = 0
  44. copy(resp[2+len(p.Username):], p.Password)
  45. return resp, nil, nil
  46. }
  47. func (p PasswordAuthenticator) Success(data []byte) error {
  48. return nil
  49. }
  50. type SslOptions struct {
  51. tls.Config
  52. // CertPath and KeyPath are optional depending on server
  53. // config, but both fields must be omitted to avoid using a
  54. // client certificate
  55. CertPath string
  56. KeyPath string
  57. CaPath string //optional depending on server config
  58. // If you want to verify the hostname and server cert (like a wildcard for cass cluster) then you should turn this on
  59. // This option is basically the inverse of InSecureSkipVerify
  60. // See InSecureSkipVerify in http://golang.org/pkg/crypto/tls/ for more info
  61. EnableHostVerification bool
  62. }
  63. type ConnConfig struct {
  64. ProtoVersion int
  65. CQLVersion string
  66. Timeout time.Duration
  67. NumStreams int
  68. Compressor Compressor
  69. Authenticator Authenticator
  70. Keepalive time.Duration
  71. tlsConfig *tls.Config
  72. }
  73. type ConnErrorHandler interface {
  74. HandleError(conn *Conn, err error, closed bool)
  75. }
  76. // How many timeouts we will allow to occur before the connection is closed
  77. // and restarted. This is to prevent a single query timeout from killing a connection
  78. // which may be serving more queries just fine.
  79. // Default is 10, should not be changed concurrently with queries.
  80. var TimeoutLimit int64 = 10
  81. // Conn is a single connection to a Cassandra node. It can be used to execute
  82. // queries, but users are usually advised to use a more reliable, higher
  83. // level API.
  84. type Conn struct {
  85. conn net.Conn
  86. r *bufio.Reader
  87. timeout time.Duration
  88. headerBuf []byte
  89. uniq chan int
  90. calls []callReq
  91. errorHandler ConnErrorHandler
  92. compressor Compressor
  93. auth Authenticator
  94. addr string
  95. version uint8
  96. currentKeyspace string
  97. started bool
  98. closed int32
  99. quit chan struct{}
  100. timeouts int64
  101. }
  102. // Connect establishes a connection to a Cassandra node.
  103. // You must also call the Serve method before you can execute any queries.
  104. func Connect(addr string, cfg ConnConfig, errorHandler ConnErrorHandler) (*Conn, error) {
  105. var (
  106. err error
  107. conn net.Conn
  108. )
  109. dialer := &net.Dialer{
  110. Timeout: cfg.Timeout,
  111. }
  112. if cfg.tlsConfig != nil {
  113. // the TLS config is safe to be reused by connections but it must not
  114. // be modified after being used.
  115. conn, err = tls.DialWithDialer(dialer, "tcp", addr, cfg.tlsConfig)
  116. } else {
  117. conn, err = dialer.Dial("tcp", addr)
  118. }
  119. if err != nil {
  120. return nil, err
  121. }
  122. // going to default to proto 2
  123. if cfg.ProtoVersion < protoVersion1 || cfg.ProtoVersion > protoVersion3 {
  124. log.Printf("unsupported protocol version: %d using 2\n", cfg.ProtoVersion)
  125. cfg.ProtoVersion = 2
  126. }
  127. headerSize := 8
  128. maxStreams := 128
  129. if cfg.ProtoVersion > protoVersion2 {
  130. maxStreams = 32768
  131. headerSize = 9
  132. }
  133. if cfg.NumStreams <= 0 || cfg.NumStreams > maxStreams {
  134. cfg.NumStreams = maxStreams
  135. }
  136. c := &Conn{
  137. conn: conn,
  138. r: bufio.NewReader(conn),
  139. uniq: make(chan int, cfg.NumStreams),
  140. calls: make([]callReq, cfg.NumStreams),
  141. timeout: cfg.Timeout,
  142. version: uint8(cfg.ProtoVersion),
  143. addr: conn.RemoteAddr().String(),
  144. errorHandler: errorHandler,
  145. compressor: cfg.Compressor,
  146. auth: cfg.Authenticator,
  147. headerBuf: make([]byte, headerSize),
  148. quit: make(chan struct{}),
  149. }
  150. if cfg.Keepalive > 0 {
  151. c.setKeepalive(cfg.Keepalive)
  152. }
  153. for i := 0; i < cfg.NumStreams; i++ {
  154. c.calls[i].resp = make(chan error)
  155. c.uniq <- i
  156. }
  157. go c.serve()
  158. if err := c.startup(&cfg); err != nil {
  159. conn.Close()
  160. return nil, err
  161. }
  162. c.started = true
  163. return c, nil
  164. }
  165. func (c *Conn) Write(p []byte) (int, error) {
  166. if c.timeout > 0 {
  167. c.conn.SetWriteDeadline(time.Now().Add(c.timeout))
  168. }
  169. return c.conn.Write(p)
  170. }
  171. func (c *Conn) Read(p []byte) (n int, err error) {
  172. const maxAttempts = 5
  173. for i := 0; i < maxAttempts; i++ {
  174. var nn int
  175. if c.timeout > 0 {
  176. c.conn.SetReadDeadline(time.Now().Add(c.timeout))
  177. }
  178. nn, err = io.ReadFull(c.r, p[n:])
  179. n += nn
  180. if err == nil {
  181. break
  182. }
  183. if verr, ok := err.(net.Error); !ok || !verr.Temporary() {
  184. break
  185. }
  186. }
  187. return
  188. }
  189. func (c *Conn) startup(cfg *ConnConfig) error {
  190. m := map[string]string{
  191. "CQL_VERSION": cfg.CQLVersion,
  192. }
  193. if c.compressor != nil {
  194. m["COMPRESSION"] = c.compressor.Name()
  195. }
  196. frame, err := c.exec(&writeStartupFrame{opts: m}, nil)
  197. if err != nil {
  198. return err
  199. }
  200. switch v := frame.(type) {
  201. case error:
  202. return v
  203. case *readyFrame:
  204. return nil
  205. case *authenticateFrame:
  206. return c.authenticateHandshake(v)
  207. default:
  208. return NewErrProtocol("Unknown type of response to startup frame: %s", v)
  209. }
  210. }
  211. func (c *Conn) authenticateHandshake(authFrame *authenticateFrame) error {
  212. if c.auth == nil {
  213. return fmt.Errorf("authentication required (using %q)", authFrame.class)
  214. }
  215. resp, challenger, err := c.auth.Challenge([]byte(authFrame.class))
  216. if err != nil {
  217. return err
  218. }
  219. req := &writeAuthResponseFrame{data: resp}
  220. for {
  221. frame, err := c.exec(req, nil)
  222. if err != nil {
  223. return err
  224. }
  225. switch v := frame.(type) {
  226. case error:
  227. return v
  228. case *authSuccessFrame:
  229. if challenger != nil {
  230. return challenger.Success(v.data)
  231. }
  232. return nil
  233. case *authChallengeFrame:
  234. resp, challenger, err = challenger.Challenge(v.data)
  235. if err != nil {
  236. return err
  237. }
  238. req = &writeAuthResponseFrame{
  239. data: resp,
  240. }
  241. default:
  242. return fmt.Errorf("unknown frame response during authentication: %v", v)
  243. }
  244. }
  245. }
  246. func (c *Conn) closeWithError(err error) {
  247. if !atomic.CompareAndSwapInt32(&c.closed, 0, 1) {
  248. return
  249. }
  250. if err != nil {
  251. // we should attempt to deliver the error back to the caller if it
  252. // exists
  253. for id := 0; id < len(c.calls); id++ {
  254. req := &c.calls[id]
  255. // we need to send the error to all waiting queries, put the state
  256. // of this conn into not active so that it can not execute any queries.
  257. if err != nil {
  258. select {
  259. case req.resp <- err:
  260. default:
  261. }
  262. }
  263. }
  264. }
  265. // if error was nil then unblock the quit channel
  266. close(c.quit)
  267. c.conn.Close()
  268. if c.started && err != nil {
  269. c.errorHandler.HandleError(c, err, true)
  270. }
  271. }
  272. func (c *Conn) Close() {
  273. c.closeWithError(nil)
  274. }
  275. // Serve starts the stream multiplexer for this connection, which is required
  276. // to execute any queries. This method runs as long as the connection is
  277. // open and is therefore usually called in a separate goroutine.
  278. func (c *Conn) serve() {
  279. var (
  280. err error
  281. )
  282. for {
  283. err = c.recv()
  284. if err != nil {
  285. break
  286. }
  287. }
  288. c.closeWithError(err)
  289. }
  290. func (c *Conn) recv() error {
  291. // not safe for concurrent reads
  292. // read a full header, ignore timeouts, as this is being ran in a loop
  293. // TODO: TCP level deadlines? or just query level deadlines?
  294. if c.timeout > 0 {
  295. c.conn.SetReadDeadline(time.Time{})
  296. }
  297. // were just reading headers over and over and copy bodies
  298. head, err := readHeader(c.r, c.headerBuf)
  299. if err != nil {
  300. return err
  301. }
  302. call := &c.calls[head.stream]
  303. err = call.framer.readFrame(&head)
  304. if err != nil {
  305. // only net errors should cause the connection to be closed. Though
  306. // cassandra returning corrupt frames will be returned here as well.
  307. if _, ok := err.(net.Error); ok {
  308. return err
  309. }
  310. }
  311. // we either, return a response to the caller, the caller timedout, or the
  312. // connection has closed. Either way we should never block indefinatly here
  313. select {
  314. case call.resp <- err:
  315. case <-call.timeout:
  316. c.releaseStream(head.stream)
  317. case <-c.quit:
  318. }
  319. return nil
  320. }
  321. type callReq struct {
  322. // could use a waitgroup but this allows us to do timeouts on the read/send
  323. resp chan error
  324. framer *framer
  325. timeout chan struct{} // indicates to recv() that a call has timedout
  326. }
  327. func (c *Conn) releaseStream(stream int) {
  328. call := &c.calls[stream]
  329. framerPool.Put(call.framer)
  330. call.framer = nil
  331. select {
  332. case c.uniq <- stream:
  333. case <-c.quit:
  334. }
  335. }
  336. func (c *Conn) handleTimeout() {
  337. if atomic.AddInt64(&c.timeouts, 1) > TimeoutLimit {
  338. c.closeWithError(ErrTooManyTimeouts)
  339. }
  340. }
  341. func (c *Conn) exec(req frameWriter, tracer Tracer) (frame, error) {
  342. // TODO: move tracer onto conn
  343. var stream int
  344. select {
  345. case stream = <-c.uniq:
  346. case <-c.quit:
  347. return nil, ErrConnectionClosed
  348. }
  349. // resp is basically a waiting semaphore protecting the framer
  350. framer := newFramer(c, c, c.compressor, c.version)
  351. call := &c.calls[stream]
  352. call.framer = framer
  353. call.timeout = make(chan struct{})
  354. if tracer != nil {
  355. framer.trace()
  356. }
  357. err := req.writeFrame(framer, stream)
  358. if err != nil {
  359. return nil, err
  360. }
  361. select {
  362. case err := <-call.resp:
  363. // dont release the stream if detect a timeout as another request can reuse
  364. // that stream and get a response for the old request, which we have no
  365. // easy way of detecting.
  366. defer c.releaseStream(stream)
  367. if err != nil {
  368. return nil, err
  369. }
  370. case <-time.After(c.timeout):
  371. close(call.timeout)
  372. c.handleTimeout()
  373. return nil, ErrTimeoutNoResponse
  374. case <-c.quit:
  375. return nil, ErrConnectionClosed
  376. }
  377. if v := framer.header.version.version(); v != c.version {
  378. return nil, NewErrProtocol("unexpected protocol version in response: got %d expected %d", v, c.version)
  379. }
  380. frame, err := framer.parseFrame()
  381. if err != nil {
  382. return nil, err
  383. }
  384. if len(framer.traceID) > 0 {
  385. tracer.Trace(framer.traceID)
  386. }
  387. return frame, nil
  388. }
  389. func (c *Conn) prepareStatement(stmt string, trace Tracer) (*resultPreparedFrame, error) {
  390. stmtsLRU.Lock()
  391. if stmtsLRU.lru == nil {
  392. initStmtsLRU(defaultMaxPreparedStmts)
  393. }
  394. stmtCacheKey := c.addr + c.currentKeyspace + stmt
  395. if val, ok := stmtsLRU.lru.Get(stmtCacheKey); ok {
  396. stmtsLRU.Unlock()
  397. flight := val.(*inflightPrepare)
  398. flight.wg.Wait()
  399. return flight.info, flight.err
  400. }
  401. flight := new(inflightPrepare)
  402. flight.wg.Add(1)
  403. stmtsLRU.lru.Add(stmtCacheKey, flight)
  404. stmtsLRU.Unlock()
  405. prep := &writePrepareFrame{
  406. statement: stmt,
  407. }
  408. resp, err := c.exec(prep, trace)
  409. if err != nil {
  410. flight.err = err
  411. flight.wg.Done()
  412. return nil, err
  413. }
  414. switch x := resp.(type) {
  415. case *resultPreparedFrame:
  416. flight.info = x
  417. case error:
  418. flight.err = x
  419. default:
  420. flight.err = NewErrProtocol("Unknown type in response to prepare frame: %s", x)
  421. }
  422. flight.wg.Done()
  423. if flight.err != nil {
  424. stmtsLRU.Lock()
  425. stmtsLRU.lru.Remove(stmtCacheKey)
  426. stmtsLRU.Unlock()
  427. }
  428. return flight.info, flight.err
  429. }
  430. func (c *Conn) executeQuery(qry *Query) *Iter {
  431. params := queryParams{
  432. consistency: qry.cons,
  433. }
  434. // frame checks that it is not 0
  435. params.serialConsistency = qry.serialCons
  436. params.defaultTimestamp = qry.defaultTimestamp
  437. if len(qry.pageState) > 0 {
  438. params.pagingState = qry.pageState
  439. }
  440. if qry.pageSize > 0 {
  441. params.pageSize = qry.pageSize
  442. }
  443. var frame frameWriter
  444. if qry.shouldPrepare() {
  445. // Prepare all DML queries. Other queries can not be prepared.
  446. info, err := c.prepareStatement(qry.stmt, qry.trace)
  447. if err != nil {
  448. return &Iter{err: err}
  449. }
  450. var values []interface{}
  451. if qry.binding == nil {
  452. values = qry.values
  453. } else {
  454. binding := &QueryInfo{
  455. Id: info.preparedID,
  456. Args: info.reqMeta.columns,
  457. Rval: info.respMeta.columns,
  458. }
  459. values, err = qry.binding(binding)
  460. if err != nil {
  461. return &Iter{err: err}
  462. }
  463. }
  464. if len(values) != len(info.reqMeta.columns) {
  465. return &Iter{err: ErrQueryArgLength}
  466. }
  467. params.values = make([]queryValues, len(values))
  468. for i := 0; i < len(values); i++ {
  469. val, err := Marshal(info.reqMeta.columns[i].TypeInfo, values[i])
  470. if err != nil {
  471. return &Iter{err: err}
  472. }
  473. v := &params.values[i]
  474. v.value = val
  475. // TODO: handle query binding names
  476. }
  477. frame = &writeExecuteFrame{
  478. preparedID: info.preparedID,
  479. params: params,
  480. }
  481. } else {
  482. frame = &writeQueryFrame{
  483. statement: qry.stmt,
  484. params: params,
  485. }
  486. }
  487. resp, err := c.exec(frame, qry.trace)
  488. if err != nil {
  489. return &Iter{err: err}
  490. }
  491. switch x := resp.(type) {
  492. case *resultVoidFrame:
  493. return &Iter{}
  494. case *resultRowsFrame:
  495. iter := &Iter{
  496. meta: x.meta,
  497. rows: x.rows,
  498. }
  499. if len(x.meta.pagingState) > 0 {
  500. iter.next = &nextIter{
  501. qry: *qry,
  502. pos: int((1 - qry.prefetch) * float64(len(iter.rows))),
  503. }
  504. iter.next.qry.pageState = x.meta.pagingState
  505. if iter.next.pos < 1 {
  506. iter.next.pos = 1
  507. }
  508. }
  509. return iter
  510. case *resultKeyspaceFrame, *resultSchemaChangeFrame:
  511. return &Iter{}
  512. case *RequestErrUnprepared:
  513. stmtsLRU.Lock()
  514. stmtCacheKey := c.addr + c.currentKeyspace + qry.stmt
  515. if _, ok := stmtsLRU.lru.Get(stmtCacheKey); ok {
  516. stmtsLRU.lru.Remove(stmtCacheKey)
  517. stmtsLRU.Unlock()
  518. return c.executeQuery(qry)
  519. }
  520. stmtsLRU.Unlock()
  521. return &Iter{err: x}
  522. case error:
  523. return &Iter{err: x}
  524. default:
  525. return &Iter{err: NewErrProtocol("Unknown type in response to execute query: %s", x)}
  526. }
  527. }
  528. func (c *Conn) Pick(qry *Query) *Conn {
  529. if c.Closed() {
  530. return nil
  531. }
  532. return c
  533. }
  534. func (c *Conn) Closed() bool {
  535. return atomic.LoadInt32(&c.closed) == 1
  536. }
  537. func (c *Conn) Address() string {
  538. return c.addr
  539. }
  540. func (c *Conn) AvailableStreams() int {
  541. return len(c.uniq)
  542. }
  543. func (c *Conn) UseKeyspace(keyspace string) error {
  544. q := &writeQueryFrame{statement: `USE "` + keyspace + `"`}
  545. q.params.consistency = Any
  546. resp, err := c.exec(q, nil)
  547. if err != nil {
  548. return err
  549. }
  550. switch x := resp.(type) {
  551. case *resultKeyspaceFrame:
  552. case error:
  553. return x
  554. default:
  555. return NewErrProtocol("unknown frame in response to USE: %v", x)
  556. }
  557. c.currentKeyspace = keyspace
  558. return nil
  559. }
  560. func (c *Conn) executeBatch(batch *Batch) error {
  561. if c.version == protoVersion1 {
  562. return ErrUnsupported
  563. }
  564. n := len(batch.Entries)
  565. req := &writeBatchFrame{
  566. typ: batch.Type,
  567. statements: make([]batchStatment, n),
  568. consistency: batch.Cons,
  569. serialConsistency: batch.serialCons,
  570. defaultTimestamp: batch.defaultTimestamp,
  571. }
  572. stmts := make(map[string]string)
  573. for i := 0; i < n; i++ {
  574. entry := &batch.Entries[i]
  575. b := &req.statements[i]
  576. if len(entry.Args) > 0 || entry.binding != nil {
  577. info, err := c.prepareStatement(entry.Stmt, nil)
  578. if err != nil {
  579. return err
  580. }
  581. var args []interface{}
  582. if entry.binding == nil {
  583. args = entry.Args
  584. } else {
  585. binding := &QueryInfo{
  586. Id: info.preparedID,
  587. Args: info.reqMeta.columns,
  588. Rval: info.respMeta.columns,
  589. }
  590. args, err = entry.binding(binding)
  591. if err != nil {
  592. return err
  593. }
  594. }
  595. if len(args) != len(info.reqMeta.columns) {
  596. return ErrQueryArgLength
  597. }
  598. b.preparedID = info.preparedID
  599. stmts[string(info.preparedID)] = entry.Stmt
  600. b.values = make([]queryValues, len(info.reqMeta.columns))
  601. for j := 0; j < len(info.reqMeta.columns); j++ {
  602. val, err := Marshal(info.reqMeta.columns[j].TypeInfo, args[j])
  603. if err != nil {
  604. return err
  605. }
  606. b.values[j].value = val
  607. // TODO: add names
  608. }
  609. } else {
  610. b.statement = entry.Stmt
  611. }
  612. }
  613. // TODO: should batch support tracing?
  614. resp, err := c.exec(req, nil)
  615. if err != nil {
  616. return err
  617. }
  618. switch x := resp.(type) {
  619. case *resultVoidFrame:
  620. return nil
  621. case *RequestErrUnprepared:
  622. stmt, found := stmts[string(x.StatementId)]
  623. if found {
  624. stmtsLRU.Lock()
  625. stmtsLRU.lru.Remove(c.addr + c.currentKeyspace + stmt)
  626. stmtsLRU.Unlock()
  627. }
  628. if found {
  629. return c.executeBatch(batch)
  630. } else {
  631. return x
  632. }
  633. case error:
  634. return x
  635. default:
  636. return NewErrProtocol("Unknown type in response to batch statement: %s", x)
  637. }
  638. }
  639. func (c *Conn) setKeepalive(d time.Duration) error {
  640. if tc, ok := c.conn.(*net.TCPConn); ok {
  641. err := tc.SetKeepAlivePeriod(d)
  642. if err != nil {
  643. return err
  644. }
  645. return tc.SetKeepAlive(true)
  646. }
  647. return nil
  648. }
  649. type inflightPrepare struct {
  650. info *resultPreparedFrame
  651. err error
  652. wg sync.WaitGroup
  653. }
  654. var (
  655. ErrQueryArgLength = errors.New("gocql: query argument length mismatch")
  656. ErrTimeoutNoResponse = errors.New("gocql: no response received from cassandra within timeout period")
  657. ErrTooManyTimeouts = errors.New("gocql: too many query timeouts on the connection")
  658. ErrConnectionClosed = errors.New("gocql: connection closed waiting for response")
  659. )