broker.go 8.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380
  1. package sarama
  2. import (
  3. "fmt"
  4. "io"
  5. "net"
  6. "strconv"
  7. "sync"
  8. "sync/atomic"
  9. "time"
  10. )
  11. // Broker represents a single Kafka broker connection. All operations on this object are entirely concurrency-safe.
  12. type Broker struct {
  13. id int32
  14. addr string
  15. conf *Config
  16. correlationID int32
  17. conn net.Conn
  18. connErr error
  19. lock sync.Mutex
  20. opened int32
  21. responses chan responsePromise
  22. done chan bool
  23. }
  24. type responsePromise struct {
  25. correlationID int32
  26. packets chan []byte
  27. errors chan error
  28. }
  29. // NewBroker creates and returns a Broker targetting the given host:port address.
  30. // This does not attempt to actually connect, you have to call Open() for that.
  31. func NewBroker(addr string) *Broker {
  32. return &Broker{id: -1, addr: addr}
  33. }
  34. // Open tries to connect to the Broker if it is not already connected or connecting, but does not block
  35. // waiting for the connection to complete. This means that any subsequent operations on the broker will
  36. // block waiting for the connection to succeed or fail. To get the effect of a fully synchronous Open call,
  37. // follow it by a call to Connected(). The only errors Open will return directly are ConfigurationError or
  38. // AlreadyConnected. If conf is nil, the result of NewConfig() is used.
  39. func (b *Broker) Open(conf *Config) error {
  40. if conf == nil {
  41. conf = NewConfig()
  42. }
  43. err := conf.Validate()
  44. if err != nil {
  45. return err
  46. }
  47. if !atomic.CompareAndSwapInt32(&b.opened, 0, 1) {
  48. return ErrAlreadyConnected
  49. }
  50. b.lock.Lock()
  51. if b.conn != nil {
  52. b.lock.Unlock()
  53. Logger.Printf("Failed to connect to broker %s: %s\n", b.addr, ErrAlreadyConnected)
  54. return ErrAlreadyConnected
  55. }
  56. go withRecover(func() {
  57. defer b.lock.Unlock()
  58. dialer := net.Dialer{
  59. Timeout: conf.Net.DialTimeout,
  60. KeepAlive: conf.Net.KeepAlive,
  61. }
  62. b.conn, b.connErr = dialer.Dial("tcp", b.addr)
  63. if b.connErr != nil {
  64. b.conn = nil
  65. atomic.StoreInt32(&b.opened, 0)
  66. Logger.Printf("Failed to connect to broker %s: %s\n", b.addr, b.connErr)
  67. return
  68. }
  69. b.conf = conf
  70. b.done = make(chan bool)
  71. b.responses = make(chan responsePromise, b.conf.Net.MaxOpenRequests-1)
  72. if b.id >= 0 {
  73. Logger.Printf("Connected to broker at %s (registered as #%d)\n", b.addr, b.id)
  74. } else {
  75. Logger.Printf("Connected to broker at %s (unregistered)\n", b.addr)
  76. }
  77. go withRecover(b.responseReceiver)
  78. })
  79. return nil
  80. }
  81. // Connected returns true if the broker is connected and false otherwise. If the broker is not
  82. // connected but it had tried to connect, the error from that connection attempt is also returned.
  83. func (b *Broker) Connected() (bool, error) {
  84. b.lock.Lock()
  85. defer b.lock.Unlock()
  86. return b.conn != nil, b.connErr
  87. }
  88. func (b *Broker) Close() error {
  89. b.lock.Lock()
  90. defer b.lock.Unlock()
  91. if b.conn == nil {
  92. return ErrNotConnected
  93. }
  94. close(b.responses)
  95. <-b.done
  96. err := b.conn.Close()
  97. b.conn = nil
  98. b.connErr = nil
  99. b.done = nil
  100. b.responses = nil
  101. atomic.StoreInt32(&b.opened, 0)
  102. if err == nil {
  103. Logger.Printf("Closed connection to broker %s\n", b.addr)
  104. } else {
  105. Logger.Printf("Error while closing connection to broker %s: %s\n", b.addr, err)
  106. }
  107. return err
  108. }
  109. // ID returns the broker ID retrieved from Kafka's metadata, or -1 if that is not known.
  110. func (b *Broker) ID() int32 {
  111. return b.id
  112. }
  113. // Addr returns the broker address as either retrieved from Kafka's metadata or passed to NewBroker.
  114. func (b *Broker) Addr() string {
  115. return b.addr
  116. }
  117. func (b *Broker) GetMetadata(request *MetadataRequest) (*MetadataResponse, error) {
  118. response := new(MetadataResponse)
  119. err := b.sendAndReceive(request, response)
  120. if err != nil {
  121. return nil, err
  122. }
  123. return response, nil
  124. }
  125. func (b *Broker) GetConsumerMetadata(request *ConsumerMetadataRequest) (*ConsumerMetadataResponse, error) {
  126. response := new(ConsumerMetadataResponse)
  127. err := b.sendAndReceive(request, response)
  128. if err != nil {
  129. return nil, err
  130. }
  131. return response, nil
  132. }
  133. func (b *Broker) GetAvailableOffsets(request *OffsetRequest) (*OffsetResponse, error) {
  134. response := new(OffsetResponse)
  135. err := b.sendAndReceive(request, response)
  136. if err != nil {
  137. return nil, err
  138. }
  139. return response, nil
  140. }
  141. func (b *Broker) Produce(request *ProduceRequest) (*ProduceResponse, error) {
  142. var response *ProduceResponse
  143. var err error
  144. if request.RequiredAcks == NoResponse {
  145. err = b.sendAndReceive(request, nil)
  146. } else {
  147. response = new(ProduceResponse)
  148. err = b.sendAndReceive(request, response)
  149. }
  150. if err != nil {
  151. return nil, err
  152. }
  153. return response, nil
  154. }
  155. func (b *Broker) Fetch(request *FetchRequest) (*FetchResponse, error) {
  156. response := new(FetchResponse)
  157. err := b.sendAndReceive(request, response)
  158. if err != nil {
  159. return nil, err
  160. }
  161. return response, nil
  162. }
  163. func (b *Broker) CommitOffset(request *OffsetCommitRequest) (*OffsetCommitResponse, error) {
  164. response := new(OffsetCommitResponse)
  165. err := b.sendAndReceive(request, response)
  166. if err != nil {
  167. return nil, err
  168. }
  169. return response, nil
  170. }
  171. func (b *Broker) FetchOffset(request *OffsetFetchRequest) (*OffsetFetchResponse, error) {
  172. response := new(OffsetFetchResponse)
  173. err := b.sendAndReceive(request, response)
  174. if err != nil {
  175. return nil, err
  176. }
  177. return response, nil
  178. }
  179. func (b *Broker) send(req requestEncoder, promiseResponse bool) (*responsePromise, error) {
  180. b.lock.Lock()
  181. defer b.lock.Unlock()
  182. if b.conn == nil {
  183. if b.connErr != nil {
  184. return nil, b.connErr
  185. }
  186. return nil, ErrNotConnected
  187. }
  188. fullRequest := request{b.correlationID, b.conf.ClientID, req}
  189. buf, err := encode(&fullRequest)
  190. if err != nil {
  191. return nil, err
  192. }
  193. err = b.conn.SetWriteDeadline(time.Now().Add(b.conf.Net.WriteTimeout))
  194. if err != nil {
  195. return nil, err
  196. }
  197. _, err = b.conn.Write(buf)
  198. if err != nil {
  199. return nil, err
  200. }
  201. b.correlationID++
  202. if !promiseResponse {
  203. return nil, nil
  204. }
  205. promise := responsePromise{fullRequest.correlationID, make(chan []byte), make(chan error)}
  206. b.responses <- promise
  207. return &promise, nil
  208. }
  209. func (b *Broker) sendAndReceive(req requestEncoder, res decoder) error {
  210. promise, err := b.send(req, res != nil)
  211. if err != nil {
  212. return err
  213. }
  214. if promise == nil {
  215. return nil
  216. }
  217. select {
  218. case buf := <-promise.packets:
  219. return decode(buf, res)
  220. case err = <-promise.errors:
  221. return err
  222. }
  223. }
  224. func (b *Broker) decode(pd packetDecoder) (err error) {
  225. b.id, err = pd.getInt32()
  226. if err != nil {
  227. return err
  228. }
  229. host, err := pd.getString()
  230. if err != nil {
  231. return err
  232. }
  233. port, err := pd.getInt32()
  234. if err != nil {
  235. return err
  236. }
  237. b.addr = fmt.Sprint(host, ":", port)
  238. return nil
  239. }
  240. func (b *Broker) encode(pe packetEncoder) (err error) {
  241. host, portstr, err := net.SplitHostPort(b.addr)
  242. if err != nil {
  243. return err
  244. }
  245. port, err := strconv.Atoi(portstr)
  246. if err != nil {
  247. return err
  248. }
  249. pe.putInt32(b.id)
  250. err = pe.putString(host)
  251. if err != nil {
  252. return err
  253. }
  254. pe.putInt32(int32(port))
  255. return nil
  256. }
  257. func (b *Broker) responseReceiver() {
  258. header := make([]byte, 8)
  259. for response := range b.responses {
  260. err := b.conn.SetReadDeadline(time.Now().Add(b.conf.Net.ReadTimeout))
  261. if err != nil {
  262. response.errors <- err
  263. continue
  264. }
  265. _, err = io.ReadFull(b.conn, header)
  266. if err != nil {
  267. response.errors <- err
  268. continue
  269. }
  270. decodedHeader := responseHeader{}
  271. err = decode(header, &decodedHeader)
  272. if err != nil {
  273. response.errors <- err
  274. continue
  275. }
  276. if decodedHeader.correlationID != response.correlationID {
  277. // TODO if decoded ID < cur ID, discard until we catch up
  278. // TODO if decoded ID > cur ID, save it so when cur ID catches up we have a response
  279. response.errors <- PacketDecodingError{fmt.Sprintf("CorrelationID didn't match, wanted %d, got %d", response.correlationID, decodedHeader.correlationID)}
  280. continue
  281. }
  282. buf := make([]byte, decodedHeader.length-4)
  283. _, err = io.ReadFull(b.conn, buf)
  284. if err != nil {
  285. // XXX: the above ReadFull call inherits the same ReadDeadline set at the top of this loop, so it may
  286. // fail with a timeout error. If this happens, our connection is permanently toast since we will no longer
  287. // be aligned correctly on the stream (we'll be reading garbage Kafka headers from the middle of data).
  288. // Can we/should we fail harder in that case?
  289. response.errors <- err
  290. continue
  291. }
  292. response.packets <- buf
  293. }
  294. close(b.done)
  295. }