broker.go 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403
  1. package sarama
  2. import (
  3. "fmt"
  4. "io"
  5. "net"
  6. "strconv"
  7. "sync"
  8. "time"
  9. )
  10. // BrokerConfig is used to pass multiple configuration options to Broker.Open.
  11. type BrokerConfig struct {
  12. MaxOpenRequests int // How many outstanding requests the broker is allowed to have before blocking attempts to send.
  13. DialTimeout time.Duration // How long to wait for the initial connection to succeed before timing out and returning an error.
  14. ReadTimeout time.Duration // How long to wait for a response before timing out and returning an error.
  15. WriteTimeout time.Duration // How long to wait for a transmit to succeed before timing out and returning an error.
  16. }
  17. // NewBrokerConfig returns a new broker configuration with sane defaults.
  18. func NewBrokerConfig() *BrokerConfig {
  19. return &BrokerConfig{
  20. MaxOpenRequests: 4,
  21. DialTimeout: 1 * time.Minute,
  22. ReadTimeout: 1 * time.Minute,
  23. WriteTimeout: 1 * time.Minute,
  24. }
  25. }
  26. // Validate checks a BrokerConfig instance. This will return a
  27. // ConfigurationError if the specified values don't make sense.
  28. func (config *BrokerConfig) Validate() error {
  29. if config.MaxOpenRequests < 0 {
  30. return ConfigurationError("Invalid MaxOpenRequests")
  31. }
  32. if config.ReadTimeout <= 0 {
  33. return ConfigurationError("Invalid ReadTimeout")
  34. }
  35. if config.WriteTimeout <= 0 {
  36. return ConfigurationError("Invalid WriteTimeout")
  37. }
  38. return nil
  39. }
  40. // Broker represents a single Kafka broker connection. All operations on this object are entirely concurrency-safe.
  41. type Broker struct {
  42. id int32
  43. addr string
  44. conf *BrokerConfig
  45. correlationID int32
  46. conn net.Conn
  47. connErr error
  48. lock sync.Mutex
  49. responses chan responsePromise
  50. done chan bool
  51. }
  52. type responsePromise struct {
  53. correlationID int32
  54. packets chan []byte
  55. errors chan error
  56. }
  57. // NewBroker creates and returns a Broker targetting the given host:port address.
  58. // This does not attempt to actually connect, you have to call Open() for that.
  59. func NewBroker(addr string) *Broker {
  60. return &Broker{id: -1, addr: addr}
  61. }
  62. // Open tries to connect to the Broker. It takes the broker lock synchronously, then spawns a goroutine which
  63. // connects and releases the lock. This means any subsequent operations on the broker will block waiting for
  64. // the connection to finish. To get the effect of a fully synchronous Open call, follow it by a call to Connected().
  65. // The only errors Open will return directly are ConfigurationError or AlreadyConnected. If conf is nil, the result of
  66. // NewBrokerConfig() is used.
  67. func (b *Broker) Open(conf *BrokerConfig) error {
  68. if conf == nil {
  69. conf = NewBrokerConfig()
  70. }
  71. err := conf.Validate()
  72. if err != nil {
  73. return err
  74. }
  75. b.lock.Lock()
  76. if b.conn != nil {
  77. b.lock.Unlock()
  78. Logger.Printf("Failed to connect to broker %s\n", b.addr)
  79. Logger.Println(AlreadyConnected)
  80. return AlreadyConnected
  81. }
  82. go withRecover(func() {
  83. defer b.lock.Unlock()
  84. b.conn, b.connErr = net.DialTimeout("tcp", b.addr, conf.DialTimeout)
  85. if b.connErr != nil {
  86. Logger.Printf("Failed to connect to broker %s\n", b.addr)
  87. Logger.Println(b.connErr)
  88. return
  89. }
  90. b.conf = conf
  91. b.done = make(chan bool)
  92. b.responses = make(chan responsePromise, b.conf.MaxOpenRequests)
  93. Logger.Printf("Connected to broker %s\n", b.addr)
  94. go withRecover(b.responseReceiver)
  95. })
  96. return nil
  97. }
  98. // Connected returns true if the broker is connected and false otherwise. If the broker is not
  99. // connected but it had tried to connect, the error from that connection attempt is also returned.
  100. func (b *Broker) Connected() (bool, error) {
  101. b.lock.Lock()
  102. defer b.lock.Unlock()
  103. return b.conn != nil, b.connErr
  104. }
  105. func (b *Broker) Close() (err error) {
  106. b.lock.Lock()
  107. defer b.lock.Unlock()
  108. defer func() {
  109. if err == nil {
  110. Logger.Printf("Closed connection to broker %s\n", b.addr)
  111. } else {
  112. Logger.Printf("Failed to close connection to broker %s.\n", b.addr)
  113. Logger.Println(err)
  114. }
  115. }()
  116. if b.conn == nil {
  117. return NotConnected
  118. }
  119. close(b.responses)
  120. <-b.done
  121. err = b.conn.Close()
  122. b.conn = nil
  123. b.connErr = nil
  124. b.done = nil
  125. b.responses = nil
  126. return
  127. }
  128. // ID returns the broker ID retrieved from Kafka's metadata, or -1 if that is not known.
  129. func (b *Broker) ID() int32 {
  130. return b.id
  131. }
  132. // Addr returns the broker address as either retrieved from Kafka's metadata or passed to NewBroker.
  133. func (b *Broker) Addr() string {
  134. return b.addr
  135. }
  136. func (b *Broker) GetMetadata(clientID string, request *MetadataRequest) (*MetadataResponse, error) {
  137. response := new(MetadataResponse)
  138. err := b.sendAndReceive(clientID, request, response)
  139. if err != nil {
  140. return nil, err
  141. }
  142. return response, nil
  143. }
  144. func (b *Broker) GetConsumerMetadata(clientID string, request *ConsumerMetadataRequest) (*ConsumerMetadataResponse, error) {
  145. response := new(ConsumerMetadataResponse)
  146. err := b.sendAndReceive(clientID, request, response)
  147. if err != nil {
  148. return nil, err
  149. }
  150. return response, nil
  151. }
  152. func (b *Broker) GetAvailableOffsets(clientID string, request *OffsetRequest) (*OffsetResponse, error) {
  153. response := new(OffsetResponse)
  154. err := b.sendAndReceive(clientID, request, response)
  155. if err != nil {
  156. return nil, err
  157. }
  158. return response, nil
  159. }
  160. func (b *Broker) Produce(clientID string, request *ProduceRequest) (*ProduceResponse, error) {
  161. var response *ProduceResponse
  162. var err error
  163. if request.RequiredAcks == NoResponse {
  164. err = b.sendAndReceive(clientID, request, nil)
  165. } else {
  166. response = new(ProduceResponse)
  167. err = b.sendAndReceive(clientID, request, response)
  168. }
  169. if err != nil {
  170. return nil, err
  171. }
  172. return response, nil
  173. }
  174. func (b *Broker) Fetch(clientID string, request *FetchRequest) (*FetchResponse, error) {
  175. response := new(FetchResponse)
  176. err := b.sendAndReceive(clientID, request, response)
  177. if err != nil {
  178. return nil, err
  179. }
  180. return response, nil
  181. }
  182. func (b *Broker) CommitOffset(clientID string, request *OffsetCommitRequest) (*OffsetCommitResponse, error) {
  183. response := new(OffsetCommitResponse)
  184. err := b.sendAndReceive(clientID, request, response)
  185. if err != nil {
  186. return nil, err
  187. }
  188. return response, nil
  189. }
  190. func (b *Broker) FetchOffset(clientID string, request *OffsetFetchRequest) (*OffsetFetchResponse, error) {
  191. response := new(OffsetFetchResponse)
  192. err := b.sendAndReceive(clientID, request, response)
  193. if err != nil {
  194. return nil, err
  195. }
  196. return response, nil
  197. }
  198. func (b *Broker) send(clientID string, req requestEncoder, promiseResponse bool) (*responsePromise, error) {
  199. b.lock.Lock()
  200. defer b.lock.Unlock()
  201. if b.conn == nil {
  202. if b.connErr != nil {
  203. return nil, b.connErr
  204. }
  205. return nil, NotConnected
  206. }
  207. fullRequest := request{b.correlationID, clientID, req}
  208. buf, err := encode(&fullRequest)
  209. if err != nil {
  210. return nil, err
  211. }
  212. err = b.conn.SetWriteDeadline(time.Now().Add(b.conf.WriteTimeout))
  213. if err != nil {
  214. return nil, err
  215. }
  216. _, err = b.conn.Write(buf)
  217. if err != nil {
  218. return nil, err
  219. }
  220. b.correlationID++
  221. if !promiseResponse {
  222. return nil, nil
  223. }
  224. promise := responsePromise{fullRequest.correlationID, make(chan []byte), make(chan error)}
  225. b.responses <- promise
  226. return &promise, nil
  227. }
  228. func (b *Broker) sendAndReceive(clientID string, req requestEncoder, res decoder) error {
  229. promise, err := b.send(clientID, req, res != nil)
  230. if err != nil {
  231. return err
  232. }
  233. if promise == nil {
  234. return nil
  235. }
  236. select {
  237. case buf := <-promise.packets:
  238. return decode(buf, res)
  239. case err = <-promise.errors:
  240. return err
  241. }
  242. }
  243. func (b *Broker) decode(pd packetDecoder) (err error) {
  244. b.id, err = pd.getInt32()
  245. if err != nil {
  246. return err
  247. }
  248. host, err := pd.getString()
  249. if err != nil {
  250. return err
  251. }
  252. port, err := pd.getInt32()
  253. if err != nil {
  254. return err
  255. }
  256. b.addr = fmt.Sprint(host, ":", port)
  257. return nil
  258. }
  259. func (b *Broker) encode(pe packetEncoder) (err error) {
  260. host, portstr, err := net.SplitHostPort(b.addr)
  261. if err != nil {
  262. return err
  263. }
  264. port, err := strconv.Atoi(portstr)
  265. if err != nil {
  266. return err
  267. }
  268. pe.putInt32(b.id)
  269. err = pe.putString(host)
  270. if err != nil {
  271. return err
  272. }
  273. pe.putInt32(int32(port))
  274. return nil
  275. }
  276. func (b *Broker) responseReceiver() {
  277. header := make([]byte, 8)
  278. for response := range b.responses {
  279. err := b.conn.SetReadDeadline(time.Now().Add(b.conf.ReadTimeout))
  280. if err != nil {
  281. response.errors <- err
  282. continue
  283. }
  284. _, err = io.ReadFull(b.conn, header)
  285. if err != nil {
  286. response.errors <- err
  287. continue
  288. }
  289. decodedHeader := responseHeader{}
  290. err = decode(header, &decodedHeader)
  291. if err != nil {
  292. response.errors <- err
  293. continue
  294. }
  295. if decodedHeader.correlationID != response.correlationID {
  296. // TODO if decoded ID < cur ID, discard until we catch up
  297. // TODO if decoded ID > cur ID, save it so when cur ID catches up we have a response
  298. response.errors <- DecodingError{
  299. Info: fmt.Sprintf("CorrelationID didn't match, wanted %d, got %d", response.correlationID, decodedHeader.correlationID),
  300. }
  301. continue
  302. }
  303. buf := make([]byte, decodedHeader.length-4)
  304. _, err = io.ReadFull(b.conn, buf)
  305. if err != nil {
  306. // XXX: the above ReadFull call inherits the same ReadDeadline set at the top of this loop, so it may
  307. // fail with a timeout error. If this happens, our connection is permanently toast since we will no longer
  308. // be aligned correctly on the stream (we'll be reading garbage Kafka headers from the middle of data).
  309. // Can we/should we fail harder in that case?
  310. response.errors <- err
  311. continue
  312. }
  313. response.packets <- buf
  314. }
  315. close(b.done)
  316. }