broker.go 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384
  1. package sarama
  2. import (
  3. "fmt"
  4. "io"
  5. "net"
  6. "strconv"
  7. "sync"
  8. "time"
  9. )
  10. // BrokerConfig is used to pass multiple configuration options to Broker.Open.
  11. type BrokerConfig struct {
  12. MaxOpenRequests int // How many outstanding requests the broker is allowed to have before blocking attempts to send.
  13. ReadTimeout time.Duration // How long to wait for a response before timing out and returning an error.
  14. }
  15. // NewBrokerConfig returns a new broker configuration with sane defaults.
  16. func NewBrokerConfig() *BrokerConfig {
  17. return &BrokerConfig{
  18. MaxOpenRequests: 4,
  19. ReadTimeout: 1 * time.Minute,
  20. }
  21. }
  22. // Validates a BrokerConfig instance. This will return a
  23. // ConfigurationError if the specified values don't make sense.
  24. func (config *BrokerConfig) Validate() error {
  25. if config.MaxOpenRequests < 0 {
  26. return ConfigurationError("Invalid MaxOpenRequests")
  27. }
  28. if config.ReadTimeout <= 0 {
  29. return ConfigurationError("Invalid ReadTimeout")
  30. }
  31. return nil
  32. }
  33. // Broker represents a single Kafka broker connection. All operations on this object are entirely concurrency-safe.
  34. type Broker struct {
  35. id int32
  36. addr string
  37. conf *BrokerConfig
  38. correlationID int32
  39. conn net.Conn
  40. connErr error
  41. lock sync.Mutex
  42. responses chan responsePromise
  43. done chan bool
  44. }
  45. type responsePromise struct {
  46. correlationID int32
  47. packets chan []byte
  48. errors chan error
  49. }
  50. // NewBroker creates and returns a Broker targetting the given host:port address.
  51. // This does not attempt to actually connect, you have to call Open() for that.
  52. func NewBroker(addr string) *Broker {
  53. return &Broker{id: -1, addr: addr}
  54. }
  55. // Open tries to connect to the Broker. It takes the broker lock synchronously, then spawns a goroutine which
  56. // connects and releases the lock. This means any subsequent operations on the broker will block waiting for
  57. // the connection to finish. To get the effect of a fully synchronous Open call, follow it by a call to Connected().
  58. // The only errors Open will return directly are ConfigurationError or AlreadyConnected. If conf is nil, the result of
  59. // NewBrokerConfig() is used.
  60. func (b *Broker) Open(conf *BrokerConfig) error {
  61. if conf == nil {
  62. conf = NewBrokerConfig()
  63. }
  64. err := conf.Validate()
  65. if err != nil {
  66. return err
  67. }
  68. b.lock.Lock()
  69. if b.conn != nil {
  70. b.lock.Unlock()
  71. Logger.Printf("Failed to connect to broker %s\n", b.addr)
  72. Logger.Println(AlreadyConnected)
  73. return AlreadyConnected
  74. }
  75. go withRecover(func() {
  76. defer b.lock.Unlock()
  77. b.conn, b.connErr = net.Dial("tcp", b.addr)
  78. if b.connErr != nil {
  79. Logger.Printf("Failed to connect to broker %s\n", b.addr)
  80. Logger.Println(b.connErr)
  81. return
  82. }
  83. b.conf = conf
  84. b.done = make(chan bool)
  85. b.responses = make(chan responsePromise, b.conf.MaxOpenRequests)
  86. Logger.Printf("Connected to broker %s\n", b.addr)
  87. go withRecover(b.responseReceiver)
  88. })
  89. return nil
  90. }
  91. // Connected returns true if the broker is connected and false otherwise. If the broker is not
  92. // connected but it had tried to connect, the error from that connection attempt is also returned.
  93. func (b *Broker) Connected() (bool, error) {
  94. b.lock.Lock()
  95. defer b.lock.Unlock()
  96. return b.conn != nil, b.connErr
  97. }
  98. func (b *Broker) Close() (err error) {
  99. b.lock.Lock()
  100. defer b.lock.Unlock()
  101. defer func() {
  102. if err == nil {
  103. Logger.Printf("Closed connection to broker %s\n", b.addr)
  104. } else {
  105. Logger.Printf("Failed to close connection to broker %s.\n", b.addr)
  106. Logger.Println(err)
  107. }
  108. }()
  109. if b.conn == nil {
  110. return NotConnected
  111. }
  112. close(b.responses)
  113. <-b.done
  114. err = b.conn.Close()
  115. b.conn = nil
  116. b.connErr = nil
  117. b.done = nil
  118. b.responses = nil
  119. return
  120. }
  121. // ID returns the broker ID retrieved from Kafka's metadata, or -1 if that is not known.
  122. func (b *Broker) ID() int32 {
  123. return b.id
  124. }
  125. // Addr returns the broker address as either retrieved from Kafka's metadata or passed to NewBroker.
  126. func (b *Broker) Addr() string {
  127. return b.addr
  128. }
  129. func (b *Broker) GetMetadata(clientID string, request *MetadataRequest) (*MetadataResponse, error) {
  130. response := new(MetadataResponse)
  131. err := b.sendAndReceive(clientID, request, response)
  132. if err != nil {
  133. return nil, err
  134. }
  135. return response, nil
  136. }
  137. func (b *Broker) GetConsumerMetadata(clientID string, request *ConsumerMetadataRequest) (*ConsumerMetadataResponse, error) {
  138. response := new(ConsumerMetadataResponse)
  139. err := b.sendAndReceive(clientID, request, response)
  140. if err != nil {
  141. return nil, err
  142. }
  143. return response, nil
  144. }
  145. func (b *Broker) GetAvailableOffsets(clientID string, request *OffsetRequest) (*OffsetResponse, error) {
  146. response := new(OffsetResponse)
  147. err := b.sendAndReceive(clientID, request, response)
  148. if err != nil {
  149. return nil, err
  150. }
  151. return response, nil
  152. }
  153. func (b *Broker) Produce(clientID string, request *ProduceRequest) (*ProduceResponse, error) {
  154. var response *ProduceResponse
  155. var err error
  156. if request.RequiredAcks == NoResponse {
  157. err = b.sendAndReceive(clientID, request, nil)
  158. } else {
  159. response = new(ProduceResponse)
  160. err = b.sendAndReceive(clientID, request, response)
  161. }
  162. if err != nil {
  163. return nil, err
  164. }
  165. return response, nil
  166. }
  167. func (b *Broker) Fetch(clientID string, request *FetchRequest) (*FetchResponse, error) {
  168. response := new(FetchResponse)
  169. err := b.sendAndReceive(clientID, request, response)
  170. if err != nil {
  171. return nil, err
  172. }
  173. return response, nil
  174. }
  175. func (b *Broker) CommitOffset(clientID string, request *OffsetCommitRequest) (*OffsetCommitResponse, error) {
  176. response := new(OffsetCommitResponse)
  177. err := b.sendAndReceive(clientID, request, response)
  178. if err != nil {
  179. return nil, err
  180. }
  181. return response, nil
  182. }
  183. func (b *Broker) FetchOffset(clientID string, request *OffsetFetchRequest) (*OffsetFetchResponse, error) {
  184. response := new(OffsetFetchResponse)
  185. err := b.sendAndReceive(clientID, request, response)
  186. if err != nil {
  187. return nil, err
  188. }
  189. return response, nil
  190. }
  191. func (b *Broker) send(clientID string, req requestEncoder, promiseResponse bool) (*responsePromise, error) {
  192. b.lock.Lock()
  193. defer b.lock.Unlock()
  194. if b.conn == nil {
  195. if b.connErr != nil {
  196. return nil, b.connErr
  197. }
  198. return nil, NotConnected
  199. }
  200. fullRequest := request{b.correlationID, clientID, req}
  201. buf, err := encode(&fullRequest)
  202. if err != nil {
  203. return nil, err
  204. }
  205. _, err = b.conn.Write(buf)
  206. if err != nil {
  207. return nil, err
  208. }
  209. b.correlationID++
  210. if !promiseResponse {
  211. return nil, nil
  212. }
  213. promise := responsePromise{fullRequest.correlationID, make(chan []byte), make(chan error)}
  214. b.responses <- promise
  215. return &promise, nil
  216. }
  217. func (b *Broker) sendAndReceive(clientID string, req requestEncoder, res decoder) error {
  218. promise, err := b.send(clientID, req, res != nil)
  219. if err != nil {
  220. return err
  221. }
  222. if promise == nil {
  223. return nil
  224. }
  225. select {
  226. case buf := <-promise.packets:
  227. return decode(buf, res)
  228. case err = <-promise.errors:
  229. return err
  230. }
  231. }
  232. func (b *Broker) decode(pd packetDecoder) (err error) {
  233. b.id, err = pd.getInt32()
  234. if err != nil {
  235. return err
  236. }
  237. host, err := pd.getString()
  238. if err != nil {
  239. return err
  240. }
  241. port, err := pd.getInt32()
  242. if err != nil {
  243. return err
  244. }
  245. b.addr = fmt.Sprint(host, ":", port)
  246. return nil
  247. }
  248. func (b *Broker) encode(pe packetEncoder) (err error) {
  249. host, portstr, err := net.SplitHostPort(b.addr)
  250. if err != nil {
  251. return err
  252. }
  253. port, err := strconv.Atoi(portstr)
  254. if err != nil {
  255. return err
  256. }
  257. pe.putInt32(b.id)
  258. err = pe.putString(host)
  259. if err != nil {
  260. return err
  261. }
  262. pe.putInt32(int32(port))
  263. return nil
  264. }
  265. func (b *Broker) responseReceiver() {
  266. header := make([]byte, 8)
  267. for response := range b.responses {
  268. b.conn.SetReadDeadline(time.Now().Add(b.conf.ReadTimeout))
  269. _, err := io.ReadFull(b.conn, header)
  270. if err != nil {
  271. response.errors <- err
  272. continue
  273. }
  274. decodedHeader := responseHeader{}
  275. err = decode(header, &decodedHeader)
  276. if err != nil {
  277. response.errors <- err
  278. continue
  279. }
  280. if decodedHeader.correlationID != response.correlationID {
  281. // TODO if decoded ID < cur ID, discard until we catch up
  282. // TODO if decoded ID > cur ID, save it so when cur ID catches up we have a response
  283. response.errors <- DecodingError{Info: "CorrelationID didn't match"}
  284. continue
  285. }
  286. buf := make([]byte, decodedHeader.length-4)
  287. _, err = io.ReadFull(b.conn, buf)
  288. if err != nil {
  289. // XXX: the above ReadFull call inherits the same ReadDeadline set at the top of this loop, so it may
  290. // fail with a timeout error. If this happens, our connection is permanently toast since we will no longer
  291. // be aligned correctly on the stream (we'll be reading garbage Kafka headers from the middle of data).
  292. // Can we/should we fail harder in that case?
  293. response.errors <- err
  294. continue
  295. }
  296. response.packets <- buf
  297. }
  298. close(b.done)
  299. }