github.com/hack0072008/kafka-go@v1.0.1/consumergroup.go

github.com/hack0072008/kafka-go@v1.0.1/consumergroup.go (about)

     1  package kafka
     2  
     3  import (
     4  	"bufio"
     5  	"bytes"
     6  	"context"
     7  	"errors"
     8  	"fmt"
     9  	"io"
    10  	"math"
    11  	"net"
    12  	"strconv"
    13  	"strings"
    14  	"sync"
    15  	"time"
    16  )
    17  
    18  // ErrGroupClosed is returned by ConsumerGroup.Next when the group has already
    19  // been closed.
    20  var ErrGroupClosed = errors.New("consumer group is closed")
    21  
    22  // ErrGenerationEnded is returned by the context.Context issued by the
    23  // Generation's Start function when the context has been closed.
    24  var ErrGenerationEnded = errors.New("consumer group generation has ended")
    25  
    26  const (
    27  	// defaultProtocolType holds the default protocol type documented in the
    28  	// kafka protocol
    29  	//
    30  	// See https://cwiki.apache.org/confluence/display/KAFKA/A+Guide+To+The+Kafka+Protocol#AGuideToTheKafkaProtocol-GroupMembershipAPI
    31  	defaultProtocolType = "consumer"
    32  
    33  	// defaultHeartbeatInterval contains the default time between heartbeats.  If
    34  	// the coordinator does not receive a heartbeat within the session timeout interval,
    35  	// the consumer will be considered dead and the coordinator will rebalance the
    36  	// group.
    37  	//
    38  	// As a rule, the heartbeat interval should be no greater than 1/3 the session timeout
    39  	defaultHeartbeatInterval = 3 * time.Second
    40  
    41  	// defaultSessionTimeout contains the default interval the coordinator will wait
    42  	// for a heartbeat before marking a consumer as dead
    43  	defaultSessionTimeout = 30 * time.Second
    44  
    45  	// defaultRebalanceTimeout contains the amount of time the coordinator will wait
    46  	// for consumers to issue a join group once a rebalance has been requested
    47  	defaultRebalanceTimeout = 30 * time.Second
    48  
    49  	// defaultJoinGroupBackoff is the amount of time to wait after a failed
    50  	// consumer group generation before attempting to re-join.
    51  	defaultJoinGroupBackoff = 5 * time.Second
    52  
    53  	// defaultRetentionTime holds the length of time a the consumer group will be
    54  	// saved by kafka.  This value tells the broker to use its configured value.
    55  	defaultRetentionTime = -1 * time.Millisecond
    56  
    57  	// defaultPartitionWatchTime contains the amount of time the kafka-go will wait to
    58  	// query the brokers looking for partition changes.
    59  	defaultPartitionWatchTime = 5 * time.Second
    60  
    61  	// defaultTimeout is the deadline to set when interacting with the
    62  	// consumer group coordinator.
    63  	defaultTimeout = 5 * time.Second
    64  )
    65  
    66  // ConsumerGroupConfig is a configuration object used to create new instances of
    67  // ConsumerGroup.
    68  type ConsumerGroupConfig struct {
    69  	// ID is the consumer group ID.  It must not be empty.
    70  	ID string
    71  
    72  	// The list of broker addresses used to connect to the kafka cluster.  It
    73  	// must not be empty.
    74  	Brokers []string
    75  
    76  	// An dialer used to open connections to the kafka server. This field is
    77  	// optional, if nil, the default dialer is used instead.
    78  	Dialer *Dialer
    79  
    80  	// Topics is the list of topics that will be consumed by this group.  It
    81  	// will usually have a single value, but it is permitted to have multiple
    82  	// for more complex use cases.
    83  	Topics []string
    84  
    85  	// GroupBalancers is the priority-ordered list of client-side consumer group
    86  	// balancing strategies that will be offered to the coordinator.  The first
    87  	// strategy that all group members support will be chosen by the leader.
    88  	//
    89  	// Default: [Range, RoundRobin]
    90  	GroupBalancers []GroupBalancer
    91  
    92  	// HeartbeatInterval sets the optional frequency at which the reader sends the consumer
    93  	// group heartbeat update.
    94  	//
    95  	// Default: 3s
    96  	HeartbeatInterval time.Duration
    97  
    98  	// PartitionWatchInterval indicates how often a reader checks for partition changes.
    99  	// If a reader sees a partition change (such as a partition add) it will rebalance the group
   100  	// picking up new partitions.
   101  	//
   102  	// Default: 5s
   103  	PartitionWatchInterval time.Duration
   104  
   105  	// WatchForPartitionChanges is used to inform kafka-go that a consumer group should be
   106  	// polling the brokers and rebalancing if any partition changes happen to the topic.
   107  	WatchPartitionChanges bool
   108  
   109  	// SessionTimeout optionally sets the length of time that may pass without a heartbeat
   110  	// before the coordinator considers the consumer dead and initiates a rebalance.
   111  	//
   112  	// Default: 30s
   113  	SessionTimeout time.Duration
   114  
   115  	// RebalanceTimeout optionally sets the length of time the coordinator will wait
   116  	// for members to join as part of a rebalance.  For kafka servers under higher
   117  	// load, it may be useful to set this value higher.
   118  	//
   119  	// Default: 30s
   120  	RebalanceTimeout time.Duration
   121  
   122  	// JoinGroupBackoff optionally sets the length of time to wait before re-joining
   123  	// the consumer group after an error.
   124  	//
   125  	// Default: 5s
   126  	JoinGroupBackoff time.Duration
   127  
   128  	// RetentionTime optionally sets the length of time the consumer group will
   129  	// be saved by the broker.  -1 will disable the setting and leave the
   130  	// retention up to the broker's offsets.retention.minutes property.  By
   131  	// default, that setting is 1 day for kafka < 2.0 and 7 days for kafka >=
   132  	// 2.0.
   133  	//
   134  	// Default: -1
   135  	RetentionTime time.Duration
   136  
   137  	// StartOffset determines from whence the consumer group should begin
   138  	// consuming when it finds a partition without a committed offset.  If
   139  	// non-zero, it must be set to one of FirstOffset or LastOffset.
   140  	//
   141  	// Default: FirstOffset
   142  	StartOffset int64
   143  
   144  	// If not nil, specifies a logger used to report internal changes within the
   145  	// reader.
   146  	Logger Logger
   147  
   148  	// ErrorLogger is the logger used to report errors. If nil, the reader falls
   149  	// back to using Logger instead.
   150  	ErrorLogger Logger
   151  
   152  	// Timeout is the network timeout used when communicating with the consumer
   153  	// group coordinator.  This value should not be too small since errors
   154  	// communicating with the broker will generally cause a consumer group
   155  	// rebalance, and it's undesirable that a transient network error intoduce
   156  	// that overhead.  Similarly, it should not be too large or the consumer
   157  	// group may be slow to respond to the coordinator failing over to another
   158  	// broker.
   159  	//
   160  	// Default: 5s
   161  	Timeout time.Duration
   162  
   163  	// connect is a function for dialing the coordinator.  This is provided for
   164  	// unit testing to mock broker connections.
   165  	connect func(dialer *Dialer, brokers ...string) (coordinator, error)
   166  }
   167  
   168  // Validate method validates ConsumerGroupConfig properties and sets relevant
   169  // defaults.
   170  func (config *ConsumerGroupConfig) Validate() error {
   171  
   172  	if len(config.Brokers) == 0 {
   173  		return errors.New("cannot create a consumer group with an empty list of broker addresses")
   174  	}
   175  
   176  	if len(config.Topics) == 0 {
   177  		return errors.New("cannot create a consumer group without a topic")
   178  	}
   179  
   180  	if config.ID == "" {
   181  		return errors.New("cannot create a consumer group without an ID")
   182  	}
   183  
   184  	if config.Dialer == nil {
   185  		config.Dialer = DefaultDialer
   186  	}
   187  
   188  	if len(config.GroupBalancers) == 0 {
   189  		config.GroupBalancers = []GroupBalancer{
   190  			RangeGroupBalancer{},
   191  			RoundRobinGroupBalancer{},
   192  		}
   193  	}
   194  
   195  	if config.HeartbeatInterval == 0 {
   196  		config.HeartbeatInterval = defaultHeartbeatInterval
   197  	}
   198  
   199  	if config.SessionTimeout == 0 {
   200  		config.SessionTimeout = defaultSessionTimeout
   201  	}
   202  
   203  	if config.PartitionWatchInterval == 0 {
   204  		config.PartitionWatchInterval = defaultPartitionWatchTime
   205  	}
   206  
   207  	if config.RebalanceTimeout == 0 {
   208  		config.RebalanceTimeout = defaultRebalanceTimeout
   209  	}
   210  
   211  	if config.JoinGroupBackoff == 0 {
   212  		config.JoinGroupBackoff = defaultJoinGroupBackoff
   213  	}
   214  
   215  	if config.RetentionTime == 0 {
   216  		config.RetentionTime = defaultRetentionTime
   217  	}
   218  
   219  	if config.HeartbeatInterval < 0 || (config.HeartbeatInterval/time.Millisecond) >= math.MaxInt32 {
   220  		return errors.New(fmt.Sprintf("HeartbeatInterval out of bounds: %d", config.HeartbeatInterval))
   221  	}
   222  
   223  	if config.SessionTimeout < 0 || (config.SessionTimeout/time.Millisecond) >= math.MaxInt32 {
   224  		return errors.New(fmt.Sprintf("SessionTimeout out of bounds: %d", config.SessionTimeout))
   225  	}
   226  
   227  	if config.RebalanceTimeout < 0 || (config.RebalanceTimeout/time.Millisecond) >= math.MaxInt32 {
   228  		return errors.New(fmt.Sprintf("RebalanceTimeout out of bounds: %d", config.RebalanceTimeout))
   229  	}
   230  
   231  	if config.JoinGroupBackoff < 0 || (config.JoinGroupBackoff/time.Millisecond) >= math.MaxInt32 {
   232  		return errors.New(fmt.Sprintf("JoinGroupBackoff out of bounds: %d", config.JoinGroupBackoff))
   233  	}
   234  
   235  	if config.RetentionTime < 0 && config.RetentionTime != defaultRetentionTime {
   236  		return errors.New(fmt.Sprintf("RetentionTime out of bounds: %d", config.RetentionTime))
   237  	}
   238  
   239  	if config.PartitionWatchInterval < 0 || (config.PartitionWatchInterval/time.Millisecond) >= math.MaxInt32 {
   240  		return errors.New(fmt.Sprintf("PartitionWachInterval out of bounds %d", config.PartitionWatchInterval))
   241  	}
   242  
   243  	if config.StartOffset == 0 {
   244  		config.StartOffset = FirstOffset
   245  	}
   246  
   247  	if config.StartOffset != FirstOffset && config.StartOffset != LastOffset {
   248  		return errors.New(fmt.Sprintf("StartOffset is not valid %d", config.StartOffset))
   249  	}
   250  
   251  	if config.Timeout == 0 {
   252  		config.Timeout = defaultTimeout
   253  	}
   254  
   255  	if config.connect == nil {
   256  		config.connect = makeConnect(*config)
   257  	}
   258  
   259  	return nil
   260  }
   261  
   262  // PartitionAssignment represents the starting state of a partition that has
   263  // been assigned to a consumer.
   264  type PartitionAssignment struct {
   265  	// ID is the partition ID.
   266  	ID int
   267  
   268  	// Offset is the initial offset at which this assignment begins.  It will
   269  	// either be an absolute offset if one has previously been committed for
   270  	// the consumer group or a relative offset such as FirstOffset when this
   271  	// is the first time the partition have been assigned to a member of the
   272  	// group.
   273  	Offset int64
   274  }
   275  
   276  // genCtx adapts the done channel of the generation to a context.Context.  This
   277  // is used by Generation.Start so that we can pass a context to go routines
   278  // instead of passing around channels.
   279  type genCtx struct {
   280  	gen *Generation
   281  }
   282  
   283  func (c genCtx) Done() <-chan struct{} {
   284  	return c.gen.done
   285  }
   286  
   287  func (c genCtx) Err() error {
   288  	select {
   289  	case <-c.gen.done:
   290  		return ErrGenerationEnded
   291  	default:
   292  		return nil
   293  	}
   294  }
   295  
   296  func (c genCtx) Deadline() (time.Time, bool) {
   297  	return time.Time{}, false
   298  }
   299  
   300  func (c genCtx) Value(interface{}) interface{} {
   301  	return nil
   302  }
   303  
   304  // Generation represents a single consumer group generation.  The generation
   305  // carries the topic+partition assignments for the given.  It also provides
   306  // facilities for committing offsets and for running functions whose lifecycles
   307  // are bound to the generation.
   308  type Generation struct {
   309  	// ID is the generation ID as assigned by the consumer group coordinator.
   310  	ID int32
   311  
   312  	// GroupID is the name of the consumer group.
   313  	GroupID string
   314  
   315  	// MemberID is the ID assigned to this consumer by the consumer group
   316  	// coordinator.
   317  	MemberID string
   318  
   319  	// Assignments is the initial state of this Generation.  The partition
   320  	// assignments are grouped by topic.
   321  	Assignments map[string][]PartitionAssignment
   322  
   323  	conn coordinator
   324  
   325  	// the following fields are used for process accounting to synchronize
   326  	// between Start and close.  lock protects all of them.  done is closed
   327  	// when the generation is ending in order to signal that the generation
   328  	// should start self-desructing.  closed protects against double-closing
   329  	// the done chan.  routines is a count of runing go routines that have been
   330  	// launched by Start.  joined will be closed by the last go routine to exit.
   331  	lock     sync.Mutex
   332  	done     chan struct{}
   333  	closed   bool
   334  	routines int
   335  	joined   chan struct{}
   336  
   337  	retentionMillis int64
   338  	log             func(func(Logger))
   339  	logError        func(func(Logger))
   340  }
   341  
   342  // close stops the generation and waits for all functions launched via Start to
   343  // terminate.
   344  func (g *Generation) close() {
   345  	g.lock.Lock()
   346  	if !g.closed {
   347  		close(g.done)
   348  		g.closed = true
   349  	}
   350  	// determine whether any go routines are running that we need to wait for.
   351  	// waiting needs to happen outside of the critical section.
   352  	r := g.routines
   353  	g.lock.Unlock()
   354  
   355  	// NOTE: r will be zero if no go routines were ever launched.  no need to
   356  	// wait in that case.
   357  	if r > 0 {
   358  		<-g.joined
   359  	}
   360  }
   361  
   362  // Start launches the provided function in a go routine and adds accounting such
   363  // that when the function exits, it stops the current generation (if not
   364  // already in the process of doing so).
   365  //
   366  // The provided function MUST support cancellation via the ctx argument and exit
   367  // in a timely manner once the ctx is complete.  When the context is closed, the
   368  // context's Error() function will return ErrGenerationEnded.
   369  //
   370  // When closing out a generation, the consumer group will wait for all functions
   371  // launched by Start to exit before the group can move on and join the next
   372  // generation.  If the function does not exit promptly, it will stop forward
   373  // progress for this consumer and potentially cause consumer group membership
   374  // churn.
   375  func (g *Generation) Start(fn func(ctx context.Context)) {
   376  	g.lock.Lock()
   377  	defer g.lock.Unlock()
   378  
   379  	// this is an edge case: if the generation has already closed, then it's
   380  	// possible that the close func has already waited on outstanding go
   381  	// routines and exited.
   382  	//
   383  	// nonetheless, it's important to honor that the fn is invoked in case the
   384  	// calling function is waiting e.g. on a channel send or a WaitGroup.  in
   385  	// such a case, fn should immediately exit because ctx.Err() will return
   386  	// ErrGenerationEnded.
   387  	if g.closed {
   388  		go fn(genCtx{g})
   389  		return
   390  	}
   391  
   392  	// register that there is one more go routine that's part of this gen.
   393  	g.routines++
   394  
   395  	go func() {
   396  		fn(genCtx{g})
   397  		g.lock.Lock()
   398  		// shut down the generation as soon as one function exits.  this is
   399  		// different from close() in that it doesn't wait for all go routines in
   400  		// the generation to exit.
   401  		if !g.closed {
   402  			close(g.done)
   403  			g.closed = true
   404  		}
   405  		g.routines--
   406  		// if this was the last go routine in the generation, close the joined
   407  		// chan so that close() can exit if it's waiting.
   408  		if g.routines == 0 {
   409  			close(g.joined)
   410  		}
   411  		g.lock.Unlock()
   412  	}()
   413  }
   414  
   415  // CommitOffsets commits the provided topic+partition+offset combos to the
   416  // consumer group coordinator.  This can be used to reset the consumer to
   417  // explicit offsets.
   418  func (g *Generation) CommitOffsets(offsets map[string]map[int]int64) error {
   419  	if len(offsets) == 0 {
   420  		return nil
   421  	}
   422  
   423  	topics := make([]offsetCommitRequestV2Topic, 0, len(offsets))
   424  	for topic, partitions := range offsets {
   425  		t := offsetCommitRequestV2Topic{Topic: topic}
   426  		for partition, offset := range partitions {
   427  			t.Partitions = append(t.Partitions, offsetCommitRequestV2Partition{
   428  				Partition: int32(partition),
   429  				Offset:    offset,
   430  			})
   431  		}
   432  		topics = append(topics, t)
   433  	}
   434  
   435  	request := offsetCommitRequestV2{
   436  		GroupID:       g.GroupID,
   437  		GenerationID:  g.ID,
   438  		MemberID:      g.MemberID,
   439  		RetentionTime: g.retentionMillis,
   440  		Topics:        topics,
   441  	}
   442  
   443  	_, err := g.conn.offsetCommit(request)
   444  	if err == nil {
   445  		// if logging is enabled, print out the partitions that were committed.
   446  		g.log(func(l Logger) {
   447  			var report []string
   448  			for _, t := range request.Topics {
   449  				report = append(report, fmt.Sprintf("\ttopic: %s", t.Topic))
   450  				for _, p := range t.Partitions {
   451  					report = append(report, fmt.Sprintf("\t\tpartition %d: %d", p.Partition, p.Offset))
   452  				}
   453  			}
   454  			l.Printf("committed offsets for group %s: \n%s", g.GroupID, strings.Join(report, "\n"))
   455  		})
   456  	}
   457  
   458  	return err
   459  }
   460  
   461  // heartbeatLoop checks in with the consumer group coordinator at the provided
   462  // interval.  It exits if it ever encounters an error, which would signal the
   463  // end of the generation.
   464  func (g *Generation) heartbeatLoop(interval time.Duration) {
   465  	g.Start(func(ctx context.Context) {
   466  		g.log(func(l Logger) {
   467  			l.Printf("started heartbeat for group, %v [%v]", g.GroupID, interval)
   468  		})
   469  		defer g.log(func(l Logger) {
   470  			l.Printf("stopped heartbeat for group %s\n", g.GroupID)
   471  		})
   472  
   473  		ticker := time.NewTicker(interval)
   474  		defer ticker.Stop()
   475  
   476  		for {
   477  			select {
   478  			case <-ctx.Done():
   479  				return
   480  			case <-ticker.C:
   481  				_, err := g.conn.heartbeat(heartbeatRequestV0{
   482  					GroupID:      g.GroupID,
   483  					GenerationID: g.ID,
   484  					MemberID:     g.MemberID,
   485  				})
   486  				if err != nil {
   487  					return
   488  				}
   489  			}
   490  		}
   491  	})
   492  }
   493  
   494  // partitionWatcher queries kafka and watches for partition changes, triggering
   495  // a rebalance if changes are found. Similar to heartbeat it's okay to return on
   496  // error here as if you are unable to ask a broker for basic metadata you're in
   497  // a bad spot and should rebalance. Commonly you will see an error here if there
   498  // is a problem with the connection to the coordinator and a rebalance will
   499  // establish a new connection to the coordinator.
   500  func (g *Generation) partitionWatcher(interval time.Duration, topic string) {
   501  	g.Start(func(ctx context.Context) {
   502  		g.log(func(l Logger) {
   503  			l.Printf("started partition watcher for group, %v, topic %v [%v]", g.GroupID, topic, interval)
   504  		})
   505  		defer g.log(func(l Logger) {
   506  			l.Printf("stopped partition watcher for group, %v, topic %v", g.GroupID, topic)
   507  		})
   508  
   509  		ticker := time.NewTicker(interval)
   510  		defer ticker.Stop()
   511  
   512  		ops, err := g.conn.readPartitions(topic)
   513  		if err != nil {
   514  			g.logError(func(l Logger) {
   515  				l.Printf("Problem getting partitions during startup, %v\n, Returning and setting up nextGeneration", err)
   516  			})
   517  			return
   518  		}
   519  		oParts := len(ops)
   520  		for {
   521  			select {
   522  			case <-ctx.Done():
   523  				return
   524  			case <-ticker.C:
   525  				ops, err := g.conn.readPartitions(topic)
   526  				switch err {
   527  				case nil, UnknownTopicOrPartition:
   528  					if len(ops) != oParts {
   529  						g.log(func(l Logger) {
   530  							l.Printf("Partition changes found, reblancing group: %v.", g.GroupID)
   531  						})
   532  						return
   533  					}
   534  				default:
   535  					g.logError(func(l Logger) {
   536  						l.Printf("Problem getting partitions while checking for changes, %v", err)
   537  					})
   538  					if _, ok := err.(Error); ok {
   539  						continue
   540  					}
   541  					// other errors imply that we lost the connection to the coordinator, so we
   542  					// should abort and reconnect.
   543  					return
   544  				}
   545  			}
   546  		}
   547  	})
   548  }
   549  
   550  // coordinator is a subset of the functionality in Conn in order to facilitate
   551  // testing the consumer group...especially for error conditions that are
   552  // difficult to instigate with a live broker running in docker.
   553  type coordinator interface {
   554  	io.Closer
   555  	findCoordinator(findCoordinatorRequestV0) (findCoordinatorResponseV0, error)
   556  	joinGroup(joinGroupRequestV1) (joinGroupResponseV1, error)
   557  	syncGroup(syncGroupRequestV0) (syncGroupResponseV0, error)
   558  	leaveGroup(leaveGroupRequestV0) (leaveGroupResponseV0, error)
   559  	heartbeat(heartbeatRequestV0) (heartbeatResponseV0, error)
   560  	offsetFetch(offsetFetchRequestV1) (offsetFetchResponseV1, error)
   561  	offsetCommit(offsetCommitRequestV2) (offsetCommitResponseV2, error)
   562  	readPartitions(...string) ([]Partition, error)
   563  }
   564  
   565  // timeoutCoordinator wraps the Conn to ensure that every operation has a
   566  // deadline.  Otherwise, it would be possible for requests to block indefinitely
   567  // if the remote server never responds.  There are many spots where the consumer
   568  // group needs to interact with the broker, so it feels less error prone to
   569  // factor all of the deadline management into this shared location as opposed to
   570  // peppering it all through where the code actually interacts with the broker.
   571  type timeoutCoordinator struct {
   572  	timeout          time.Duration
   573  	sessionTimeout   time.Duration
   574  	rebalanceTimeout time.Duration
   575  	conn             *Conn
   576  }
   577  
   578  func (t *timeoutCoordinator) Close() error {
   579  	return t.conn.Close()
   580  }
   581  
   582  func (t *timeoutCoordinator) findCoordinator(req findCoordinatorRequestV0) (findCoordinatorResponseV0, error) {
   583  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   584  		return findCoordinatorResponseV0{}, err
   585  	}
   586  	return t.conn.findCoordinator(req)
   587  }
   588  
   589  func (t *timeoutCoordinator) joinGroup(req joinGroupRequestV1) (joinGroupResponseV1, error) {
   590  	// in the case of join group, the consumer group coordinator may wait up
   591  	// to rebalance timeout in order to wait for all members to join.
   592  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout + t.rebalanceTimeout)); err != nil {
   593  		return joinGroupResponseV1{}, err
   594  	}
   595  	return t.conn.joinGroup(req)
   596  }
   597  
   598  func (t *timeoutCoordinator) syncGroup(req syncGroupRequestV0) (syncGroupResponseV0, error) {
   599  	// in the case of sync group, the consumer group leader is given up to
   600  	// the session timeout to respond before the coordinator will give up.
   601  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout + t.sessionTimeout)); err != nil {
   602  		return syncGroupResponseV0{}, err
   603  	}
   604  	return t.conn.syncGroup(req)
   605  }
   606  
   607  func (t *timeoutCoordinator) leaveGroup(req leaveGroupRequestV0) (leaveGroupResponseV0, error) {
   608  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   609  		return leaveGroupResponseV0{}, err
   610  	}
   611  	return t.conn.leaveGroup(req)
   612  }
   613  
   614  func (t *timeoutCoordinator) heartbeat(req heartbeatRequestV0) (heartbeatResponseV0, error) {
   615  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   616  		return heartbeatResponseV0{}, err
   617  	}
   618  	return t.conn.heartbeat(req)
   619  }
   620  
   621  func (t *timeoutCoordinator) offsetFetch(req offsetFetchRequestV1) (offsetFetchResponseV1, error) {
   622  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   623  		return offsetFetchResponseV1{}, err
   624  	}
   625  	return t.conn.offsetFetch(req)
   626  }
   627  
   628  func (t *timeoutCoordinator) offsetCommit(req offsetCommitRequestV2) (offsetCommitResponseV2, error) {
   629  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   630  		return offsetCommitResponseV2{}, err
   631  	}
   632  	return t.conn.offsetCommit(req)
   633  }
   634  
   635  func (t *timeoutCoordinator) readPartitions(topics ...string) ([]Partition, error) {
   636  	if err := t.conn.SetDeadline(time.Now().Add(t.timeout)); err != nil {
   637  		return nil, err
   638  	}
   639  	return t.conn.ReadPartitions(topics...)
   640  }
   641  
   642  // NewConsumerGroup creates a new ConsumerGroup.  It returns an error if the
   643  // provided configuration is invalid.  It does not attempt to connect to the
   644  // Kafka cluster.  That happens asynchronously, and any errors will be reported
   645  // by Next.
   646  func NewConsumerGroup(config ConsumerGroupConfig) (*ConsumerGroup, error) {
   647  	if err := config.Validate(); err != nil {
   648  		return nil, err
   649  	}
   650  
   651  	cg := &ConsumerGroup{
   652  		config: config,
   653  		next:   make(chan *Generation),
   654  		errs:   make(chan error),
   655  		done:   make(chan struct{}),
   656  	}
   657  	cg.wg.Add(1)
   658  	go func() {
   659  		cg.run()
   660  		cg.wg.Done()
   661  	}()
   662  	return cg, nil
   663  }
   664  
   665  // ConsumerGroup models a Kafka consumer group.  A caller doesn't interact with
   666  // the group directly.  Rather, they interact with a Generation.  Every time a
   667  // member enters or exits the group, it results in a new Generation.  The
   668  // Generation is where partition assignments and offset management occur.
   669  // Callers will use Next to get a handle to the Generation.
   670  type ConsumerGroup struct {
   671  	config ConsumerGroupConfig
   672  	next   chan *Generation
   673  	errs   chan error
   674  
   675  	closeOnce sync.Once
   676  	wg        sync.WaitGroup
   677  	done      chan struct{}
   678  }
   679  
   680  // Close terminates the current generation by causing this member to leave and
   681  // releases all local resources used to participate in the consumer group.
   682  // Close will also end the current generation if it is still active.
   683  func (cg *ConsumerGroup) Close() error {
   684  	cg.closeOnce.Do(func() {
   685  		close(cg.done)
   686  	})
   687  	cg.wg.Wait()
   688  	return nil
   689  }
   690  
   691  // Next waits for the next consumer group generation.  There will never be two
   692  // active generations.  Next will never return a new generation until the
   693  // previous one has completed.
   694  //
   695  // If there are errors setting up the next generation, they will be surfaced
   696  // here.
   697  //
   698  // If the ConsumerGroup has been closed, then Next will return ErrGroupClosed.
   699  func (cg *ConsumerGroup) Next(ctx context.Context) (*Generation, error) {
   700  	select {
   701  	case <-ctx.Done():
   702  		return nil, ctx.Err()
   703  	case <-cg.done:
   704  		return nil, ErrGroupClosed
   705  	case err := <-cg.errs:
   706  		return nil, err
   707  	case next := <-cg.next:
   708  		return next, nil
   709  	}
   710  }
   711  
   712  func (cg *ConsumerGroup) run() {
   713  	// the memberID is the only piece of information that is maintained across
   714  	// generations.  it starts empty and will be assigned on the first nextGeneration
   715  	// when the joinGroup request is processed.  it may change again later if
   716  	// the CG coordinator fails over or if the member is evicted.  otherwise, it
   717  	// will be constant for the lifetime of this group.
   718  	var memberID string
   719  	var err error
   720  	for {
   721  		memberID, err = cg.nextGeneration(memberID)
   722  
   723  		// backoff will be set if this go routine should sleep before continuing
   724  		// to the next generation.  it will be non-nil in the case of an error
   725  		// joining or syncing the group.
   726  		var backoff <-chan time.Time
   727  		switch err {
   728  		case nil:
   729  			// no error...the previous generation finished normally.
   730  			continue
   731  		case ErrGroupClosed:
   732  			// the CG has been closed...leave the group and exit loop.
   733  			_ = cg.leaveGroup(memberID)
   734  			return
   735  		case RebalanceInProgress:
   736  			// in case of a RebalanceInProgress, don't leave the group or
   737  			// change the member ID, but report the error.  the next attempt
   738  			// to join the group will then be subject to the rebalance
   739  			// timeout, so the broker will be responsible for throttling
   740  			// this loop.
   741  		default:
   742  			// leave the group and report the error if we had gotten far
   743  			// enough so as to have a member ID.  also clear the member id
   744  			// so we don't attempt to use it again.  in order to avoid
   745  			// a tight error loop, backoff before the next attempt to join
   746  			// the group.
   747  			_ = cg.leaveGroup(memberID)
   748  			memberID = ""
   749  			backoff = time.After(cg.config.JoinGroupBackoff)
   750  		}
   751  		// ensure that we exit cleanly in case the CG is done and no one is
   752  		// waiting to receive on the unbuffered error channel.
   753  		select {
   754  		case <-cg.done:
   755  			return
   756  		case cg.errs <- err:
   757  		}
   758  		// backoff if needed, being sure to exit cleanly if the CG is done.
   759  		if backoff != nil {
   760  			select {
   761  			case <-cg.done:
   762  				// exit cleanly if the group is closed.
   763  				return
   764  			case <-backoff:
   765  			}
   766  		}
   767  	}
   768  }
   769  
   770  func (cg *ConsumerGroup) nextGeneration(memberID string) (string, error) {
   771  	// get a new connection to the coordinator on each loop.  the previous
   772  	// generation could have exited due to losing the connection, so this
   773  	// ensures that we always have a clean starting point.  it means we will
   774  	// re-connect in certain cases, but that shouldn't be an issue given that
   775  	// rebalances are relatively infrequent under normal operating
   776  	// conditions.
   777  	conn, err := cg.coordinator()
   778  	if err != nil {
   779  		cg.withErrorLogger(func(log Logger) {
   780  			log.Printf("Unable to establish connection to consumer group coordinator for group %s: %v", cg.config.ID, err)
   781  		})
   782  		return memberID, err // a prior memberID may still be valid, so don't return ""
   783  	}
   784  	defer conn.Close()
   785  
   786  	var generationID int32
   787  	var groupAssignments GroupMemberAssignments
   788  	var assignments map[string][]int32
   789  
   790  	// join group.  this will join the group and prepare assignments if our
   791  	// consumer is elected leader.  it may also change or assign the member ID.
   792  	memberID, generationID, groupAssignments, err = cg.joinGroup(conn, memberID)
   793  	if err != nil {
   794  		cg.withErrorLogger(func(log Logger) {
   795  			log.Printf("Failed to join group %s: %v", cg.config.ID, err)
   796  		})
   797  		return memberID, err
   798  	}
   799  	cg.withLogger(func(log Logger) {
   800  		log.Printf("Joined group %s as member %s in generation %d", cg.config.ID, memberID, generationID)
   801  	})
   802  
   803  	// sync group
   804  	assignments, err = cg.syncGroup(conn, memberID, generationID, groupAssignments)
   805  	if err != nil {
   806  		cg.withErrorLogger(func(log Logger) {
   807  			log.Printf("Failed to sync group %s: %v", cg.config.ID, err)
   808  		})
   809  		return memberID, err
   810  	}
   811  
   812  	// fetch initial offsets.
   813  	var offsets map[string]map[int]int64
   814  	offsets, err = cg.fetchOffsets(conn, assignments)
   815  	if err != nil {
   816  		cg.withErrorLogger(func(log Logger) {
   817  			log.Printf("Failed to fetch offsets for group %s: %v", cg.config.ID, err)
   818  		})
   819  		return memberID, err
   820  	}
   821  
   822  	// create the generation.
   823  	gen := Generation{
   824  		ID:              generationID,
   825  		GroupID:         cg.config.ID,
   826  		MemberID:        memberID,
   827  		Assignments:     cg.makeAssignments(assignments, offsets),
   828  		conn:            conn,
   829  		done:            make(chan struct{}),
   830  		joined:          make(chan struct{}),
   831  		retentionMillis: int64(cg.config.RetentionTime / time.Millisecond),
   832  		log:             cg.withLogger,
   833  		logError:        cg.withErrorLogger,
   834  	}
   835  
   836  	// spawn all of the go routines required to facilitate this generation.  if
   837  	// any of these functions exit, then the generation is determined to be
   838  	// complete.
   839  	gen.heartbeatLoop(cg.config.HeartbeatInterval)
   840  	if cg.config.WatchPartitionChanges {
   841  		for _, topic := range cg.config.Topics {
   842  			gen.partitionWatcher(cg.config.PartitionWatchInterval, topic)
   843  		}
   844  	}
   845  
   846  	// make this generation available for retrieval.  if the CG is closed before
   847  	// we can send it on the channel, exit.  that case is required b/c the next
   848  	// channel is unbuffered.  if the caller to Next has already bailed because
   849  	// it's own teardown logic has been invoked, this would deadlock otherwise.
   850  	select {
   851  	case <-cg.done:
   852  		gen.close()
   853  		return memberID, ErrGroupClosed // ErrGroupClosed will trigger leave logic.
   854  	case cg.next <- &gen:
   855  	}
   856  
   857  	// wait for generation to complete.  if the CG is closed before the
   858  	// generation is finished, exit and leave the group.
   859  	select {
   860  	case <-cg.done:
   861  		gen.close()
   862  		return memberID, ErrGroupClosed // ErrGroupClosed will trigger leave logic.
   863  	case <-gen.done:
   864  		// time for next generation!  make sure all the current go routines exit
   865  		// before continuing onward.
   866  		gen.close()
   867  		return memberID, nil
   868  	}
   869  }
   870  
   871  // connect returns a connection to ANY broker
   872  func makeConnect(config ConsumerGroupConfig) func(dialer *Dialer, brokers ...string) (coordinator, error) {
   873  	return func(dialer *Dialer, brokers ...string) (coordinator, error) {
   874  		var err error
   875  		for _, broker := range brokers {
   876  			var conn *Conn
   877  			if conn, err = dialer.Dial("tcp", broker); err == nil {
   878  				return &timeoutCoordinator{
   879  					conn:             conn,
   880  					timeout:          config.Timeout,
   881  					sessionTimeout:   config.SessionTimeout,
   882  					rebalanceTimeout: config.RebalanceTimeout,
   883  				}, nil
   884  			}
   885  		}
   886  		return nil, err // err will be non-nil
   887  	}
   888  }
   889  
   890  // coordinator establishes a connection to the coordinator for this consumer
   891  // group.
   892  func (cg *ConsumerGroup) coordinator() (coordinator, error) {
   893  	// NOTE : could try to cache the coordinator to avoid the double connect
   894  	//        here.  since consumer group balances happen infrequently and are
   895  	//        an expensive operation, we're not currently optimizing that case
   896  	//        in order to keep the code simpler.
   897  	conn, err := cg.config.connect(cg.config.Dialer, cg.config.Brokers...)
   898  	if err != nil {
   899  		return nil, err
   900  	}
   901  	defer conn.Close()
   902  
   903  	out, err := conn.findCoordinator(findCoordinatorRequestV0{
   904  		CoordinatorKey: cg.config.ID,
   905  	})
   906  	if err == nil && out.ErrorCode != 0 {
   907  		err = Error(out.ErrorCode)
   908  	}
   909  	if err != nil {
   910  		return nil, err
   911  	}
   912  
   913  	address := net.JoinHostPort(out.Coordinator.Host, strconv.Itoa(int(out.Coordinator.Port)))
   914  	return cg.config.connect(cg.config.Dialer, address)
   915  }
   916  
   917  // joinGroup attempts to join the reader to the consumer group.
   918  // Returns GroupMemberAssignments is this Reader was selected as
   919  // the leader.  Otherwise, GroupMemberAssignments will be nil.
   920  //
   921  // Possible kafka error codes returned:
   922  //  * GroupLoadInProgress:
   923  //  * GroupCoordinatorNotAvailable:
   924  //  * NotCoordinatorForGroup:
   925  //  * InconsistentGroupProtocol:
   926  //  * InvalidSessionTimeout:
   927  //  * GroupAuthorizationFailed:
   928  func (cg *ConsumerGroup) joinGroup(conn coordinator, memberID string) (string, int32, GroupMemberAssignments, error) {
   929  	request, err := cg.makeJoinGroupRequestV1(memberID)
   930  	if err != nil {
   931  		return "", 0, nil, err
   932  	}
   933  
   934  	response, err := conn.joinGroup(request)
   935  	if err == nil && response.ErrorCode != 0 {
   936  		err = Error(response.ErrorCode)
   937  	}
   938  	if err != nil {
   939  		return "", 0, nil, err
   940  	}
   941  
   942  	memberID = response.MemberID
   943  	generationID := response.GenerationID
   944  
   945  	cg.withLogger(func(l Logger) {
   946  		l.Printf("joined group %s as member %s in generation %d", cg.config.ID, memberID, generationID)
   947  	})
   948  
   949  	var assignments GroupMemberAssignments
   950  	if iAmLeader := response.MemberID == response.LeaderID; iAmLeader {
   951  		v, err := cg.assignTopicPartitions(conn, response)
   952  		if err != nil {
   953  			return memberID, 0, nil, err
   954  		}
   955  		assignments = v
   956  
   957  		cg.withLogger(func(l Logger) {
   958  			for memberID, assignment := range assignments {
   959  				for topic, partitions := range assignment {
   960  					l.Printf("assigned member/topic/partitions %v/%v/%v", memberID, topic, partitions)
   961  				}
   962  			}
   963  		})
   964  	}
   965  
   966  	cg.withLogger(func(l Logger) {
   967  		l.Printf("joinGroup succeeded for response, %v.  generationID=%v, memberID=%v", cg.config.ID, response.GenerationID, response.MemberID)
   968  	})
   969  
   970  	return memberID, generationID, assignments, nil
   971  }
   972  
   973  // makeJoinGroupRequestV1 handles the logic of constructing a joinGroup
   974  // request
   975  func (cg *ConsumerGroup) makeJoinGroupRequestV1(memberID string) (joinGroupRequestV1, error) {
   976  	request := joinGroupRequestV1{
   977  		GroupID:          cg.config.ID,
   978  		MemberID:         memberID,
   979  		SessionTimeout:   int32(cg.config.SessionTimeout / time.Millisecond),
   980  		RebalanceTimeout: int32(cg.config.RebalanceTimeout / time.Millisecond),
   981  		ProtocolType:     defaultProtocolType,
   982  	}
   983  
   984  	for _, balancer := range cg.config.GroupBalancers {
   985  		userData, err := balancer.UserData()
   986  		if err != nil {
   987  			return joinGroupRequestV1{}, fmt.Errorf("unable to construct protocol metadata for member, %v: %v", balancer.ProtocolName(), err)
   988  		}
   989  		request.GroupProtocols = append(request.GroupProtocols, joinGroupRequestGroupProtocolV1{
   990  			ProtocolName: balancer.ProtocolName(),
   991  			ProtocolMetadata: groupMetadata{
   992  				Version:  1,
   993  				Topics:   cg.config.Topics,
   994  				UserData: userData,
   995  			}.bytes(),
   996  		})
   997  	}
   998  
   999  	return request, nil
  1000  }
  1001  
  1002  // assignTopicPartitions uses the selected GroupBalancer to assign members to
  1003  // their various partitions
  1004  func (cg *ConsumerGroup) assignTopicPartitions(conn coordinator, group joinGroupResponseV1) (GroupMemberAssignments, error) {
  1005  	cg.withLogger(func(l Logger) {
  1006  		l.Printf("selected as leader for group, %s\n", cg.config.ID)
  1007  	})
  1008  
  1009  	balancer, ok := findGroupBalancer(group.GroupProtocol, cg.config.GroupBalancers)
  1010  	if !ok {
  1011  		// NOTE : this shouldn't happen in practice...the broker should not
  1012  		//        return successfully from joinGroup unless all members support
  1013  		//        at least one common protocol.
  1014  		return nil, fmt.Errorf("unable to find selected balancer, %v, for group, %v", group.GroupProtocol, cg.config.ID)
  1015  	}
  1016  
  1017  	members, err := cg.makeMemberProtocolMetadata(group.Members)
  1018  	if err != nil {
  1019  		return nil, err
  1020  	}
  1021  
  1022  	topics := extractTopics(members)
  1023  	partitions, err := conn.readPartitions(topics...)
  1024  
  1025  	// it's not a failure if the topic doesn't exist yet.  it results in no
  1026  	// assignments for the topic.  this matches the behavior of the official
  1027  	// clients: java, python, and librdkafka.
  1028  	// a topic watcher can trigger a rebalance when the topic comes into being.
  1029  	if err != nil && err != UnknownTopicOrPartition {
  1030  		return nil, err
  1031  	}
  1032  
  1033  	cg.withLogger(func(l Logger) {
  1034  		l.Printf("using '%v' balancer to assign group, %v", group.GroupProtocol, cg.config.ID)
  1035  		for _, member := range members {
  1036  			l.Printf("found member: %v/%#v", member.ID, member.UserData)
  1037  		}
  1038  		for _, partition := range partitions {
  1039  			l.Printf("found topic/partition: %v/%v", partition.Topic, partition.ID)
  1040  		}
  1041  	})
  1042  
  1043  	return balancer.AssignGroups(members, partitions), nil
  1044  }
  1045  
  1046  // makeMemberProtocolMetadata maps encoded member metadata ([]byte) into []GroupMember
  1047  func (cg *ConsumerGroup) makeMemberProtocolMetadata(in []joinGroupResponseMemberV1) ([]GroupMember, error) {
  1048  	members := make([]GroupMember, 0, len(in))
  1049  	for _, item := range in {
  1050  		metadata := groupMetadata{}
  1051  		reader := bufio.NewReader(bytes.NewReader(item.MemberMetadata))
  1052  		if remain, err := (&metadata).readFrom(reader, len(item.MemberMetadata)); err != nil || remain != 0 {
  1053  			return nil, fmt.Errorf("unable to read metadata for member, %v: %v", item.MemberID, err)
  1054  		}
  1055  
  1056  		members = append(members, GroupMember{
  1057  			ID:       item.MemberID,
  1058  			Topics:   metadata.Topics,
  1059  			UserData: metadata.UserData,
  1060  		})
  1061  	}
  1062  	return members, nil
  1063  }
  1064  
  1065  // syncGroup completes the consumer group nextGeneration by accepting the
  1066  // memberAssignments (if this Reader is the leader) and returning this
  1067  // Readers subscriptions topic => partitions
  1068  //
  1069  // Possible kafka error codes returned:
  1070  //  * GroupCoordinatorNotAvailable:
  1071  //  * NotCoordinatorForGroup:
  1072  //  * IllegalGeneration:
  1073  //  * RebalanceInProgress:
  1074  //  * GroupAuthorizationFailed:
  1075  func (cg *ConsumerGroup) syncGroup(conn coordinator, memberID string, generationID int32, memberAssignments GroupMemberAssignments) (map[string][]int32, error) {
  1076  	request := cg.makeSyncGroupRequestV0(memberID, generationID, memberAssignments)
  1077  	response, err := conn.syncGroup(request)
  1078  	if err == nil && response.ErrorCode != 0 {
  1079  		err = Error(response.ErrorCode)
  1080  	}
  1081  	if err != nil {
  1082  		return nil, err
  1083  	}
  1084  
  1085  	assignments := groupAssignment{}
  1086  	reader := bufio.NewReader(bytes.NewReader(response.MemberAssignments))
  1087  	if _, err := (&assignments).readFrom(reader, len(response.MemberAssignments)); err != nil {
  1088  		return nil, err
  1089  	}
  1090  
  1091  	if len(assignments.Topics) == 0 {
  1092  		cg.withLogger(func(l Logger) {
  1093  			l.Printf("received empty assignments for group, %v as member %s for generation %d", cg.config.ID, memberID, generationID)
  1094  		})
  1095  	}
  1096  
  1097  	cg.withLogger(func(l Logger) {
  1098  		l.Printf("sync group finished for group, %v", cg.config.ID)
  1099  	})
  1100  
  1101  	return assignments.Topics, nil
  1102  }
  1103  
  1104  func (cg *ConsumerGroup) makeSyncGroupRequestV0(memberID string, generationID int32, memberAssignments GroupMemberAssignments) syncGroupRequestV0 {
  1105  	request := syncGroupRequestV0{
  1106  		GroupID:      cg.config.ID,
  1107  		GenerationID: generationID,
  1108  		MemberID:     memberID,
  1109  	}
  1110  
  1111  	if memberAssignments != nil {
  1112  		request.GroupAssignments = make([]syncGroupRequestGroupAssignmentV0, 0, 1)
  1113  
  1114  		for memberID, topics := range memberAssignments {
  1115  			topics32 := make(map[string][]int32)
  1116  			for topic, partitions := range topics {
  1117  				partitions32 := make([]int32, len(partitions))
  1118  				for i := range partitions {
  1119  					partitions32[i] = int32(partitions[i])
  1120  				}
  1121  				topics32[topic] = partitions32
  1122  			}
  1123  			request.GroupAssignments = append(request.GroupAssignments, syncGroupRequestGroupAssignmentV0{
  1124  				MemberID: memberID,
  1125  				MemberAssignments: groupAssignment{
  1126  					Version: 1,
  1127  					Topics:  topics32,
  1128  				}.bytes(),
  1129  			})
  1130  		}
  1131  
  1132  		cg.withLogger(func(logger Logger) {
  1133  			logger.Printf("Syncing %d assignments for generation %d as member %s", len(request.GroupAssignments), generationID, memberID)
  1134  		})
  1135  	}
  1136  
  1137  	return request
  1138  }
  1139  
  1140  func (cg *ConsumerGroup) fetchOffsets(conn coordinator, subs map[string][]int32) (map[string]map[int]int64, error) {
  1141  	req := offsetFetchRequestV1{
  1142  		GroupID: cg.config.ID,
  1143  		Topics:  make([]offsetFetchRequestV1Topic, 0, len(cg.config.Topics)),
  1144  	}
  1145  	for _, topic := range cg.config.Topics {
  1146  		req.Topics = append(req.Topics, offsetFetchRequestV1Topic{
  1147  			Topic:      topic,
  1148  			Partitions: subs[topic],
  1149  		})
  1150  	}
  1151  	offsets, err := conn.offsetFetch(req)
  1152  	if err != nil {
  1153  		return nil, err
  1154  	}
  1155  
  1156  	offsetsByTopic := make(map[string]map[int]int64)
  1157  	for _, res := range offsets.Responses {
  1158  		offsetsByPartition := map[int]int64{}
  1159  		offsetsByTopic[res.Topic] = offsetsByPartition
  1160  		for _, pr := range res.PartitionResponses {
  1161  			for _, partition := range subs[res.Topic] {
  1162  				if partition == pr.Partition {
  1163  					offset := pr.Offset
  1164  					if offset < 0 {
  1165  						offset = cg.config.StartOffset
  1166  					}
  1167  					offsetsByPartition[int(partition)] = offset
  1168  				}
  1169  			}
  1170  		}
  1171  	}
  1172  
  1173  	return offsetsByTopic, nil
  1174  }
  1175  
  1176  func (cg *ConsumerGroup) makeAssignments(assignments map[string][]int32, offsets map[string]map[int]int64) map[string][]PartitionAssignment {
  1177  	topicAssignments := make(map[string][]PartitionAssignment)
  1178  	for _, topic := range cg.config.Topics {
  1179  		topicPartitions := assignments[topic]
  1180  		topicAssignments[topic] = make([]PartitionAssignment, 0, len(topicPartitions))
  1181  		for _, partition := range topicPartitions {
  1182  			var offset int64
  1183  			partitionOffsets, ok := offsets[topic]
  1184  			if ok {
  1185  				offset, ok = partitionOffsets[int(partition)]
  1186  			}
  1187  			if !ok {
  1188  				offset = cg.config.StartOffset
  1189  			}
  1190  			topicAssignments[topic] = append(topicAssignments[topic], PartitionAssignment{
  1191  				ID:     int(partition),
  1192  				Offset: offset,
  1193  			})
  1194  		}
  1195  	}
  1196  	return topicAssignments
  1197  }
  1198  
  1199  func (cg *ConsumerGroup) leaveGroup(memberID string) error {
  1200  	// don't attempt to leave the group if no memberID was ever assigned.
  1201  	if memberID == "" {
  1202  		return nil
  1203  	}
  1204  
  1205  	cg.withLogger(func(log Logger) {
  1206  		log.Printf("Leaving group %s, member %s", cg.config.ID, memberID)
  1207  	})
  1208  
  1209  	// IMPORTANT : leaveGroup establishes its own connection to the coordinator
  1210  	//             because it is often called after some other operation failed.
  1211  	//             said failure could be the result of connection-level issues,
  1212  	//             so we want to re-establish the connection to ensure that we
  1213  	//             are able to process the cleanup step.
  1214  	coordinator, err := cg.coordinator()
  1215  	if err != nil {
  1216  		return err
  1217  	}
  1218  
  1219  	_, err = coordinator.leaveGroup(leaveGroupRequestV0{
  1220  		GroupID:  cg.config.ID,
  1221  		MemberID: memberID,
  1222  	})
  1223  	if err != nil {
  1224  		cg.withErrorLogger(func(log Logger) {
  1225  			log.Printf("leave group failed for group, %v, and member, %v: %v", cg.config.ID, memberID, err)
  1226  		})
  1227  	}
  1228  
  1229  	_ = coordinator.Close()
  1230  
  1231  	return err
  1232  }
  1233  
  1234  func (cg *ConsumerGroup) withLogger(do func(Logger)) {
  1235  	if cg.config.Logger != nil {
  1236  		do(cg.config.Logger)
  1237  	}
  1238  }
  1239  
  1240  func (cg *ConsumerGroup) withErrorLogger(do func(Logger)) {
  1241  	if cg.config.ErrorLogger != nil {
  1242  		do(cg.config.ErrorLogger)
  1243  	} else {
  1244  		cg.withLogger(do)
  1245  	}
  1246  }