github.com/m3db/m3@v1.5.1-0.20231129193456-75a402aa583b/src/dbnode/encoding/proto/round_trip_prop_test.go (about)

     1  // +build big
     2  //
     3  // Copyright (c) 2019 Uber Technologies, Inc.
     4  //
     5  // Permission is hereby granted, free of charge, to any person obtaining a copy
     6  // of this software and associated documentation files (the "Software"), to deal
     7  // in the Software without restriction, including without limitation the rights
     8  // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
     9  // copies of the Software, and to permit persons to whom the Software is
    10  // furnished to do so, subject to the following conditions:
    11  //
    12  // The above copyright notice and this permission notice shall be included in
    13  // all copies or substantial portions of the Software.
    14  //
    15  // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    16  // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    17  // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    18  // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    19  // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    20  // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
    21  // THE SOFTWARE.
    22  
    23  package proto
    24  
    25  import (
    26  	"bytes"
    27  	"fmt"
    28  	"os"
    29  	"reflect"
    30  	"runtime/debug"
    31  	"testing"
    32  	"time"
    33  
    34  	"github.com/m3db/m3/src/dbnode/namespace"
    35  	"github.com/m3db/m3/src/dbnode/ts"
    36  	"github.com/m3db/m3/src/dbnode/x/xio"
    37  	"github.com/m3db/m3/src/x/context"
    38  	xtime "github.com/m3db/m3/src/x/time"
    39  
    40  	dpb "github.com/golang/protobuf/protoc-gen-go/descriptor"
    41  	"github.com/jhump/protoreflect/desc"
    42  	"github.com/jhump/protoreflect/desc/builder"
    43  	"github.com/jhump/protoreflect/dynamic"
    44  	"github.com/leanovate/gopter"
    45  	"github.com/leanovate/gopter/gen"
    46  	"github.com/leanovate/gopter/prop"
    47  	"github.com/stretchr/testify/require"
    48  )
    49  
    50  var (
    51  	// Generated from mapProtoTypeToCustomFieldType by init().
    52  	allowedProtoTypesSliceIface = []interface{}{}
    53  
    54  	validMapKeyTypes = []interface{}{
    55  		// https://developers.google.com/protocol-buffers/docs/proto3#maps
    56  		dpb.FieldDescriptorProto_TYPE_INT32,
    57  		dpb.FieldDescriptorProto_TYPE_INT64,
    58  		dpb.FieldDescriptorProto_TYPE_UINT32,
    59  		dpb.FieldDescriptorProto_TYPE_UINT64,
    60  		dpb.FieldDescriptorProto_TYPE_SINT32,
    61  		dpb.FieldDescriptorProto_TYPE_SINT64,
    62  		dpb.FieldDescriptorProto_TYPE_FIXED32,
    63  		dpb.FieldDescriptorProto_TYPE_FIXED64,
    64  		dpb.FieldDescriptorProto_TYPE_SFIXED32,
    65  		dpb.FieldDescriptorProto_TYPE_SFIXED64,
    66  		dpb.FieldDescriptorProto_TYPE_BOOL,
    67  		dpb.FieldDescriptorProto_TYPE_STRING,
    68  	}
    69  )
    70  
    71  func init() {
    72  	for key := range mapProtoTypeToCustomFieldType {
    73  		allowedProtoTypesSliceIface = append(allowedProtoTypesSliceIface, key)
    74  	}
    75  }
    76  
    77  const (
    78  	maxNumFields     = 10
    79  	maxNumMessages   = 100
    80  	maxNumEnumValues = 10
    81  
    82  	debugLogs = false
    83  )
    84  
    85  type fieldModifierProp int
    86  
    87  const (
    88  	fieldModifierRegular fieldModifierProp = iota
    89  	fieldModifierReserved
    90  	// Maps can't be repeated so its ok for these to be mutally exclusive.
    91  	fieldModifierRepeated
    92  	fieldModifierMap
    93  )
    94  
    95  func TestRoundTripProp(t *testing.T) {
    96  	var (
    97  		parameters = gopter.DefaultTestParameters()
    98  		seed       = time.Now().UnixNano()
    99  		props      = gopter.NewProperties(parameters)
   100  		reporter   = gopter.NewFormatedReporter(true, 160, os.Stdout)
   101  	)
   102  	parameters.MinSuccessfulTests = 300
   103  	parameters.Rng.Seed(seed)
   104  
   105  	enc := NewEncoder(0, testEncodingOptions)
   106  	iter := NewIterator(nil, nil, testEncodingOptions).(*iterator)
   107  	props.Property("Encoded data should be readable", prop.ForAll(func(input propTestInput) (bool, error) {
   108  		if debugLogs {
   109  			fmt.Println("---------------------------------------------------")
   110  		}
   111  
   112  		// Make panics debuggable.
   113  		defer func() {
   114  			if r := recover(); r != nil {
   115  				fmt.Printf(
   116  					"recovered with err: %v,schema: %s and messages: %#v",
   117  					r,
   118  					input.schema.String(),
   119  					input.messages)
   120  				debug.PrintStack()
   121  				panic("prop test encountered a panic!")
   122  			}
   123  		}()
   124  
   125  		times := make([]xtime.UnixNano, 0, len(input.messages))
   126  		currTime := xtime.Now()
   127  		for i, m := range input.messages {
   128  			duration, err := m.timeUnit.Value()
   129  			if err != nil {
   130  				return false, fmt.Errorf("error getting duration from xtime.Unit: %v", err)
   131  			}
   132  
   133  			currTime = currTime.Add(time.Duration(i) * duration).Truncate(duration)
   134  			times = append(times, currTime)
   135  		}
   136  
   137  		schemaDescr := namespace.GetTestSchemaDescr(input.schema)
   138  		enc.Reset(currTime, 0, schemaDescr)
   139  
   140  		for i, m := range input.messages {
   141  			// The encoder will mutate the message so make sure we clone it first.
   142  			clone := dynamic.NewMessage(input.schema)
   143  			clone.MergeFrom(m.message)
   144  			cloneBytes, err := clone.Marshal()
   145  			if err != nil {
   146  				return false, fmt.Errorf("error marshalling proto message: %v", err)
   147  			}
   148  
   149  			if debugLogs {
   150  				printMessage(fmt.Sprintf("encoding %d", i), m.message)
   151  			}
   152  			err = enc.Encode(ts.Datapoint{TimestampNanos: times[i]}, xtime.Nanosecond, cloneBytes)
   153  			if err != nil {
   154  				return false, fmt.Errorf(
   155  					"error encoding message: %v, schema: %s", err, input.schema.String())
   156  			}
   157  
   158  			// Ensure that the schema can be set inbetween writes without interfering with the stream.
   159  			// A new deployID is created each time to bypass the quick check in the SetSchema method
   160  			// and force the encoder to perform all of the state updates it has to do when a schema
   161  			// changes but without actually changing the schema (which would make asserting on the
   162  			// correct output difficult).
   163  			setSchemaDescr := namespace.GetTestSchemaDescrWithDeployID(
   164  				input.schema, fmt.Sprintf("deploy_id_%d", i))
   165  			enc.SetSchema(setSchemaDescr)
   166  		}
   167  
   168  		// Ensure that the Len() method always returns the length of the final stream that would
   169  		// be returned by a call to Stream().
   170  		encLen := enc.Len()
   171  
   172  		ctx := context.NewBackground()
   173  		defer ctx.Close()
   174  
   175  		stream, ok := enc.Stream(ctx)
   176  		if !ok {
   177  			if len(input.messages) == 0 {
   178  				return true, nil
   179  			}
   180  			return false, fmt.Errorf("encoder returned empty stream")
   181  		}
   182  		segment, err := stream.Segment()
   183  		if err != nil {
   184  			return false, fmt.Errorf("error getting segment: %v", err)
   185  		}
   186  		if segment.Len() != encLen {
   187  			return false, fmt.Errorf(
   188  				"expected segment len (%d) to match encoder len (%d)",
   189  				segment.Len(), encLen)
   190  		}
   191  
   192  		iter.Reset(stream, schemaDescr)
   193  
   194  		i := 0
   195  		for iter.Next() {
   196  			var (
   197  				m                    = input.messages[i].message
   198  				dp, unit, annotation = iter.Current()
   199  			)
   200  			decodedM := dynamic.NewMessage(input.schema)
   201  			require.NoError(t, decodedM.Unmarshal(annotation))
   202  			if debugLogs {
   203  				printMessage(fmt.Sprintf("decoding %d", i), decodedM)
   204  			}
   205  
   206  			require.Equal(t, unit, xtime.Nanosecond)
   207  			require.True(t,
   208  				times[i].Equal(dp.TimestampNanos),
   209  				"%s does not match %s", times[i], dp.TimestampNanos)
   210  
   211  			if !dynamic.MessagesEqual(m, decodedM) {
   212  				for _, field := range m.GetKnownFields() {
   213  					var (
   214  						fieldNum    = int(field.GetNumber())
   215  						expectedVal = m.GetFieldByNumber(fieldNum)
   216  						actualVal   = decodedM.GetFieldByNumber(fieldNum)
   217  					)
   218  
   219  					if !fieldsEqual(expectedVal, actualVal) {
   220  						return false, fmt.Errorf(
   221  							"expected %v but got %v on iteration number %d and fieldNum %d, schema %s",
   222  							expectedVal, actualVal, i, fieldNum, input.schema)
   223  					}
   224  				}
   225  			}
   226  			i++
   227  		}
   228  
   229  		if iter.Err() != nil {
   230  			return false, fmt.Errorf(
   231  				"iteration error: %v, schema: %s", iter.Err(), input.schema.String())
   232  		}
   233  
   234  		if i != len(input.messages) {
   235  			return false, fmt.Errorf("expected %d messages but got %d", len(input.messages), i)
   236  		}
   237  
   238  		return true, nil
   239  	}, genPropTestInputs()))
   240  
   241  	if !props.Run(reporter) {
   242  		t.Errorf("failed with initial seed: %d", seed)
   243  	}
   244  }
   245  
   246  // TestBijectivityProp ensures that the protobuf encoding format is bijective. I.E if the same messages are
   247  // provided in the same order then the resulting stream should always be the same and similarly that decoding
   248  // and re-encoding should always generate the same stream as the original.
   249  func TestBijectivityProp(t *testing.T) {
   250  	var (
   251  		parameters = gopter.DefaultTestParameters()
   252  		seed       = time.Now().UnixNano()
   253  		props      = gopter.NewProperties(parameters)
   254  		reporter   = gopter.NewFormatedReporter(true, 160, os.Stdout)
   255  	)
   256  	parameters.MinSuccessfulTests = 100
   257  	parameters.Rng.Seed(seed)
   258  
   259  	enc := NewEncoder(0, testEncodingOptions)
   260  	iter := NewIterator(nil, nil, testEncodingOptions).(*iterator)
   261  	props.Property("Encoded data should be readable", prop.ForAll(func(input propTestInput) (bool, error) {
   262  		if len(input.messages) == 0 {
   263  			return true, nil
   264  		}
   265  		if debugLogs {
   266  			fmt.Println("---------------------------------------------------")
   267  		}
   268  
   269  		var (
   270  			start       = xtime.Now()
   271  			schemaDescr = namespace.GetTestSchemaDescr(input.schema)
   272  
   273  			originalStream  xio.SegmentReader
   274  			originalSegment ts.Segment
   275  			messageTimes    []xtime.UnixNano
   276  			messageBytes    [][]byte
   277  		)
   278  
   279  		// Unfortunately the current implementation is only guaranteed to generate the exact stream
   280  		// for the same input Protobuf messages if the marshaled protobuf bytes are the same. The reason
   281  		// for that is that the Protobuf encoding format is not bijective (for example, fields do not have
   282  		// to be encoded in sorted order by field number and map values can appear in arbitrary orders).
   283  		//
   284  		// The protobuf encoder/iterator compensates for some of these limitations (like the lack of sorting
   285  		// on field order by performing the sort itself during "custom unmarshaling") but does not compensate
   286  		// for others (like the fact that maps are not sorted). Because of these limitations the current encoder
   287  		// may generate different streams (even when provided the same messages) if the messages are not first
   288  		// marshaled into the same exact byte streams.
   289  		for i, m := range input.messages {
   290  			if debugLogs {
   291  				printMessage(fmt.Sprintf("encoding %d", i), m.message)
   292  			}
   293  			clone := dynamic.NewMessage(input.schema)
   294  			clone.MergeFrom(m.message)
   295  			mBytes, err := clone.Marshal()
   296  			if err != nil {
   297  				return false, fmt.Errorf("error marshalling proto message: %v", err)
   298  			}
   299  			// Generate times up-front so they're the same for each iteration.
   300  			messageTimes = append(messageTimes, xtime.Now())
   301  			messageBytes = append(messageBytes, mBytes)
   302  		}
   303  
   304  		ctx := context.NewBackground()
   305  		defer ctx.Close()
   306  
   307  		// First verify that if the same input byte slices are passed then the same stream will always
   308  		// be generated.
   309  		for i := 0; i < 10; i++ {
   310  			enc.Reset(start, 0, schemaDescr)
   311  			for j, mBytes := range messageBytes {
   312  				err := enc.Encode(ts.Datapoint{TimestampNanos: messageTimes[j]}, xtime.Nanosecond, mBytes)
   313  				if err != nil {
   314  					return false, fmt.Errorf(
   315  						"error encoding message: %v, schema: %s", err, input.schema.String())
   316  				}
   317  			}
   318  
   319  			currStream, ok := enc.Stream(ctx)
   320  			if !ok {
   321  				return false, fmt.Errorf("encoder returned empty stream")
   322  			}
   323  			currSegment, err := currStream.Segment()
   324  			if err != nil {
   325  				return false, fmt.Errorf("error getting segment: %v", err)
   326  			}
   327  
   328  			if originalStream == nil {
   329  				originalStream = currStream
   330  				originalSegment = currSegment
   331  			} else {
   332  				if err := compareSegments(originalSegment, currSegment); err != nil {
   333  					return false, fmt.Errorf("error comparing segments for re-encoding original stream: %v", err)
   334  				}
   335  			}
   336  		}
   337  
   338  		// Next verify that re-encoding a stream (after decoding/iterating it) will also always generate the
   339  		// same original stream.
   340  		for i := 0; i < 10; i++ {
   341  			originalStream.Reset(originalSegment)
   342  			iter.Reset(originalStream, schemaDescr)
   343  			enc.Reset(start, 0, schemaDescr)
   344  			j := 0
   345  			for iter.Next() {
   346  				dp, unit, annotation := iter.Current()
   347  				if debugLogs {
   348  					fmt.Println("iterating", dp, unit, annotation)
   349  				}
   350  				if err := enc.Encode(dp, unit, annotation); err != nil {
   351  					return false, fmt.Errorf("error encoding current value")
   352  				}
   353  				j++
   354  			}
   355  			if iter.Err() != nil {
   356  				return false, fmt.Errorf(
   357  					"iteration error: %v, schema: %s", iter.Err(), input.schema.String())
   358  			}
   359  
   360  			if j != len(input.messages) {
   361  				return false, fmt.Errorf("expected %d messages but got %d", len(input.messages), j)
   362  			}
   363  
   364  			currStream, ok := enc.Stream(ctx)
   365  			if !ok {
   366  				return false, fmt.Errorf("encoder returned empty stream")
   367  			}
   368  			currSegment, err := currStream.Segment()
   369  			if err != nil {
   370  				return false, fmt.Errorf("error getting segment: %v", err)
   371  			}
   372  
   373  			if err := compareSegments(originalSegment, currSegment); err != nil {
   374  				return false, fmt.Errorf("error comparing segments for re-encoding original stream after iterating: %v", err)
   375  			}
   376  		}
   377  
   378  		return true, nil
   379  	}, genPropTestInputs()))
   380  
   381  	if !props.Run(reporter) {
   382  		t.Errorf("failed with initial seed: %d", seed)
   383  	}
   384  }
   385  
   386  type propTestInput struct {
   387  	schema   *desc.MessageDescriptor
   388  	messages []messageAndTimeUnit
   389  }
   390  
   391  type messageAndTimeUnit struct {
   392  	message  *dynamic.Message
   393  	timeUnit xtime.Unit
   394  }
   395  
   396  // generatedWrite contains numFields values for every type of ProtoBuf
   397  // field. This allows us to generate data independent of the schema itself
   398  // which we may not have seen in the input generation section yet. For example,
   399  // if the maximum number of fields that a message can contain is 10, then this
   400  // struct will generate a slice of size 10 for each of the scalar types and populate
   401  // them with random values.
   402  //
   403  // If we receive a schema where the message has 5 boolean fields and then 5 string
   404  // fields, then we will populate the first 5 booleans fields with generatedWrite.bools[:5]
   405  // and the next 5 string fields with generatedWrite.strings[5:].
   406  type generatedWrite struct {
   407  	timeUnit xtime.Unit
   408  
   409  	// Whether we should use one of the randomly generated values in the slice below,
   410  	// or just the default value for the given type.
   411  	useDefaultValue []bool
   412  
   413  	bools    []bool
   414  	enums    []int32
   415  	strings  []string
   416  	float32s []float32
   417  	float64s []float64
   418  	int8s    []int8
   419  	int16s   []int16
   420  	int32s   []int32
   421  	int64s   []int64
   422  	uint8s   []uint8
   423  	uint16s  []uint16
   424  	uint32s  []uint32
   425  	uint64s  []uint64
   426  }
   427  
   428  func genPropTestInputs() gopter.Gen {
   429  	curriedGenPropTestInput := func(input interface{}) gopter.Gen {
   430  		var (
   431  			inputs      = input.([]interface{})
   432  			numFields   = inputs[0].(int)
   433  			numMessages = inputs[1].(int)
   434  		)
   435  
   436  		return genSchema(numFields).FlatMap(
   437  			func(input interface{}) gopter.Gen {
   438  				schema := input.(*desc.MessageDescriptor)
   439  				return genPropTestInput(schema, numMessages)
   440  			}, reflect.TypeOf(propTestInput{}))
   441  	}
   442  
   443  	return gopter.CombineGens(
   444  		gen.IntRange(0, maxNumFields),
   445  		gen.IntRange(0, maxNumMessages),
   446  	).FlatMap(curriedGenPropTestInput, reflect.TypeOf(propTestInput{}))
   447  }
   448  
   449  func genPropTestInput(schema *desc.MessageDescriptor, numMessages int) gopter.Gen {
   450  	return gopter.CombineGens(
   451  		// Messages to write for the given schema.
   452  		gen.SliceOfN(numMessages, genMessage(schema)),
   453  		// [][]bool that indicates on a field-by-field basis for each message whether the
   454  		// value should be the same as the previous message for that field to ensure we
   455  		// aggressively exercise that codepath.
   456  		gen.SliceOfN(numMessages, gen.SliceOfN(len(schema.GetFields()), gen.Bool())),
   457  	).Map(func(input []interface{}) propTestInput {
   458  
   459  		messages := input[0].([]messageAndTimeUnit)
   460  		perMessageShouldBeSameAsPrevWrite := input[1].([][]bool)
   461  		for i, messageAndUnit := range messages {
   462  			m := messageAndUnit.message
   463  			if i == 0 {
   464  				// Can't make the same as previous if there is no previous.
   465  				continue
   466  			}
   467  
   468  			perFieldShouldBeSameAsPrevWrite := perMessageShouldBeSameAsPrevWrite[i]
   469  			fields := m.GetKnownFields()
   470  			for j, field := range fields {
   471  				if perFieldShouldBeSameAsPrevWrite[j] {
   472  					fieldNumInt := int(field.GetNumber())
   473  					prevFieldVal := messages[i-1].message.GetFieldByNumber(fieldNumInt)
   474  					m.SetFieldByNumber(fieldNumInt, prevFieldVal)
   475  				}
   476  			}
   477  		}
   478  
   479  		return propTestInput{
   480  			schema:   schema,
   481  			messages: messages,
   482  		}
   483  	})
   484  }
   485  
   486  func genMessage(schema *desc.MessageDescriptor) gopter.Gen {
   487  	return genWrite().Map(func(input generatedWrite) messageAndTimeUnit {
   488  		return newMessageWithValues(schema, input)
   489  	})
   490  }
   491  
   492  func newMessageWithValues(schema *desc.MessageDescriptor, input generatedWrite) messageAndTimeUnit {
   493  	message := dynamic.NewMessage(schema)
   494  	for i, field := range message.GetKnownFields() {
   495  		fieldNumber := int(field.GetNumber())
   496  		switch {
   497  		case input.useDefaultValue[i]:
   498  			// Due to the way ProtoBuf encoding works where there is no way to
   499  			// distinguish between an "unset" field and a field set to its default
   500  			// value, we intentionally force some of the values to their default values
   501  			// to exercise those code paths. This is important because the probability of
   502  			// randomly generating a uint64 with the default value of zero is so unlikely
   503  			// that it will basically never happen.
   504  			continue
   505  		case field.IsMap():
   506  			// Maps require special handling because the type will look like a message, they'll
   507  			// have the repeated label, and to construct them properly we need to look at both
   508  			// the key type as well as the value type.
   509  			var (
   510  				mapKeyType   = field.GetMapKeyType()
   511  				mapValueType = field.GetMapValueType()
   512  
   513  				mapKeysForTypeIFace, _   = valuesOfType(nil, i, mapKeyType, input)
   514  				mapValuesForTypeIFace, _ = valuesOfType(nil, i, mapValueType, input)
   515  				mapKeysForType           = interfaceSlice(mapKeysForTypeIFace)
   516  				mapValuesForType         = interfaceSlice(mapValuesForTypeIFace)
   517  			)
   518  			for j, key := range mapKeysForType {
   519  				if messageAndTU, ok := mapValuesForType[j].(messageAndTimeUnit); ok {
   520  					message.PutMapFieldByNumber(fieldNumber, key, messageAndTU.message)
   521  				} else {
   522  					message.PutMapFieldByNumber(fieldNumber, key, mapValuesForType[j])
   523  				}
   524  			}
   525  		default:
   526  			sliceValues, singleValue := valuesOfType(schema, i, field, input)
   527  			if field.IsRepeated() {
   528  				valuesToSet := interfaceSlice(sliceValues)
   529  				if _, ok := singleValue.(messageAndTimeUnit); ok {
   530  					// If its a slice of messageAndTimeUnit (indiciating a field with repeated
   531  					// nested messages) then we need to convert it to a slice of *dynamic.Message.
   532  					valuesToSet = make([]interface{}, 0, len(valuesToSet))
   533  					for _, v := range interfaceSlice(sliceValues) {
   534  						valuesToSet = append(valuesToSet, v.(messageAndTimeUnit).message)
   535  					}
   536  				}
   537  
   538  				message.SetFieldByNumber(fieldNumber, valuesToSet)
   539  			} else {
   540  				if messageAndTU, ok := singleValue.(messageAndTimeUnit); ok {
   541  					message.SetFieldByNumber(fieldNumber, messageAndTU.message)
   542  				} else {
   543  					message.SetFieldByNumber(fieldNumber, singleValue)
   544  				}
   545  			}
   546  		}
   547  	}
   548  
   549  	// Basic sanity test to protect against bugs in the underlying library:
   550  	// https://github.com/jhump/protoreflect/issues/181
   551  	marshalled, err := message.Marshal()
   552  	if err != nil {
   553  		panic(err)
   554  	}
   555  	unmarshalled := dynamic.NewMessage(schema)
   556  	err = unmarshalled.Unmarshal(marshalled)
   557  	if err != nil {
   558  		panic(err)
   559  	}
   560  	if !dynamic.MessagesEqual(message, unmarshalled) {
   561  		panic("generated message that is not equal after being marshalled and unmarshalled")
   562  	}
   563  
   564  	return messageAndTimeUnit{
   565  		message:  message,
   566  		timeUnit: input.timeUnit,
   567  	}
   568  }
   569  
   570  func valuesOfType(
   571  	schema *desc.MessageDescriptor,
   572  	i int,
   573  	field *desc.FieldDescriptor,
   574  	input generatedWrite) (interface{}, interface{}) {
   575  	fieldType := field.GetType()
   576  
   577  	switch fieldType {
   578  	case dpb.FieldDescriptorProto_TYPE_BOOL:
   579  		return input.bools[0 : i+1], input.bools[i]
   580  	case dpb.FieldDescriptorProto_TYPE_ENUM:
   581  		return input.enums[0 : i+1], input.enums[i]
   582  	case dpb.FieldDescriptorProto_TYPE_BYTES:
   583  		bytesSlice := make([][]byte, 0, i)
   584  		for _, s := range input.strings[0 : i+1] {
   585  			bytesSlice = append(bytesSlice, []byte(s))
   586  		}
   587  		return bytesSlice, []byte(input.strings[i])
   588  	case dpb.FieldDescriptorProto_TYPE_STRING:
   589  		return input.strings[0 : i+1], input.strings[i]
   590  	case dpb.FieldDescriptorProto_TYPE_DOUBLE:
   591  		return input.float64s[0 : i+1], input.float64s[i]
   592  	case dpb.FieldDescriptorProto_TYPE_FLOAT:
   593  		return input.float32s[0 : i+1], input.float32s[i]
   594  	case dpb.FieldDescriptorProto_TYPE_SFIXED32:
   595  		fallthrough
   596  	case dpb.FieldDescriptorProto_TYPE_SINT32:
   597  		fallthrough
   598  	case dpb.FieldDescriptorProto_TYPE_INT32:
   599  		return input.int32s[0 : i+1], input.int32s[i]
   600  	case dpb.FieldDescriptorProto_TYPE_SFIXED64:
   601  		fallthrough
   602  	case dpb.FieldDescriptorProto_TYPE_SINT64:
   603  		fallthrough
   604  	case dpb.FieldDescriptorProto_TYPE_INT64:
   605  		return input.int64s[0 : i+1], input.int64s[i]
   606  	case dpb.FieldDescriptorProto_TYPE_FIXED32:
   607  		fallthrough
   608  	case dpb.FieldDescriptorProto_TYPE_UINT32:
   609  		return input.uint32s[0 : i+1], input.uint32s[i]
   610  	case dpb.FieldDescriptorProto_TYPE_FIXED64:
   611  		fallthrough
   612  	case dpb.FieldDescriptorProto_TYPE_UINT64:
   613  		return input.uint64s[0 : i+1], input.uint64s[i]
   614  	case dpb.FieldDescriptorProto_TYPE_MESSAGE:
   615  		// If the field is a nested message, figure out what the nested schema is
   616  		// and then generate another message to use as the value of that field. We
   617  		// reuse the same inputs value for simplicity.
   618  		//
   619  		// If the schema is set to nil, that means that field itself is a message type
   620  		// that we'd like to generate a value for so get the nested message schema
   621  		// from the field itself instead of looking it up.
   622  		var nestedMessageSchema *desc.MessageDescriptor
   623  		if schema != nil {
   624  			nestedMessageSchema = schema.FindFieldByNumber(field.GetNumber()).GetMessageType()
   625  		} else {
   626  			nestedMessageSchema = field.GetMessageType()
   627  		}
   628  		nestedMessages := make([]messageAndTimeUnit, 0, i)
   629  		for j := 0; j <= i; j++ {
   630  			nestedMessages = append(nestedMessages, newMessageWithValues(nestedMessageSchema, input))
   631  		}
   632  		return nestedMessages, newMessageWithValues(nestedMessageSchema, input)
   633  	default:
   634  		panic(fmt.Sprintf("invalid field type in schema: %v", fieldType))
   635  	}
   636  }
   637  
   638  func genWrite() gopter.Gen {
   639  	return gopter.CombineGens(
   640  		genTimeUnit(),
   641  		gen.SliceOfN(maxNumFields, gen.Bool()),
   642  		gen.SliceOfN(maxNumFields, gen.Bool()),
   643  		gen.SliceOfN(maxNumFields, gen.Int32Range(0, int32(maxNumEnumValues)-1)),
   644  		gen.SliceOfN(maxNumFields, gen.Identifier()),
   645  		gen.SliceOfN(maxNumFields, gen.Float32()),
   646  		gen.SliceOfN(maxNumFields, gen.Float64()),
   647  		gen.SliceOfN(maxNumFields, gen.Int8()),
   648  		gen.SliceOfN(maxNumFields, gen.Int16()),
   649  		gen.SliceOfN(maxNumFields, gen.Int32()),
   650  		gen.SliceOfN(maxNumFields, gen.Int64()),
   651  		gen.SliceOfN(maxNumFields, gen.UInt8()),
   652  		gen.SliceOfN(maxNumFields, gen.UInt16()),
   653  		gen.SliceOfN(maxNumFields, gen.UInt32()),
   654  		gen.SliceOfN(maxNumFields, gen.UInt64()),
   655  	).Map(func(input []interface{}) generatedWrite {
   656  		return generatedWrite{
   657  			timeUnit:        input[0].(xtime.Unit),
   658  			useDefaultValue: input[1].([]bool),
   659  			bools:           input[2].([]bool),
   660  			enums:           input[3].([]int32),
   661  			strings:         input[4].([]string),
   662  			float32s:        input[5].([]float32),
   663  			float64s:        input[6].([]float64),
   664  			int8s:           input[7].([]int8),
   665  			int16s:          input[8].([]int16),
   666  			int32s:          input[9].([]int32),
   667  			int64s:          input[10].([]int64),
   668  			uint8s:          input[11].([]uint8),
   669  			uint16s:         input[12].([]uint16),
   670  			uint32s:         input[13].([]uint32),
   671  			uint64s:         input[14].([]uint64),
   672  		}
   673  	})
   674  }
   675  
   676  func genSchema(numFields int) gopter.Gen {
   677  	return gopter.CombineGens(
   678  		gen.SliceOfN(numFields, genFieldModifier()),
   679  		gen.SliceOfN(numFields, genMapKeyType()),
   680  		gen.SliceOfN(numFields, genFieldTypeWithNestedMessage()),
   681  		gen.SliceOfN(numFields, genFieldTypeWithNoNestedMessage()),
   682  	).
   683  		Map(func(input []interface{}) *desc.MessageDescriptor {
   684  			var (
   685  				fieldModifiers = input[0].([]fieldModifierProp)
   686  				mapKeyTypes    = input[1].([]dpb.FieldDescriptorProto_Type)
   687  				// fieldTypes are generated with the possibility of a field being a nested message
   688  				// where nestedFieldTypes are generated without the possibility of a field being
   689  				// a nested message to prevent infinite recursion. This limits the property testing
   690  				// of nested message types to a maximum depth of 1, but in practice it doesn't matter
   691  				// much because nested messages are handled by the ProtoBuf specification not our
   692  				// custom encoding.
   693  				fieldTypes       = input[2].([]dpb.FieldDescriptorProto_Type)
   694  				nestedFieldTypes = input[3].([]dpb.FieldDescriptorProto_Type)
   695  			)
   696  
   697  			schemaBuilder := schemaBuilderFromFieldTypes(fieldModifiers, mapKeyTypes, fieldTypes, nestedFieldTypes)
   698  			schema, err := schemaBuilder.Build()
   699  			if err != nil {
   700  				panic(err)
   701  			}
   702  
   703  			return schema
   704  		})
   705  }
   706  
   707  func schemaBuilderFromFieldTypes(
   708  	fieldModifiers []fieldModifierProp,
   709  	mapKeyTypes []dpb.FieldDescriptorProto_Type,
   710  	fieldTypes []dpb.FieldDescriptorProto_Type,
   711  	nestedMessageFieldTypes []dpb.FieldDescriptorProto_Type,
   712  ) *builder.MessageBuilder {
   713  	var schemaName string
   714  	if nestedMessageFieldTypes != nil {
   715  		schemaName = "schema"
   716  	} else {
   717  		schemaName = "nested_schema"
   718  	}
   719  	schemaBuilder := builder.NewMessage(schemaName)
   720  
   721  	for i, fieldType := range fieldTypes {
   722  		var (
   723  			fieldModifier = fieldModifiers[i]
   724  			fieldNum      = int32(i + 1) // Zero not valid.
   725  			fieldBuilder  *builder.FieldBuilder
   726  		)
   727  
   728  		switch {
   729  		case fieldModifier == fieldModifierReserved:
   730  			// Sprinkle in some reserved fields to make sure that we handle those
   731  			// without issue.
   732  			schemaBuilder.AddReservedRange(fieldNum, fieldNum)
   733  			continue
   734  		case fieldModifier == fieldModifierMap:
   735  			// Map key types can only be scalar types.
   736  			mapKeyType := builder.FieldTypeScalar(mapKeyTypes[i])
   737  			mapValueType := newBuilderFieldType(
   738  				// All map values should be "regular" I.E not repeated, reserved, or another map.
   739  				fieldNum, fieldType, make([]fieldModifierProp, len(nestedMessageFieldTypes)), mapKeyTypes, nestedMessageFieldTypes)
   740  			mapFieldName := fmt.Sprintf("_map_%d", fieldNum)
   741  			fieldBuilder = builder.NewMapField(mapFieldName, mapKeyType, mapValueType).SetNumber(fieldNum)
   742  		default:
   743  			builderFieldType := newBuilderFieldType(fieldNum, fieldType, fieldModifiers, mapKeyTypes, nestedMessageFieldTypes)
   744  			fieldBuilder = builder.NewField(fmt.Sprintf("_%d", fieldNum), builderFieldType).
   745  				SetNumber(fieldNum)
   746  		}
   747  
   748  		if fieldModifier == fieldModifierRepeated {
   749  			// This is safe because a field cant be repeated and a map by design.
   750  			fieldBuilder = fieldBuilder.SetRepeated()
   751  		}
   752  
   753  		schemaBuilder = schemaBuilder.AddField(fieldBuilder)
   754  	}
   755  
   756  	return schemaBuilder
   757  }
   758  
   759  func newBuilderFieldType(
   760  	fieldNum int32,
   761  	fieldType dpb.FieldDescriptorProto_Type,
   762  	fieldModifiers []fieldModifierProp,
   763  	mapKeyTypes []dpb.FieldDescriptorProto_Type,
   764  	nestedMessageFieldTypes []dpb.FieldDescriptorProto_Type,
   765  ) *builder.FieldType {
   766  	if fieldType == dpb.FieldDescriptorProto_TYPE_ENUM {
   767  		var (
   768  			enumFieldName = fmt.Sprintf("_enum_%d", fieldNum)
   769  			enumBuilder   = builder.NewEnum(enumFieldName)
   770  		)
   771  		for j := 0; j < maxNumEnumValues; j++ {
   772  			enumValueName := fmt.Sprintf("_enum_value_%d", j)
   773  			enumBuilder.AddValue(builder.NewEnumValue(enumValueName))
   774  		}
   775  		return builder.FieldTypeEnum(enumBuilder)
   776  	}
   777  
   778  	if fieldType == dpb.FieldDescriptorProto_TYPE_MESSAGE {
   779  		// NestedMessageFieldTypes can't contain nested messages so we're limited to a single level
   780  		// of recursion here.
   781  		nestedMessageBuilder := schemaBuilderFromFieldTypes(fieldModifiers, mapKeyTypes, nestedMessageFieldTypes, nil)
   782  		return builder.FieldTypeMessage(nestedMessageBuilder)
   783  	}
   784  
   785  	return builder.FieldTypeScalar(fieldType)
   786  }
   787  
   788  func genTimeUnit() gopter.Gen {
   789  	return gen.OneConstOf(
   790  		xtime.Second, xtime.Millisecond, xtime.Microsecond, xtime.Nanosecond)
   791  }
   792  
   793  func genFieldModifier() gopter.Gen {
   794  	return gen.OneConstOf(
   795  		fieldModifierRegular,
   796  		fieldModifierReserved,
   797  		fieldModifierRepeated,
   798  		fieldModifierMap)
   799  }
   800  
   801  func genMapKeyType() gopter.Gen {
   802  	return gen.OneConstOf(validMapKeyTypes...)
   803  }
   804  
   805  func genFieldTypeWithNoNestedMessage() gopter.Gen {
   806  	return gen.OneConstOf(allowedProtoTypesSliceIface...)
   807  }
   808  
   809  func genFieldTypeWithNestedMessage() gopter.Gen {
   810  	allowedProtoTypesSliceIfaceWithNestedMessage := allowedProtoTypesSliceIface[:] // Shallow copy.
   811  	allowedProtoTypesSliceIfaceWithNestedMessage = append(
   812  		allowedProtoTypesSliceIfaceWithNestedMessage,
   813  		dpb.FieldDescriptorProto_TYPE_MESSAGE)
   814  	return gen.OneConstOf(allowedProtoTypesSliceIfaceWithNestedMessage...)
   815  }
   816  
   817  func interfaceSlice(slice interface{}) []interface{} {
   818  	// https://stackoverflow.com/questions/12753805/type-converting-slices-of-interfaces-in-go
   819  	s := reflect.ValueOf(slice)
   820  	if s.Kind() != reflect.Slice {
   821  		panic("InterfaceSlice() given a non-slice type")
   822  	}
   823  
   824  	ret := make([]interface{}, s.Len())
   825  
   826  	for i := 0; i < s.Len(); i++ {
   827  		ret[i] = s.Index(i).Interface()
   828  	}
   829  
   830  	return ret
   831  }
   832  
   833  func printMessage(prefix string, m *dynamic.Message) {
   834  	json, err := m.MarshalJSON()
   835  	if err != nil {
   836  		panic(err)
   837  	}
   838  	fmt.Printf("%s: %s\n", prefix, string(json))
   839  }
   840  
   841  func compareSegments(a ts.Segment, b ts.Segment) error {
   842  	var (
   843  		aHead []byte
   844  		bHead []byte
   845  		aTail []byte
   846  		bTail []byte
   847  	)
   848  	if a.Head != nil {
   849  		aHead = a.Head.Bytes()
   850  	}
   851  	if b.Head != nil {
   852  		bHead = b.Head.Bytes()
   853  	}
   854  	if a.Tail != nil {
   855  		aTail = a.Tail.Bytes()
   856  	}
   857  	if b.Tail != nil {
   858  		bTail = b.Tail.Bytes()
   859  	}
   860  	if !bytes.Equal(aHead, bHead) {
   861  		return fmt.Errorf(
   862  			"heads do not match. Expected: %v but got: %v",
   863  			aHead, bHead)
   864  	}
   865  	if !bytes.Equal(aTail, bTail) {
   866  		return fmt.Errorf(
   867  			"tails do not match. Expected: %v but got: %v",
   868  			aTail, bTail)
   869  	}
   870  	return nil
   871  }