github.com/m3db/m3@v1.5.1-0.20231129193456-75a402aa583b/src/cmd/tools/read_commitlog/main/main.go (about)

     1  // Copyright (c) 2021 Uber Technologies, Inc.
     2  //
     3  // Permission is hereby granted, free of charge, to any person obtaining a copy
     4  // of this software and associated documentation files (the "Software"), to deal
     5  // in the Software without restriction, including without limitation the rights
     6  // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
     7  // copies of the Software, and to permit persons to whom the Software is
     8  // furnished to do so, subject to the following conditions:
     9  //
    10  // The above copyright notice and this permission notice shall be included in
    11  // all copies or substantial portions of the Software.
    12  //
    13  // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
    14  // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
    15  // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
    16  // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
    17  // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
    18  // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
    19  // THE SOFTWARE.
    20  
    21  package main
    22  
    23  import (
    24  	"encoding/base64"
    25  	"fmt"
    26  	"log"
    27  	"os"
    28  	"sort"
    29  	"time"
    30  
    31  	"github.com/m3db/m3/src/x/ident"
    32  	xtime "github.com/m3db/m3/src/x/time"
    33  
    34  	"github.com/pborman/getopt"
    35  	"go.uber.org/zap"
    36  )
    37  
    38  func main() {
    39  	var (
    40  		path         = getopt.StringLong("path", 'p', "", "file path [e.g. /var/lib/m3db/commitlogs/commitlog-0-161023.db]")
    41  		idFilter     = getopt.StringLong("id-filter", 'f', "", "ID Contains Filter (optional)")
    42  		idSizeFilter = getopt.IntLong("id-size-filter", 's', 0, "ID Size (bytes) Filter (optional)")
    43  		mode         = getopt.StringLong("mode", 'm', "", "Action [print,summary]. Defaults to 'print'")
    44  		top          = getopt.IntLong("top", 't', 0, "Print out only top N IDs")
    45  	)
    46  	getopt.Parse()
    47  
    48  	rawLogger, err := zap.NewDevelopment()
    49  	if err != nil {
    50  		log.Fatalf("unable to create logger: %+v", err)
    51  	}
    52  	logger := rawLogger.Sugar()
    53  
    54  	if *path == "" {
    55  		getopt.Usage()
    56  		os.Exit(1)
    57  	}
    58  
    59  	reader, err := newFilteringReader(*path, idFilter, idSizeFilter)
    60  	if err != nil {
    61  		logger.Fatalf("unable to open reader: %v", err)
    62  	}
    63  	defer reader.Close()
    64  
    65  	switch *mode {
    66  	case "summary":
    67  		err = printSummary(reader, top)
    68  	default:
    69  		err = printMetrics(reader)
    70  	}
    71  	if err != nil {
    72  		logger.Fatalf("error while reading commitlog: %v", err)
    73  	}
    74  }
    75  
    76  func printMetrics(reader *filteringReader) error {
    77  	var (
    78  		entryCount          uint32
    79  		annotationSizeTotal uint64
    80  		start               = time.Now()
    81  	)
    82  
    83  	for {
    84  		entry, found, err := reader.Read()
    85  		if err != nil {
    86  			return err
    87  		}
    88  		if !found {
    89  			break
    90  		}
    91  
    92  		series := entry.Series
    93  		fmt.Printf("{id: %s, dp: %+v, ns: %s, shard: %d", // nolint: forbidigo
    94  			series.ID, entry.Datapoint, entry.Series.Namespace, entry.Series.Shard)
    95  		if len(entry.Annotation) > 0 {
    96  			fmt.Printf(", annotation: %s", // nolint: forbidigo
    97  				base64.StdEncoding.EncodeToString(entry.Annotation))
    98  			annotationSizeTotal += uint64(len(entry.Annotation))
    99  		}
   100  		fmt.Println("}") // nolint: forbidigo
   101  
   102  		entryCount++
   103  	}
   104  
   105  	runTime := time.Since(start)
   106  
   107  	fmt.Printf("\nRunning time: %s\n", runTime)                          // nolint: forbidigo
   108  	fmt.Printf("%d entries read\n", entryCount)                          // nolint: forbidigo
   109  	fmt.Printf("Total annotation size: %d bytes\n", annotationSizeTotal) // nolint: forbidigo
   110  	return nil
   111  }
   112  
   113  func printSummary(reader *filteringReader, top *int) error {
   114  	var (
   115  		entryCount        uint32
   116  		start             = time.Now()
   117  		datapointCount    = map[ident.ID]uint32{}
   118  		totalIDSize       uint64
   119  		earliestDatapoint xtime.UnixNano
   120  		oldestDatapoint   xtime.UnixNano
   121  	)
   122  
   123  	for {
   124  		entry, found, err := reader.Read()
   125  		if err != nil {
   126  			return err
   127  		}
   128  		if !found {
   129  			break
   130  		}
   131  		dp := entry.Datapoint
   132  
   133  		if earliestDatapoint == 0 || earliestDatapoint > dp.TimestampNanos {
   134  			earliestDatapoint = dp.TimestampNanos
   135  		}
   136  		if oldestDatapoint == 0 || oldestDatapoint < dp.TimestampNanos {
   137  			oldestDatapoint = dp.TimestampNanos
   138  		}
   139  
   140  		datapointCount[entry.Series.ID]++
   141  
   142  		entryCount++
   143  	}
   144  
   145  	runTime := time.Since(start)
   146  
   147  	fmt.Printf("\nRunning time: %s\n", runTime)                                              // nolint: forbidigo
   148  	fmt.Printf("%d entries read\n", entryCount)                                              // nolint: forbidigo
   149  	fmt.Printf("time range [%s:%s]\n", earliestDatapoint.String(), oldestDatapoint.String()) // nolint: forbidigo
   150  
   151  	datapointCountArr := idPairs{}
   152  	sizeArr := idPairs{}
   153  	for ID, count := range datapointCount {
   154  		IDSize := len(ID.Bytes())
   155  		totalIDSize += uint64(IDSize)
   156  		datapointCountArr = append(datapointCountArr, idPair{ID: ID, Value: count})
   157  		sizeArr = append(sizeArr, idPair{ID: ID, Value: uint32(IDSize)})
   158  	}
   159  
   160  	sort.Sort(sort.Reverse(datapointCountArr))
   161  	sort.Sort(sort.Reverse(sizeArr))
   162  
   163  	fmt.Printf("total ID size: %d bytes\n", totalIDSize)                  // nolint: forbidigo
   164  	fmt.Printf("total distinct number of IDs %d \n", len(datapointCount)) // nolint: forbidigo
   165  
   166  	limit := len(datapointCountArr)
   167  	if *top > 0 && *top < limit {
   168  		limit = *top
   169  	}
   170  	fmt.Printf("ID datapoint counts: \n") // nolint: forbidigo
   171  	for i := 0; i < limit; i++ {
   172  		pair := datapointCountArr[i]
   173  		fmt.Printf("%-10d %s\n", pair.Value, pair.ID.String()) // nolint: forbidigo
   174  	}
   175  
   176  	fmt.Printf("ID sizes(bytes): \n") // nolint: forbidigo
   177  	for i := 0; i < limit; i++ {
   178  		pair := sizeArr[i]
   179  		fmt.Printf("%-10d %s\n", pair.Value, pair.ID.String()) // nolint: forbidigo
   180  	}
   181  
   182  	return nil
   183  }
   184  
   185  type idPair struct {
   186  	ID    ident.ID
   187  	Value uint32
   188  }
   189  
   190  type idPairs []idPair
   191  
   192  func (p idPairs) Len() int           { return len(p) }
   193  func (p idPairs) Swap(i, j int)      { p[i], p[j] = p[j], p[i] }
   194  func (p idPairs) Less(i, j int) bool { return p[i].Value < p[j].Value }