github.com/cockroachdb/tools@v0.0.0-20230222021103-a6d27438930d/present/args.go (about) 1 // Copyright 2012 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 package present 6 7 import ( 8 "errors" 9 "regexp" 10 "strconv" 11 "unicode/utf8" 12 ) 13 14 // This file is stolen from go/src/cmd/godoc/codewalk.go. 15 // It's an evaluator for the file address syntax implemented by acme and sam, 16 // but using Go-native regular expressions. 17 // To keep things reasonably close, this version uses (?m:re) for all user-provided 18 // regular expressions. That is the only change to the code from codewalk.go. 19 // See http://9p.io/sys/doc/sam/sam.html Table II for details on the syntax. 20 21 // addrToByteRange evaluates the given address starting at offset start in data. 22 // It returns the lo and hi byte offset of the matched region within data. 23 func addrToByteRange(addr string, start int, data []byte) (lo, hi int, err error) { 24 if addr == "" { 25 lo, hi = start, len(data) 26 return 27 } 28 var ( 29 dir byte 30 prevc byte 31 charOffset bool 32 ) 33 lo = start 34 hi = start 35 for addr != "" && err == nil { 36 c := addr[0] 37 switch c { 38 default: 39 err = errors.New("invalid address syntax near " + string(c)) 40 case ',': 41 if len(addr) == 1 { 42 hi = len(data) 43 } else { 44 _, hi, err = addrToByteRange(addr[1:], hi, data) 45 } 46 return 47 48 case '+', '-': 49 if prevc == '+' || prevc == '-' { 50 lo, hi, err = addrNumber(data, lo, hi, prevc, 1, charOffset) 51 } 52 dir = c 53 54 case '$': 55 lo = len(data) 56 hi = len(data) 57 if len(addr) > 1 { 58 dir = '+' 59 } 60 61 case '#': 62 charOffset = true 63 64 case '0', '1', '2', '3', '4', '5', '6', '7', '8', '9': 65 var i int 66 for i = 1; i < len(addr); i++ { 67 if addr[i] < '0' || addr[i] > '9' { 68 break 69 } 70 } 71 var n int 72 n, err = strconv.Atoi(addr[0:i]) 73 if err != nil { 74 break 75 } 76 lo, hi, err = addrNumber(data, lo, hi, dir, n, charOffset) 77 dir = 0 78 charOffset = false 79 prevc = c 80 addr = addr[i:] 81 continue 82 83 case '/': 84 var i, j int 85 Regexp: 86 for i = 1; i < len(addr); i++ { 87 switch addr[i] { 88 case '\\': 89 i++ 90 case '/': 91 j = i + 1 92 break Regexp 93 } 94 } 95 if j == 0 { 96 j = i 97 } 98 pattern := addr[1:i] 99 lo, hi, err = addrRegexp(data, lo, hi, dir, pattern) 100 prevc = c 101 addr = addr[j:] 102 continue 103 } 104 prevc = c 105 addr = addr[1:] 106 } 107 108 if err == nil && dir != 0 { 109 lo, hi, err = addrNumber(data, lo, hi, dir, 1, charOffset) 110 } 111 if err != nil { 112 return 0, 0, err 113 } 114 return lo, hi, nil 115 } 116 117 // addrNumber applies the given dir, n, and charOffset to the address lo, hi. 118 // dir is '+' or '-', n is the count, and charOffset is true if the syntax 119 // used was #n. Applying +n (or +#n) means to advance n lines 120 // (or characters) after hi. Applying -n (or -#n) means to back up n lines 121 // (or characters) before lo. 122 // The return value is the new lo, hi. 123 func addrNumber(data []byte, lo, hi int, dir byte, n int, charOffset bool) (int, int, error) { 124 switch dir { 125 case 0: 126 lo = 0 127 hi = 0 128 fallthrough 129 130 case '+': 131 if charOffset { 132 pos := hi 133 for ; n > 0 && pos < len(data); n-- { 134 _, size := utf8.DecodeRune(data[pos:]) 135 pos += size 136 } 137 if n == 0 { 138 return pos, pos, nil 139 } 140 break 141 } 142 // find next beginning of line 143 if hi > 0 { 144 for hi < len(data) && data[hi-1] != '\n' { 145 hi++ 146 } 147 } 148 lo = hi 149 if n == 0 { 150 return lo, hi, nil 151 } 152 for ; hi < len(data); hi++ { 153 if data[hi] != '\n' { 154 continue 155 } 156 switch n--; n { 157 case 1: 158 lo = hi + 1 159 case 0: 160 return lo, hi + 1, nil 161 } 162 } 163 164 case '-': 165 if charOffset { 166 // Scan backward for bytes that are not UTF-8 continuation bytes. 167 pos := lo 168 for ; pos > 0 && n > 0; pos-- { 169 if data[pos]&0xc0 != 0x80 { 170 n-- 171 } 172 } 173 if n == 0 { 174 return pos, pos, nil 175 } 176 break 177 } 178 // find earlier beginning of line 179 for lo > 0 && data[lo-1] != '\n' { 180 lo-- 181 } 182 hi = lo 183 if n == 0 { 184 return lo, hi, nil 185 } 186 for ; lo >= 0; lo-- { 187 if lo > 0 && data[lo-1] != '\n' { 188 continue 189 } 190 switch n--; n { 191 case 1: 192 hi = lo 193 case 0: 194 return lo, hi, nil 195 } 196 } 197 } 198 199 return 0, 0, errors.New("address out of range") 200 } 201 202 // addrRegexp searches for pattern in the given direction starting at lo, hi. 203 // The direction dir is '+' (search forward from hi) or '-' (search backward from lo). 204 // Backward searches are unimplemented. 205 func addrRegexp(data []byte, lo, hi int, dir byte, pattern string) (int, int, error) { 206 // We want ^ and $ to work as in sam/acme, so use ?m. 207 re, err := regexp.Compile("(?m:" + pattern + ")") 208 if err != nil { 209 return 0, 0, err 210 } 211 if dir == '-' { 212 // Could implement reverse search using binary search 213 // through file, but that seems like overkill. 214 return 0, 0, errors.New("reverse search not implemented") 215 } 216 m := re.FindIndex(data[hi:]) 217 if len(m) > 0 { 218 m[0] += hi 219 m[1] += hi 220 } else if hi > 0 { 221 // No match. Wrap to beginning of data. 222 m = re.FindIndex(data) 223 } 224 if len(m) == 0 { 225 return 0, 0, errors.New("no match for " + pattern) 226 } 227 return m[0], m[1], nil 228 }