github.com/m3db/m3@v1.5.0/src/dbnode/digest/reader.go (about) 1 // Copyright (c) 2016 Uber Technologies, Inc. 2 // 3 // Permission is hereby granted, free of charge, to any person obtaining a copy 4 // of this software and associated documentation files (the "Software"), to deal 5 // in the Software without restriction, including without limitation the rights 6 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7 // copies of the Software, and to permit persons to whom the Software is 8 // furnished to do so, subject to the following conditions: 9 // 10 // The above copyright notice and this permission notice shall be included in 11 // all copies or substantial portions of the Software. 12 // 13 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 19 // THE SOFTWARE. 20 21 package digest 22 23 import ( 24 "bufio" 25 "errors" 26 "hash" 27 "hash/adler32" 28 "io" 29 "os" 30 ) 31 32 var ( 33 // errReadFewerThanExpectedBytes returned when number of bytes read is fewer than expected 34 errReadFewerThanExpectedBytes = errors.New("number of bytes read is fewer than expected") 35 36 // errChecksumMismatch returned when the calculated checksum doesn't match the stored checksum 37 errChecksumMismatch = errors.New("calculated checksum doesn't match stored checksum") 38 39 // errBufferSizeMismatch returned when ReadAllAndValidate called without well sized buffer 40 errBufferSizeMismatch = errors.New("buffer passed is not an exact fit for contents") 41 ) 42 43 // FdWithDigestReader provides a buffered reader for reading from the underlying file. 44 type FdWithDigestReader interface { 45 FdWithDigest 46 io.Reader 47 48 // ReadAllAndValidate reads everything in the underlying file and validates 49 // it against the expected digest, returning an error if they don't match. 50 // Note: the buffer "b" must be an exact match for how long the contents being 51 // read is, the signature is structured this way to allow for buffer reuse. 52 ReadAllAndValidate(b []byte, expectedDigest uint32) (int, error) 53 54 // Validate compares the current digest against the expected digest and returns 55 // an error if they don't match. 56 Validate(expectedDigest uint32) error 57 } 58 59 type fdWithDigestReader struct { 60 fd *os.File 61 bufReader *bufio.Reader 62 readerWithDigest ReaderWithDigest 63 single [1]byte 64 } 65 66 // NewFdWithDigestReader creates a new FdWithDigestReader. 67 func NewFdWithDigestReader(bufferSize int) FdWithDigestReader { 68 bufReader := bufio.NewReaderSize(nil, bufferSize) 69 return &fdWithDigestReader{ 70 bufReader: bufReader, 71 readerWithDigest: NewReaderWithDigest(bufReader), 72 } 73 } 74 75 // Reset resets the underlying file descriptor and the buffered reader. 76 func (r *fdWithDigestReader) Reset(fd *os.File) { 77 r.fd = fd 78 r.bufReader.Reset(fd) 79 r.readerWithDigest.Reset(r.bufReader) 80 } 81 82 func (r *fdWithDigestReader) Read(b []byte) (int, error) { 83 return r.readerWithDigest.Read(b) 84 } 85 86 func (r *fdWithDigestReader) Fd() *os.File { 87 return r.fd 88 } 89 90 func (r *fdWithDigestReader) Digest() hash.Hash32 { 91 return r.readerWithDigest.Digest() 92 } 93 94 func (r *fdWithDigestReader) ReadAllAndValidate(b []byte, expectedDigest uint32) (int, error) { 95 n, err := r.Read(b) 96 if err != nil { 97 return n, err 98 } 99 // NB(r): Attempt next read to prove that the size of the buffer b 100 // was sized correctly to fit all contents into it and that we are 101 // correctly now at the end of input. 102 _, err = r.Read(r.single[:]) 103 if err != io.EOF { 104 return 0, errBufferSizeMismatch 105 } 106 if err := r.Validate(expectedDigest); err != nil { 107 return n, err 108 } 109 return n, nil 110 } 111 112 func (r *fdWithDigestReader) Validate(expectedDigest uint32) error { 113 return r.readerWithDigest.Validate(expectedDigest) 114 } 115 116 func (r *fdWithDigestReader) Close() error { 117 if r.fd == nil { 118 return nil 119 } 120 err := r.fd.Close() 121 r.fd = nil 122 return err 123 } 124 125 // FdWithDigestContentsReader provides additional functionality of reading a digest from the underlying file. 126 type FdWithDigestContentsReader interface { 127 FdWithDigestReader 128 129 // ReadDigest reads a digest from the underlying file. 130 ReadDigest() (uint32, error) 131 } 132 133 type fdWithDigestContentsReader struct { 134 FdWithDigestReader 135 136 digestBuf Buffer 137 } 138 139 // NewFdWithDigestContentsReader creates a new FdWithDigestContentsReader. 140 func NewFdWithDigestContentsReader(bufferSize int) FdWithDigestContentsReader { 141 return &fdWithDigestContentsReader{ 142 FdWithDigestReader: NewFdWithDigestReader(bufferSize), 143 digestBuf: NewBuffer(), 144 } 145 } 146 147 func (r *fdWithDigestContentsReader) ReadDigest() (uint32, error) { 148 n, err := r.Read(r.digestBuf) 149 if err != nil { 150 return 0, err 151 } 152 if n < len(r.digestBuf) { 153 return 0, errReadFewerThanExpectedBytes 154 } 155 return r.digestBuf.ReadDigest(), nil 156 } 157 158 // ReaderWithDigest is a reader that that calculates a digest 159 // as it is read. 160 type ReaderWithDigest interface { 161 io.Reader 162 163 // Reset resets the reader for use with a new reader. 164 Reset(reader io.Reader) 165 166 // Digest returns the digest. 167 Digest() hash.Hash32 168 169 // Validate compares the current digest against the expected digest and returns 170 // an error if they don't match. 171 Validate(expectedDigest uint32) error 172 } 173 174 type readerWithDigest struct { 175 reader io.Reader 176 digest hash.Hash32 177 } 178 179 // NewReaderWithDigest creates a new reader that calculates a digest as it 180 // reads an input. 181 func NewReaderWithDigest(reader io.Reader) ReaderWithDigest { 182 return &readerWithDigest{ 183 reader: reader, 184 digest: adler32.New(), 185 } 186 } 187 188 func (r *readerWithDigest) Reset(reader io.Reader) { 189 r.reader = reader 190 r.digest.Reset() 191 } 192 193 func (r *readerWithDigest) Digest() hash.Hash32 { 194 return r.digest 195 } 196 197 func (r *readerWithDigest) readBytes(b []byte) (int, error) { 198 n, err := r.reader.Read(b) 199 if err != nil { 200 return 0, err 201 } 202 // In case the buffered reader only returns what's remaining in 203 // the buffer, recursively read what's left in the underlying reader. 204 if n < len(b) { 205 b = b[n:] 206 remainder, err := r.readBytes(b) 207 return n + remainder, err 208 } 209 return n, err 210 } 211 212 func (r *readerWithDigest) Read(b []byte) (int, error) { 213 n, err := r.readBytes(b) 214 if err != nil && err != io.EOF { 215 return n, err 216 } 217 // If we encountered an EOF error and didn't read any bytes 218 // given a non-empty slice, we return an EOF error. 219 if err == io.EOF && n == 0 && len(b) > 0 { 220 return 0, err 221 } 222 if _, err := r.digest.Write(b[:n]); err != nil { 223 return 0, err 224 } 225 return n, nil 226 } 227 228 func (r *readerWithDigest) Validate(expectedDigest uint32) error { 229 if r.digest.Sum32() != expectedDigest { 230 return errChecksumMismatch 231 } 232 return nil 233 }