github.com/sean-/go@v0.0.0-20151219100004-97f854cd7bb6/src/compress/zlib/reader.go (about)

     1  // Copyright 2009 The Go Authors. All rights reserved.
     2  // Use of this source code is governed by a BSD-style
     3  // license that can be found in the LICENSE file.
     4  
     5  /*
     6  Package zlib implements reading and writing of zlib format compressed data,
     7  as specified in RFC 1950.
     8  
     9  The implementation provides filters that uncompress during reading
    10  and compress during writing.  For example, to write compressed data
    11  to a buffer:
    12  
    13  	var b bytes.Buffer
    14  	w := zlib.NewWriter(&b)
    15  	w.Write([]byte("hello, world\n"))
    16  	w.Close()
    17  
    18  and to read that data back:
    19  
    20  	r, err := zlib.NewReader(&b)
    21  	io.Copy(os.Stdout, r)
    22  	r.Close()
    23  */
    24  package zlib
    25  
    26  import (
    27  	"bufio"
    28  	"compress/flate"
    29  	"errors"
    30  	"hash"
    31  	"hash/adler32"
    32  	"io"
    33  )
    34  
    35  const zlibDeflate = 8
    36  
    37  var (
    38  	// ErrChecksum is returned when reading ZLIB data that has an invalid checksum.
    39  	ErrChecksum = errors.New("zlib: invalid checksum")
    40  	// ErrDictionary is returned when reading ZLIB data that has an invalid dictionary.
    41  	ErrDictionary = errors.New("zlib: invalid dictionary")
    42  	// ErrHeader is returned when reading ZLIB data that has an invalid header.
    43  	ErrHeader = errors.New("zlib: invalid header")
    44  )
    45  
    46  type reader struct {
    47  	r            flate.Reader
    48  	decompressor io.ReadCloser
    49  	digest       hash.Hash32
    50  	err          error
    51  	scratch      [4]byte
    52  }
    53  
    54  // Resetter resets a ReadCloser returned by NewReader or NewReaderDict to
    55  // to switch to a new underlying Reader. This permits reusing a ReadCloser
    56  // instead of allocating a new one.
    57  type Resetter interface {
    58  	// Reset discards any buffered data and resets the Resetter as if it was
    59  	// newly initialized with the given reader.
    60  	Reset(r io.Reader, dict []byte) error
    61  }
    62  
    63  // NewReader creates a new ReadCloser.
    64  // Reads from the returned ReadCloser read and decompress data from r.
    65  // The implementation buffers input and may read more data than necessary from r.
    66  // It is the caller's responsibility to call Close on the ReadCloser when done.
    67  //
    68  // The ReadCloser returned by NewReader also implements Resetter.
    69  func NewReader(r io.Reader) (io.ReadCloser, error) {
    70  	return NewReaderDict(r, nil)
    71  }
    72  
    73  // NewReaderDict is like NewReader but uses a preset dictionary.
    74  // NewReaderDict ignores the dictionary if the compressed data does not refer to it.
    75  // If the compressed data refers to a different dictionary, NewReaderDict returns ErrDictionary.
    76  //
    77  // The ReadCloser returned by NewReaderDict also implements Resetter.
    78  func NewReaderDict(r io.Reader, dict []byte) (io.ReadCloser, error) {
    79  	z := new(reader)
    80  	err := z.Reset(r, dict)
    81  	if err != nil {
    82  		return nil, err
    83  	}
    84  	return z, nil
    85  }
    86  
    87  func (z *reader) Read(p []byte) (n int, err error) {
    88  	if z.err != nil {
    89  		return 0, z.err
    90  	}
    91  	if len(p) == 0 {
    92  		return 0, nil
    93  	}
    94  
    95  	n, err = z.decompressor.Read(p)
    96  	z.digest.Write(p[0:n])
    97  	if n != 0 || err != io.EOF {
    98  		z.err = err
    99  		return
   100  	}
   101  
   102  	// Finished file; check checksum.
   103  	if _, err := io.ReadFull(z.r, z.scratch[0:4]); err != nil {
   104  		if err == io.EOF {
   105  			err = io.ErrUnexpectedEOF
   106  		}
   107  		z.err = err
   108  		return 0, err
   109  	}
   110  	// ZLIB (RFC 1950) is big-endian, unlike GZIP (RFC 1952).
   111  	checksum := uint32(z.scratch[0])<<24 | uint32(z.scratch[1])<<16 | uint32(z.scratch[2])<<8 | uint32(z.scratch[3])
   112  	if checksum != z.digest.Sum32() {
   113  		z.err = ErrChecksum
   114  		return 0, z.err
   115  	}
   116  	return
   117  }
   118  
   119  // Calling Close does not close the wrapped io.Reader originally passed to NewReader.
   120  func (z *reader) Close() error {
   121  	if z.err != nil {
   122  		return z.err
   123  	}
   124  	z.err = z.decompressor.Close()
   125  	return z.err
   126  }
   127  
   128  func (z *reader) Reset(r io.Reader, dict []byte) error {
   129  	if fr, ok := r.(flate.Reader); ok {
   130  		z.r = fr
   131  	} else {
   132  		z.r = bufio.NewReader(r)
   133  	}
   134  	_, err := io.ReadFull(z.r, z.scratch[0:2])
   135  	if err != nil {
   136  		if err == io.EOF {
   137  			err = io.ErrUnexpectedEOF
   138  		}
   139  		return err
   140  	}
   141  	h := uint(z.scratch[0])<<8 | uint(z.scratch[1])
   142  	if (z.scratch[0]&0x0f != zlibDeflate) || (h%31 != 0) {
   143  		return ErrHeader
   144  	}
   145  	haveDict := z.scratch[1]&0x20 != 0
   146  	if haveDict {
   147  		_, err = io.ReadFull(z.r, z.scratch[0:4])
   148  		if err != nil {
   149  			if err == io.EOF {
   150  				err = io.ErrUnexpectedEOF
   151  			}
   152  			return err
   153  		}
   154  		checksum := uint32(z.scratch[0])<<24 | uint32(z.scratch[1])<<16 | uint32(z.scratch[2])<<8 | uint32(z.scratch[3])
   155  		if checksum != adler32.Checksum(dict) {
   156  			return ErrDictionary
   157  		}
   158  	}
   159  	if z.decompressor == nil {
   160  		if haveDict {
   161  			z.decompressor = flate.NewReaderDict(z.r, dict)
   162  		} else {
   163  			z.decompressor = flate.NewReader(z.r)
   164  		}
   165  	} else {
   166  		z.decompressor.(flate.Resetter).Reset(z.r, dict)
   167  	}
   168  	z.digest = adler32.New()
   169  	return nil
   170  }