github.com/4ad/go@v0.0.0-20161219182952-69a12818b605/src/archive/tar/format.go (about) 1 // Copyright 2016 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 package tar 6 7 // Constants to identify various tar formats. 8 const ( 9 // The format is unknown. 10 formatUnknown = (1 << iota) / 2 // Sequence of 0, 1, 2, 4, 8, etc... 11 12 // The format of the original Unix V7 tar tool prior to standardization. 13 formatV7 14 15 // The old and new GNU formats, which are incompatible with USTAR. 16 // This does cover the old GNU sparse extension. 17 // This does not cover the GNU sparse extensions using PAX headers, 18 // versions 0.0, 0.1, and 1.0; these fall under the PAX format. 19 formatGNU 20 21 // Schily's tar format, which is incompatible with USTAR. 22 // This does not cover STAR extensions to the PAX format; these fall under 23 // the PAX format. 24 formatSTAR 25 26 // USTAR is the former standardization of tar defined in POSIX.1-1988. 27 // This is incompatible with the GNU and STAR formats. 28 formatUSTAR 29 30 // PAX is the latest standardization of tar defined in POSIX.1-2001. 31 // This is an extension of USTAR and is "backwards compatible" with it. 32 // 33 // Some newer formats add their own extensions to PAX, such as GNU sparse 34 // files and SCHILY extended attributes. Since they are backwards compatible 35 // with PAX, they will be labelled as "PAX". 36 formatPAX 37 ) 38 39 // Magics used to identify various formats. 40 const ( 41 magicGNU, versionGNU = "ustar ", " \x00" 42 magicUSTAR, versionUSTAR = "ustar\x00", "00" 43 trailerSTAR = "tar\x00" 44 ) 45 46 // Size constants from various tar specifications. 47 const ( 48 blockSize = 512 // Size of each block in a tar stream 49 nameSize = 100 // Max length of the name field in USTAR format 50 prefixSize = 155 // Max length of the prefix field in USTAR format 51 ) 52 53 var zeroBlock block 54 55 type block [blockSize]byte 56 57 // Convert block to any number of formats. 58 func (b *block) V7() *headerV7 { return (*headerV7)(b) } 59 func (b *block) GNU() *headerGNU { return (*headerGNU)(b) } 60 func (b *block) STAR() *headerSTAR { return (*headerSTAR)(b) } 61 func (b *block) USTAR() *headerUSTAR { return (*headerUSTAR)(b) } 62 func (b *block) Sparse() sparseArray { return (sparseArray)(b[:]) } 63 64 // GetFormat checks that the block is a valid tar header based on the checksum. 65 // It then attempts to guess the specific format based on magic values. 66 // If the checksum fails, then formatUnknown is returned. 67 func (b *block) GetFormat() (format int) { 68 // Verify checksum. 69 var p parser 70 value := p.parseOctal(b.V7().Chksum()) 71 chksum1, chksum2 := b.ComputeChecksum() 72 if p.err != nil || (value != chksum1 && value != chksum2) { 73 return formatUnknown 74 } 75 76 // Guess the magic values. 77 magic := string(b.USTAR().Magic()) 78 version := string(b.USTAR().Version()) 79 trailer := string(b.STAR().Trailer()) 80 switch { 81 case magic == magicUSTAR && trailer == trailerSTAR: 82 return formatSTAR 83 case magic == magicUSTAR: 84 return formatUSTAR 85 case magic == magicGNU && version == versionGNU: 86 return formatGNU 87 default: 88 return formatV7 89 } 90 } 91 92 // SetFormat writes the magic values necessary for specified format 93 // and then updates the checksum accordingly. 94 func (b *block) SetFormat(format int) { 95 // Set the magic values. 96 switch format { 97 case formatV7: 98 // Do nothing. 99 case formatGNU: 100 copy(b.GNU().Magic(), magicGNU) 101 copy(b.GNU().Version(), versionGNU) 102 case formatSTAR: 103 copy(b.STAR().Magic(), magicUSTAR) 104 copy(b.STAR().Version(), versionUSTAR) 105 copy(b.STAR().Trailer(), trailerSTAR) 106 case formatUSTAR, formatPAX: 107 copy(b.USTAR().Magic(), magicUSTAR) 108 copy(b.USTAR().Version(), versionUSTAR) 109 default: 110 panic("invalid format") 111 } 112 113 // Update checksum. 114 // This field is special in that it is terminated by a NULL then space. 115 var f formatter 116 field := b.V7().Chksum() 117 chksum, _ := b.ComputeChecksum() // Possible values are 256..128776 118 f.formatOctal(field[:7], chksum) // Never fails since 128776 < 262143 119 field[7] = ' ' 120 } 121 122 // ComputeChecksum computes the checksum for the header block. 123 // POSIX specifies a sum of the unsigned byte values, but the Sun tar used 124 // signed byte values. 125 // We compute and return both. 126 func (b *block) ComputeChecksum() (unsigned, signed int64) { 127 for i, c := range b { 128 if 148 <= i && i < 156 { 129 c = ' ' // Treat the checksum field itself as all spaces. 130 } 131 unsigned += int64(uint8(c)) 132 signed += int64(int8(c)) 133 } 134 return unsigned, signed 135 } 136 137 type headerV7 [blockSize]byte 138 139 func (h *headerV7) Name() []byte { return h[000:][:100] } 140 func (h *headerV7) Mode() []byte { return h[100:][:8] } 141 func (h *headerV7) UID() []byte { return h[108:][:8] } 142 func (h *headerV7) GID() []byte { return h[116:][:8] } 143 func (h *headerV7) Size() []byte { return h[124:][:12] } 144 func (h *headerV7) ModTime() []byte { return h[136:][:12] } 145 func (h *headerV7) Chksum() []byte { return h[148:][:8] } 146 func (h *headerV7) TypeFlag() []byte { return h[156:][:1] } 147 func (h *headerV7) LinkName() []byte { return h[157:][:100] } 148 149 type headerGNU [blockSize]byte 150 151 func (h *headerGNU) V7() *headerV7 { return (*headerV7)(h) } 152 func (h *headerGNU) Magic() []byte { return h[257:][:6] } 153 func (h *headerGNU) Version() []byte { return h[263:][:2] } 154 func (h *headerGNU) UserName() []byte { return h[265:][:32] } 155 func (h *headerGNU) GroupName() []byte { return h[297:][:32] } 156 func (h *headerGNU) DevMajor() []byte { return h[329:][:8] } 157 func (h *headerGNU) DevMinor() []byte { return h[337:][:8] } 158 func (h *headerGNU) AccessTime() []byte { return h[345:][:12] } 159 func (h *headerGNU) ChangeTime() []byte { return h[357:][:12] } 160 func (h *headerGNU) Sparse() sparseArray { return (sparseArray)(h[386:][:24*4+1]) } 161 func (h *headerGNU) RealSize() []byte { return h[483:][:12] } 162 163 type headerSTAR [blockSize]byte 164 165 func (h *headerSTAR) V7() *headerV7 { return (*headerV7)(h) } 166 func (h *headerSTAR) Magic() []byte { return h[257:][:6] } 167 func (h *headerSTAR) Version() []byte { return h[263:][:2] } 168 func (h *headerSTAR) UserName() []byte { return h[265:][:32] } 169 func (h *headerSTAR) GroupName() []byte { return h[297:][:32] } 170 func (h *headerSTAR) DevMajor() []byte { return h[329:][:8] } 171 func (h *headerSTAR) DevMinor() []byte { return h[337:][:8] } 172 func (h *headerSTAR) Prefix() []byte { return h[345:][:131] } 173 func (h *headerSTAR) AccessTime() []byte { return h[476:][:12] } 174 func (h *headerSTAR) ChangeTime() []byte { return h[488:][:12] } 175 func (h *headerSTAR) Trailer() []byte { return h[508:][:4] } 176 177 type headerUSTAR [blockSize]byte 178 179 func (h *headerUSTAR) V7() *headerV7 { return (*headerV7)(h) } 180 func (h *headerUSTAR) Magic() []byte { return h[257:][:6] } 181 func (h *headerUSTAR) Version() []byte { return h[263:][:2] } 182 func (h *headerUSTAR) UserName() []byte { return h[265:][:32] } 183 func (h *headerUSTAR) GroupName() []byte { return h[297:][:32] } 184 func (h *headerUSTAR) DevMajor() []byte { return h[329:][:8] } 185 func (h *headerUSTAR) DevMinor() []byte { return h[337:][:8] } 186 func (h *headerUSTAR) Prefix() []byte { return h[345:][:155] } 187 188 type sparseArray []byte 189 190 func (s sparseArray) Entry(i int) sparseNode { return (sparseNode)(s[i*24:]) } 191 func (s sparseArray) IsExtended() []byte { return s[24*s.MaxEntries():][:1] } 192 func (s sparseArray) MaxEntries() int { return len(s) / 24 } 193 194 type sparseNode []byte 195 196 func (s sparseNode) Offset() []byte { return s[00:][:12] } 197 func (s sparseNode) NumBytes() []byte { return s[12:][:12] }