Home | History | Annotate | Download | only in tar
      1 // Copyright 2016 The Go Authors. All rights reserved.
      2 // Use of this source code is governed by a BSD-style
      3 // license that can be found in the LICENSE file.
      4 
      5 package tar
      6 
      7 // Constants to identify various tar formats.
      8 const (
      9 	// The format is unknown.
     10 	formatUnknown = (1 << iota) / 2 // Sequence of 0, 1, 2, 4, 8, etc...
     11 
     12 	// The format of the original Unix V7 tar tool prior to standardization.
     13 	formatV7
     14 
     15 	// The old and new GNU formats, which are incompatible with USTAR.
     16 	// This does cover the old GNU sparse extension.
     17 	// This does not cover the GNU sparse extensions using PAX headers,
     18 	// versions 0.0, 0.1, and 1.0; these fall under the PAX format.
     19 	formatGNU
     20 
     21 	// Schily's tar format, which is incompatible with USTAR.
     22 	// This does not cover STAR extensions to the PAX format; these fall under
     23 	// the PAX format.
     24 	formatSTAR
     25 
     26 	// USTAR is the former standardization of tar defined in POSIX.1-1988.
     27 	// This is incompatible with the GNU and STAR formats.
     28 	formatUSTAR
     29 
     30 	// PAX is the latest standardization of tar defined in POSIX.1-2001.
     31 	// This is an extension of USTAR and is "backwards compatible" with it.
     32 	//
     33 	// Some newer formats add their own extensions to PAX, such as GNU sparse
     34 	// files and SCHILY extended attributes. Since they are backwards compatible
     35 	// with PAX, they will be labelled as "PAX".
     36 	formatPAX
     37 )
     38 
     39 // Magics used to identify various formats.
     40 const (
     41 	magicGNU, versionGNU     = "ustar ", " \x00"
     42 	magicUSTAR, versionUSTAR = "ustar\x00", "00"
     43 	trailerSTAR              = "tar\x00"
     44 )
     45 
     46 // Size constants from various tar specifications.
     47 const (
     48 	blockSize  = 512 // Size of each block in a tar stream
     49 	nameSize   = 100 // Max length of the name field in USTAR format
     50 	prefixSize = 155 // Max length of the prefix field in USTAR format
     51 )
     52 
     53 var zeroBlock block
     54 
     55 type block [blockSize]byte
     56 
     57 // Convert block to any number of formats.
     58 func (b *block) V7() *headerV7       { return (*headerV7)(b) }
     59 func (b *block) GNU() *headerGNU     { return (*headerGNU)(b) }
     60 func (b *block) STAR() *headerSTAR   { return (*headerSTAR)(b) }
     61 func (b *block) USTAR() *headerUSTAR { return (*headerUSTAR)(b) }
     62 func (b *block) Sparse() sparseArray { return (sparseArray)(b[:]) }
     63 
     64 // GetFormat checks that the block is a valid tar header based on the checksum.
     65 // It then attempts to guess the specific format based on magic values.
     66 // If the checksum fails, then formatUnknown is returned.
     67 func (b *block) GetFormat() (format int) {
     68 	// Verify checksum.
     69 	var p parser
     70 	value := p.parseOctal(b.V7().Chksum())
     71 	chksum1, chksum2 := b.ComputeChecksum()
     72 	if p.err != nil || (value != chksum1 && value != chksum2) {
     73 		return formatUnknown
     74 	}
     75 
     76 	// Guess the magic values.
     77 	magic := string(b.USTAR().Magic())
     78 	version := string(b.USTAR().Version())
     79 	trailer := string(b.STAR().Trailer())
     80 	switch {
     81 	case magic == magicUSTAR && trailer == trailerSTAR:
     82 		return formatSTAR
     83 	case magic == magicUSTAR:
     84 		return formatUSTAR
     85 	case magic == magicGNU && version == versionGNU:
     86 		return formatGNU
     87 	default:
     88 		return formatV7
     89 	}
     90 }
     91 
     92 // SetFormat writes the magic values necessary for specified format
     93 // and then updates the checksum accordingly.
     94 func (b *block) SetFormat(format int) {
     95 	// Set the magic values.
     96 	switch format {
     97 	case formatV7:
     98 		// Do nothing.
     99 	case formatGNU:
    100 		copy(b.GNU().Magic(), magicGNU)
    101 		copy(b.GNU().Version(), versionGNU)
    102 	case formatSTAR:
    103 		copy(b.STAR().Magic(), magicUSTAR)
    104 		copy(b.STAR().Version(), versionUSTAR)
    105 		copy(b.STAR().Trailer(), trailerSTAR)
    106 	case formatUSTAR, formatPAX:
    107 		copy(b.USTAR().Magic(), magicUSTAR)
    108 		copy(b.USTAR().Version(), versionUSTAR)
    109 	default:
    110 		panic("invalid format")
    111 	}
    112 
    113 	// Update checksum.
    114 	// This field is special in that it is terminated by a NULL then space.
    115 	var f formatter
    116 	field := b.V7().Chksum()
    117 	chksum, _ := b.ComputeChecksum() // Possible values are 256..128776
    118 	f.formatOctal(field[:7], chksum) // Never fails since 128776 < 262143
    119 	field[7] = ' '
    120 }
    121 
    122 // ComputeChecksum computes the checksum for the header block.
    123 // POSIX specifies a sum of the unsigned byte values, but the Sun tar used
    124 // signed byte values.
    125 // We compute and return both.
    126 func (b *block) ComputeChecksum() (unsigned, signed int64) {
    127 	for i, c := range b {
    128 		if 148 <= i && i < 156 {
    129 			c = ' ' // Treat the checksum field itself as all spaces.
    130 		}
    131 		unsigned += int64(uint8(c))
    132 		signed += int64(int8(c))
    133 	}
    134 	return unsigned, signed
    135 }
    136 
    137 type headerV7 [blockSize]byte
    138 
    139 func (h *headerV7) Name() []byte     { return h[000:][:100] }
    140 func (h *headerV7) Mode() []byte     { return h[100:][:8] }
    141 func (h *headerV7) UID() []byte      { return h[108:][:8] }
    142 func (h *headerV7) GID() []byte      { return h[116:][:8] }
    143 func (h *headerV7) Size() []byte     { return h[124:][:12] }
    144 func (h *headerV7) ModTime() []byte  { return h[136:][:12] }
    145 func (h *headerV7) Chksum() []byte   { return h[148:][:8] }
    146 func (h *headerV7) TypeFlag() []byte { return h[156:][:1] }
    147 func (h *headerV7) LinkName() []byte { return h[157:][:100] }
    148 
    149 type headerGNU [blockSize]byte
    150 
    151 func (h *headerGNU) V7() *headerV7       { return (*headerV7)(h) }
    152 func (h *headerGNU) Magic() []byte       { return h[257:][:6] }
    153 func (h *headerGNU) Version() []byte     { return h[263:][:2] }
    154 func (h *headerGNU) UserName() []byte    { return h[265:][:32] }
    155 func (h *headerGNU) GroupName() []byte   { return h[297:][:32] }
    156 func (h *headerGNU) DevMajor() []byte    { return h[329:][:8] }
    157 func (h *headerGNU) DevMinor() []byte    { return h[337:][:8] }
    158 func (h *headerGNU) AccessTime() []byte  { return h[345:][:12] }
    159 func (h *headerGNU) ChangeTime() []byte  { return h[357:][:12] }
    160 func (h *headerGNU) Sparse() sparseArray { return (sparseArray)(h[386:][:24*4+1]) }
    161 func (h *headerGNU) RealSize() []byte    { return h[483:][:12] }
    162 
    163 type headerSTAR [blockSize]byte
    164 
    165 func (h *headerSTAR) V7() *headerV7      { return (*headerV7)(h) }
    166 func (h *headerSTAR) Magic() []byte      { return h[257:][:6] }
    167 func (h *headerSTAR) Version() []byte    { return h[263:][:2] }
    168 func (h *headerSTAR) UserName() []byte   { return h[265:][:32] }
    169 func (h *headerSTAR) GroupName() []byte  { return h[297:][:32] }
    170 func (h *headerSTAR) DevMajor() []byte   { return h[329:][:8] }
    171 func (h *headerSTAR) DevMinor() []byte   { return h[337:][:8] }
    172 func (h *headerSTAR) Prefix() []byte     { return h[345:][:131] }
    173 func (h *headerSTAR) AccessTime() []byte { return h[476:][:12] }
    174 func (h *headerSTAR) ChangeTime() []byte { return h[488:][:12] }
    175 func (h *headerSTAR) Trailer() []byte    { return h[508:][:4] }
    176 
    177 type headerUSTAR [blockSize]byte
    178 
    179 func (h *headerUSTAR) V7() *headerV7     { return (*headerV7)(h) }
    180 func (h *headerUSTAR) Magic() []byte     { return h[257:][:6] }
    181 func (h *headerUSTAR) Version() []byte   { return h[263:][:2] }
    182 func (h *headerUSTAR) UserName() []byte  { return h[265:][:32] }
    183 func (h *headerUSTAR) GroupName() []byte { return h[297:][:32] }
    184 func (h *headerUSTAR) DevMajor() []byte  { return h[329:][:8] }
    185 func (h *headerUSTAR) DevMinor() []byte  { return h[337:][:8] }
    186 func (h *headerUSTAR) Prefix() []byte    { return h[345:][:155] }
    187 
    188 type sparseArray []byte
    189 
    190 func (s sparseArray) Entry(i int) sparseNode { return (sparseNode)(s[i*24:]) }
    191 func (s sparseArray) IsExtended() []byte     { return s[24*s.MaxEntries():][:1] }
    192 func (s sparseArray) MaxEntries() int        { return len(s) / 24 }
    193 
    194 type sparseNode []byte
    195 
    196 func (s sparseNode) Offset() []byte   { return s[00:][:12] }
    197 func (s sparseNode) NumBytes() []byte { return s[12:][:12] }
    198