Home | History | Annotate | Download | only in gosym
      1 // Copyright 2009 The Go Authors.  All rights reserved.
      2 // Use of this source code is governed by a BSD-style
      3 // license that can be found in the LICENSE file.
      4 
      5 /*
      6  * Line tables
      7  */
      8 
      9 package gosym
     10 
     11 import (
     12 	"encoding/binary"
     13 	"sync"
     14 )
     15 
     16 // A LineTable is a data structure mapping program counters to line numbers.
     17 //
     18 // In Go 1.1 and earlier, each function (represented by a Func) had its own LineTable,
     19 // and the line number corresponded to a numbering of all source lines in the
     20 // program, across all files. That absolute line number would then have to be
     21 // converted separately to a file name and line number within the file.
     22 //
     23 // In Go 1.2, the format of the data changed so that there is a single LineTable
     24 // for the entire program, shared by all Funcs, and there are no absolute line
     25 // numbers, just line numbers within specific files.
     26 //
     27 // For the most part, LineTable's methods should be treated as an internal
     28 // detail of the package; callers should use the methods on Table instead.
     29 type LineTable struct {
     30 	Data []byte
     31 	PC   uint64
     32 	Line int
     33 
     34 	// Go 1.2 state
     35 	mu       sync.Mutex
     36 	go12     int // is this in Go 1.2 format? -1 no, 0 unknown, 1 yes
     37 	binary   binary.ByteOrder
     38 	quantum  uint32
     39 	ptrsize  uint32
     40 	functab  []byte
     41 	nfunctab uint32
     42 	filetab  []byte
     43 	nfiletab uint32
     44 	fileMap  map[string]uint32
     45 }
     46 
     47 // NOTE(rsc): This is wrong for GOARCH=arm, which uses a quantum of 4,
     48 // but we have no idea whether we're using arm or not. This only
     49 // matters in the old (pre-Go 1.2) symbol table format, so it's not worth
     50 // fixing.
     51 const oldQuantum = 1
     52 
     53 func (t *LineTable) parse(targetPC uint64, targetLine int) (b []byte, pc uint64, line int) {
     54 	// The PC/line table can be thought of as a sequence of
     55 	//  <pc update>* <line update>
     56 	// batches.  Each update batch results in a (pc, line) pair,
     57 	// where line applies to every PC from pc up to but not
     58 	// including the pc of the next pair.
     59 	//
     60 	// Here we process each update individually, which simplifies
     61 	// the code, but makes the corner cases more confusing.
     62 	b, pc, line = t.Data, t.PC, t.Line
     63 	for pc <= targetPC && line != targetLine && len(b) > 0 {
     64 		code := b[0]
     65 		b = b[1:]
     66 		switch {
     67 		case code == 0:
     68 			if len(b) < 4 {
     69 				b = b[0:0]
     70 				break
     71 			}
     72 			val := binary.BigEndian.Uint32(b)
     73 			b = b[4:]
     74 			line += int(val)
     75 		case code <= 64:
     76 			line += int(code)
     77 		case code <= 128:
     78 			line -= int(code - 64)
     79 		default:
     80 			pc += oldQuantum * uint64(code-128)
     81 			continue
     82 		}
     83 		pc += oldQuantum
     84 	}
     85 	return b, pc, line
     86 }
     87 
     88 func (t *LineTable) slice(pc uint64) *LineTable {
     89 	data, pc, line := t.parse(pc, -1)
     90 	return &LineTable{Data: data, PC: pc, Line: line}
     91 }
     92 
     93 // PCToLine returns the line number for the given program counter.
     94 // Callers should use Table's PCToLine method instead.
     95 func (t *LineTable) PCToLine(pc uint64) int {
     96 	if t.isGo12() {
     97 		return t.go12PCToLine(pc)
     98 	}
     99 	_, _, line := t.parse(pc, -1)
    100 	return line
    101 }
    102 
    103 // LineToPC returns the program counter for the given line number,
    104 // considering only program counters before maxpc.
    105 // Callers should use Table's LineToPC method instead.
    106 func (t *LineTable) LineToPC(line int, maxpc uint64) uint64 {
    107 	if t.isGo12() {
    108 		return 0
    109 	}
    110 	_, pc, line1 := t.parse(maxpc, line)
    111 	if line1 != line {
    112 		return 0
    113 	}
    114 	// Subtract quantum from PC to account for post-line increment
    115 	return pc - oldQuantum
    116 }
    117 
    118 // NewLineTable returns a new PC/line table
    119 // corresponding to the encoded data.
    120 // Text must be the start address of the
    121 // corresponding text segment.
    122 func NewLineTable(data []byte, text uint64) *LineTable {
    123 	return &LineTable{Data: data, PC: text, Line: 0}
    124 }
    125 
    126 // Go 1.2 symbol table format.
    127 // See golang.org/s/go12symtab.
    128 //
    129 // A general note about the methods here: rather than try to avoid
    130 // index out of bounds errors, we trust Go to detect them, and then
    131 // we recover from the panics and treat them as indicative of a malformed
    132 // or incomplete table.
    133 //
    134 // The methods called by symtab.go, which begin with "go12" prefixes,
    135 // are expected to have that recovery logic.
    136 
    137 // isGo12 reports whether this is a Go 1.2 (or later) symbol table.
    138 func (t *LineTable) isGo12() bool {
    139 	t.go12Init()
    140 	return t.go12 == 1
    141 }
    142 
    143 const go12magic = 0xfffffffb
    144 
    145 // uintptr returns the pointer-sized value encoded at b.
    146 // The pointer size is dictated by the table being read.
    147 func (t *LineTable) uintptr(b []byte) uint64 {
    148 	if t.ptrsize == 4 {
    149 		return uint64(t.binary.Uint32(b))
    150 	}
    151 	return t.binary.Uint64(b)
    152 }
    153 
    154 // go12init initializes the Go 1.2 metadata if t is a Go 1.2 symbol table.
    155 func (t *LineTable) go12Init() {
    156 	t.mu.Lock()
    157 	defer t.mu.Unlock()
    158 	if t.go12 != 0 {
    159 		return
    160 	}
    161 
    162 	defer func() {
    163 		// If we panic parsing, assume it's not a Go 1.2 symbol table.
    164 		recover()
    165 	}()
    166 
    167 	// Check header: 4-byte magic, two zeros, pc quantum, pointer size.
    168 	t.go12 = -1 // not Go 1.2 until proven otherwise
    169 	if len(t.Data) < 16 || t.Data[4] != 0 || t.Data[5] != 0 ||
    170 		(t.Data[6] != 1 && t.Data[6] != 4) || // pc quantum
    171 		(t.Data[7] != 4 && t.Data[7] != 8) { // pointer size
    172 		return
    173 	}
    174 
    175 	switch uint32(go12magic) {
    176 	case binary.LittleEndian.Uint32(t.Data):
    177 		t.binary = binary.LittleEndian
    178 	case binary.BigEndian.Uint32(t.Data):
    179 		t.binary = binary.BigEndian
    180 	default:
    181 		return
    182 	}
    183 
    184 	t.quantum = uint32(t.Data[6])
    185 	t.ptrsize = uint32(t.Data[7])
    186 
    187 	t.nfunctab = uint32(t.uintptr(t.Data[8:]))
    188 	t.functab = t.Data[8+t.ptrsize:]
    189 	functabsize := t.nfunctab*2*t.ptrsize + t.ptrsize
    190 	fileoff := t.binary.Uint32(t.functab[functabsize:])
    191 	t.functab = t.functab[:functabsize]
    192 	t.filetab = t.Data[fileoff:]
    193 	t.nfiletab = t.binary.Uint32(t.filetab)
    194 	t.filetab = t.filetab[:t.nfiletab*4]
    195 
    196 	t.go12 = 1 // so far so good
    197 }
    198 
    199 // go12Funcs returns a slice of Funcs derived from the Go 1.2 pcln table.
    200 func (t *LineTable) go12Funcs() []Func {
    201 	// Assume it is malformed and return nil on error.
    202 	defer func() {
    203 		recover()
    204 	}()
    205 
    206 	n := len(t.functab) / int(t.ptrsize) / 2
    207 	funcs := make([]Func, n)
    208 	for i := range funcs {
    209 		f := &funcs[i]
    210 		f.Entry = uint64(t.uintptr(t.functab[2*i*int(t.ptrsize):]))
    211 		f.End = uint64(t.uintptr(t.functab[(2*i+2)*int(t.ptrsize):]))
    212 		info := t.Data[t.uintptr(t.functab[(2*i+1)*int(t.ptrsize):]):]
    213 		f.LineTable = t
    214 		f.FrameSize = int(t.binary.Uint32(info[t.ptrsize+2*4:]))
    215 		f.Sym = &Sym{
    216 			Value:  f.Entry,
    217 			Type:   'T',
    218 			Name:   t.string(t.binary.Uint32(info[t.ptrsize:])),
    219 			GoType: 0,
    220 			Func:   f,
    221 		}
    222 	}
    223 	return funcs
    224 }
    225 
    226 // findFunc returns the func corresponding to the given program counter.
    227 func (t *LineTable) findFunc(pc uint64) []byte {
    228 	if pc < t.uintptr(t.functab) || pc >= t.uintptr(t.functab[len(t.functab)-int(t.ptrsize):]) {
    229 		return nil
    230 	}
    231 
    232 	// The function table is a list of 2*nfunctab+1 uintptrs,
    233 	// alternating program counters and offsets to func structures.
    234 	f := t.functab
    235 	nf := t.nfunctab
    236 	for nf > 0 {
    237 		m := nf / 2
    238 		fm := f[2*t.ptrsize*m:]
    239 		if t.uintptr(fm) <= pc && pc < t.uintptr(fm[2*t.ptrsize:]) {
    240 			return t.Data[t.uintptr(fm[t.ptrsize:]):]
    241 		} else if pc < t.uintptr(fm) {
    242 			nf = m
    243 		} else {
    244 			f = f[(m+1)*2*t.ptrsize:]
    245 			nf -= m + 1
    246 		}
    247 	}
    248 	return nil
    249 }
    250 
    251 // readvarint reads, removes, and returns a varint from *pp.
    252 func (t *LineTable) readvarint(pp *[]byte) uint32 {
    253 	var v, shift uint32
    254 	p := *pp
    255 	for shift = 0; ; shift += 7 {
    256 		b := p[0]
    257 		p = p[1:]
    258 		v |= (uint32(b) & 0x7F) << shift
    259 		if b&0x80 == 0 {
    260 			break
    261 		}
    262 	}
    263 	*pp = p
    264 	return v
    265 }
    266 
    267 // string returns a Go string found at off.
    268 func (t *LineTable) string(off uint32) string {
    269 	for i := off; ; i++ {
    270 		if t.Data[i] == 0 {
    271 			return string(t.Data[off:i])
    272 		}
    273 	}
    274 }
    275 
    276 // step advances to the next pc, value pair in the encoded table.
    277 func (t *LineTable) step(p *[]byte, pc *uint64, val *int32, first bool) bool {
    278 	uvdelta := t.readvarint(p)
    279 	if uvdelta == 0 && !first {
    280 		return false
    281 	}
    282 	if uvdelta&1 != 0 {
    283 		uvdelta = ^(uvdelta >> 1)
    284 	} else {
    285 		uvdelta >>= 1
    286 	}
    287 	vdelta := int32(uvdelta)
    288 	pcdelta := t.readvarint(p) * t.quantum
    289 	*pc += uint64(pcdelta)
    290 	*val += vdelta
    291 	return true
    292 }
    293 
    294 // pcvalue reports the value associated with the target pc.
    295 // off is the offset to the beginning of the pc-value table,
    296 // and entry is the start PC for the corresponding function.
    297 func (t *LineTable) pcvalue(off uint32, entry, targetpc uint64) int32 {
    298 	if off == 0 {
    299 		return -1
    300 	}
    301 	p := t.Data[off:]
    302 
    303 	val := int32(-1)
    304 	pc := entry
    305 	for t.step(&p, &pc, &val, pc == entry) {
    306 		if targetpc < pc {
    307 			return val
    308 		}
    309 	}
    310 	return -1
    311 }
    312 
    313 // findFileLine scans one function in the binary looking for a
    314 // program counter in the given file on the given line.
    315 // It does so by running the pc-value tables mapping program counter
    316 // to file number. Since most functions come from a single file, these
    317 // are usually short and quick to scan. If a file match is found, then the
    318 // code goes to the expense of looking for a simultaneous line number match.
    319 func (t *LineTable) findFileLine(entry uint64, filetab, linetab uint32, filenum, line int32) uint64 {
    320 	if filetab == 0 || linetab == 0 {
    321 		return 0
    322 	}
    323 
    324 	fp := t.Data[filetab:]
    325 	fl := t.Data[linetab:]
    326 	fileVal := int32(-1)
    327 	filePC := entry
    328 	lineVal := int32(-1)
    329 	linePC := entry
    330 	fileStartPC := filePC
    331 	for t.step(&fp, &filePC, &fileVal, filePC == entry) {
    332 		if fileVal == filenum && fileStartPC < filePC {
    333 			// fileVal is in effect starting at fileStartPC up to
    334 			// but not including filePC, and it's the file we want.
    335 			// Run the PC table looking for a matching line number
    336 			// or until we reach filePC.
    337 			lineStartPC := linePC
    338 			for linePC < filePC && t.step(&fl, &linePC, &lineVal, linePC == entry) {
    339 				// lineVal is in effect until linePC, and lineStartPC < filePC.
    340 				if lineVal == line {
    341 					if fileStartPC <= lineStartPC {
    342 						return lineStartPC
    343 					}
    344 					if fileStartPC < linePC {
    345 						return fileStartPC
    346 					}
    347 				}
    348 				lineStartPC = linePC
    349 			}
    350 		}
    351 		fileStartPC = filePC
    352 	}
    353 	return 0
    354 }
    355 
    356 // go12PCToLine maps program counter to line number for the Go 1.2 pcln table.
    357 func (t *LineTable) go12PCToLine(pc uint64) (line int) {
    358 	defer func() {
    359 		if recover() != nil {
    360 			line = -1
    361 		}
    362 	}()
    363 
    364 	f := t.findFunc(pc)
    365 	if f == nil {
    366 		return -1
    367 	}
    368 	entry := t.uintptr(f)
    369 	linetab := t.binary.Uint32(f[t.ptrsize+5*4:])
    370 	return int(t.pcvalue(linetab, entry, pc))
    371 }
    372 
    373 // go12PCToFile maps program counter to file name for the Go 1.2 pcln table.
    374 func (t *LineTable) go12PCToFile(pc uint64) (file string) {
    375 	defer func() {
    376 		if recover() != nil {
    377 			file = ""
    378 		}
    379 	}()
    380 
    381 	f := t.findFunc(pc)
    382 	if f == nil {
    383 		return ""
    384 	}
    385 	entry := t.uintptr(f)
    386 	filetab := t.binary.Uint32(f[t.ptrsize+4*4:])
    387 	fno := t.pcvalue(filetab, entry, pc)
    388 	if fno <= 0 {
    389 		return ""
    390 	}
    391 	return t.string(t.binary.Uint32(t.filetab[4*fno:]))
    392 }
    393 
    394 // go12LineToPC maps a (file, line) pair to a program counter for the Go 1.2 pcln table.
    395 func (t *LineTable) go12LineToPC(file string, line int) (pc uint64) {
    396 	defer func() {
    397 		if recover() != nil {
    398 			pc = 0
    399 		}
    400 	}()
    401 
    402 	t.initFileMap()
    403 	filenum := t.fileMap[file]
    404 	if filenum == 0 {
    405 		return 0
    406 	}
    407 
    408 	// Scan all functions.
    409 	// If this turns out to be a bottleneck, we could build a map[int32][]int32
    410 	// mapping file number to a list of functions with code from that file.
    411 	for i := uint32(0); i < t.nfunctab; i++ {
    412 		f := t.Data[t.uintptr(t.functab[2*t.ptrsize*i+t.ptrsize:]):]
    413 		entry := t.uintptr(f)
    414 		filetab := t.binary.Uint32(f[t.ptrsize+4*4:])
    415 		linetab := t.binary.Uint32(f[t.ptrsize+5*4:])
    416 		pc := t.findFileLine(entry, filetab, linetab, int32(filenum), int32(line))
    417 		if pc != 0 {
    418 			return pc
    419 		}
    420 	}
    421 	return 0
    422 }
    423 
    424 // initFileMap initializes the map from file name to file number.
    425 func (t *LineTable) initFileMap() {
    426 	t.mu.Lock()
    427 	defer t.mu.Unlock()
    428 
    429 	if t.fileMap != nil {
    430 		return
    431 	}
    432 	m := make(map[string]uint32)
    433 
    434 	for i := uint32(1); i < t.nfiletab; i++ {
    435 		s := t.string(t.binary.Uint32(t.filetab[4*i:]))
    436 		m[s] = i
    437 	}
    438 	t.fileMap = m
    439 }
    440 
    441 // go12MapFiles adds to m a key for every file in the Go 1.2 LineTable.
    442 // Every key maps to obj. That's not a very interesting map, but it provides
    443 // a way for callers to obtain the list of files in the program.
    444 func (t *LineTable) go12MapFiles(m map[string]*Obj, obj *Obj) {
    445 	defer func() {
    446 		recover()
    447 	}()
    448 
    449 	t.initFileMap()
    450 	for file := range t.fileMap {
    451 		m[file] = obj
    452 	}
    453 }
    454