1  // SPDX-License-Identifier: GPL-2.0-only
2  /*
3   * genelf_debug.c
4   * Copyright (C) 2015, Google, Inc
5   *
6   * Contributed by:
7   * 	Stephane Eranian <eranian@google.com>
8   *
9   * based on GPLv2 source code from Oprofile
10   * @remark Copyright 2007 OProfile authors
11   * @author Philippe Elie
12   */
13  #include <linux/compiler.h>
14  #include <sys/types.h>
15  #include <stdio.h>
16  #include <getopt.h>
17  #include <stddef.h>
18  #include <libelf.h>
19  #include <string.h>
20  #include <stdlib.h>
21  #include <inttypes.h>
22  #include <limits.h>
23  #include <fcntl.h>
24  #include <err.h>
25  #include <dwarf.h>
26  
27  #include "genelf.h"
28  #include "../util/jitdump.h"
29  
30  #define BUFFER_EXT_DFL_SIZE	(4 * 1024)
31  
32  typedef uint32_t uword;
33  typedef uint16_t uhalf;
34  typedef int32_t  sword;
35  typedef int16_t  shalf;
36  typedef uint8_t  ubyte;
37  typedef int8_t   sbyte;
38  
39  struct buffer_ext {
40  	size_t cur_pos;
41  	size_t max_sz;
42  	void *data;
43  };
44  
45  static void
buffer_ext_dump(struct buffer_ext * be,const char * msg)46  buffer_ext_dump(struct buffer_ext *be, const char *msg)
47  {
48  	size_t i;
49  	warnx("DUMP for %s", msg);
50  	for (i = 0 ; i < be->cur_pos; i++)
51  		warnx("%4zu 0x%02x", i, (((char *)be->data)[i]) & 0xff);
52  }
53  
54  static inline int
buffer_ext_add(struct buffer_ext * be,void * addr,size_t sz)55  buffer_ext_add(struct buffer_ext *be, void *addr, size_t sz)
56  {
57  	void *tmp;
58  	size_t be_sz = be->max_sz;
59  
60  retry:
61  	if ((be->cur_pos + sz) < be_sz) {
62  		memcpy(be->data + be->cur_pos, addr, sz);
63  		be->cur_pos += sz;
64  		return 0;
65  	}
66  
67  	if (!be_sz)
68  		be_sz = BUFFER_EXT_DFL_SIZE;
69  	else
70  		be_sz <<= 1;
71  
72  	tmp = realloc(be->data, be_sz);
73  	if (!tmp)
74  		return -1;
75  
76  	be->data   = tmp;
77  	be->max_sz = be_sz;
78  
79  	goto retry;
80  }
81  
82  static void
buffer_ext_init(struct buffer_ext * be)83  buffer_ext_init(struct buffer_ext *be)
84  {
85  	be->data = NULL;
86  	be->cur_pos = 0;
87  	be->max_sz = 0;
88  }
89  
90  static inline size_t
buffer_ext_size(struct buffer_ext * be)91  buffer_ext_size(struct buffer_ext *be)
92  {
93  	return be->cur_pos;
94  }
95  
96  static inline void *
buffer_ext_addr(struct buffer_ext * be)97  buffer_ext_addr(struct buffer_ext *be)
98  {
99  	return be->data;
100  }
101  
102  struct debug_line_header {
103  	// Not counting this field
104  	uword total_length;
105  	// version number (2 currently)
106  	uhalf version;
107  	// relative offset from next field to
108  	// program statement
109  	uword prolog_length;
110  	ubyte minimum_instruction_length;
111  	ubyte default_is_stmt;
112  	// line_base - see DWARF 2 specs
113  	sbyte line_base;
114  	// line_range - see DWARF 2 specs
115  	ubyte line_range;
116  	// number of opcode + 1
117  	ubyte opcode_base;
118  	/* follow the array of opcode args nr: ubytes [nr_opcode_base] */
119  	/* follow the search directories index, zero terminated string
120  	 * terminated by an empty string.
121  	 */
122  	/* follow an array of { filename, LEB128, LEB128, LEB128 }, first is
123  	 * the directory index entry, 0 means current directory, then mtime
124  	 * and filesize, last entry is followed by en empty string.
125  	 */
126  	/* follow the first program statement */
127  } __packed;
128  
129  /* DWARF 2 spec talk only about one possible compilation unit header while
130   * binutils can handle two flavours of dwarf 2, 32 and 64 bits, this is not
131   * related to the used arch, an ELF 32 can hold more than 4 Go of debug
132   * information. For now we handle only DWARF 2 32 bits comp unit. It'll only
133   * become a problem if we generate more than 4GB of debug information.
134   */
135  struct compilation_unit_header {
136  	uword total_length;
137  	uhalf version;
138  	uword debug_abbrev_offset;
139  	ubyte pointer_size;
140  } __packed;
141  
142  #define DW_LNS_num_opcode (DW_LNS_set_isa + 1)
143  
144  /* field filled at run time are marked with -1 */
145  static struct debug_line_header const default_debug_line_header = {
146  	.total_length = -1,
147  	.version = 2,
148  	.prolog_length = -1,
149  	.minimum_instruction_length = 1,	/* could be better when min instruction size != 1 */
150  	.default_is_stmt = 1,	/* we don't take care about basic block */
151  	.line_base = -5,	/* sensible value for line base ... */
152  	.line_range = -14,     /* ... and line range are guessed statically */
153  	.opcode_base = DW_LNS_num_opcode
154  };
155  
156  static ubyte standard_opcode_length[] =
157  {
158  	0, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1
159  };
160  #if 0
161  {
162  	[DW_LNS_advance_pc]   = 1,
163  	[DW_LNS_advance_line] = 1,
164  	[DW_LNS_set_file] =  1,
165  	[DW_LNS_set_column] = 1,
166  	[DW_LNS_fixed_advance_pc] = 1,
167  	[DW_LNS_set_isa] = 1,
168  };
169  #endif
170  
171  /* field filled at run time are marked with -1 */
172  static struct compilation_unit_header default_comp_unit_header = {
173  	.total_length = -1,
174  	.version = 2,
175  	.debug_abbrev_offset = 0,     /* we reuse the same abbrev entries for all comp unit */
176  	.pointer_size = sizeof(void *)
177  };
178  
emit_uword(struct buffer_ext * be,uword data)179  static void emit_uword(struct buffer_ext *be, uword data)
180  {
181  	buffer_ext_add(be, &data, sizeof(uword));
182  }
183  
emit_string(struct buffer_ext * be,const char * s)184  static void emit_string(struct buffer_ext *be, const char *s)
185  {
186  	buffer_ext_add(be, (void *)s, strlen(s) + 1);
187  }
188  
emit_unsigned_LEB128(struct buffer_ext * be,unsigned long data)189  static void emit_unsigned_LEB128(struct buffer_ext *be,
190  				 unsigned long data)
191  {
192  	do {
193  		ubyte cur = data & 0x7F;
194  		data >>= 7;
195  		if (data)
196  			cur |= 0x80;
197  		buffer_ext_add(be, &cur, 1);
198  	} while (data);
199  }
200  
emit_signed_LEB128(struct buffer_ext * be,long data)201  static void emit_signed_LEB128(struct buffer_ext *be, long data)
202  {
203  	int more = 1;
204  	int negative = data < 0;
205  	int size = sizeof(long) * CHAR_BIT;
206  	while (more) {
207  		ubyte cur = data & 0x7F;
208  		data >>= 7;
209  		if (negative)
210  			data |= - (1 << (size - 7));
211  		if ((data == 0 && !(cur & 0x40)) ||
212  		    (data == -1l && (cur & 0x40)))
213  			more = 0;
214  		else
215  			cur |= 0x80;
216  		buffer_ext_add(be, &cur, 1);
217  	}
218  }
219  
emit_extended_opcode(struct buffer_ext * be,ubyte opcode,void * data,size_t data_len)220  static void emit_extended_opcode(struct buffer_ext *be, ubyte opcode,
221  				 void *data, size_t data_len)
222  {
223  	buffer_ext_add(be, (char *)"", 1);
224  
225  	emit_unsigned_LEB128(be, data_len + 1);
226  
227  	buffer_ext_add(be, &opcode, 1);
228  	buffer_ext_add(be, data, data_len);
229  }
230  
emit_opcode(struct buffer_ext * be,ubyte opcode)231  static void emit_opcode(struct buffer_ext *be, ubyte opcode)
232  {
233  	buffer_ext_add(be, &opcode, 1);
234  }
235  
emit_opcode_signed(struct buffer_ext * be,ubyte opcode,long data)236  static void emit_opcode_signed(struct buffer_ext  *be,
237  			       ubyte opcode, long data)
238  {
239  	buffer_ext_add(be, &opcode, 1);
240  	emit_signed_LEB128(be, data);
241  }
242  
emit_opcode_unsigned(struct buffer_ext * be,ubyte opcode,unsigned long data)243  static void emit_opcode_unsigned(struct buffer_ext *be, ubyte opcode,
244  				 unsigned long data)
245  {
246  	buffer_ext_add(be, &opcode, 1);
247  	emit_unsigned_LEB128(be, data);
248  }
249  
emit_advance_pc(struct buffer_ext * be,unsigned long delta_pc)250  static void emit_advance_pc(struct buffer_ext *be, unsigned long delta_pc)
251  {
252  	emit_opcode_unsigned(be, DW_LNS_advance_pc, delta_pc);
253  }
254  
emit_advance_lineno(struct buffer_ext * be,long delta_lineno)255  static void emit_advance_lineno(struct buffer_ext  *be, long delta_lineno)
256  {
257  	emit_opcode_signed(be, DW_LNS_advance_line, delta_lineno);
258  }
259  
emit_lne_end_of_sequence(struct buffer_ext * be)260  static void emit_lne_end_of_sequence(struct buffer_ext *be)
261  {
262  	emit_extended_opcode(be, DW_LNE_end_sequence, NULL, 0);
263  }
264  
emit_set_file(struct buffer_ext * be,unsigned long idx)265  static void emit_set_file(struct buffer_ext *be, unsigned long idx)
266  {
267  	emit_opcode_unsigned(be, DW_LNS_set_file, idx);
268  }
269  
emit_lne_define_filename(struct buffer_ext * be,const char * filename)270  static void emit_lne_define_filename(struct buffer_ext *be,
271  				     const char *filename)
272  {
273  	buffer_ext_add(be, (void *)"", 1);
274  
275  	/* LNE field, strlen(filename) + zero termination, 3 bytes for: the dir entry, timestamp, filesize */
276  	emit_unsigned_LEB128(be, strlen(filename) + 5);
277  	emit_opcode(be, DW_LNE_define_file);
278  	emit_string(be, filename);
279  	/* directory index 0=do not know */
280          emit_unsigned_LEB128(be, 0);
281  	/* last modification date on file 0=do not know */
282          emit_unsigned_LEB128(be, 0);
283  	/* filesize 0=do not know */
284          emit_unsigned_LEB128(be, 0);
285  }
286  
emit_lne_set_address(struct buffer_ext * be,void * address)287  static void emit_lne_set_address(struct buffer_ext *be,
288  				 void *address)
289  {
290  	emit_extended_opcode(be, DW_LNE_set_address, &address, sizeof(unsigned long));
291  }
292  
get_special_opcode(struct debug_entry * ent,unsigned int last_line,unsigned long last_vma)293  static ubyte get_special_opcode(struct debug_entry *ent,
294  				unsigned int last_line,
295  				unsigned long last_vma)
296  {
297  	unsigned int temp;
298  	unsigned long delta_addr;
299  
300  	/*
301  	 * delta from line_base
302  	 */
303  	temp = (ent->lineno - last_line) - default_debug_line_header.line_base;
304  
305  	if (temp >= default_debug_line_header.line_range)
306  		return 0;
307  
308  	/*
309  	 * delta of addresses
310  	 */
311  	delta_addr = (ent->addr - last_vma) / default_debug_line_header.minimum_instruction_length;
312  
313  	/* This is not sufficient to ensure opcode will be in [0-256] but
314  	 * sufficient to ensure when summing with the delta lineno we will
315  	 * not overflow the unsigned long opcode */
316  
317  	if (delta_addr <= 256 / default_debug_line_header.line_range) {
318  		unsigned long opcode = temp +
319  			(delta_addr * default_debug_line_header.line_range) +
320  			default_debug_line_header.opcode_base;
321  
322  		return opcode <= 255 ? opcode : 0;
323  	}
324  	return 0;
325  }
326  
emit_lineno_info(struct buffer_ext * be,struct debug_entry * ent,size_t nr_entry,unsigned long code_addr)327  static void emit_lineno_info(struct buffer_ext *be,
328  			     struct debug_entry *ent, size_t nr_entry,
329  			     unsigned long code_addr)
330  {
331  	size_t i;
332  
333  	/*
334  	 * Machine state at start of a statement program
335  	 * address = 0
336  	 * file    = 1
337  	 * line    = 1
338  	 * column  = 0
339  	 * is_stmt = default_is_stmt as given in the debug_line_header
340  	 * basic block = 0
341  	 * end sequence = 0
342  	 */
343  
344  	/* start state of the state machine we take care of */
345  	unsigned long last_vma = 0;
346  	char const  *cur_filename = NULL;
347  	unsigned long cur_file_idx = 0;
348  	int last_line = 1;
349  
350  	emit_lne_set_address(be, (void *)code_addr);
351  
352  	for (i = 0; i < nr_entry; i++, ent = debug_entry_next(ent)) {
353  		int need_copy = 0;
354  		ubyte special_opcode;
355  
356  		/*
357  		 * check if filename changed, if so add it
358  		 */
359  		if (!cur_filename || strcmp(cur_filename, ent->name)) {
360  			emit_lne_define_filename(be, ent->name);
361  			cur_filename = ent->name;
362  			emit_set_file(be, ++cur_file_idx);
363  			need_copy = 1;
364  		}
365  
366  		special_opcode = get_special_opcode(ent, last_line, last_vma);
367  		if (special_opcode != 0) {
368  			last_line = ent->lineno;
369  			last_vma  = ent->addr;
370  			emit_opcode(be, special_opcode);
371  		} else {
372  			/*
373  			 * lines differ, emit line delta
374  			 */
375  			if (last_line != ent->lineno) {
376  				emit_advance_lineno(be, ent->lineno - last_line);
377  				last_line = ent->lineno;
378  				need_copy = 1;
379  			}
380  			/*
381  			 * addresses differ, emit address delta
382  			 */
383  			if (last_vma != ent->addr) {
384  				emit_advance_pc(be, ent->addr - last_vma);
385  				last_vma = ent->addr;
386  				need_copy = 1;
387  			}
388  			/*
389  			 * add new row to matrix
390  			 */
391  			if (need_copy)
392  				emit_opcode(be, DW_LNS_copy);
393  		}
394  	}
395  }
396  
add_debug_line(struct buffer_ext * be,struct debug_entry * ent,size_t nr_entry,unsigned long code_addr)397  static void add_debug_line(struct buffer_ext *be,
398  	struct debug_entry *ent, size_t nr_entry,
399  	unsigned long code_addr)
400  {
401  	struct debug_line_header * dbg_header;
402  	size_t old_size;
403  
404  	old_size = buffer_ext_size(be);
405  
406  	buffer_ext_add(be, (void *)&default_debug_line_header,
407  		 sizeof(default_debug_line_header));
408  
409  	buffer_ext_add(be, &standard_opcode_length,  sizeof(standard_opcode_length));
410  
411  	// empty directory entry
412  	buffer_ext_add(be, (void *)"", 1);
413  
414  	// empty filename directory
415  	buffer_ext_add(be, (void *)"", 1);
416  
417  	dbg_header = buffer_ext_addr(be) + old_size;
418  	dbg_header->prolog_length = (buffer_ext_size(be) - old_size) -
419  		offsetof(struct debug_line_header, minimum_instruction_length);
420  
421  	emit_lineno_info(be, ent, nr_entry, code_addr);
422  
423  	emit_lne_end_of_sequence(be);
424  
425  	dbg_header = buffer_ext_addr(be) + old_size;
426  	dbg_header->total_length = (buffer_ext_size(be) - old_size) -
427  		offsetof(struct debug_line_header, version);
428  }
429  
430  static void
add_debug_abbrev(struct buffer_ext * be)431  add_debug_abbrev(struct buffer_ext *be)
432  {
433          emit_unsigned_LEB128(be, 1);
434          emit_unsigned_LEB128(be, DW_TAG_compile_unit);
435          emit_unsigned_LEB128(be, DW_CHILDREN_yes);
436          emit_unsigned_LEB128(be, DW_AT_stmt_list);
437          emit_unsigned_LEB128(be, DW_FORM_data4);
438          emit_unsigned_LEB128(be, 0);
439          emit_unsigned_LEB128(be, 0);
440          emit_unsigned_LEB128(be, 0);
441  }
442  
443  static void
add_compilation_unit(struct buffer_ext * be,size_t offset_debug_line)444  add_compilation_unit(struct buffer_ext *be,
445  		     size_t offset_debug_line)
446  {
447  	struct compilation_unit_header *comp_unit_header;
448  	size_t old_size = buffer_ext_size(be);
449  
450  	buffer_ext_add(be, &default_comp_unit_header,
451  		       sizeof(default_comp_unit_header));
452  
453  	emit_unsigned_LEB128(be, 1);
454  	emit_uword(be, offset_debug_line);
455  
456  	comp_unit_header = buffer_ext_addr(be) + old_size;
457  	comp_unit_header->total_length = (buffer_ext_size(be) - old_size) -
458  		offsetof(struct compilation_unit_header, version);
459  }
460  
461  static int
jit_process_debug_info(uint64_t code_addr,void * debug,int nr_debug_entries,struct buffer_ext * dl,struct buffer_ext * da,struct buffer_ext * di)462  jit_process_debug_info(uint64_t code_addr,
463  		       void *debug, int nr_debug_entries,
464  		       struct buffer_ext *dl,
465  		       struct buffer_ext *da,
466  		       struct buffer_ext *di)
467  {
468  	struct debug_entry *ent = debug;
469  	int i;
470  
471  	for (i = 0; i < nr_debug_entries; i++) {
472  		ent->addr = ent->addr - code_addr;
473  		ent = debug_entry_next(ent);
474  	}
475  	add_compilation_unit(di, buffer_ext_size(dl));
476  	add_debug_line(dl, debug, nr_debug_entries, GEN_ELF_TEXT_OFFSET);
477  	add_debug_abbrev(da);
478  	if (0) buffer_ext_dump(da, "abbrev");
479  
480  	return 0;
481  }
482  
483  int
jit_add_debug_info(Elf * e,uint64_t code_addr,void * debug,int nr_debug_entries)484  jit_add_debug_info(Elf *e, uint64_t code_addr, void *debug, int nr_debug_entries)
485  {
486  	Elf_Data *d;
487  	Elf_Scn *scn;
488  	Elf_Shdr *shdr;
489  	struct buffer_ext dl, di, da;
490  	int ret;
491  
492  	buffer_ext_init(&dl);
493  	buffer_ext_init(&di);
494  	buffer_ext_init(&da);
495  
496  	ret = jit_process_debug_info(code_addr, debug, nr_debug_entries, &dl, &da, &di);
497  	if (ret)
498  		return -1;
499  	/*
500  	 * setup .debug_line section
501  	 */
502  	scn = elf_newscn(e);
503  	if (!scn) {
504  		warnx("cannot create section");
505  		return -1;
506  	}
507  
508  	d = elf_newdata(scn);
509  	if (!d) {
510  		warnx("cannot get new data");
511  		return -1;
512  	}
513  
514  	d->d_align = 1;
515  	d->d_off = 0LL;
516  	d->d_buf = buffer_ext_addr(&dl);
517  	d->d_type = ELF_T_BYTE;
518  	d->d_size = buffer_ext_size(&dl);
519  	d->d_version = EV_CURRENT;
520  
521  	shdr = elf_getshdr(scn);
522  	if (!shdr) {
523  		warnx("cannot get section header");
524  		return -1;
525  	}
526  
527  	shdr->sh_name = 52; /* .debug_line */
528  	shdr->sh_type = SHT_PROGBITS;
529  	shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
530  	shdr->sh_flags = 0;
531  	shdr->sh_entsize = 0;
532  
533  	/*
534  	 * setup .debug_info section
535  	 */
536  	scn = elf_newscn(e);
537  	if (!scn) {
538  		warnx("cannot create section");
539  		return -1;
540  	}
541  
542  	d = elf_newdata(scn);
543  	if (!d) {
544  		warnx("cannot get new data");
545  		return -1;
546  	}
547  
548  	d->d_align = 1;
549  	d->d_off = 0LL;
550  	d->d_buf = buffer_ext_addr(&di);
551  	d->d_type = ELF_T_BYTE;
552  	d->d_size = buffer_ext_size(&di);
553  	d->d_version = EV_CURRENT;
554  
555  	shdr = elf_getshdr(scn);
556  	if (!shdr) {
557  		warnx("cannot get section header");
558  		return -1;
559  	}
560  
561  	shdr->sh_name = 64; /* .debug_info */
562  	shdr->sh_type = SHT_PROGBITS;
563  	shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
564  	shdr->sh_flags = 0;
565  	shdr->sh_entsize = 0;
566  
567  	/*
568  	 * setup .debug_abbrev section
569  	 */
570  	scn = elf_newscn(e);
571  	if (!scn) {
572  		warnx("cannot create section");
573  		return -1;
574  	}
575  
576  	d = elf_newdata(scn);
577  	if (!d) {
578  		warnx("cannot get new data");
579  		return -1;
580  	}
581  
582  	d->d_align = 1;
583  	d->d_off = 0LL;
584  	d->d_buf = buffer_ext_addr(&da);
585  	d->d_type = ELF_T_BYTE;
586  	d->d_size = buffer_ext_size(&da);
587  	d->d_version = EV_CURRENT;
588  
589  	shdr = elf_getshdr(scn);
590  	if (!shdr) {
591  		warnx("cannot get section header");
592  		return -1;
593  	}
594  
595  	shdr->sh_name = 76; /* .debug_info */
596  	shdr->sh_type = SHT_PROGBITS;
597  	shdr->sh_addr = 0; /* must be zero or == sh_offset -> dynamic object */
598  	shdr->sh_flags = 0;
599  	shdr->sh_entsize = 0;
600  
601  	/*
602  	 * now we update the ELF image with all the sections
603  	 */
604  	if (elf_update(e, ELF_C_WRITE) < 0) {
605  		warnx("elf_update debug failed");
606  		return -1;
607  	}
608  	return 0;
609  }
610