recordmcount.c 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509
  1. /*
  2. * recordmcount.c: construct a table of the locations of calls to 'mcount'
  3. * so that ftrace can find them quickly.
  4. * Copyright 2009 John F. Reiser <jreiser@BitWagon.com>. All rights reserved.
  5. * Licensed under the GNU General Public License, version 2 (GPLv2).
  6. *
  7. * Restructured to fit Linux format, as well as other updates:
  8. * Copyright 2010 Steven Rostedt <srostedt@redhat.com>, Red Hat Inc.
  9. */
  10. /*
  11. * Strategy: alter the .o file in-place.
  12. *
  13. * Append a new STRTAB that has the new section names, followed by a new array
  14. * ElfXX_Shdr[] that has the new section headers, followed by the section
  15. * contents for __mcount_loc and its relocations. The old shstrtab strings,
  16. * and the old ElfXX_Shdr[] array, remain as "garbage" (commonly, a couple
  17. * kilobytes.) Subsequent processing by /bin/ld (or the kernel module loader)
  18. * will ignore the garbage regions, because they are not designated by the
  19. * new .e_shoff nor the new ElfXX_Shdr[]. [In order to remove the garbage,
  20. * then use "ld -r" to create a new file that omits the garbage.]
  21. */
  22. #include <sys/types.h>
  23. #include <sys/mman.h>
  24. #include <sys/stat.h>
  25. #include <getopt.h>
  26. #include <elf.h>
  27. #include <fcntl.h>
  28. #include <setjmp.h>
  29. #include <stdio.h>
  30. #include <stdlib.h>
  31. #include <string.h>
  32. #include <unistd.h>
  33. #ifndef EM_METAG
  34. /* Remove this when these make it to the standard system elf.h. */
  35. #define EM_METAG 174
  36. #define R_METAG_ADDR32 2
  37. #define R_METAG_NONE 3
  38. #endif
  39. #ifndef EM_AARCH64
  40. #define EM_AARCH64 183
  41. #define R_AARCH64_NONE 0
  42. #define R_AARCH64_ABS64 257
  43. #endif
  44. static int fd_map; /* File descriptor for file being modified. */
  45. static int mmap_failed; /* Boolean flag. */
  46. static void *ehdr_curr; /* current ElfXX_Ehdr * for resource cleanup */
  47. static char gpfx; /* prefix for global symbol name (sometimes '_') */
  48. static struct stat sb; /* Remember .st_size, etc. */
  49. static jmp_buf jmpenv; /* setjmp/longjmp per-file error escape */
  50. static const char *altmcount; /* alternate mcount symbol name */
  51. static int warn_on_notrace_sect; /* warn when section has mcount not being recorded */
  52. /* setjmp() return values */
  53. enum {
  54. SJ_SETJMP = 0, /* hardwired first return */
  55. SJ_FAIL,
  56. SJ_SUCCEED
  57. };
  58. /* Per-file resource cleanup when multiple files. */
  59. static void
  60. cleanup(void)
  61. {
  62. if (!mmap_failed)
  63. munmap(ehdr_curr, sb.st_size);
  64. else
  65. free(ehdr_curr);
  66. close(fd_map);
  67. }
  68. static void __attribute__((noreturn))
  69. fail_file(void)
  70. {
  71. cleanup();
  72. longjmp(jmpenv, SJ_FAIL);
  73. }
  74. static void __attribute__((noreturn))
  75. succeed_file(void)
  76. {
  77. cleanup();
  78. longjmp(jmpenv, SJ_SUCCEED);
  79. }
  80. /* ulseek, uread, ...: Check return value for errors. */
  81. static off_t
  82. ulseek(int const fd, off_t const offset, int const whence)
  83. {
  84. off_t const w = lseek(fd, offset, whence);
  85. if (w == (off_t)-1) {
  86. perror("lseek");
  87. fail_file();
  88. }
  89. return w;
  90. }
  91. static size_t
  92. uread(int const fd, void *const buf, size_t const count)
  93. {
  94. size_t const n = read(fd, buf, count);
  95. if (n != count) {
  96. perror("read");
  97. fail_file();
  98. }
  99. return n;
  100. }
  101. static size_t
  102. uwrite(int const fd, void const *const buf, size_t const count)
  103. {
  104. size_t const n = write(fd, buf, count);
  105. if (n != count) {
  106. perror("write");
  107. fail_file();
  108. }
  109. return n;
  110. }
  111. static void *
  112. umalloc(size_t size)
  113. {
  114. void *const addr = malloc(size);
  115. if (addr == 0) {
  116. fprintf(stderr, "malloc failed: %zu bytes\n", size);
  117. fail_file();
  118. }
  119. return addr;
  120. }
  121. static unsigned char ideal_nop5_x86_64[5] = { 0x0f, 0x1f, 0x44, 0x00, 0x00 };
  122. static unsigned char ideal_nop5_x86_32[5] = { 0x3e, 0x8d, 0x74, 0x26, 0x00 };
  123. static unsigned char *ideal_nop;
  124. static char rel_type_nop;
  125. static int (*make_nop)(void *map, size_t const offset);
  126. static int make_nop_x86(void *map, size_t const offset)
  127. {
  128. uint32_t *ptr;
  129. unsigned char *op;
  130. /* Confirm we have 0xe8 0x0 0x0 0x0 0x0 */
  131. ptr = map + offset;
  132. if (*ptr != 0)
  133. return -1;
  134. op = map + offset - 1;
  135. if (*op != 0xe8)
  136. return -1;
  137. /* convert to nop */
  138. ulseek(fd_map, offset - 1, SEEK_SET);
  139. uwrite(fd_map, ideal_nop, 5);
  140. return 0;
  141. }
  142. static unsigned char ideal_nop4_arm64[4] = {0x1f, 0x20, 0x03, 0xd5};
  143. static int make_nop_arm64(void *map, size_t const offset)
  144. {
  145. uint32_t *ptr;
  146. ptr = map + offset;
  147. /* bl <_mcount> is 0x94000000 before relocation */
  148. if (*ptr != 0x94000000)
  149. return -1;
  150. /* Convert to nop */
  151. ulseek(fd_map, offset, SEEK_SET);
  152. uwrite(fd_map, ideal_nop, 4);
  153. return 0;
  154. }
  155. /*
  156. * Get the whole file as a programming convenience in order to avoid
  157. * malloc+lseek+read+free of many pieces. If successful, then mmap
  158. * avoids copying unused pieces; else just read the whole file.
  159. * Open for both read and write; new info will be appended to the file.
  160. * Use MAP_PRIVATE so that a few changes to the in-memory ElfXX_Ehdr
  161. * do not propagate to the file until an explicit overwrite at the last.
  162. * This preserves most aspects of consistency (all except .st_size)
  163. * for simultaneous readers of the file while we are appending to it.
  164. * However, multiple writers still are bad. We choose not to use
  165. * locking because it is expensive and the use case of kernel build
  166. * makes multiple writers unlikely.
  167. */
  168. static void *mmap_file(char const *fname)
  169. {
  170. void *addr;
  171. fd_map = open(fname, O_RDWR);
  172. if (fd_map < 0 || fstat(fd_map, &sb) < 0) {
  173. perror(fname);
  174. fail_file();
  175. }
  176. if (!S_ISREG(sb.st_mode)) {
  177. fprintf(stderr, "not a regular file: %s\n", fname);
  178. fail_file();
  179. }
  180. addr = mmap(0, sb.st_size, PROT_READ|PROT_WRITE, MAP_PRIVATE,
  181. fd_map, 0);
  182. mmap_failed = 0;
  183. if (addr == MAP_FAILED) {
  184. mmap_failed = 1;
  185. addr = umalloc(sb.st_size);
  186. uread(fd_map, addr, sb.st_size);
  187. }
  188. return addr;
  189. }
  190. /* w8rev, w8nat, ...: Handle endianness. */
  191. static uint64_t w8rev(uint64_t const x)
  192. {
  193. return ((0xff & (x >> (0 * 8))) << (7 * 8))
  194. | ((0xff & (x >> (1 * 8))) << (6 * 8))
  195. | ((0xff & (x >> (2 * 8))) << (5 * 8))
  196. | ((0xff & (x >> (3 * 8))) << (4 * 8))
  197. | ((0xff & (x >> (4 * 8))) << (3 * 8))
  198. | ((0xff & (x >> (5 * 8))) << (2 * 8))
  199. | ((0xff & (x >> (6 * 8))) << (1 * 8))
  200. | ((0xff & (x >> (7 * 8))) << (0 * 8));
  201. }
  202. static uint32_t w4rev(uint32_t const x)
  203. {
  204. return ((0xff & (x >> (0 * 8))) << (3 * 8))
  205. | ((0xff & (x >> (1 * 8))) << (2 * 8))
  206. | ((0xff & (x >> (2 * 8))) << (1 * 8))
  207. | ((0xff & (x >> (3 * 8))) << (0 * 8));
  208. }
  209. static uint32_t w2rev(uint16_t const x)
  210. {
  211. return ((0xff & (x >> (0 * 8))) << (1 * 8))
  212. | ((0xff & (x >> (1 * 8))) << (0 * 8));
  213. }
  214. static uint64_t w8nat(uint64_t const x)
  215. {
  216. return x;
  217. }
  218. static uint32_t w4nat(uint32_t const x)
  219. {
  220. return x;
  221. }
  222. static uint32_t w2nat(uint16_t const x)
  223. {
  224. return x;
  225. }
  226. static uint64_t (*w8)(uint64_t);
  227. static uint32_t (*w)(uint32_t);
  228. static uint32_t (*w2)(uint16_t);
  229. /* Names of the sections that could contain calls to mcount. */
  230. static int
  231. is_mcounted_section_name(char const *const txtname)
  232. {
  233. return strcmp(".text", txtname) == 0 ||
  234. strcmp(".ref.text", txtname) == 0 ||
  235. strcmp(".sched.text", txtname) == 0 ||
  236. strcmp(".spinlock.text", txtname) == 0 ||
  237. strcmp(".irqentry.text", txtname) == 0 ||
  238. strcmp(".kprobes.text", txtname) == 0 ||
  239. strcmp(".text.unlikely", txtname) == 0;
  240. }
  241. /* 32 bit and 64 bit are very similar */
  242. #include "recordmcount.h"
  243. #define RECORD_MCOUNT_64
  244. #include "recordmcount.h"
  245. /* 64-bit EM_MIPS has weird ELF64_Rela.r_info.
  246. * http://techpubs.sgi.com/library/manuals/4000/007-4658-001/pdf/007-4658-001.pdf
  247. * We interpret Table 29 Relocation Operation (Elf64_Rel, Elf64_Rela) [p.40]
  248. * to imply the order of the members; the spec does not say so.
  249. * typedef unsigned char Elf64_Byte;
  250. * fails on MIPS64 because their <elf.h> already has it!
  251. */
  252. typedef uint8_t myElf64_Byte; /* Type for a 8-bit quantity. */
  253. union mips_r_info {
  254. Elf64_Xword r_info;
  255. struct {
  256. Elf64_Word r_sym; /* Symbol index. */
  257. myElf64_Byte r_ssym; /* Special symbol. */
  258. myElf64_Byte r_type3; /* Third relocation. */
  259. myElf64_Byte r_type2; /* Second relocation. */
  260. myElf64_Byte r_type; /* First relocation. */
  261. } r_mips;
  262. };
  263. static uint64_t MIPS64_r_sym(Elf64_Rel const *rp)
  264. {
  265. return w(((union mips_r_info){ .r_info = rp->r_info }).r_mips.r_sym);
  266. }
  267. static void MIPS64_r_info(Elf64_Rel *const rp, unsigned sym, unsigned type)
  268. {
  269. rp->r_info = ((union mips_r_info){
  270. .r_mips = { .r_sym = w(sym), .r_type = type }
  271. }).r_info;
  272. }
  273. static void
  274. do_file(char const *const fname)
  275. {
  276. Elf32_Ehdr *const ehdr = mmap_file(fname);
  277. unsigned int reltype = 0;
  278. ehdr_curr = ehdr;
  279. w = w4nat;
  280. w2 = w2nat;
  281. w8 = w8nat;
  282. switch (ehdr->e_ident[EI_DATA]) {
  283. static unsigned int const endian = 1;
  284. default:
  285. fprintf(stderr, "unrecognized ELF data encoding %d: %s\n",
  286. ehdr->e_ident[EI_DATA], fname);
  287. fail_file();
  288. break;
  289. case ELFDATA2LSB:
  290. if (*(unsigned char const *)&endian != 1) {
  291. /* main() is big endian, file.o is little endian. */
  292. w = w4rev;
  293. w2 = w2rev;
  294. w8 = w8rev;
  295. }
  296. break;
  297. case ELFDATA2MSB:
  298. if (*(unsigned char const *)&endian != 0) {
  299. /* main() is little endian, file.o is big endian. */
  300. w = w4rev;
  301. w2 = w2rev;
  302. w8 = w8rev;
  303. }
  304. break;
  305. } /* end switch */
  306. if (memcmp(ELFMAG, ehdr->e_ident, SELFMAG) != 0
  307. || w2(ehdr->e_type) != ET_REL
  308. || ehdr->e_ident[EI_VERSION] != EV_CURRENT) {
  309. fprintf(stderr, "unrecognized ET_REL file %s\n", fname);
  310. fail_file();
  311. }
  312. gpfx = 0;
  313. switch (w2(ehdr->e_machine)) {
  314. default:
  315. fprintf(stderr, "unrecognized e_machine %d %s\n",
  316. w2(ehdr->e_machine), fname);
  317. fail_file();
  318. break;
  319. case EM_386:
  320. reltype = R_386_32;
  321. rel_type_nop = R_386_NONE;
  322. make_nop = make_nop_x86;
  323. ideal_nop = ideal_nop5_x86_32;
  324. mcount_adjust_32 = -1;
  325. break;
  326. case EM_ARM: reltype = R_ARM_ABS32;
  327. altmcount = "__gnu_mcount_nc";
  328. break;
  329. case EM_AARCH64:
  330. reltype = R_AARCH64_ABS64;
  331. make_nop = make_nop_arm64;
  332. rel_type_nop = R_AARCH64_NONE;
  333. ideal_nop = ideal_nop4_arm64;
  334. gpfx = '_';
  335. break;
  336. case EM_IA_64: reltype = R_IA64_IMM64; gpfx = '_'; break;
  337. case EM_METAG: reltype = R_METAG_ADDR32;
  338. altmcount = "_mcount_wrapper";
  339. rel_type_nop = R_METAG_NONE;
  340. /* We happen to have the same requirement as MIPS */
  341. is_fake_mcount32 = MIPS32_is_fake_mcount;
  342. break;
  343. case EM_MIPS: /* reltype: e_class */ gpfx = '_'; break;
  344. case EM_PPC: reltype = R_PPC_ADDR32; gpfx = '_'; break;
  345. case EM_PPC64: reltype = R_PPC64_ADDR64; gpfx = '_'; break;
  346. case EM_S390: /* reltype: e_class */ gpfx = '_'; break;
  347. case EM_SH: reltype = R_SH_DIR32; break;
  348. case EM_SPARCV9: reltype = R_SPARC_64; gpfx = '_'; break;
  349. case EM_X86_64:
  350. make_nop = make_nop_x86;
  351. ideal_nop = ideal_nop5_x86_64;
  352. reltype = R_X86_64_64;
  353. rel_type_nop = R_X86_64_NONE;
  354. mcount_adjust_64 = -1;
  355. break;
  356. } /* end switch */
  357. switch (ehdr->e_ident[EI_CLASS]) {
  358. default:
  359. fprintf(stderr, "unrecognized ELF class %d %s\n",
  360. ehdr->e_ident[EI_CLASS], fname);
  361. fail_file();
  362. break;
  363. case ELFCLASS32:
  364. if (w2(ehdr->e_ehsize) != sizeof(Elf32_Ehdr)
  365. || w2(ehdr->e_shentsize) != sizeof(Elf32_Shdr)) {
  366. fprintf(stderr,
  367. "unrecognized ET_REL file: %s\n", fname);
  368. fail_file();
  369. }
  370. if (w2(ehdr->e_machine) == EM_MIPS) {
  371. reltype = R_MIPS_32;
  372. is_fake_mcount32 = MIPS32_is_fake_mcount;
  373. }
  374. do32(ehdr, fname, reltype);
  375. break;
  376. case ELFCLASS64: {
  377. Elf64_Ehdr *const ghdr = (Elf64_Ehdr *)ehdr;
  378. if (w2(ghdr->e_ehsize) != sizeof(Elf64_Ehdr)
  379. || w2(ghdr->e_shentsize) != sizeof(Elf64_Shdr)) {
  380. fprintf(stderr,
  381. "unrecognized ET_REL file: %s\n", fname);
  382. fail_file();
  383. }
  384. if (w2(ghdr->e_machine) == EM_S390) {
  385. reltype = R_390_64;
  386. mcount_adjust_64 = -14;
  387. }
  388. if (w2(ghdr->e_machine) == EM_MIPS) {
  389. reltype = R_MIPS_64;
  390. Elf64_r_sym = MIPS64_r_sym;
  391. Elf64_r_info = MIPS64_r_info;
  392. is_fake_mcount64 = MIPS64_is_fake_mcount;
  393. }
  394. do64(ghdr, fname, reltype);
  395. break;
  396. }
  397. } /* end switch */
  398. cleanup();
  399. }
  400. int
  401. main(int argc, char *argv[])
  402. {
  403. const char ftrace[] = "/ftrace.o";
  404. int ftrace_size = sizeof(ftrace) - 1;
  405. int n_error = 0; /* gcc-4.3.0 false positive complaint */
  406. int c;
  407. int i;
  408. while ((c = getopt(argc, argv, "w")) >= 0) {
  409. switch (c) {
  410. case 'w':
  411. warn_on_notrace_sect = 1;
  412. break;
  413. default:
  414. fprintf(stderr, "usage: recordmcount [-w] file.o...\n");
  415. return 0;
  416. }
  417. }
  418. if ((argc - optind) < 1) {
  419. fprintf(stderr, "usage: recordmcount [-w] file.o...\n");
  420. return 0;
  421. }
  422. /* Process each file in turn, allowing deep failure. */
  423. for (i = optind; i < argc; i++) {
  424. char *file = argv[i];
  425. int const sjval = setjmp(jmpenv);
  426. int len;
  427. /*
  428. * The file kernel/trace/ftrace.o references the mcount
  429. * function but does not call it. Since ftrace.o should
  430. * not be traced anyway, we just skip it.
  431. */
  432. len = strlen(file);
  433. if (len >= ftrace_size &&
  434. strcmp(file + (len - ftrace_size), ftrace) == 0)
  435. continue;
  436. switch (sjval) {
  437. default:
  438. fprintf(stderr, "internal error: %s\n", file);
  439. exit(1);
  440. break;
  441. case SJ_SETJMP: /* normal sequence */
  442. /* Avoid problems if early cleanup() */
  443. fd_map = -1;
  444. ehdr_curr = NULL;
  445. mmap_failed = 1;
  446. do_file(file);
  447. break;
  448. case SJ_FAIL: /* error in do_file or below */
  449. ++n_error;
  450. break;
  451. case SJ_SUCCEED: /* premature success */
  452. /* do nothing */
  453. break;
  454. } /* end switch */
  455. }
  456. return !!n_error;
  457. }