libbpf.c 44 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987
  1. // SPDX-License-Identifier: LGPL-2.1
  2. /*
  3. * Common eBPF ELF object loading operations.
  4. *
  5. * Copyright (C) 2013-2015 Alexei Starovoitov <ast@kernel.org>
  6. * Copyright (C) 2015 Wang Nan <wangnan0@huawei.com>
  7. * Copyright (C) 2015 Huawei Inc.
  8. * Copyright (C) 2017 Nicira, Inc.
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU Lesser General Public
  12. * License as published by the Free Software Foundation;
  13. * version 2.1 of the License (not later!)
  14. *
  15. * This program is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  18. * GNU Lesser General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU Lesser General Public
  21. * License along with this program; if not, see <http://www.gnu.org/licenses>
  22. */
  23. #include <stdlib.h>
  24. #include <stdio.h>
  25. #include <stdarg.h>
  26. #include <libgen.h>
  27. #include <inttypes.h>
  28. #include <string.h>
  29. #include <unistd.h>
  30. #include <fcntl.h>
  31. #include <errno.h>
  32. #include <asm/unistd.h>
  33. #include <linux/err.h>
  34. #include <linux/kernel.h>
  35. #include <linux/bpf.h>
  36. #include <linux/list.h>
  37. #include <linux/limits.h>
  38. #include <sys/stat.h>
  39. #include <sys/types.h>
  40. #include <sys/vfs.h>
  41. #include <libelf.h>
  42. #include <gelf.h>
  43. #include "libbpf.h"
  44. #include "bpf.h"
  45. #ifndef EM_BPF
  46. #define EM_BPF 247
  47. #endif
  48. #ifndef BPF_FS_MAGIC
  49. #define BPF_FS_MAGIC 0xcafe4a11
  50. #endif
  51. #define __printf(a, b) __attribute__((format(printf, a, b)))
  52. __printf(1, 2)
  53. static int __base_pr(const char *format, ...)
  54. {
  55. va_list args;
  56. int err;
  57. va_start(args, format);
  58. err = vfprintf(stderr, format, args);
  59. va_end(args);
  60. return err;
  61. }
  62. static __printf(1, 2) libbpf_print_fn_t __pr_warning = __base_pr;
  63. static __printf(1, 2) libbpf_print_fn_t __pr_info = __base_pr;
  64. static __printf(1, 2) libbpf_print_fn_t __pr_debug;
  65. #define __pr(func, fmt, ...) \
  66. do { \
  67. if ((func)) \
  68. (func)("libbpf: " fmt, ##__VA_ARGS__); \
  69. } while (0)
  70. #define pr_warning(fmt, ...) __pr(__pr_warning, fmt, ##__VA_ARGS__)
  71. #define pr_info(fmt, ...) __pr(__pr_info, fmt, ##__VA_ARGS__)
  72. #define pr_debug(fmt, ...) __pr(__pr_debug, fmt, ##__VA_ARGS__)
  73. void libbpf_set_print(libbpf_print_fn_t warn,
  74. libbpf_print_fn_t info,
  75. libbpf_print_fn_t debug)
  76. {
  77. __pr_warning = warn;
  78. __pr_info = info;
  79. __pr_debug = debug;
  80. }
  81. #define STRERR_BUFSIZE 128
  82. #define ERRNO_OFFSET(e) ((e) - __LIBBPF_ERRNO__START)
  83. #define ERRCODE_OFFSET(c) ERRNO_OFFSET(LIBBPF_ERRNO__##c)
  84. #define NR_ERRNO (__LIBBPF_ERRNO__END - __LIBBPF_ERRNO__START)
  85. static const char *libbpf_strerror_table[NR_ERRNO] = {
  86. [ERRCODE_OFFSET(LIBELF)] = "Something wrong in libelf",
  87. [ERRCODE_OFFSET(FORMAT)] = "BPF object format invalid",
  88. [ERRCODE_OFFSET(KVERSION)] = "'version' section incorrect or lost",
  89. [ERRCODE_OFFSET(ENDIAN)] = "Endian mismatch",
  90. [ERRCODE_OFFSET(INTERNAL)] = "Internal error in libbpf",
  91. [ERRCODE_OFFSET(RELOC)] = "Relocation failed",
  92. [ERRCODE_OFFSET(VERIFY)] = "Kernel verifier blocks program loading",
  93. [ERRCODE_OFFSET(PROG2BIG)] = "Program too big",
  94. [ERRCODE_OFFSET(KVER)] = "Incorrect kernel version",
  95. [ERRCODE_OFFSET(PROGTYPE)] = "Kernel doesn't support this program type",
  96. [ERRCODE_OFFSET(WRNGPID)] = "Wrong pid in netlink message",
  97. [ERRCODE_OFFSET(INVSEQ)] = "Invalid netlink sequence",
  98. };
  99. int libbpf_strerror(int err, char *buf, size_t size)
  100. {
  101. if (!buf || !size)
  102. return -1;
  103. err = err > 0 ? err : -err;
  104. if (err < __LIBBPF_ERRNO__START) {
  105. int ret;
  106. ret = strerror_r(err, buf, size);
  107. buf[size - 1] = '\0';
  108. return ret;
  109. }
  110. if (err < __LIBBPF_ERRNO__END) {
  111. const char *msg;
  112. msg = libbpf_strerror_table[ERRNO_OFFSET(err)];
  113. snprintf(buf, size, "%s", msg);
  114. buf[size - 1] = '\0';
  115. return 0;
  116. }
  117. snprintf(buf, size, "Unknown libbpf error %d", err);
  118. buf[size - 1] = '\0';
  119. return -1;
  120. }
  121. #define CHECK_ERR(action, err, out) do { \
  122. err = action; \
  123. if (err) \
  124. goto out; \
  125. } while(0)
  126. /* Copied from tools/perf/util/util.h */
  127. #ifndef zfree
  128. # define zfree(ptr) ({ free(*ptr); *ptr = NULL; })
  129. #endif
  130. #ifndef zclose
  131. # define zclose(fd) ({ \
  132. int ___err = 0; \
  133. if ((fd) >= 0) \
  134. ___err = close((fd)); \
  135. fd = -1; \
  136. ___err; })
  137. #endif
  138. #ifdef HAVE_LIBELF_MMAP_SUPPORT
  139. # define LIBBPF_ELF_C_READ_MMAP ELF_C_READ_MMAP
  140. #else
  141. # define LIBBPF_ELF_C_READ_MMAP ELF_C_READ
  142. #endif
  143. /*
  144. * bpf_prog should be a better name but it has been used in
  145. * linux/filter.h.
  146. */
  147. struct bpf_program {
  148. /* Index in elf obj file, for relocation use. */
  149. int idx;
  150. char *name;
  151. char *section_name;
  152. struct bpf_insn *insns;
  153. size_t insns_cnt, main_prog_cnt;
  154. enum bpf_prog_type type;
  155. struct reloc_desc {
  156. enum {
  157. RELO_LD64,
  158. RELO_CALL,
  159. } type;
  160. int insn_idx;
  161. union {
  162. int map_idx;
  163. int text_off;
  164. };
  165. } *reloc_desc;
  166. int nr_reloc;
  167. struct {
  168. int nr;
  169. int *fds;
  170. } instances;
  171. bpf_program_prep_t preprocessor;
  172. struct bpf_object *obj;
  173. void *priv;
  174. bpf_program_clear_priv_t clear_priv;
  175. };
  176. struct bpf_map {
  177. int fd;
  178. char *name;
  179. size_t offset;
  180. struct bpf_map_def def;
  181. void *priv;
  182. bpf_map_clear_priv_t clear_priv;
  183. };
  184. static LIST_HEAD(bpf_objects_list);
  185. struct bpf_object {
  186. char license[64];
  187. u32 kern_version;
  188. struct bpf_program *programs;
  189. size_t nr_programs;
  190. struct bpf_map *maps;
  191. size_t nr_maps;
  192. bool loaded;
  193. /*
  194. * Information when doing elf related work. Only valid if fd
  195. * is valid.
  196. */
  197. struct {
  198. int fd;
  199. void *obj_buf;
  200. size_t obj_buf_sz;
  201. Elf *elf;
  202. GElf_Ehdr ehdr;
  203. Elf_Data *symbols;
  204. size_t strtabidx;
  205. struct {
  206. GElf_Shdr shdr;
  207. Elf_Data *data;
  208. } *reloc;
  209. int nr_reloc;
  210. int maps_shndx;
  211. int text_shndx;
  212. } efile;
  213. /*
  214. * All loaded bpf_object is linked in a list, which is
  215. * hidden to caller. bpf_objects__<func> handlers deal with
  216. * all objects.
  217. */
  218. struct list_head list;
  219. void *priv;
  220. bpf_object_clear_priv_t clear_priv;
  221. char path[];
  222. };
  223. #define obj_elf_valid(o) ((o)->efile.elf)
  224. static void bpf_program__unload(struct bpf_program *prog)
  225. {
  226. int i;
  227. if (!prog)
  228. return;
  229. /*
  230. * If the object is opened but the program was never loaded,
  231. * it is possible that prog->instances.nr == -1.
  232. */
  233. if (prog->instances.nr > 0) {
  234. for (i = 0; i < prog->instances.nr; i++)
  235. zclose(prog->instances.fds[i]);
  236. } else if (prog->instances.nr != -1) {
  237. pr_warning("Internal error: instances.nr is %d\n",
  238. prog->instances.nr);
  239. }
  240. prog->instances.nr = -1;
  241. zfree(&prog->instances.fds);
  242. }
  243. static void bpf_program__exit(struct bpf_program *prog)
  244. {
  245. if (!prog)
  246. return;
  247. if (prog->clear_priv)
  248. prog->clear_priv(prog, prog->priv);
  249. prog->priv = NULL;
  250. prog->clear_priv = NULL;
  251. bpf_program__unload(prog);
  252. zfree(&prog->name);
  253. zfree(&prog->section_name);
  254. zfree(&prog->insns);
  255. zfree(&prog->reloc_desc);
  256. prog->nr_reloc = 0;
  257. prog->insns_cnt = 0;
  258. prog->idx = -1;
  259. }
  260. static int
  261. bpf_program__init(void *data, size_t size, char *section_name, int idx,
  262. struct bpf_program *prog)
  263. {
  264. if (size < sizeof(struct bpf_insn)) {
  265. pr_warning("corrupted section '%s'\n", section_name);
  266. return -EINVAL;
  267. }
  268. bzero(prog, sizeof(*prog));
  269. prog->section_name = strdup(section_name);
  270. if (!prog->section_name) {
  271. pr_warning("failed to alloc name for prog under section %s\n",
  272. section_name);
  273. goto errout;
  274. }
  275. prog->insns = malloc(size);
  276. if (!prog->insns) {
  277. pr_warning("failed to alloc insns for prog under section %s\n",
  278. section_name);
  279. goto errout;
  280. }
  281. prog->insns_cnt = size / sizeof(struct bpf_insn);
  282. memcpy(prog->insns, data,
  283. prog->insns_cnt * sizeof(struct bpf_insn));
  284. prog->idx = idx;
  285. prog->instances.fds = NULL;
  286. prog->instances.nr = -1;
  287. prog->type = BPF_PROG_TYPE_KPROBE;
  288. return 0;
  289. errout:
  290. bpf_program__exit(prog);
  291. return -ENOMEM;
  292. }
  293. static int
  294. bpf_object__add_program(struct bpf_object *obj, void *data, size_t size,
  295. char *section_name, int idx)
  296. {
  297. struct bpf_program prog, *progs;
  298. int nr_progs, err;
  299. err = bpf_program__init(data, size, section_name, idx, &prog);
  300. if (err)
  301. return err;
  302. progs = obj->programs;
  303. nr_progs = obj->nr_programs;
  304. progs = realloc(progs, sizeof(progs[0]) * (nr_progs + 1));
  305. if (!progs) {
  306. /*
  307. * In this case the original obj->programs
  308. * is still valid, so don't need special treat for
  309. * bpf_close_object().
  310. */
  311. pr_warning("failed to alloc a new program under section '%s'\n",
  312. section_name);
  313. bpf_program__exit(&prog);
  314. return -ENOMEM;
  315. }
  316. pr_debug("found program %s\n", prog.section_name);
  317. obj->programs = progs;
  318. obj->nr_programs = nr_progs + 1;
  319. prog.obj = obj;
  320. progs[nr_progs] = prog;
  321. return 0;
  322. }
  323. static int
  324. bpf_object__init_prog_names(struct bpf_object *obj)
  325. {
  326. Elf_Data *symbols = obj->efile.symbols;
  327. struct bpf_program *prog;
  328. size_t pi, si;
  329. for (pi = 0; pi < obj->nr_programs; pi++) {
  330. const char *name = NULL;
  331. prog = &obj->programs[pi];
  332. if (prog->idx == obj->efile.text_shndx) {
  333. name = ".text";
  334. goto skip_search;
  335. }
  336. for (si = 0; si < symbols->d_size / sizeof(GElf_Sym) && !name;
  337. si++) {
  338. GElf_Sym sym;
  339. if (!gelf_getsym(symbols, si, &sym))
  340. continue;
  341. if (sym.st_shndx != prog->idx)
  342. continue;
  343. if (GELF_ST_BIND(sym.st_info) != STB_GLOBAL)
  344. continue;
  345. name = elf_strptr(obj->efile.elf,
  346. obj->efile.strtabidx,
  347. sym.st_name);
  348. if (!name) {
  349. pr_warning("failed to get sym name string for prog %s\n",
  350. prog->section_name);
  351. return -LIBBPF_ERRNO__LIBELF;
  352. }
  353. }
  354. if (!name) {
  355. pr_warning("failed to find sym for prog %s\n",
  356. prog->section_name);
  357. return -EINVAL;
  358. }
  359. skip_search:
  360. prog->name = strdup(name);
  361. if (!prog->name) {
  362. pr_warning("failed to allocate memory for prog sym %s\n",
  363. name);
  364. return -ENOMEM;
  365. }
  366. }
  367. return 0;
  368. }
  369. static struct bpf_object *bpf_object__new(const char *path,
  370. void *obj_buf,
  371. size_t obj_buf_sz)
  372. {
  373. struct bpf_object *obj;
  374. obj = calloc(1, sizeof(struct bpf_object) + strlen(path) + 1);
  375. if (!obj) {
  376. pr_warning("alloc memory failed for %s\n", path);
  377. return ERR_PTR(-ENOMEM);
  378. }
  379. strcpy(obj->path, path);
  380. obj->efile.fd = -1;
  381. /*
  382. * Caller of this function should also calls
  383. * bpf_object__elf_finish() after data collection to return
  384. * obj_buf to user. If not, we should duplicate the buffer to
  385. * avoid user freeing them before elf finish.
  386. */
  387. obj->efile.obj_buf = obj_buf;
  388. obj->efile.obj_buf_sz = obj_buf_sz;
  389. obj->efile.maps_shndx = -1;
  390. obj->loaded = false;
  391. INIT_LIST_HEAD(&obj->list);
  392. list_add(&obj->list, &bpf_objects_list);
  393. return obj;
  394. }
  395. static void bpf_object__elf_finish(struct bpf_object *obj)
  396. {
  397. if (!obj_elf_valid(obj))
  398. return;
  399. if (obj->efile.elf) {
  400. elf_end(obj->efile.elf);
  401. obj->efile.elf = NULL;
  402. }
  403. obj->efile.symbols = NULL;
  404. zfree(&obj->efile.reloc);
  405. obj->efile.nr_reloc = 0;
  406. zclose(obj->efile.fd);
  407. obj->efile.obj_buf = NULL;
  408. obj->efile.obj_buf_sz = 0;
  409. }
  410. static int bpf_object__elf_init(struct bpf_object *obj)
  411. {
  412. int err = 0;
  413. GElf_Ehdr *ep;
  414. if (obj_elf_valid(obj)) {
  415. pr_warning("elf init: internal error\n");
  416. return -LIBBPF_ERRNO__LIBELF;
  417. }
  418. if (obj->efile.obj_buf_sz > 0) {
  419. /*
  420. * obj_buf should have been validated by
  421. * bpf_object__open_buffer().
  422. */
  423. obj->efile.elf = elf_memory(obj->efile.obj_buf,
  424. obj->efile.obj_buf_sz);
  425. } else {
  426. obj->efile.fd = open(obj->path, O_RDONLY);
  427. if (obj->efile.fd < 0) {
  428. pr_warning("failed to open %s: %s\n", obj->path,
  429. strerror(errno));
  430. return -errno;
  431. }
  432. obj->efile.elf = elf_begin(obj->efile.fd,
  433. LIBBPF_ELF_C_READ_MMAP,
  434. NULL);
  435. }
  436. if (!obj->efile.elf) {
  437. pr_warning("failed to open %s as ELF file\n",
  438. obj->path);
  439. err = -LIBBPF_ERRNO__LIBELF;
  440. goto errout;
  441. }
  442. if (!gelf_getehdr(obj->efile.elf, &obj->efile.ehdr)) {
  443. pr_warning("failed to get EHDR from %s\n",
  444. obj->path);
  445. err = -LIBBPF_ERRNO__FORMAT;
  446. goto errout;
  447. }
  448. ep = &obj->efile.ehdr;
  449. /* Old LLVM set e_machine to EM_NONE */
  450. if ((ep->e_type != ET_REL) || (ep->e_machine && (ep->e_machine != EM_BPF))) {
  451. pr_warning("%s is not an eBPF object file\n",
  452. obj->path);
  453. err = -LIBBPF_ERRNO__FORMAT;
  454. goto errout;
  455. }
  456. return 0;
  457. errout:
  458. bpf_object__elf_finish(obj);
  459. return err;
  460. }
  461. static int
  462. bpf_object__check_endianness(struct bpf_object *obj)
  463. {
  464. static unsigned int const endian = 1;
  465. switch (obj->efile.ehdr.e_ident[EI_DATA]) {
  466. case ELFDATA2LSB:
  467. /* We are big endian, BPF obj is little endian. */
  468. if (*(unsigned char const *)&endian != 1)
  469. goto mismatch;
  470. break;
  471. case ELFDATA2MSB:
  472. /* We are little endian, BPF obj is big endian. */
  473. if (*(unsigned char const *)&endian != 0)
  474. goto mismatch;
  475. break;
  476. default:
  477. return -LIBBPF_ERRNO__ENDIAN;
  478. }
  479. return 0;
  480. mismatch:
  481. pr_warning("Error: endianness mismatch.\n");
  482. return -LIBBPF_ERRNO__ENDIAN;
  483. }
  484. static int
  485. bpf_object__init_license(struct bpf_object *obj,
  486. void *data, size_t size)
  487. {
  488. memcpy(obj->license, data,
  489. min(size, sizeof(obj->license) - 1));
  490. pr_debug("license of %s is %s\n", obj->path, obj->license);
  491. return 0;
  492. }
  493. static int
  494. bpf_object__init_kversion(struct bpf_object *obj,
  495. void *data, size_t size)
  496. {
  497. u32 kver;
  498. if (size != sizeof(kver)) {
  499. pr_warning("invalid kver section in %s\n", obj->path);
  500. return -LIBBPF_ERRNO__FORMAT;
  501. }
  502. memcpy(&kver, data, sizeof(kver));
  503. obj->kern_version = kver;
  504. pr_debug("kernel version of %s is %x\n", obj->path,
  505. obj->kern_version);
  506. return 0;
  507. }
  508. static int compare_bpf_map(const void *_a, const void *_b)
  509. {
  510. const struct bpf_map *a = _a;
  511. const struct bpf_map *b = _b;
  512. return a->offset - b->offset;
  513. }
  514. static int
  515. bpf_object__init_maps(struct bpf_object *obj)
  516. {
  517. int i, map_idx, map_def_sz, nr_maps = 0;
  518. Elf_Scn *scn;
  519. Elf_Data *data;
  520. Elf_Data *symbols = obj->efile.symbols;
  521. if (obj->efile.maps_shndx < 0)
  522. return -EINVAL;
  523. if (!symbols)
  524. return -EINVAL;
  525. scn = elf_getscn(obj->efile.elf, obj->efile.maps_shndx);
  526. if (scn)
  527. data = elf_getdata(scn, NULL);
  528. if (!scn || !data) {
  529. pr_warning("failed to get Elf_Data from map section %d\n",
  530. obj->efile.maps_shndx);
  531. return -EINVAL;
  532. }
  533. /*
  534. * Count number of maps. Each map has a name.
  535. * Array of maps is not supported: only the first element is
  536. * considered.
  537. *
  538. * TODO: Detect array of map and report error.
  539. */
  540. for (i = 0; i < symbols->d_size / sizeof(GElf_Sym); i++) {
  541. GElf_Sym sym;
  542. if (!gelf_getsym(symbols, i, &sym))
  543. continue;
  544. if (sym.st_shndx != obj->efile.maps_shndx)
  545. continue;
  546. nr_maps++;
  547. }
  548. /* Alloc obj->maps and fill nr_maps. */
  549. pr_debug("maps in %s: %d maps in %zd bytes\n", obj->path,
  550. nr_maps, data->d_size);
  551. if (!nr_maps)
  552. return 0;
  553. /* Assume equally sized map definitions */
  554. map_def_sz = data->d_size / nr_maps;
  555. if (!data->d_size || (data->d_size % nr_maps) != 0) {
  556. pr_warning("unable to determine map definition size "
  557. "section %s, %d maps in %zd bytes\n",
  558. obj->path, nr_maps, data->d_size);
  559. return -EINVAL;
  560. }
  561. obj->maps = calloc(nr_maps, sizeof(obj->maps[0]));
  562. if (!obj->maps) {
  563. pr_warning("alloc maps for object failed\n");
  564. return -ENOMEM;
  565. }
  566. obj->nr_maps = nr_maps;
  567. /*
  568. * fill all fd with -1 so won't close incorrect
  569. * fd (fd=0 is stdin) when failure (zclose won't close
  570. * negative fd)).
  571. */
  572. for (i = 0; i < nr_maps; i++)
  573. obj->maps[i].fd = -1;
  574. /*
  575. * Fill obj->maps using data in "maps" section.
  576. */
  577. for (i = 0, map_idx = 0; i < symbols->d_size / sizeof(GElf_Sym); i++) {
  578. GElf_Sym sym;
  579. const char *map_name;
  580. struct bpf_map_def *def;
  581. if (!gelf_getsym(symbols, i, &sym))
  582. continue;
  583. if (sym.st_shndx != obj->efile.maps_shndx)
  584. continue;
  585. map_name = elf_strptr(obj->efile.elf,
  586. obj->efile.strtabidx,
  587. sym.st_name);
  588. obj->maps[map_idx].offset = sym.st_value;
  589. if (sym.st_value + map_def_sz > data->d_size) {
  590. pr_warning("corrupted maps section in %s: last map \"%s\" too small\n",
  591. obj->path, map_name);
  592. return -EINVAL;
  593. }
  594. obj->maps[map_idx].name = strdup(map_name);
  595. if (!obj->maps[map_idx].name) {
  596. pr_warning("failed to alloc map name\n");
  597. return -ENOMEM;
  598. }
  599. pr_debug("map %d is \"%s\"\n", map_idx,
  600. obj->maps[map_idx].name);
  601. def = (struct bpf_map_def *)(data->d_buf + sym.st_value);
  602. /*
  603. * If the definition of the map in the object file fits in
  604. * bpf_map_def, copy it. Any extra fields in our version
  605. * of bpf_map_def will default to zero as a result of the
  606. * calloc above.
  607. */
  608. if (map_def_sz <= sizeof(struct bpf_map_def)) {
  609. memcpy(&obj->maps[map_idx].def, def, map_def_sz);
  610. } else {
  611. /*
  612. * Here the map structure being read is bigger than what
  613. * we expect, truncate if the excess bits are all zero.
  614. * If they are not zero, reject this map as
  615. * incompatible.
  616. */
  617. char *b;
  618. for (b = ((char *)def) + sizeof(struct bpf_map_def);
  619. b < ((char *)def) + map_def_sz; b++) {
  620. if (*b != 0) {
  621. pr_warning("maps section in %s: \"%s\" "
  622. "has unrecognized, non-zero "
  623. "options\n",
  624. obj->path, map_name);
  625. return -EINVAL;
  626. }
  627. }
  628. memcpy(&obj->maps[map_idx].def, def,
  629. sizeof(struct bpf_map_def));
  630. }
  631. map_idx++;
  632. }
  633. qsort(obj->maps, obj->nr_maps, sizeof(obj->maps[0]), compare_bpf_map);
  634. return 0;
  635. }
  636. static int bpf_object__elf_collect(struct bpf_object *obj)
  637. {
  638. Elf *elf = obj->efile.elf;
  639. GElf_Ehdr *ep = &obj->efile.ehdr;
  640. Elf_Scn *scn = NULL;
  641. int idx = 0, err = 0;
  642. /* Elf is corrupted/truncated, avoid calling elf_strptr. */
  643. if (!elf_rawdata(elf_getscn(elf, ep->e_shstrndx), NULL)) {
  644. pr_warning("failed to get e_shstrndx from %s\n",
  645. obj->path);
  646. return -LIBBPF_ERRNO__FORMAT;
  647. }
  648. while ((scn = elf_nextscn(elf, scn)) != NULL) {
  649. char *name;
  650. GElf_Shdr sh;
  651. Elf_Data *data;
  652. idx++;
  653. if (gelf_getshdr(scn, &sh) != &sh) {
  654. pr_warning("failed to get section header from %s\n",
  655. obj->path);
  656. err = -LIBBPF_ERRNO__FORMAT;
  657. goto out;
  658. }
  659. name = elf_strptr(elf, ep->e_shstrndx, sh.sh_name);
  660. if (!name) {
  661. pr_warning("failed to get section name from %s\n",
  662. obj->path);
  663. err = -LIBBPF_ERRNO__FORMAT;
  664. goto out;
  665. }
  666. data = elf_getdata(scn, 0);
  667. if (!data) {
  668. pr_warning("failed to get section data from %s(%s)\n",
  669. name, obj->path);
  670. err = -LIBBPF_ERRNO__FORMAT;
  671. goto out;
  672. }
  673. pr_debug("section %s, size %ld, link %d, flags %lx, type=%d\n",
  674. name, (unsigned long)data->d_size,
  675. (int)sh.sh_link, (unsigned long)sh.sh_flags,
  676. (int)sh.sh_type);
  677. if (strcmp(name, "license") == 0)
  678. err = bpf_object__init_license(obj,
  679. data->d_buf,
  680. data->d_size);
  681. else if (strcmp(name, "version") == 0)
  682. err = bpf_object__init_kversion(obj,
  683. data->d_buf,
  684. data->d_size);
  685. else if (strcmp(name, "maps") == 0)
  686. obj->efile.maps_shndx = idx;
  687. else if (sh.sh_type == SHT_SYMTAB) {
  688. if (obj->efile.symbols) {
  689. pr_warning("bpf: multiple SYMTAB in %s\n",
  690. obj->path);
  691. err = -LIBBPF_ERRNO__FORMAT;
  692. } else {
  693. obj->efile.symbols = data;
  694. obj->efile.strtabidx = sh.sh_link;
  695. }
  696. } else if ((sh.sh_type == SHT_PROGBITS) &&
  697. (sh.sh_flags & SHF_EXECINSTR) &&
  698. (data->d_size > 0)) {
  699. if (strcmp(name, ".text") == 0)
  700. obj->efile.text_shndx = idx;
  701. err = bpf_object__add_program(obj, data->d_buf,
  702. data->d_size, name, idx);
  703. if (err) {
  704. char errmsg[STRERR_BUFSIZE];
  705. strerror_r(-err, errmsg, sizeof(errmsg));
  706. pr_warning("failed to alloc program %s (%s): %s",
  707. name, obj->path, errmsg);
  708. }
  709. } else if (sh.sh_type == SHT_REL) {
  710. void *reloc = obj->efile.reloc;
  711. int nr_reloc = obj->efile.nr_reloc + 1;
  712. reloc = realloc(reloc,
  713. sizeof(*obj->efile.reloc) * nr_reloc);
  714. if (!reloc) {
  715. pr_warning("realloc failed\n");
  716. err = -ENOMEM;
  717. } else {
  718. int n = nr_reloc - 1;
  719. obj->efile.reloc = reloc;
  720. obj->efile.nr_reloc = nr_reloc;
  721. obj->efile.reloc[n].shdr = sh;
  722. obj->efile.reloc[n].data = data;
  723. }
  724. }
  725. if (err)
  726. goto out;
  727. }
  728. if (!obj->efile.strtabidx || obj->efile.strtabidx >= idx) {
  729. pr_warning("Corrupted ELF file: index of strtab invalid\n");
  730. return LIBBPF_ERRNO__FORMAT;
  731. }
  732. if (obj->efile.maps_shndx >= 0) {
  733. err = bpf_object__init_maps(obj);
  734. if (err)
  735. goto out;
  736. }
  737. err = bpf_object__init_prog_names(obj);
  738. out:
  739. return err;
  740. }
  741. static struct bpf_program *
  742. bpf_object__find_prog_by_idx(struct bpf_object *obj, int idx)
  743. {
  744. struct bpf_program *prog;
  745. size_t i;
  746. for (i = 0; i < obj->nr_programs; i++) {
  747. prog = &obj->programs[i];
  748. if (prog->idx == idx)
  749. return prog;
  750. }
  751. return NULL;
  752. }
  753. static int
  754. bpf_program__collect_reloc(struct bpf_program *prog, GElf_Shdr *shdr,
  755. Elf_Data *data, struct bpf_object *obj)
  756. {
  757. Elf_Data *symbols = obj->efile.symbols;
  758. int text_shndx = obj->efile.text_shndx;
  759. int maps_shndx = obj->efile.maps_shndx;
  760. struct bpf_map *maps = obj->maps;
  761. size_t nr_maps = obj->nr_maps;
  762. int i, nrels;
  763. pr_debug("collecting relocating info for: '%s'\n",
  764. prog->section_name);
  765. nrels = shdr->sh_size / shdr->sh_entsize;
  766. prog->reloc_desc = malloc(sizeof(*prog->reloc_desc) * nrels);
  767. if (!prog->reloc_desc) {
  768. pr_warning("failed to alloc memory in relocation\n");
  769. return -ENOMEM;
  770. }
  771. prog->nr_reloc = nrels;
  772. for (i = 0; i < nrels; i++) {
  773. GElf_Sym sym;
  774. GElf_Rel rel;
  775. unsigned int insn_idx;
  776. struct bpf_insn *insns = prog->insns;
  777. size_t map_idx;
  778. if (!gelf_getrel(data, i, &rel)) {
  779. pr_warning("relocation: failed to get %d reloc\n", i);
  780. return -LIBBPF_ERRNO__FORMAT;
  781. }
  782. if (!gelf_getsym(symbols,
  783. GELF_R_SYM(rel.r_info),
  784. &sym)) {
  785. pr_warning("relocation: symbol %"PRIx64" not found\n",
  786. GELF_R_SYM(rel.r_info));
  787. return -LIBBPF_ERRNO__FORMAT;
  788. }
  789. pr_debug("relo for %lld value %lld name %d\n",
  790. (long long) (rel.r_info >> 32),
  791. (long long) sym.st_value, sym.st_name);
  792. if (sym.st_shndx != maps_shndx && sym.st_shndx != text_shndx) {
  793. pr_warning("Program '%s' contains non-map related relo data pointing to section %u\n",
  794. prog->section_name, sym.st_shndx);
  795. return -LIBBPF_ERRNO__RELOC;
  796. }
  797. insn_idx = rel.r_offset / sizeof(struct bpf_insn);
  798. pr_debug("relocation: insn_idx=%u\n", insn_idx);
  799. if (insns[insn_idx].code == (BPF_JMP | BPF_CALL)) {
  800. if (insns[insn_idx].src_reg != BPF_PSEUDO_CALL) {
  801. pr_warning("incorrect bpf_call opcode\n");
  802. return -LIBBPF_ERRNO__RELOC;
  803. }
  804. prog->reloc_desc[i].type = RELO_CALL;
  805. prog->reloc_desc[i].insn_idx = insn_idx;
  806. prog->reloc_desc[i].text_off = sym.st_value;
  807. continue;
  808. }
  809. if (insns[insn_idx].code != (BPF_LD | BPF_IMM | BPF_DW)) {
  810. pr_warning("bpf: relocation: invalid relo for insns[%d].code 0x%x\n",
  811. insn_idx, insns[insn_idx].code);
  812. return -LIBBPF_ERRNO__RELOC;
  813. }
  814. /* TODO: 'maps' is sorted. We can use bsearch to make it faster. */
  815. for (map_idx = 0; map_idx < nr_maps; map_idx++) {
  816. if (maps[map_idx].offset == sym.st_value) {
  817. pr_debug("relocation: find map %zd (%s) for insn %u\n",
  818. map_idx, maps[map_idx].name, insn_idx);
  819. break;
  820. }
  821. }
  822. if (map_idx >= nr_maps) {
  823. pr_warning("bpf relocation: map_idx %d large than %d\n",
  824. (int)map_idx, (int)nr_maps - 1);
  825. return -LIBBPF_ERRNO__RELOC;
  826. }
  827. prog->reloc_desc[i].type = RELO_LD64;
  828. prog->reloc_desc[i].insn_idx = insn_idx;
  829. prog->reloc_desc[i].map_idx = map_idx;
  830. }
  831. return 0;
  832. }
  833. static int
  834. bpf_object__create_maps(struct bpf_object *obj)
  835. {
  836. unsigned int i;
  837. for (i = 0; i < obj->nr_maps; i++) {
  838. struct bpf_map_def *def = &obj->maps[i].def;
  839. int *pfd = &obj->maps[i].fd;
  840. *pfd = bpf_create_map_name(def->type,
  841. obj->maps[i].name,
  842. def->key_size,
  843. def->value_size,
  844. def->max_entries,
  845. def->map_flags);
  846. if (*pfd < 0) {
  847. size_t j;
  848. int err = *pfd;
  849. pr_warning("failed to create map (name: '%s'): %s\n",
  850. obj->maps[i].name,
  851. strerror(errno));
  852. for (j = 0; j < i; j++)
  853. zclose(obj->maps[j].fd);
  854. return err;
  855. }
  856. pr_debug("create map %s: fd=%d\n", obj->maps[i].name, *pfd);
  857. }
  858. return 0;
  859. }
  860. static int
  861. bpf_program__reloc_text(struct bpf_program *prog, struct bpf_object *obj,
  862. struct reloc_desc *relo)
  863. {
  864. struct bpf_insn *insn, *new_insn;
  865. struct bpf_program *text;
  866. size_t new_cnt;
  867. if (relo->type != RELO_CALL)
  868. return -LIBBPF_ERRNO__RELOC;
  869. if (prog->idx == obj->efile.text_shndx) {
  870. pr_warning("relo in .text insn %d into off %d\n",
  871. relo->insn_idx, relo->text_off);
  872. return -LIBBPF_ERRNO__RELOC;
  873. }
  874. if (prog->main_prog_cnt == 0) {
  875. text = bpf_object__find_prog_by_idx(obj, obj->efile.text_shndx);
  876. if (!text) {
  877. pr_warning("no .text section found yet relo into text exist\n");
  878. return -LIBBPF_ERRNO__RELOC;
  879. }
  880. new_cnt = prog->insns_cnt + text->insns_cnt;
  881. new_insn = realloc(prog->insns, new_cnt * sizeof(*insn));
  882. if (!new_insn) {
  883. pr_warning("oom in prog realloc\n");
  884. return -ENOMEM;
  885. }
  886. memcpy(new_insn + prog->insns_cnt, text->insns,
  887. text->insns_cnt * sizeof(*insn));
  888. prog->insns = new_insn;
  889. prog->main_prog_cnt = prog->insns_cnt;
  890. prog->insns_cnt = new_cnt;
  891. }
  892. insn = &prog->insns[relo->insn_idx];
  893. insn->imm += prog->main_prog_cnt - relo->insn_idx;
  894. pr_debug("added %zd insn from %s to prog %s\n",
  895. text->insns_cnt, text->section_name, prog->section_name);
  896. return 0;
  897. }
  898. static int
  899. bpf_program__relocate(struct bpf_program *prog, struct bpf_object *obj)
  900. {
  901. int i, err;
  902. if (!prog || !prog->reloc_desc)
  903. return 0;
  904. for (i = 0; i < prog->nr_reloc; i++) {
  905. if (prog->reloc_desc[i].type == RELO_LD64) {
  906. struct bpf_insn *insns = prog->insns;
  907. int insn_idx, map_idx;
  908. insn_idx = prog->reloc_desc[i].insn_idx;
  909. map_idx = prog->reloc_desc[i].map_idx;
  910. if (insn_idx >= (int)prog->insns_cnt) {
  911. pr_warning("relocation out of range: '%s'\n",
  912. prog->section_name);
  913. return -LIBBPF_ERRNO__RELOC;
  914. }
  915. insns[insn_idx].src_reg = BPF_PSEUDO_MAP_FD;
  916. insns[insn_idx].imm = obj->maps[map_idx].fd;
  917. } else {
  918. err = bpf_program__reloc_text(prog, obj,
  919. &prog->reloc_desc[i]);
  920. if (err)
  921. return err;
  922. }
  923. }
  924. zfree(&prog->reloc_desc);
  925. prog->nr_reloc = 0;
  926. return 0;
  927. }
  928. static int
  929. bpf_object__relocate(struct bpf_object *obj)
  930. {
  931. struct bpf_program *prog;
  932. size_t i;
  933. int err;
  934. for (i = 0; i < obj->nr_programs; i++) {
  935. prog = &obj->programs[i];
  936. err = bpf_program__relocate(prog, obj);
  937. if (err) {
  938. pr_warning("failed to relocate '%s'\n",
  939. prog->section_name);
  940. return err;
  941. }
  942. }
  943. return 0;
  944. }
  945. static int bpf_object__collect_reloc(struct bpf_object *obj)
  946. {
  947. int i, err;
  948. if (!obj_elf_valid(obj)) {
  949. pr_warning("Internal error: elf object is closed\n");
  950. return -LIBBPF_ERRNO__INTERNAL;
  951. }
  952. for (i = 0; i < obj->efile.nr_reloc; i++) {
  953. GElf_Shdr *shdr = &obj->efile.reloc[i].shdr;
  954. Elf_Data *data = obj->efile.reloc[i].data;
  955. int idx = shdr->sh_info;
  956. struct bpf_program *prog;
  957. if (shdr->sh_type != SHT_REL) {
  958. pr_warning("internal error at %d\n", __LINE__);
  959. return -LIBBPF_ERRNO__INTERNAL;
  960. }
  961. prog = bpf_object__find_prog_by_idx(obj, idx);
  962. if (!prog) {
  963. pr_warning("relocation failed: no %d section\n",
  964. idx);
  965. return -LIBBPF_ERRNO__RELOC;
  966. }
  967. err = bpf_program__collect_reloc(prog,
  968. shdr, data,
  969. obj);
  970. if (err)
  971. return err;
  972. }
  973. return 0;
  974. }
  975. static int
  976. load_program(enum bpf_prog_type type, const char *name, struct bpf_insn *insns,
  977. int insns_cnt, char *license, u32 kern_version, int *pfd)
  978. {
  979. int ret;
  980. char *log_buf;
  981. if (!insns || !insns_cnt)
  982. return -EINVAL;
  983. log_buf = malloc(BPF_LOG_BUF_SIZE);
  984. if (!log_buf)
  985. pr_warning("Alloc log buffer for bpf loader error, continue without log\n");
  986. ret = bpf_load_program_name(type, name, insns, insns_cnt, license,
  987. kern_version, log_buf, BPF_LOG_BUF_SIZE);
  988. if (ret >= 0) {
  989. *pfd = ret;
  990. ret = 0;
  991. goto out;
  992. }
  993. ret = -LIBBPF_ERRNO__LOAD;
  994. pr_warning("load bpf program failed: %s\n", strerror(errno));
  995. if (log_buf && log_buf[0] != '\0') {
  996. ret = -LIBBPF_ERRNO__VERIFY;
  997. pr_warning("-- BEGIN DUMP LOG ---\n");
  998. pr_warning("\n%s\n", log_buf);
  999. pr_warning("-- END LOG --\n");
  1000. } else if (insns_cnt >= BPF_MAXINSNS) {
  1001. pr_warning("Program too large (%d insns), at most %d insns\n",
  1002. insns_cnt, BPF_MAXINSNS);
  1003. ret = -LIBBPF_ERRNO__PROG2BIG;
  1004. } else {
  1005. /* Wrong program type? */
  1006. if (type != BPF_PROG_TYPE_KPROBE) {
  1007. int fd;
  1008. fd = bpf_load_program_name(BPF_PROG_TYPE_KPROBE, name,
  1009. insns, insns_cnt, license,
  1010. kern_version, NULL, 0);
  1011. if (fd >= 0) {
  1012. close(fd);
  1013. ret = -LIBBPF_ERRNO__PROGTYPE;
  1014. goto out;
  1015. }
  1016. }
  1017. if (log_buf)
  1018. ret = -LIBBPF_ERRNO__KVER;
  1019. }
  1020. out:
  1021. free(log_buf);
  1022. return ret;
  1023. }
  1024. static int
  1025. bpf_program__load(struct bpf_program *prog,
  1026. char *license, u32 kern_version)
  1027. {
  1028. int err = 0, fd, i;
  1029. if (prog->instances.nr < 0 || !prog->instances.fds) {
  1030. if (prog->preprocessor) {
  1031. pr_warning("Internal error: can't load program '%s'\n",
  1032. prog->section_name);
  1033. return -LIBBPF_ERRNO__INTERNAL;
  1034. }
  1035. prog->instances.fds = malloc(sizeof(int));
  1036. if (!prog->instances.fds) {
  1037. pr_warning("Not enough memory for BPF fds\n");
  1038. return -ENOMEM;
  1039. }
  1040. prog->instances.nr = 1;
  1041. prog->instances.fds[0] = -1;
  1042. }
  1043. if (!prog->preprocessor) {
  1044. if (prog->instances.nr != 1) {
  1045. pr_warning("Program '%s' is inconsistent: nr(%d) != 1\n",
  1046. prog->section_name, prog->instances.nr);
  1047. }
  1048. err = load_program(prog->type, prog->name, prog->insns,
  1049. prog->insns_cnt, license, kern_version, &fd);
  1050. if (!err)
  1051. prog->instances.fds[0] = fd;
  1052. goto out;
  1053. }
  1054. for (i = 0; i < prog->instances.nr; i++) {
  1055. struct bpf_prog_prep_result result;
  1056. bpf_program_prep_t preprocessor = prog->preprocessor;
  1057. bzero(&result, sizeof(result));
  1058. err = preprocessor(prog, i, prog->insns,
  1059. prog->insns_cnt, &result);
  1060. if (err) {
  1061. pr_warning("Preprocessing the %dth instance of program '%s' failed\n",
  1062. i, prog->section_name);
  1063. goto out;
  1064. }
  1065. if (!result.new_insn_ptr || !result.new_insn_cnt) {
  1066. pr_debug("Skip loading the %dth instance of program '%s'\n",
  1067. i, prog->section_name);
  1068. prog->instances.fds[i] = -1;
  1069. if (result.pfd)
  1070. *result.pfd = -1;
  1071. continue;
  1072. }
  1073. err = load_program(prog->type, prog->name,
  1074. result.new_insn_ptr,
  1075. result.new_insn_cnt,
  1076. license, kern_version, &fd);
  1077. if (err) {
  1078. pr_warning("Loading the %dth instance of program '%s' failed\n",
  1079. i, prog->section_name);
  1080. goto out;
  1081. }
  1082. if (result.pfd)
  1083. *result.pfd = fd;
  1084. prog->instances.fds[i] = fd;
  1085. }
  1086. out:
  1087. if (err)
  1088. pr_warning("failed to load program '%s'\n",
  1089. prog->section_name);
  1090. zfree(&prog->insns);
  1091. prog->insns_cnt = 0;
  1092. return err;
  1093. }
  1094. static int
  1095. bpf_object__load_progs(struct bpf_object *obj)
  1096. {
  1097. size_t i;
  1098. int err;
  1099. for (i = 0; i < obj->nr_programs; i++) {
  1100. if (obj->programs[i].idx == obj->efile.text_shndx)
  1101. continue;
  1102. err = bpf_program__load(&obj->programs[i],
  1103. obj->license,
  1104. obj->kern_version);
  1105. if (err)
  1106. return err;
  1107. }
  1108. return 0;
  1109. }
  1110. static int bpf_object__validate(struct bpf_object *obj)
  1111. {
  1112. if (obj->kern_version == 0) {
  1113. pr_warning("%s doesn't provide kernel version\n",
  1114. obj->path);
  1115. return -LIBBPF_ERRNO__KVERSION;
  1116. }
  1117. return 0;
  1118. }
  1119. static struct bpf_object *
  1120. __bpf_object__open(const char *path, void *obj_buf, size_t obj_buf_sz)
  1121. {
  1122. struct bpf_object *obj;
  1123. int err;
  1124. if (elf_version(EV_CURRENT) == EV_NONE) {
  1125. pr_warning("failed to init libelf for %s\n", path);
  1126. return ERR_PTR(-LIBBPF_ERRNO__LIBELF);
  1127. }
  1128. obj = bpf_object__new(path, obj_buf, obj_buf_sz);
  1129. if (IS_ERR(obj))
  1130. return obj;
  1131. CHECK_ERR(bpf_object__elf_init(obj), err, out);
  1132. CHECK_ERR(bpf_object__check_endianness(obj), err, out);
  1133. CHECK_ERR(bpf_object__elf_collect(obj), err, out);
  1134. CHECK_ERR(bpf_object__collect_reloc(obj), err, out);
  1135. CHECK_ERR(bpf_object__validate(obj), err, out);
  1136. bpf_object__elf_finish(obj);
  1137. return obj;
  1138. out:
  1139. bpf_object__close(obj);
  1140. return ERR_PTR(err);
  1141. }
  1142. struct bpf_object *bpf_object__open(const char *path)
  1143. {
  1144. /* param validation */
  1145. if (!path)
  1146. return NULL;
  1147. pr_debug("loading %s\n", path);
  1148. return __bpf_object__open(path, NULL, 0);
  1149. }
  1150. struct bpf_object *bpf_object__open_buffer(void *obj_buf,
  1151. size_t obj_buf_sz,
  1152. const char *name)
  1153. {
  1154. char tmp_name[64];
  1155. /* param validation */
  1156. if (!obj_buf || obj_buf_sz <= 0)
  1157. return NULL;
  1158. if (!name) {
  1159. snprintf(tmp_name, sizeof(tmp_name), "%lx-%lx",
  1160. (unsigned long)obj_buf,
  1161. (unsigned long)obj_buf_sz);
  1162. tmp_name[sizeof(tmp_name) - 1] = '\0';
  1163. name = tmp_name;
  1164. }
  1165. pr_debug("loading object '%s' from buffer\n",
  1166. name);
  1167. return __bpf_object__open(name, obj_buf, obj_buf_sz);
  1168. }
  1169. int bpf_object__unload(struct bpf_object *obj)
  1170. {
  1171. size_t i;
  1172. if (!obj)
  1173. return -EINVAL;
  1174. for (i = 0; i < obj->nr_maps; i++)
  1175. zclose(obj->maps[i].fd);
  1176. for (i = 0; i < obj->nr_programs; i++)
  1177. bpf_program__unload(&obj->programs[i]);
  1178. return 0;
  1179. }
  1180. int bpf_object__load(struct bpf_object *obj)
  1181. {
  1182. int err;
  1183. if (!obj)
  1184. return -EINVAL;
  1185. if (obj->loaded) {
  1186. pr_warning("object should not be loaded twice\n");
  1187. return -EINVAL;
  1188. }
  1189. obj->loaded = true;
  1190. CHECK_ERR(bpf_object__create_maps(obj), err, out);
  1191. CHECK_ERR(bpf_object__relocate(obj), err, out);
  1192. CHECK_ERR(bpf_object__load_progs(obj), err, out);
  1193. return 0;
  1194. out:
  1195. bpf_object__unload(obj);
  1196. pr_warning("failed to load object '%s'\n", obj->path);
  1197. return err;
  1198. }
  1199. static int check_path(const char *path)
  1200. {
  1201. struct statfs st_fs;
  1202. char *dname, *dir;
  1203. int err = 0;
  1204. if (path == NULL)
  1205. return -EINVAL;
  1206. dname = strdup(path);
  1207. if (dname == NULL)
  1208. return -ENOMEM;
  1209. dir = dirname(dname);
  1210. if (statfs(dir, &st_fs)) {
  1211. pr_warning("failed to statfs %s: %s\n", dir, strerror(errno));
  1212. err = -errno;
  1213. }
  1214. free(dname);
  1215. if (!err && st_fs.f_type != BPF_FS_MAGIC) {
  1216. pr_warning("specified path %s is not on BPF FS\n", path);
  1217. err = -EINVAL;
  1218. }
  1219. return err;
  1220. }
  1221. int bpf_program__pin_instance(struct bpf_program *prog, const char *path,
  1222. int instance)
  1223. {
  1224. int err;
  1225. err = check_path(path);
  1226. if (err)
  1227. return err;
  1228. if (prog == NULL) {
  1229. pr_warning("invalid program pointer\n");
  1230. return -EINVAL;
  1231. }
  1232. if (instance < 0 || instance >= prog->instances.nr) {
  1233. pr_warning("invalid prog instance %d of prog %s (max %d)\n",
  1234. instance, prog->section_name, prog->instances.nr);
  1235. return -EINVAL;
  1236. }
  1237. if (bpf_obj_pin(prog->instances.fds[instance], path)) {
  1238. pr_warning("failed to pin program: %s\n", strerror(errno));
  1239. return -errno;
  1240. }
  1241. pr_debug("pinned program '%s'\n", path);
  1242. return 0;
  1243. }
  1244. static int make_dir(const char *path)
  1245. {
  1246. int err = 0;
  1247. if (mkdir(path, 0700) && errno != EEXIST)
  1248. err = -errno;
  1249. if (err)
  1250. pr_warning("failed to mkdir %s: %s\n", path, strerror(-err));
  1251. return err;
  1252. }
  1253. int bpf_program__pin(struct bpf_program *prog, const char *path)
  1254. {
  1255. int i, err;
  1256. err = check_path(path);
  1257. if (err)
  1258. return err;
  1259. if (prog == NULL) {
  1260. pr_warning("invalid program pointer\n");
  1261. return -EINVAL;
  1262. }
  1263. if (prog->instances.nr <= 0) {
  1264. pr_warning("no instances of prog %s to pin\n",
  1265. prog->section_name);
  1266. return -EINVAL;
  1267. }
  1268. err = make_dir(path);
  1269. if (err)
  1270. return err;
  1271. for (i = 0; i < prog->instances.nr; i++) {
  1272. char buf[PATH_MAX];
  1273. int len;
  1274. len = snprintf(buf, PATH_MAX, "%s/%d", path, i);
  1275. if (len < 0)
  1276. return -EINVAL;
  1277. else if (len >= PATH_MAX)
  1278. return -ENAMETOOLONG;
  1279. err = bpf_program__pin_instance(prog, buf, i);
  1280. if (err)
  1281. return err;
  1282. }
  1283. return 0;
  1284. }
  1285. int bpf_map__pin(struct bpf_map *map, const char *path)
  1286. {
  1287. int err;
  1288. err = check_path(path);
  1289. if (err)
  1290. return err;
  1291. if (map == NULL) {
  1292. pr_warning("invalid map pointer\n");
  1293. return -EINVAL;
  1294. }
  1295. if (bpf_obj_pin(map->fd, path)) {
  1296. pr_warning("failed to pin map: %s\n", strerror(errno));
  1297. return -errno;
  1298. }
  1299. pr_debug("pinned map '%s'\n", path);
  1300. return 0;
  1301. }
  1302. int bpf_object__pin(struct bpf_object *obj, const char *path)
  1303. {
  1304. struct bpf_program *prog;
  1305. struct bpf_map *map;
  1306. int err;
  1307. if (!obj)
  1308. return -ENOENT;
  1309. if (!obj->loaded) {
  1310. pr_warning("object not yet loaded; load it first\n");
  1311. return -ENOENT;
  1312. }
  1313. err = make_dir(path);
  1314. if (err)
  1315. return err;
  1316. bpf_map__for_each(map, obj) {
  1317. char buf[PATH_MAX];
  1318. int len;
  1319. len = snprintf(buf, PATH_MAX, "%s/%s", path,
  1320. bpf_map__name(map));
  1321. if (len < 0)
  1322. return -EINVAL;
  1323. else if (len >= PATH_MAX)
  1324. return -ENAMETOOLONG;
  1325. err = bpf_map__pin(map, buf);
  1326. if (err)
  1327. return err;
  1328. }
  1329. bpf_object__for_each_program(prog, obj) {
  1330. char buf[PATH_MAX];
  1331. int len;
  1332. len = snprintf(buf, PATH_MAX, "%s/%s", path,
  1333. prog->section_name);
  1334. if (len < 0)
  1335. return -EINVAL;
  1336. else if (len >= PATH_MAX)
  1337. return -ENAMETOOLONG;
  1338. err = bpf_program__pin(prog, buf);
  1339. if (err)
  1340. return err;
  1341. }
  1342. return 0;
  1343. }
  1344. void bpf_object__close(struct bpf_object *obj)
  1345. {
  1346. size_t i;
  1347. if (!obj)
  1348. return;
  1349. if (obj->clear_priv)
  1350. obj->clear_priv(obj, obj->priv);
  1351. bpf_object__elf_finish(obj);
  1352. bpf_object__unload(obj);
  1353. for (i = 0; i < obj->nr_maps; i++) {
  1354. zfree(&obj->maps[i].name);
  1355. if (obj->maps[i].clear_priv)
  1356. obj->maps[i].clear_priv(&obj->maps[i],
  1357. obj->maps[i].priv);
  1358. obj->maps[i].priv = NULL;
  1359. obj->maps[i].clear_priv = NULL;
  1360. }
  1361. zfree(&obj->maps);
  1362. obj->nr_maps = 0;
  1363. if (obj->programs && obj->nr_programs) {
  1364. for (i = 0; i < obj->nr_programs; i++)
  1365. bpf_program__exit(&obj->programs[i]);
  1366. }
  1367. zfree(&obj->programs);
  1368. list_del(&obj->list);
  1369. free(obj);
  1370. }
  1371. struct bpf_object *
  1372. bpf_object__next(struct bpf_object *prev)
  1373. {
  1374. struct bpf_object *next;
  1375. if (!prev)
  1376. next = list_first_entry(&bpf_objects_list,
  1377. struct bpf_object,
  1378. list);
  1379. else
  1380. next = list_next_entry(prev, list);
  1381. /* Empty list is noticed here so don't need checking on entry. */
  1382. if (&next->list == &bpf_objects_list)
  1383. return NULL;
  1384. return next;
  1385. }
  1386. const char *bpf_object__name(struct bpf_object *obj)
  1387. {
  1388. return obj ? obj->path : ERR_PTR(-EINVAL);
  1389. }
  1390. unsigned int bpf_object__kversion(struct bpf_object *obj)
  1391. {
  1392. return obj ? obj->kern_version : 0;
  1393. }
  1394. int bpf_object__set_priv(struct bpf_object *obj, void *priv,
  1395. bpf_object_clear_priv_t clear_priv)
  1396. {
  1397. if (obj->priv && obj->clear_priv)
  1398. obj->clear_priv(obj, obj->priv);
  1399. obj->priv = priv;
  1400. obj->clear_priv = clear_priv;
  1401. return 0;
  1402. }
  1403. void *bpf_object__priv(struct bpf_object *obj)
  1404. {
  1405. return obj ? obj->priv : ERR_PTR(-EINVAL);
  1406. }
  1407. struct bpf_program *
  1408. bpf_program__next(struct bpf_program *prev, struct bpf_object *obj)
  1409. {
  1410. size_t idx;
  1411. if (!obj->programs)
  1412. return NULL;
  1413. /* First handler */
  1414. if (prev == NULL)
  1415. return &obj->programs[0];
  1416. if (prev->obj != obj) {
  1417. pr_warning("error: program handler doesn't match object\n");
  1418. return NULL;
  1419. }
  1420. idx = (prev - obj->programs) + 1;
  1421. if (idx >= obj->nr_programs)
  1422. return NULL;
  1423. return &obj->programs[idx];
  1424. }
  1425. int bpf_program__set_priv(struct bpf_program *prog, void *priv,
  1426. bpf_program_clear_priv_t clear_priv)
  1427. {
  1428. if (prog->priv && prog->clear_priv)
  1429. prog->clear_priv(prog, prog->priv);
  1430. prog->priv = priv;
  1431. prog->clear_priv = clear_priv;
  1432. return 0;
  1433. }
  1434. void *bpf_program__priv(struct bpf_program *prog)
  1435. {
  1436. return prog ? prog->priv : ERR_PTR(-EINVAL);
  1437. }
  1438. const char *bpf_program__title(struct bpf_program *prog, bool needs_copy)
  1439. {
  1440. const char *title;
  1441. title = prog->section_name;
  1442. if (needs_copy) {
  1443. title = strdup(title);
  1444. if (!title) {
  1445. pr_warning("failed to strdup program title\n");
  1446. return ERR_PTR(-ENOMEM);
  1447. }
  1448. }
  1449. return title;
  1450. }
  1451. int bpf_program__fd(struct bpf_program *prog)
  1452. {
  1453. return bpf_program__nth_fd(prog, 0);
  1454. }
  1455. int bpf_program__set_prep(struct bpf_program *prog, int nr_instances,
  1456. bpf_program_prep_t prep)
  1457. {
  1458. int *instances_fds;
  1459. if (nr_instances <= 0 || !prep)
  1460. return -EINVAL;
  1461. if (prog->instances.nr > 0 || prog->instances.fds) {
  1462. pr_warning("Can't set pre-processor after loading\n");
  1463. return -EINVAL;
  1464. }
  1465. instances_fds = malloc(sizeof(int) * nr_instances);
  1466. if (!instances_fds) {
  1467. pr_warning("alloc memory failed for fds\n");
  1468. return -ENOMEM;
  1469. }
  1470. /* fill all fd with -1 */
  1471. memset(instances_fds, -1, sizeof(int) * nr_instances);
  1472. prog->instances.nr = nr_instances;
  1473. prog->instances.fds = instances_fds;
  1474. prog->preprocessor = prep;
  1475. return 0;
  1476. }
  1477. int bpf_program__nth_fd(struct bpf_program *prog, int n)
  1478. {
  1479. int fd;
  1480. if (n >= prog->instances.nr || n < 0) {
  1481. pr_warning("Can't get the %dth fd from program %s: only %d instances\n",
  1482. n, prog->section_name, prog->instances.nr);
  1483. return -EINVAL;
  1484. }
  1485. fd = prog->instances.fds[n];
  1486. if (fd < 0) {
  1487. pr_warning("%dth instance of program '%s' is invalid\n",
  1488. n, prog->section_name);
  1489. return -ENOENT;
  1490. }
  1491. return fd;
  1492. }
  1493. void bpf_program__set_type(struct bpf_program *prog, enum bpf_prog_type type)
  1494. {
  1495. prog->type = type;
  1496. }
  1497. static bool bpf_program__is_type(struct bpf_program *prog,
  1498. enum bpf_prog_type type)
  1499. {
  1500. return prog ? (prog->type == type) : false;
  1501. }
  1502. #define BPF_PROG_TYPE_FNS(NAME, TYPE) \
  1503. int bpf_program__set_##NAME(struct bpf_program *prog) \
  1504. { \
  1505. if (!prog) \
  1506. return -EINVAL; \
  1507. bpf_program__set_type(prog, TYPE); \
  1508. return 0; \
  1509. } \
  1510. \
  1511. bool bpf_program__is_##NAME(struct bpf_program *prog) \
  1512. { \
  1513. return bpf_program__is_type(prog, TYPE); \
  1514. } \
  1515. BPF_PROG_TYPE_FNS(socket_filter, BPF_PROG_TYPE_SOCKET_FILTER);
  1516. BPF_PROG_TYPE_FNS(kprobe, BPF_PROG_TYPE_KPROBE);
  1517. BPF_PROG_TYPE_FNS(sched_cls, BPF_PROG_TYPE_SCHED_CLS);
  1518. BPF_PROG_TYPE_FNS(sched_act, BPF_PROG_TYPE_SCHED_ACT);
  1519. BPF_PROG_TYPE_FNS(tracepoint, BPF_PROG_TYPE_TRACEPOINT);
  1520. BPF_PROG_TYPE_FNS(xdp, BPF_PROG_TYPE_XDP);
  1521. BPF_PROG_TYPE_FNS(perf_event, BPF_PROG_TYPE_PERF_EVENT);
  1522. #define BPF_PROG_SEC(string, type) { string, sizeof(string) - 1, type }
  1523. static const struct {
  1524. const char *sec;
  1525. size_t len;
  1526. enum bpf_prog_type prog_type;
  1527. } section_names[] = {
  1528. BPF_PROG_SEC("socket", BPF_PROG_TYPE_SOCKET_FILTER),
  1529. BPF_PROG_SEC("kprobe/", BPF_PROG_TYPE_KPROBE),
  1530. BPF_PROG_SEC("kretprobe/", BPF_PROG_TYPE_KPROBE),
  1531. BPF_PROG_SEC("tracepoint/", BPF_PROG_TYPE_TRACEPOINT),
  1532. BPF_PROG_SEC("xdp", BPF_PROG_TYPE_XDP),
  1533. BPF_PROG_SEC("perf_event", BPF_PROG_TYPE_PERF_EVENT),
  1534. BPF_PROG_SEC("cgroup/skb", BPF_PROG_TYPE_CGROUP_SKB),
  1535. BPF_PROG_SEC("cgroup/sock", BPF_PROG_TYPE_CGROUP_SOCK),
  1536. BPF_PROG_SEC("cgroup/dev", BPF_PROG_TYPE_CGROUP_DEVICE),
  1537. BPF_PROG_SEC("sockops", BPF_PROG_TYPE_SOCK_OPS),
  1538. BPF_PROG_SEC("sk_skb", BPF_PROG_TYPE_SK_SKB),
  1539. };
  1540. #undef BPF_PROG_SEC
  1541. static enum bpf_prog_type bpf_program__guess_type(struct bpf_program *prog)
  1542. {
  1543. int i;
  1544. if (!prog->section_name)
  1545. goto err;
  1546. for (i = 0; i < ARRAY_SIZE(section_names); i++)
  1547. if (strncmp(prog->section_name, section_names[i].sec,
  1548. section_names[i].len) == 0)
  1549. return section_names[i].prog_type;
  1550. err:
  1551. pr_warning("failed to guess program type based on section name %s\n",
  1552. prog->section_name);
  1553. return BPF_PROG_TYPE_UNSPEC;
  1554. }
  1555. int bpf_map__fd(struct bpf_map *map)
  1556. {
  1557. return map ? map->fd : -EINVAL;
  1558. }
  1559. const struct bpf_map_def *bpf_map__def(struct bpf_map *map)
  1560. {
  1561. return map ? &map->def : ERR_PTR(-EINVAL);
  1562. }
  1563. const char *bpf_map__name(struct bpf_map *map)
  1564. {
  1565. return map ? map->name : NULL;
  1566. }
  1567. int bpf_map__set_priv(struct bpf_map *map, void *priv,
  1568. bpf_map_clear_priv_t clear_priv)
  1569. {
  1570. if (!map)
  1571. return -EINVAL;
  1572. if (map->priv) {
  1573. if (map->clear_priv)
  1574. map->clear_priv(map, map->priv);
  1575. }
  1576. map->priv = priv;
  1577. map->clear_priv = clear_priv;
  1578. return 0;
  1579. }
  1580. void *bpf_map__priv(struct bpf_map *map)
  1581. {
  1582. return map ? map->priv : ERR_PTR(-EINVAL);
  1583. }
  1584. struct bpf_map *
  1585. bpf_map__next(struct bpf_map *prev, struct bpf_object *obj)
  1586. {
  1587. size_t idx;
  1588. struct bpf_map *s, *e;
  1589. if (!obj || !obj->maps)
  1590. return NULL;
  1591. s = obj->maps;
  1592. e = obj->maps + obj->nr_maps;
  1593. if (prev == NULL)
  1594. return s;
  1595. if ((prev < s) || (prev >= e)) {
  1596. pr_warning("error in %s: map handler doesn't belong to object\n",
  1597. __func__);
  1598. return NULL;
  1599. }
  1600. idx = (prev - obj->maps) + 1;
  1601. if (idx >= obj->nr_maps)
  1602. return NULL;
  1603. return &obj->maps[idx];
  1604. }
  1605. struct bpf_map *
  1606. bpf_object__find_map_by_name(struct bpf_object *obj, const char *name)
  1607. {
  1608. struct bpf_map *pos;
  1609. bpf_map__for_each(pos, obj) {
  1610. if (pos->name && !strcmp(pos->name, name))
  1611. return pos;
  1612. }
  1613. return NULL;
  1614. }
  1615. struct bpf_map *
  1616. bpf_object__find_map_by_offset(struct bpf_object *obj, size_t offset)
  1617. {
  1618. int i;
  1619. for (i = 0; i < obj->nr_maps; i++) {
  1620. if (obj->maps[i].offset == offset)
  1621. return &obj->maps[i];
  1622. }
  1623. return ERR_PTR(-ENOENT);
  1624. }
  1625. long libbpf_get_error(const void *ptr)
  1626. {
  1627. if (IS_ERR(ptr))
  1628. return PTR_ERR(ptr);
  1629. return 0;
  1630. }
  1631. int bpf_prog_load(const char *file, enum bpf_prog_type type,
  1632. struct bpf_object **pobj, int *prog_fd)
  1633. {
  1634. struct bpf_program *prog, *first_prog = NULL;
  1635. struct bpf_object *obj;
  1636. int err;
  1637. obj = bpf_object__open(file);
  1638. if (IS_ERR(obj))
  1639. return -ENOENT;
  1640. bpf_object__for_each_program(prog, obj) {
  1641. /*
  1642. * If type is not specified, try to guess it based on
  1643. * section name.
  1644. */
  1645. if (type == BPF_PROG_TYPE_UNSPEC) {
  1646. type = bpf_program__guess_type(prog);
  1647. if (type == BPF_PROG_TYPE_UNSPEC) {
  1648. bpf_object__close(obj);
  1649. return -EINVAL;
  1650. }
  1651. }
  1652. bpf_program__set_type(prog, type);
  1653. if (prog->idx != obj->efile.text_shndx && !first_prog)
  1654. first_prog = prog;
  1655. }
  1656. if (!first_prog) {
  1657. pr_warning("object file doesn't contain bpf program\n");
  1658. bpf_object__close(obj);
  1659. return -ENOENT;
  1660. }
  1661. err = bpf_object__load(obj);
  1662. if (err) {
  1663. bpf_object__close(obj);
  1664. return -EINVAL;
  1665. }
  1666. *pobj = obj;
  1667. *prog_fd = bpf_program__fd(first_prog);
  1668. return 0;
  1669. }