libbpf.c 44 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985
  1. /*
  2. * Common eBPF ELF object loading operations.
  3. *
  4. * Copyright (C) 2013-2015 Alexei Starovoitov <ast@kernel.org>
  5. * Copyright (C) 2015 Wang Nan <wangnan0@huawei.com>
  6. * Copyright (C) 2015 Huawei Inc.
  7. * Copyright (C) 2017 Nicira, Inc.
  8. *
  9. * This program is free software; you can redistribute it and/or
  10. * modify it under the terms of the GNU Lesser General Public
  11. * License as published by the Free Software Foundation;
  12. * version 2.1 of the License (not later!)
  13. *
  14. * This program is distributed in the hope that it will be useful,
  15. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  17. * GNU Lesser General Public License for more details.
  18. *
  19. * You should have received a copy of the GNU Lesser General Public
  20. * License along with this program; if not, see <http://www.gnu.org/licenses>
  21. */
  22. #include <stdlib.h>
  23. #include <stdio.h>
  24. #include <stdarg.h>
  25. #include <libgen.h>
  26. #include <inttypes.h>
  27. #include <string.h>
  28. #include <unistd.h>
  29. #include <fcntl.h>
  30. #include <errno.h>
  31. #include <asm/unistd.h>
  32. #include <linux/err.h>
  33. #include <linux/kernel.h>
  34. #include <linux/bpf.h>
  35. #include <linux/list.h>
  36. #include <linux/limits.h>
  37. #include <sys/stat.h>
  38. #include <sys/types.h>
  39. #include <sys/vfs.h>
  40. #include <libelf.h>
  41. #include <gelf.h>
  42. #include "libbpf.h"
  43. #include "bpf.h"
  44. #ifndef EM_BPF
  45. #define EM_BPF 247
  46. #endif
  47. #ifndef BPF_FS_MAGIC
  48. #define BPF_FS_MAGIC 0xcafe4a11
  49. #endif
  50. #define __printf(a, b) __attribute__((format(printf, a, b)))
  51. __printf(1, 2)
  52. static int __base_pr(const char *format, ...)
  53. {
  54. va_list args;
  55. int err;
  56. va_start(args, format);
  57. err = vfprintf(stderr, format, args);
  58. va_end(args);
  59. return err;
  60. }
  61. static __printf(1, 2) libbpf_print_fn_t __pr_warning = __base_pr;
  62. static __printf(1, 2) libbpf_print_fn_t __pr_info = __base_pr;
  63. static __printf(1, 2) libbpf_print_fn_t __pr_debug;
  64. #define __pr(func, fmt, ...) \
  65. do { \
  66. if ((func)) \
  67. (func)("libbpf: " fmt, ##__VA_ARGS__); \
  68. } while (0)
  69. #define pr_warning(fmt, ...) __pr(__pr_warning, fmt, ##__VA_ARGS__)
  70. #define pr_info(fmt, ...) __pr(__pr_info, fmt, ##__VA_ARGS__)
  71. #define pr_debug(fmt, ...) __pr(__pr_debug, fmt, ##__VA_ARGS__)
  72. void libbpf_set_print(libbpf_print_fn_t warn,
  73. libbpf_print_fn_t info,
  74. libbpf_print_fn_t debug)
  75. {
  76. __pr_warning = warn;
  77. __pr_info = info;
  78. __pr_debug = debug;
  79. }
  80. #define STRERR_BUFSIZE 128
  81. #define ERRNO_OFFSET(e) ((e) - __LIBBPF_ERRNO__START)
  82. #define ERRCODE_OFFSET(c) ERRNO_OFFSET(LIBBPF_ERRNO__##c)
  83. #define NR_ERRNO (__LIBBPF_ERRNO__END - __LIBBPF_ERRNO__START)
  84. static const char *libbpf_strerror_table[NR_ERRNO] = {
  85. [ERRCODE_OFFSET(LIBELF)] = "Something wrong in libelf",
  86. [ERRCODE_OFFSET(FORMAT)] = "BPF object format invalid",
  87. [ERRCODE_OFFSET(KVERSION)] = "'version' section incorrect or lost",
  88. [ERRCODE_OFFSET(ENDIAN)] = "Endian mismatch",
  89. [ERRCODE_OFFSET(INTERNAL)] = "Internal error in libbpf",
  90. [ERRCODE_OFFSET(RELOC)] = "Relocation failed",
  91. [ERRCODE_OFFSET(VERIFY)] = "Kernel verifier blocks program loading",
  92. [ERRCODE_OFFSET(PROG2BIG)] = "Program too big",
  93. [ERRCODE_OFFSET(KVER)] = "Incorrect kernel version",
  94. [ERRCODE_OFFSET(PROGTYPE)] = "Kernel doesn't support this program type",
  95. [ERRCODE_OFFSET(WRNGPID)] = "Wrong pid in netlink message",
  96. [ERRCODE_OFFSET(INVSEQ)] = "Invalid netlink sequence",
  97. };
  98. int libbpf_strerror(int err, char *buf, size_t size)
  99. {
  100. if (!buf || !size)
  101. return -1;
  102. err = err > 0 ? err : -err;
  103. if (err < __LIBBPF_ERRNO__START) {
  104. int ret;
  105. ret = strerror_r(err, buf, size);
  106. buf[size - 1] = '\0';
  107. return ret;
  108. }
  109. if (err < __LIBBPF_ERRNO__END) {
  110. const char *msg;
  111. msg = libbpf_strerror_table[ERRNO_OFFSET(err)];
  112. snprintf(buf, size, "%s", msg);
  113. buf[size - 1] = '\0';
  114. return 0;
  115. }
  116. snprintf(buf, size, "Unknown libbpf error %d", err);
  117. buf[size - 1] = '\0';
  118. return -1;
  119. }
  120. #define CHECK_ERR(action, err, out) do { \
  121. err = action; \
  122. if (err) \
  123. goto out; \
  124. } while(0)
  125. /* Copied from tools/perf/util/util.h */
  126. #ifndef zfree
  127. # define zfree(ptr) ({ free(*ptr); *ptr = NULL; })
  128. #endif
  129. #ifndef zclose
  130. # define zclose(fd) ({ \
  131. int ___err = 0; \
  132. if ((fd) >= 0) \
  133. ___err = close((fd)); \
  134. fd = -1; \
  135. ___err; })
  136. #endif
  137. #ifdef HAVE_LIBELF_MMAP_SUPPORT
  138. # define LIBBPF_ELF_C_READ_MMAP ELF_C_READ_MMAP
  139. #else
  140. # define LIBBPF_ELF_C_READ_MMAP ELF_C_READ
  141. #endif
  142. /*
  143. * bpf_prog should be a better name but it has been used in
  144. * linux/filter.h.
  145. */
  146. struct bpf_program {
  147. /* Index in elf obj file, for relocation use. */
  148. int idx;
  149. char *name;
  150. char *section_name;
  151. struct bpf_insn *insns;
  152. size_t insns_cnt, main_prog_cnt;
  153. enum bpf_prog_type type;
  154. struct reloc_desc {
  155. enum {
  156. RELO_LD64,
  157. RELO_CALL,
  158. } type;
  159. int insn_idx;
  160. union {
  161. int map_idx;
  162. int text_off;
  163. };
  164. } *reloc_desc;
  165. int nr_reloc;
  166. struct {
  167. int nr;
  168. int *fds;
  169. } instances;
  170. bpf_program_prep_t preprocessor;
  171. struct bpf_object *obj;
  172. void *priv;
  173. bpf_program_clear_priv_t clear_priv;
  174. };
  175. struct bpf_map {
  176. int fd;
  177. char *name;
  178. size_t offset;
  179. struct bpf_map_def def;
  180. void *priv;
  181. bpf_map_clear_priv_t clear_priv;
  182. };
  183. static LIST_HEAD(bpf_objects_list);
  184. struct bpf_object {
  185. char license[64];
  186. u32 kern_version;
  187. struct bpf_program *programs;
  188. size_t nr_programs;
  189. struct bpf_map *maps;
  190. size_t nr_maps;
  191. bool loaded;
  192. /*
  193. * Information when doing elf related work. Only valid if fd
  194. * is valid.
  195. */
  196. struct {
  197. int fd;
  198. void *obj_buf;
  199. size_t obj_buf_sz;
  200. Elf *elf;
  201. GElf_Ehdr ehdr;
  202. Elf_Data *symbols;
  203. size_t strtabidx;
  204. struct {
  205. GElf_Shdr shdr;
  206. Elf_Data *data;
  207. } *reloc;
  208. int nr_reloc;
  209. int maps_shndx;
  210. int text_shndx;
  211. } efile;
  212. /*
  213. * All loaded bpf_object is linked in a list, which is
  214. * hidden to caller. bpf_objects__<func> handlers deal with
  215. * all objects.
  216. */
  217. struct list_head list;
  218. void *priv;
  219. bpf_object_clear_priv_t clear_priv;
  220. char path[];
  221. };
  222. #define obj_elf_valid(o) ((o)->efile.elf)
  223. static void bpf_program__unload(struct bpf_program *prog)
  224. {
  225. int i;
  226. if (!prog)
  227. return;
  228. /*
  229. * If the object is opened but the program was never loaded,
  230. * it is possible that prog->instances.nr == -1.
  231. */
  232. if (prog->instances.nr > 0) {
  233. for (i = 0; i < prog->instances.nr; i++)
  234. zclose(prog->instances.fds[i]);
  235. } else if (prog->instances.nr != -1) {
  236. pr_warning("Internal error: instances.nr is %d\n",
  237. prog->instances.nr);
  238. }
  239. prog->instances.nr = -1;
  240. zfree(&prog->instances.fds);
  241. }
  242. static void bpf_program__exit(struct bpf_program *prog)
  243. {
  244. if (!prog)
  245. return;
  246. if (prog->clear_priv)
  247. prog->clear_priv(prog, prog->priv);
  248. prog->priv = NULL;
  249. prog->clear_priv = NULL;
  250. bpf_program__unload(prog);
  251. zfree(&prog->name);
  252. zfree(&prog->section_name);
  253. zfree(&prog->insns);
  254. zfree(&prog->reloc_desc);
  255. prog->nr_reloc = 0;
  256. prog->insns_cnt = 0;
  257. prog->idx = -1;
  258. }
  259. static int
  260. bpf_program__init(void *data, size_t size, char *section_name, int idx,
  261. struct bpf_program *prog)
  262. {
  263. if (size < sizeof(struct bpf_insn)) {
  264. pr_warning("corrupted section '%s'\n", section_name);
  265. return -EINVAL;
  266. }
  267. bzero(prog, sizeof(*prog));
  268. prog->section_name = strdup(section_name);
  269. if (!prog->section_name) {
  270. pr_warning("failed to alloc name for prog under section %s\n",
  271. section_name);
  272. goto errout;
  273. }
  274. prog->insns = malloc(size);
  275. if (!prog->insns) {
  276. pr_warning("failed to alloc insns for prog under section %s\n",
  277. section_name);
  278. goto errout;
  279. }
  280. prog->insns_cnt = size / sizeof(struct bpf_insn);
  281. memcpy(prog->insns, data,
  282. prog->insns_cnt * sizeof(struct bpf_insn));
  283. prog->idx = idx;
  284. prog->instances.fds = NULL;
  285. prog->instances.nr = -1;
  286. prog->type = BPF_PROG_TYPE_KPROBE;
  287. return 0;
  288. errout:
  289. bpf_program__exit(prog);
  290. return -ENOMEM;
  291. }
  292. static int
  293. bpf_object__add_program(struct bpf_object *obj, void *data, size_t size,
  294. char *section_name, int idx)
  295. {
  296. struct bpf_program prog, *progs;
  297. int nr_progs, err;
  298. err = bpf_program__init(data, size, section_name, idx, &prog);
  299. if (err)
  300. return err;
  301. progs = obj->programs;
  302. nr_progs = obj->nr_programs;
  303. progs = realloc(progs, sizeof(progs[0]) * (nr_progs + 1));
  304. if (!progs) {
  305. /*
  306. * In this case the original obj->programs
  307. * is still valid, so don't need special treat for
  308. * bpf_close_object().
  309. */
  310. pr_warning("failed to alloc a new program under section '%s'\n",
  311. section_name);
  312. bpf_program__exit(&prog);
  313. return -ENOMEM;
  314. }
  315. pr_debug("found program %s\n", prog.section_name);
  316. obj->programs = progs;
  317. obj->nr_programs = nr_progs + 1;
  318. prog.obj = obj;
  319. progs[nr_progs] = prog;
  320. return 0;
  321. }
  322. static int
  323. bpf_object__init_prog_names(struct bpf_object *obj)
  324. {
  325. Elf_Data *symbols = obj->efile.symbols;
  326. struct bpf_program *prog;
  327. size_t pi, si;
  328. for (pi = 0; pi < obj->nr_programs; pi++) {
  329. const char *name = NULL;
  330. prog = &obj->programs[pi];
  331. if (prog->idx == obj->efile.text_shndx) {
  332. name = ".text";
  333. goto skip_search;
  334. }
  335. for (si = 0; si < symbols->d_size / sizeof(GElf_Sym) && !name;
  336. si++) {
  337. GElf_Sym sym;
  338. if (!gelf_getsym(symbols, si, &sym))
  339. continue;
  340. if (sym.st_shndx != prog->idx)
  341. continue;
  342. if (GELF_ST_BIND(sym.st_info) != STB_GLOBAL)
  343. continue;
  344. name = elf_strptr(obj->efile.elf,
  345. obj->efile.strtabidx,
  346. sym.st_name);
  347. if (!name) {
  348. pr_warning("failed to get sym name string for prog %s\n",
  349. prog->section_name);
  350. return -LIBBPF_ERRNO__LIBELF;
  351. }
  352. }
  353. if (!name) {
  354. pr_warning("failed to find sym for prog %s\n",
  355. prog->section_name);
  356. return -EINVAL;
  357. }
  358. skip_search:
  359. prog->name = strdup(name);
  360. if (!prog->name) {
  361. pr_warning("failed to allocate memory for prog sym %s\n",
  362. name);
  363. return -ENOMEM;
  364. }
  365. }
  366. return 0;
  367. }
  368. static struct bpf_object *bpf_object__new(const char *path,
  369. void *obj_buf,
  370. size_t obj_buf_sz)
  371. {
  372. struct bpf_object *obj;
  373. obj = calloc(1, sizeof(struct bpf_object) + strlen(path) + 1);
  374. if (!obj) {
  375. pr_warning("alloc memory failed for %s\n", path);
  376. return ERR_PTR(-ENOMEM);
  377. }
  378. strcpy(obj->path, path);
  379. obj->efile.fd = -1;
  380. /*
  381. * Caller of this function should also calls
  382. * bpf_object__elf_finish() after data collection to return
  383. * obj_buf to user. If not, we should duplicate the buffer to
  384. * avoid user freeing them before elf finish.
  385. */
  386. obj->efile.obj_buf = obj_buf;
  387. obj->efile.obj_buf_sz = obj_buf_sz;
  388. obj->efile.maps_shndx = -1;
  389. obj->loaded = false;
  390. INIT_LIST_HEAD(&obj->list);
  391. list_add(&obj->list, &bpf_objects_list);
  392. return obj;
  393. }
  394. static void bpf_object__elf_finish(struct bpf_object *obj)
  395. {
  396. if (!obj_elf_valid(obj))
  397. return;
  398. if (obj->efile.elf) {
  399. elf_end(obj->efile.elf);
  400. obj->efile.elf = NULL;
  401. }
  402. obj->efile.symbols = NULL;
  403. zfree(&obj->efile.reloc);
  404. obj->efile.nr_reloc = 0;
  405. zclose(obj->efile.fd);
  406. obj->efile.obj_buf = NULL;
  407. obj->efile.obj_buf_sz = 0;
  408. }
  409. static int bpf_object__elf_init(struct bpf_object *obj)
  410. {
  411. int err = 0;
  412. GElf_Ehdr *ep;
  413. if (obj_elf_valid(obj)) {
  414. pr_warning("elf init: internal error\n");
  415. return -LIBBPF_ERRNO__LIBELF;
  416. }
  417. if (obj->efile.obj_buf_sz > 0) {
  418. /*
  419. * obj_buf should have been validated by
  420. * bpf_object__open_buffer().
  421. */
  422. obj->efile.elf = elf_memory(obj->efile.obj_buf,
  423. obj->efile.obj_buf_sz);
  424. } else {
  425. obj->efile.fd = open(obj->path, O_RDONLY);
  426. if (obj->efile.fd < 0) {
  427. pr_warning("failed to open %s: %s\n", obj->path,
  428. strerror(errno));
  429. return -errno;
  430. }
  431. obj->efile.elf = elf_begin(obj->efile.fd,
  432. LIBBPF_ELF_C_READ_MMAP,
  433. NULL);
  434. }
  435. if (!obj->efile.elf) {
  436. pr_warning("failed to open %s as ELF file\n",
  437. obj->path);
  438. err = -LIBBPF_ERRNO__LIBELF;
  439. goto errout;
  440. }
  441. if (!gelf_getehdr(obj->efile.elf, &obj->efile.ehdr)) {
  442. pr_warning("failed to get EHDR from %s\n",
  443. obj->path);
  444. err = -LIBBPF_ERRNO__FORMAT;
  445. goto errout;
  446. }
  447. ep = &obj->efile.ehdr;
  448. /* Old LLVM set e_machine to EM_NONE */
  449. if ((ep->e_type != ET_REL) || (ep->e_machine && (ep->e_machine != EM_BPF))) {
  450. pr_warning("%s is not an eBPF object file\n",
  451. obj->path);
  452. err = -LIBBPF_ERRNO__FORMAT;
  453. goto errout;
  454. }
  455. return 0;
  456. errout:
  457. bpf_object__elf_finish(obj);
  458. return err;
  459. }
  460. static int
  461. bpf_object__check_endianness(struct bpf_object *obj)
  462. {
  463. static unsigned int const endian = 1;
  464. switch (obj->efile.ehdr.e_ident[EI_DATA]) {
  465. case ELFDATA2LSB:
  466. /* We are big endian, BPF obj is little endian. */
  467. if (*(unsigned char const *)&endian != 1)
  468. goto mismatch;
  469. break;
  470. case ELFDATA2MSB:
  471. /* We are little endian, BPF obj is big endian. */
  472. if (*(unsigned char const *)&endian != 0)
  473. goto mismatch;
  474. break;
  475. default:
  476. return -LIBBPF_ERRNO__ENDIAN;
  477. }
  478. return 0;
  479. mismatch:
  480. pr_warning("Error: endianness mismatch.\n");
  481. return -LIBBPF_ERRNO__ENDIAN;
  482. }
  483. static int
  484. bpf_object__init_license(struct bpf_object *obj,
  485. void *data, size_t size)
  486. {
  487. memcpy(obj->license, data,
  488. min(size, sizeof(obj->license) - 1));
  489. pr_debug("license of %s is %s\n", obj->path, obj->license);
  490. return 0;
  491. }
  492. static int
  493. bpf_object__init_kversion(struct bpf_object *obj,
  494. void *data, size_t size)
  495. {
  496. u32 kver;
  497. if (size != sizeof(kver)) {
  498. pr_warning("invalid kver section in %s\n", obj->path);
  499. return -LIBBPF_ERRNO__FORMAT;
  500. }
  501. memcpy(&kver, data, sizeof(kver));
  502. obj->kern_version = kver;
  503. pr_debug("kernel version of %s is %x\n", obj->path,
  504. obj->kern_version);
  505. return 0;
  506. }
  507. static int compare_bpf_map(const void *_a, const void *_b)
  508. {
  509. const struct bpf_map *a = _a;
  510. const struct bpf_map *b = _b;
  511. return a->offset - b->offset;
  512. }
  513. static int
  514. bpf_object__init_maps(struct bpf_object *obj)
  515. {
  516. int i, map_idx, map_def_sz, nr_maps = 0;
  517. Elf_Scn *scn;
  518. Elf_Data *data;
  519. Elf_Data *symbols = obj->efile.symbols;
  520. if (obj->efile.maps_shndx < 0)
  521. return -EINVAL;
  522. if (!symbols)
  523. return -EINVAL;
  524. scn = elf_getscn(obj->efile.elf, obj->efile.maps_shndx);
  525. if (scn)
  526. data = elf_getdata(scn, NULL);
  527. if (!scn || !data) {
  528. pr_warning("failed to get Elf_Data from map section %d\n",
  529. obj->efile.maps_shndx);
  530. return -EINVAL;
  531. }
  532. /*
  533. * Count number of maps. Each map has a name.
  534. * Array of maps is not supported: only the first element is
  535. * considered.
  536. *
  537. * TODO: Detect array of map and report error.
  538. */
  539. for (i = 0; i < symbols->d_size / sizeof(GElf_Sym); i++) {
  540. GElf_Sym sym;
  541. if (!gelf_getsym(symbols, i, &sym))
  542. continue;
  543. if (sym.st_shndx != obj->efile.maps_shndx)
  544. continue;
  545. nr_maps++;
  546. }
  547. /* Alloc obj->maps and fill nr_maps. */
  548. pr_debug("maps in %s: %d maps in %zd bytes\n", obj->path,
  549. nr_maps, data->d_size);
  550. if (!nr_maps)
  551. return 0;
  552. /* Assume equally sized map definitions */
  553. map_def_sz = data->d_size / nr_maps;
  554. if (!data->d_size || (data->d_size % nr_maps) != 0) {
  555. pr_warning("unable to determine map definition size "
  556. "section %s, %d maps in %zd bytes\n",
  557. obj->path, nr_maps, data->d_size);
  558. return -EINVAL;
  559. }
  560. obj->maps = calloc(nr_maps, sizeof(obj->maps[0]));
  561. if (!obj->maps) {
  562. pr_warning("alloc maps for object failed\n");
  563. return -ENOMEM;
  564. }
  565. obj->nr_maps = nr_maps;
  566. /*
  567. * fill all fd with -1 so won't close incorrect
  568. * fd (fd=0 is stdin) when failure (zclose won't close
  569. * negative fd)).
  570. */
  571. for (i = 0; i < nr_maps; i++)
  572. obj->maps[i].fd = -1;
  573. /*
  574. * Fill obj->maps using data in "maps" section.
  575. */
  576. for (i = 0, map_idx = 0; i < symbols->d_size / sizeof(GElf_Sym); i++) {
  577. GElf_Sym sym;
  578. const char *map_name;
  579. struct bpf_map_def *def;
  580. if (!gelf_getsym(symbols, i, &sym))
  581. continue;
  582. if (sym.st_shndx != obj->efile.maps_shndx)
  583. continue;
  584. map_name = elf_strptr(obj->efile.elf,
  585. obj->efile.strtabidx,
  586. sym.st_name);
  587. obj->maps[map_idx].offset = sym.st_value;
  588. if (sym.st_value + map_def_sz > data->d_size) {
  589. pr_warning("corrupted maps section in %s: last map \"%s\" too small\n",
  590. obj->path, map_name);
  591. return -EINVAL;
  592. }
  593. obj->maps[map_idx].name = strdup(map_name);
  594. if (!obj->maps[map_idx].name) {
  595. pr_warning("failed to alloc map name\n");
  596. return -ENOMEM;
  597. }
  598. pr_debug("map %d is \"%s\"\n", map_idx,
  599. obj->maps[map_idx].name);
  600. def = (struct bpf_map_def *)(data->d_buf + sym.st_value);
  601. /*
  602. * If the definition of the map in the object file fits in
  603. * bpf_map_def, copy it. Any extra fields in our version
  604. * of bpf_map_def will default to zero as a result of the
  605. * calloc above.
  606. */
  607. if (map_def_sz <= sizeof(struct bpf_map_def)) {
  608. memcpy(&obj->maps[map_idx].def, def, map_def_sz);
  609. } else {
  610. /*
  611. * Here the map structure being read is bigger than what
  612. * we expect, truncate if the excess bits are all zero.
  613. * If they are not zero, reject this map as
  614. * incompatible.
  615. */
  616. char *b;
  617. for (b = ((char *)def) + sizeof(struct bpf_map_def);
  618. b < ((char *)def) + map_def_sz; b++) {
  619. if (*b != 0) {
  620. pr_warning("maps section in %s: \"%s\" "
  621. "has unrecognized, non-zero "
  622. "options\n",
  623. obj->path, map_name);
  624. return -EINVAL;
  625. }
  626. }
  627. memcpy(&obj->maps[map_idx].def, def,
  628. sizeof(struct bpf_map_def));
  629. }
  630. map_idx++;
  631. }
  632. qsort(obj->maps, obj->nr_maps, sizeof(obj->maps[0]), compare_bpf_map);
  633. return 0;
  634. }
  635. static int bpf_object__elf_collect(struct bpf_object *obj)
  636. {
  637. Elf *elf = obj->efile.elf;
  638. GElf_Ehdr *ep = &obj->efile.ehdr;
  639. Elf_Scn *scn = NULL;
  640. int idx = 0, err = 0;
  641. /* Elf is corrupted/truncated, avoid calling elf_strptr. */
  642. if (!elf_rawdata(elf_getscn(elf, ep->e_shstrndx), NULL)) {
  643. pr_warning("failed to get e_shstrndx from %s\n",
  644. obj->path);
  645. return -LIBBPF_ERRNO__FORMAT;
  646. }
  647. while ((scn = elf_nextscn(elf, scn)) != NULL) {
  648. char *name;
  649. GElf_Shdr sh;
  650. Elf_Data *data;
  651. idx++;
  652. if (gelf_getshdr(scn, &sh) != &sh) {
  653. pr_warning("failed to get section header from %s\n",
  654. obj->path);
  655. err = -LIBBPF_ERRNO__FORMAT;
  656. goto out;
  657. }
  658. name = elf_strptr(elf, ep->e_shstrndx, sh.sh_name);
  659. if (!name) {
  660. pr_warning("failed to get section name from %s\n",
  661. obj->path);
  662. err = -LIBBPF_ERRNO__FORMAT;
  663. goto out;
  664. }
  665. data = elf_getdata(scn, 0);
  666. if (!data) {
  667. pr_warning("failed to get section data from %s(%s)\n",
  668. name, obj->path);
  669. err = -LIBBPF_ERRNO__FORMAT;
  670. goto out;
  671. }
  672. pr_debug("section %s, size %ld, link %d, flags %lx, type=%d\n",
  673. name, (unsigned long)data->d_size,
  674. (int)sh.sh_link, (unsigned long)sh.sh_flags,
  675. (int)sh.sh_type);
  676. if (strcmp(name, "license") == 0)
  677. err = bpf_object__init_license(obj,
  678. data->d_buf,
  679. data->d_size);
  680. else if (strcmp(name, "version") == 0)
  681. err = bpf_object__init_kversion(obj,
  682. data->d_buf,
  683. data->d_size);
  684. else if (strcmp(name, "maps") == 0)
  685. obj->efile.maps_shndx = idx;
  686. else if (sh.sh_type == SHT_SYMTAB) {
  687. if (obj->efile.symbols) {
  688. pr_warning("bpf: multiple SYMTAB in %s\n",
  689. obj->path);
  690. err = -LIBBPF_ERRNO__FORMAT;
  691. } else {
  692. obj->efile.symbols = data;
  693. obj->efile.strtabidx = sh.sh_link;
  694. }
  695. } else if ((sh.sh_type == SHT_PROGBITS) &&
  696. (sh.sh_flags & SHF_EXECINSTR) &&
  697. (data->d_size > 0)) {
  698. if (strcmp(name, ".text") == 0)
  699. obj->efile.text_shndx = idx;
  700. err = bpf_object__add_program(obj, data->d_buf,
  701. data->d_size, name, idx);
  702. if (err) {
  703. char errmsg[STRERR_BUFSIZE];
  704. strerror_r(-err, errmsg, sizeof(errmsg));
  705. pr_warning("failed to alloc program %s (%s): %s",
  706. name, obj->path, errmsg);
  707. }
  708. } else if (sh.sh_type == SHT_REL) {
  709. void *reloc = obj->efile.reloc;
  710. int nr_reloc = obj->efile.nr_reloc + 1;
  711. reloc = realloc(reloc,
  712. sizeof(*obj->efile.reloc) * nr_reloc);
  713. if (!reloc) {
  714. pr_warning("realloc failed\n");
  715. err = -ENOMEM;
  716. } else {
  717. int n = nr_reloc - 1;
  718. obj->efile.reloc = reloc;
  719. obj->efile.nr_reloc = nr_reloc;
  720. obj->efile.reloc[n].shdr = sh;
  721. obj->efile.reloc[n].data = data;
  722. }
  723. }
  724. if (err)
  725. goto out;
  726. }
  727. if (!obj->efile.strtabidx || obj->efile.strtabidx >= idx) {
  728. pr_warning("Corrupted ELF file: index of strtab invalid\n");
  729. return LIBBPF_ERRNO__FORMAT;
  730. }
  731. if (obj->efile.maps_shndx >= 0) {
  732. err = bpf_object__init_maps(obj);
  733. if (err)
  734. goto out;
  735. }
  736. err = bpf_object__init_prog_names(obj);
  737. out:
  738. return err;
  739. }
  740. static struct bpf_program *
  741. bpf_object__find_prog_by_idx(struct bpf_object *obj, int idx)
  742. {
  743. struct bpf_program *prog;
  744. size_t i;
  745. for (i = 0; i < obj->nr_programs; i++) {
  746. prog = &obj->programs[i];
  747. if (prog->idx == idx)
  748. return prog;
  749. }
  750. return NULL;
  751. }
  752. static int
  753. bpf_program__collect_reloc(struct bpf_program *prog, GElf_Shdr *shdr,
  754. Elf_Data *data, struct bpf_object *obj)
  755. {
  756. Elf_Data *symbols = obj->efile.symbols;
  757. int text_shndx = obj->efile.text_shndx;
  758. int maps_shndx = obj->efile.maps_shndx;
  759. struct bpf_map *maps = obj->maps;
  760. size_t nr_maps = obj->nr_maps;
  761. int i, nrels;
  762. pr_debug("collecting relocating info for: '%s'\n",
  763. prog->section_name);
  764. nrels = shdr->sh_size / shdr->sh_entsize;
  765. prog->reloc_desc = malloc(sizeof(*prog->reloc_desc) * nrels);
  766. if (!prog->reloc_desc) {
  767. pr_warning("failed to alloc memory in relocation\n");
  768. return -ENOMEM;
  769. }
  770. prog->nr_reloc = nrels;
  771. for (i = 0; i < nrels; i++) {
  772. GElf_Sym sym;
  773. GElf_Rel rel;
  774. unsigned int insn_idx;
  775. struct bpf_insn *insns = prog->insns;
  776. size_t map_idx;
  777. if (!gelf_getrel(data, i, &rel)) {
  778. pr_warning("relocation: failed to get %d reloc\n", i);
  779. return -LIBBPF_ERRNO__FORMAT;
  780. }
  781. if (!gelf_getsym(symbols,
  782. GELF_R_SYM(rel.r_info),
  783. &sym)) {
  784. pr_warning("relocation: symbol %"PRIx64" not found\n",
  785. GELF_R_SYM(rel.r_info));
  786. return -LIBBPF_ERRNO__FORMAT;
  787. }
  788. pr_debug("relo for %lld value %lld name %d\n",
  789. (long long) (rel.r_info >> 32),
  790. (long long) sym.st_value, sym.st_name);
  791. if (sym.st_shndx != maps_shndx && sym.st_shndx != text_shndx) {
  792. pr_warning("Program '%s' contains non-map related relo data pointing to section %u\n",
  793. prog->section_name, sym.st_shndx);
  794. return -LIBBPF_ERRNO__RELOC;
  795. }
  796. insn_idx = rel.r_offset / sizeof(struct bpf_insn);
  797. pr_debug("relocation: insn_idx=%u\n", insn_idx);
  798. if (insns[insn_idx].code == (BPF_JMP | BPF_CALL)) {
  799. if (insns[insn_idx].src_reg != BPF_PSEUDO_CALL) {
  800. pr_warning("incorrect bpf_call opcode\n");
  801. return -LIBBPF_ERRNO__RELOC;
  802. }
  803. prog->reloc_desc[i].type = RELO_CALL;
  804. prog->reloc_desc[i].insn_idx = insn_idx;
  805. prog->reloc_desc[i].text_off = sym.st_value;
  806. continue;
  807. }
  808. if (insns[insn_idx].code != (BPF_LD | BPF_IMM | BPF_DW)) {
  809. pr_warning("bpf: relocation: invalid relo for insns[%d].code 0x%x\n",
  810. insn_idx, insns[insn_idx].code);
  811. return -LIBBPF_ERRNO__RELOC;
  812. }
  813. /* TODO: 'maps' is sorted. We can use bsearch to make it faster. */
  814. for (map_idx = 0; map_idx < nr_maps; map_idx++) {
  815. if (maps[map_idx].offset == sym.st_value) {
  816. pr_debug("relocation: find map %zd (%s) for insn %u\n",
  817. map_idx, maps[map_idx].name, insn_idx);
  818. break;
  819. }
  820. }
  821. if (map_idx >= nr_maps) {
  822. pr_warning("bpf relocation: map_idx %d large than %d\n",
  823. (int)map_idx, (int)nr_maps - 1);
  824. return -LIBBPF_ERRNO__RELOC;
  825. }
  826. prog->reloc_desc[i].type = RELO_LD64;
  827. prog->reloc_desc[i].insn_idx = insn_idx;
  828. prog->reloc_desc[i].map_idx = map_idx;
  829. }
  830. return 0;
  831. }
  832. static int
  833. bpf_object__create_maps(struct bpf_object *obj)
  834. {
  835. unsigned int i;
  836. for (i = 0; i < obj->nr_maps; i++) {
  837. struct bpf_map_def *def = &obj->maps[i].def;
  838. int *pfd = &obj->maps[i].fd;
  839. *pfd = bpf_create_map_name(def->type,
  840. obj->maps[i].name,
  841. def->key_size,
  842. def->value_size,
  843. def->max_entries,
  844. def->map_flags);
  845. if (*pfd < 0) {
  846. size_t j;
  847. int err = *pfd;
  848. pr_warning("failed to create map (name: '%s'): %s\n",
  849. obj->maps[i].name,
  850. strerror(errno));
  851. for (j = 0; j < i; j++)
  852. zclose(obj->maps[j].fd);
  853. return err;
  854. }
  855. pr_debug("create map %s: fd=%d\n", obj->maps[i].name, *pfd);
  856. }
  857. return 0;
  858. }
  859. static int
  860. bpf_program__reloc_text(struct bpf_program *prog, struct bpf_object *obj,
  861. struct reloc_desc *relo)
  862. {
  863. struct bpf_insn *insn, *new_insn;
  864. struct bpf_program *text;
  865. size_t new_cnt;
  866. if (relo->type != RELO_CALL)
  867. return -LIBBPF_ERRNO__RELOC;
  868. if (prog->idx == obj->efile.text_shndx) {
  869. pr_warning("relo in .text insn %d into off %d\n",
  870. relo->insn_idx, relo->text_off);
  871. return -LIBBPF_ERRNO__RELOC;
  872. }
  873. if (prog->main_prog_cnt == 0) {
  874. text = bpf_object__find_prog_by_idx(obj, obj->efile.text_shndx);
  875. if (!text) {
  876. pr_warning("no .text section found yet relo into text exist\n");
  877. return -LIBBPF_ERRNO__RELOC;
  878. }
  879. new_cnt = prog->insns_cnt + text->insns_cnt;
  880. new_insn = realloc(prog->insns, new_cnt * sizeof(*insn));
  881. if (!new_insn) {
  882. pr_warning("oom in prog realloc\n");
  883. return -ENOMEM;
  884. }
  885. memcpy(new_insn + prog->insns_cnt, text->insns,
  886. text->insns_cnt * sizeof(*insn));
  887. prog->insns = new_insn;
  888. prog->main_prog_cnt = prog->insns_cnt;
  889. prog->insns_cnt = new_cnt;
  890. }
  891. insn = &prog->insns[relo->insn_idx];
  892. insn->imm += prog->main_prog_cnt - relo->insn_idx;
  893. pr_debug("added %zd insn from %s to prog %s\n",
  894. text->insns_cnt, text->section_name, prog->section_name);
  895. return 0;
  896. }
  897. static int
  898. bpf_program__relocate(struct bpf_program *prog, struct bpf_object *obj)
  899. {
  900. int i, err;
  901. if (!prog || !prog->reloc_desc)
  902. return 0;
  903. for (i = 0; i < prog->nr_reloc; i++) {
  904. if (prog->reloc_desc[i].type == RELO_LD64) {
  905. struct bpf_insn *insns = prog->insns;
  906. int insn_idx, map_idx;
  907. insn_idx = prog->reloc_desc[i].insn_idx;
  908. map_idx = prog->reloc_desc[i].map_idx;
  909. if (insn_idx >= (int)prog->insns_cnt) {
  910. pr_warning("relocation out of range: '%s'\n",
  911. prog->section_name);
  912. return -LIBBPF_ERRNO__RELOC;
  913. }
  914. insns[insn_idx].src_reg = BPF_PSEUDO_MAP_FD;
  915. insns[insn_idx].imm = obj->maps[map_idx].fd;
  916. } else {
  917. err = bpf_program__reloc_text(prog, obj,
  918. &prog->reloc_desc[i]);
  919. if (err)
  920. return err;
  921. }
  922. }
  923. zfree(&prog->reloc_desc);
  924. prog->nr_reloc = 0;
  925. return 0;
  926. }
  927. static int
  928. bpf_object__relocate(struct bpf_object *obj)
  929. {
  930. struct bpf_program *prog;
  931. size_t i;
  932. int err;
  933. for (i = 0; i < obj->nr_programs; i++) {
  934. prog = &obj->programs[i];
  935. err = bpf_program__relocate(prog, obj);
  936. if (err) {
  937. pr_warning("failed to relocate '%s'\n",
  938. prog->section_name);
  939. return err;
  940. }
  941. }
  942. return 0;
  943. }
  944. static int bpf_object__collect_reloc(struct bpf_object *obj)
  945. {
  946. int i, err;
  947. if (!obj_elf_valid(obj)) {
  948. pr_warning("Internal error: elf object is closed\n");
  949. return -LIBBPF_ERRNO__INTERNAL;
  950. }
  951. for (i = 0; i < obj->efile.nr_reloc; i++) {
  952. GElf_Shdr *shdr = &obj->efile.reloc[i].shdr;
  953. Elf_Data *data = obj->efile.reloc[i].data;
  954. int idx = shdr->sh_info;
  955. struct bpf_program *prog;
  956. if (shdr->sh_type != SHT_REL) {
  957. pr_warning("internal error at %d\n", __LINE__);
  958. return -LIBBPF_ERRNO__INTERNAL;
  959. }
  960. prog = bpf_object__find_prog_by_idx(obj, idx);
  961. if (!prog) {
  962. pr_warning("relocation failed: no %d section\n",
  963. idx);
  964. return -LIBBPF_ERRNO__RELOC;
  965. }
  966. err = bpf_program__collect_reloc(prog,
  967. shdr, data,
  968. obj);
  969. if (err)
  970. return err;
  971. }
  972. return 0;
  973. }
  974. static int
  975. load_program(enum bpf_prog_type type, const char *name, struct bpf_insn *insns,
  976. int insns_cnt, char *license, u32 kern_version, int *pfd)
  977. {
  978. int ret;
  979. char *log_buf;
  980. if (!insns || !insns_cnt)
  981. return -EINVAL;
  982. log_buf = malloc(BPF_LOG_BUF_SIZE);
  983. if (!log_buf)
  984. pr_warning("Alloc log buffer for bpf loader error, continue without log\n");
  985. ret = bpf_load_program_name(type, name, insns, insns_cnt, license,
  986. kern_version, log_buf, BPF_LOG_BUF_SIZE);
  987. if (ret >= 0) {
  988. *pfd = ret;
  989. ret = 0;
  990. goto out;
  991. }
  992. ret = -LIBBPF_ERRNO__LOAD;
  993. pr_warning("load bpf program failed: %s\n", strerror(errno));
  994. if (log_buf && log_buf[0] != '\0') {
  995. ret = -LIBBPF_ERRNO__VERIFY;
  996. pr_warning("-- BEGIN DUMP LOG ---\n");
  997. pr_warning("\n%s\n", log_buf);
  998. pr_warning("-- END LOG --\n");
  999. } else if (insns_cnt >= BPF_MAXINSNS) {
  1000. pr_warning("Program too large (%d insns), at most %d insns\n",
  1001. insns_cnt, BPF_MAXINSNS);
  1002. ret = -LIBBPF_ERRNO__PROG2BIG;
  1003. } else {
  1004. /* Wrong program type? */
  1005. if (type != BPF_PROG_TYPE_KPROBE) {
  1006. int fd;
  1007. fd = bpf_load_program_name(BPF_PROG_TYPE_KPROBE, name,
  1008. insns, insns_cnt, license,
  1009. kern_version, NULL, 0);
  1010. if (fd >= 0) {
  1011. close(fd);
  1012. ret = -LIBBPF_ERRNO__PROGTYPE;
  1013. goto out;
  1014. }
  1015. }
  1016. if (log_buf)
  1017. ret = -LIBBPF_ERRNO__KVER;
  1018. }
  1019. out:
  1020. free(log_buf);
  1021. return ret;
  1022. }
  1023. static int
  1024. bpf_program__load(struct bpf_program *prog,
  1025. char *license, u32 kern_version)
  1026. {
  1027. int err = 0, fd, i;
  1028. if (prog->instances.nr < 0 || !prog->instances.fds) {
  1029. if (prog->preprocessor) {
  1030. pr_warning("Internal error: can't load program '%s'\n",
  1031. prog->section_name);
  1032. return -LIBBPF_ERRNO__INTERNAL;
  1033. }
  1034. prog->instances.fds = malloc(sizeof(int));
  1035. if (!prog->instances.fds) {
  1036. pr_warning("Not enough memory for BPF fds\n");
  1037. return -ENOMEM;
  1038. }
  1039. prog->instances.nr = 1;
  1040. prog->instances.fds[0] = -1;
  1041. }
  1042. if (!prog->preprocessor) {
  1043. if (prog->instances.nr != 1) {
  1044. pr_warning("Program '%s' is inconsistent: nr(%d) != 1\n",
  1045. prog->section_name, prog->instances.nr);
  1046. }
  1047. err = load_program(prog->type, prog->name, prog->insns,
  1048. prog->insns_cnt, license, kern_version, &fd);
  1049. if (!err)
  1050. prog->instances.fds[0] = fd;
  1051. goto out;
  1052. }
  1053. for (i = 0; i < prog->instances.nr; i++) {
  1054. struct bpf_prog_prep_result result;
  1055. bpf_program_prep_t preprocessor = prog->preprocessor;
  1056. bzero(&result, sizeof(result));
  1057. err = preprocessor(prog, i, prog->insns,
  1058. prog->insns_cnt, &result);
  1059. if (err) {
  1060. pr_warning("Preprocessing the %dth instance of program '%s' failed\n",
  1061. i, prog->section_name);
  1062. goto out;
  1063. }
  1064. if (!result.new_insn_ptr || !result.new_insn_cnt) {
  1065. pr_debug("Skip loading the %dth instance of program '%s'\n",
  1066. i, prog->section_name);
  1067. prog->instances.fds[i] = -1;
  1068. if (result.pfd)
  1069. *result.pfd = -1;
  1070. continue;
  1071. }
  1072. err = load_program(prog->type, prog->name,
  1073. result.new_insn_ptr,
  1074. result.new_insn_cnt,
  1075. license, kern_version, &fd);
  1076. if (err) {
  1077. pr_warning("Loading the %dth instance of program '%s' failed\n",
  1078. i, prog->section_name);
  1079. goto out;
  1080. }
  1081. if (result.pfd)
  1082. *result.pfd = fd;
  1083. prog->instances.fds[i] = fd;
  1084. }
  1085. out:
  1086. if (err)
  1087. pr_warning("failed to load program '%s'\n",
  1088. prog->section_name);
  1089. zfree(&prog->insns);
  1090. prog->insns_cnt = 0;
  1091. return err;
  1092. }
  1093. static int
  1094. bpf_object__load_progs(struct bpf_object *obj)
  1095. {
  1096. size_t i;
  1097. int err;
  1098. for (i = 0; i < obj->nr_programs; i++) {
  1099. if (obj->programs[i].idx == obj->efile.text_shndx)
  1100. continue;
  1101. err = bpf_program__load(&obj->programs[i],
  1102. obj->license,
  1103. obj->kern_version);
  1104. if (err)
  1105. return err;
  1106. }
  1107. return 0;
  1108. }
  1109. static int bpf_object__validate(struct bpf_object *obj)
  1110. {
  1111. if (obj->kern_version == 0) {
  1112. pr_warning("%s doesn't provide kernel version\n",
  1113. obj->path);
  1114. return -LIBBPF_ERRNO__KVERSION;
  1115. }
  1116. return 0;
  1117. }
  1118. static struct bpf_object *
  1119. __bpf_object__open(const char *path, void *obj_buf, size_t obj_buf_sz)
  1120. {
  1121. struct bpf_object *obj;
  1122. int err;
  1123. if (elf_version(EV_CURRENT) == EV_NONE) {
  1124. pr_warning("failed to init libelf for %s\n", path);
  1125. return ERR_PTR(-LIBBPF_ERRNO__LIBELF);
  1126. }
  1127. obj = bpf_object__new(path, obj_buf, obj_buf_sz);
  1128. if (IS_ERR(obj))
  1129. return obj;
  1130. CHECK_ERR(bpf_object__elf_init(obj), err, out);
  1131. CHECK_ERR(bpf_object__check_endianness(obj), err, out);
  1132. CHECK_ERR(bpf_object__elf_collect(obj), err, out);
  1133. CHECK_ERR(bpf_object__collect_reloc(obj), err, out);
  1134. CHECK_ERR(bpf_object__validate(obj), err, out);
  1135. bpf_object__elf_finish(obj);
  1136. return obj;
  1137. out:
  1138. bpf_object__close(obj);
  1139. return ERR_PTR(err);
  1140. }
  1141. struct bpf_object *bpf_object__open(const char *path)
  1142. {
  1143. /* param validation */
  1144. if (!path)
  1145. return NULL;
  1146. pr_debug("loading %s\n", path);
  1147. return __bpf_object__open(path, NULL, 0);
  1148. }
  1149. struct bpf_object *bpf_object__open_buffer(void *obj_buf,
  1150. size_t obj_buf_sz,
  1151. const char *name)
  1152. {
  1153. char tmp_name[64];
  1154. /* param validation */
  1155. if (!obj_buf || obj_buf_sz <= 0)
  1156. return NULL;
  1157. if (!name) {
  1158. snprintf(tmp_name, sizeof(tmp_name), "%lx-%lx",
  1159. (unsigned long)obj_buf,
  1160. (unsigned long)obj_buf_sz);
  1161. tmp_name[sizeof(tmp_name) - 1] = '\0';
  1162. name = tmp_name;
  1163. }
  1164. pr_debug("loading object '%s' from buffer\n",
  1165. name);
  1166. return __bpf_object__open(name, obj_buf, obj_buf_sz);
  1167. }
  1168. int bpf_object__unload(struct bpf_object *obj)
  1169. {
  1170. size_t i;
  1171. if (!obj)
  1172. return -EINVAL;
  1173. for (i = 0; i < obj->nr_maps; i++)
  1174. zclose(obj->maps[i].fd);
  1175. for (i = 0; i < obj->nr_programs; i++)
  1176. bpf_program__unload(&obj->programs[i]);
  1177. return 0;
  1178. }
  1179. int bpf_object__load(struct bpf_object *obj)
  1180. {
  1181. int err;
  1182. if (!obj)
  1183. return -EINVAL;
  1184. if (obj->loaded) {
  1185. pr_warning("object should not be loaded twice\n");
  1186. return -EINVAL;
  1187. }
  1188. obj->loaded = true;
  1189. CHECK_ERR(bpf_object__create_maps(obj), err, out);
  1190. CHECK_ERR(bpf_object__relocate(obj), err, out);
  1191. CHECK_ERR(bpf_object__load_progs(obj), err, out);
  1192. return 0;
  1193. out:
  1194. bpf_object__unload(obj);
  1195. pr_warning("failed to load object '%s'\n", obj->path);
  1196. return err;
  1197. }
  1198. static int check_path(const char *path)
  1199. {
  1200. struct statfs st_fs;
  1201. char *dname, *dir;
  1202. int err = 0;
  1203. if (path == NULL)
  1204. return -EINVAL;
  1205. dname = strdup(path);
  1206. if (dname == NULL)
  1207. return -ENOMEM;
  1208. dir = dirname(dname);
  1209. if (statfs(dir, &st_fs)) {
  1210. pr_warning("failed to statfs %s: %s\n", dir, strerror(errno));
  1211. err = -errno;
  1212. }
  1213. free(dname);
  1214. if (!err && st_fs.f_type != BPF_FS_MAGIC) {
  1215. pr_warning("specified path %s is not on BPF FS\n", path);
  1216. err = -EINVAL;
  1217. }
  1218. return err;
  1219. }
  1220. int bpf_program__pin_instance(struct bpf_program *prog, const char *path,
  1221. int instance)
  1222. {
  1223. int err;
  1224. err = check_path(path);
  1225. if (err)
  1226. return err;
  1227. if (prog == NULL) {
  1228. pr_warning("invalid program pointer\n");
  1229. return -EINVAL;
  1230. }
  1231. if (instance < 0 || instance >= prog->instances.nr) {
  1232. pr_warning("invalid prog instance %d of prog %s (max %d)\n",
  1233. instance, prog->section_name, prog->instances.nr);
  1234. return -EINVAL;
  1235. }
  1236. if (bpf_obj_pin(prog->instances.fds[instance], path)) {
  1237. pr_warning("failed to pin program: %s\n", strerror(errno));
  1238. return -errno;
  1239. }
  1240. pr_debug("pinned program '%s'\n", path);
  1241. return 0;
  1242. }
  1243. static int make_dir(const char *path)
  1244. {
  1245. int err = 0;
  1246. if (mkdir(path, 0700) && errno != EEXIST)
  1247. err = -errno;
  1248. if (err)
  1249. pr_warning("failed to mkdir %s: %s\n", path, strerror(-err));
  1250. return err;
  1251. }
  1252. int bpf_program__pin(struct bpf_program *prog, const char *path)
  1253. {
  1254. int i, err;
  1255. err = check_path(path);
  1256. if (err)
  1257. return err;
  1258. if (prog == NULL) {
  1259. pr_warning("invalid program pointer\n");
  1260. return -EINVAL;
  1261. }
  1262. if (prog->instances.nr <= 0) {
  1263. pr_warning("no instances of prog %s to pin\n",
  1264. prog->section_name);
  1265. return -EINVAL;
  1266. }
  1267. err = make_dir(path);
  1268. if (err)
  1269. return err;
  1270. for (i = 0; i < prog->instances.nr; i++) {
  1271. char buf[PATH_MAX];
  1272. int len;
  1273. len = snprintf(buf, PATH_MAX, "%s/%d", path, i);
  1274. if (len < 0)
  1275. return -EINVAL;
  1276. else if (len >= PATH_MAX)
  1277. return -ENAMETOOLONG;
  1278. err = bpf_program__pin_instance(prog, buf, i);
  1279. if (err)
  1280. return err;
  1281. }
  1282. return 0;
  1283. }
  1284. int bpf_map__pin(struct bpf_map *map, const char *path)
  1285. {
  1286. int err;
  1287. err = check_path(path);
  1288. if (err)
  1289. return err;
  1290. if (map == NULL) {
  1291. pr_warning("invalid map pointer\n");
  1292. return -EINVAL;
  1293. }
  1294. if (bpf_obj_pin(map->fd, path)) {
  1295. pr_warning("failed to pin map: %s\n", strerror(errno));
  1296. return -errno;
  1297. }
  1298. pr_debug("pinned map '%s'\n", path);
  1299. return 0;
  1300. }
  1301. int bpf_object__pin(struct bpf_object *obj, const char *path)
  1302. {
  1303. struct bpf_program *prog;
  1304. struct bpf_map *map;
  1305. int err;
  1306. if (!obj)
  1307. return -ENOENT;
  1308. if (!obj->loaded) {
  1309. pr_warning("object not yet loaded; load it first\n");
  1310. return -ENOENT;
  1311. }
  1312. err = make_dir(path);
  1313. if (err)
  1314. return err;
  1315. bpf_map__for_each(map, obj) {
  1316. char buf[PATH_MAX];
  1317. int len;
  1318. len = snprintf(buf, PATH_MAX, "%s/%s", path,
  1319. bpf_map__name(map));
  1320. if (len < 0)
  1321. return -EINVAL;
  1322. else if (len >= PATH_MAX)
  1323. return -ENAMETOOLONG;
  1324. err = bpf_map__pin(map, buf);
  1325. if (err)
  1326. return err;
  1327. }
  1328. bpf_object__for_each_program(prog, obj) {
  1329. char buf[PATH_MAX];
  1330. int len;
  1331. len = snprintf(buf, PATH_MAX, "%s/%s", path,
  1332. prog->section_name);
  1333. if (len < 0)
  1334. return -EINVAL;
  1335. else if (len >= PATH_MAX)
  1336. return -ENAMETOOLONG;
  1337. err = bpf_program__pin(prog, buf);
  1338. if (err)
  1339. return err;
  1340. }
  1341. return 0;
  1342. }
  1343. void bpf_object__close(struct bpf_object *obj)
  1344. {
  1345. size_t i;
  1346. if (!obj)
  1347. return;
  1348. if (obj->clear_priv)
  1349. obj->clear_priv(obj, obj->priv);
  1350. bpf_object__elf_finish(obj);
  1351. bpf_object__unload(obj);
  1352. for (i = 0; i < obj->nr_maps; i++) {
  1353. zfree(&obj->maps[i].name);
  1354. if (obj->maps[i].clear_priv)
  1355. obj->maps[i].clear_priv(&obj->maps[i],
  1356. obj->maps[i].priv);
  1357. obj->maps[i].priv = NULL;
  1358. obj->maps[i].clear_priv = NULL;
  1359. }
  1360. zfree(&obj->maps);
  1361. obj->nr_maps = 0;
  1362. if (obj->programs && obj->nr_programs) {
  1363. for (i = 0; i < obj->nr_programs; i++)
  1364. bpf_program__exit(&obj->programs[i]);
  1365. }
  1366. zfree(&obj->programs);
  1367. list_del(&obj->list);
  1368. free(obj);
  1369. }
  1370. struct bpf_object *
  1371. bpf_object__next(struct bpf_object *prev)
  1372. {
  1373. struct bpf_object *next;
  1374. if (!prev)
  1375. next = list_first_entry(&bpf_objects_list,
  1376. struct bpf_object,
  1377. list);
  1378. else
  1379. next = list_next_entry(prev, list);
  1380. /* Empty list is noticed here so don't need checking on entry. */
  1381. if (&next->list == &bpf_objects_list)
  1382. return NULL;
  1383. return next;
  1384. }
  1385. const char *bpf_object__name(struct bpf_object *obj)
  1386. {
  1387. return obj ? obj->path : ERR_PTR(-EINVAL);
  1388. }
  1389. unsigned int bpf_object__kversion(struct bpf_object *obj)
  1390. {
  1391. return obj ? obj->kern_version : 0;
  1392. }
  1393. int bpf_object__set_priv(struct bpf_object *obj, void *priv,
  1394. bpf_object_clear_priv_t clear_priv)
  1395. {
  1396. if (obj->priv && obj->clear_priv)
  1397. obj->clear_priv(obj, obj->priv);
  1398. obj->priv = priv;
  1399. obj->clear_priv = clear_priv;
  1400. return 0;
  1401. }
  1402. void *bpf_object__priv(struct bpf_object *obj)
  1403. {
  1404. return obj ? obj->priv : ERR_PTR(-EINVAL);
  1405. }
  1406. struct bpf_program *
  1407. bpf_program__next(struct bpf_program *prev, struct bpf_object *obj)
  1408. {
  1409. size_t idx;
  1410. if (!obj->programs)
  1411. return NULL;
  1412. /* First handler */
  1413. if (prev == NULL)
  1414. return &obj->programs[0];
  1415. if (prev->obj != obj) {
  1416. pr_warning("error: program handler doesn't match object\n");
  1417. return NULL;
  1418. }
  1419. idx = (prev - obj->programs) + 1;
  1420. if (idx >= obj->nr_programs)
  1421. return NULL;
  1422. return &obj->programs[idx];
  1423. }
  1424. int bpf_program__set_priv(struct bpf_program *prog, void *priv,
  1425. bpf_program_clear_priv_t clear_priv)
  1426. {
  1427. if (prog->priv && prog->clear_priv)
  1428. prog->clear_priv(prog, prog->priv);
  1429. prog->priv = priv;
  1430. prog->clear_priv = clear_priv;
  1431. return 0;
  1432. }
  1433. void *bpf_program__priv(struct bpf_program *prog)
  1434. {
  1435. return prog ? prog->priv : ERR_PTR(-EINVAL);
  1436. }
  1437. const char *bpf_program__title(struct bpf_program *prog, bool needs_copy)
  1438. {
  1439. const char *title;
  1440. title = prog->section_name;
  1441. if (needs_copy) {
  1442. title = strdup(title);
  1443. if (!title) {
  1444. pr_warning("failed to strdup program title\n");
  1445. return ERR_PTR(-ENOMEM);
  1446. }
  1447. }
  1448. return title;
  1449. }
  1450. int bpf_program__fd(struct bpf_program *prog)
  1451. {
  1452. return bpf_program__nth_fd(prog, 0);
  1453. }
  1454. int bpf_program__set_prep(struct bpf_program *prog, int nr_instances,
  1455. bpf_program_prep_t prep)
  1456. {
  1457. int *instances_fds;
  1458. if (nr_instances <= 0 || !prep)
  1459. return -EINVAL;
  1460. if (prog->instances.nr > 0 || prog->instances.fds) {
  1461. pr_warning("Can't set pre-processor after loading\n");
  1462. return -EINVAL;
  1463. }
  1464. instances_fds = malloc(sizeof(int) * nr_instances);
  1465. if (!instances_fds) {
  1466. pr_warning("alloc memory failed for fds\n");
  1467. return -ENOMEM;
  1468. }
  1469. /* fill all fd with -1 */
  1470. memset(instances_fds, -1, sizeof(int) * nr_instances);
  1471. prog->instances.nr = nr_instances;
  1472. prog->instances.fds = instances_fds;
  1473. prog->preprocessor = prep;
  1474. return 0;
  1475. }
  1476. int bpf_program__nth_fd(struct bpf_program *prog, int n)
  1477. {
  1478. int fd;
  1479. if (n >= prog->instances.nr || n < 0) {
  1480. pr_warning("Can't get the %dth fd from program %s: only %d instances\n",
  1481. n, prog->section_name, prog->instances.nr);
  1482. return -EINVAL;
  1483. }
  1484. fd = prog->instances.fds[n];
  1485. if (fd < 0) {
  1486. pr_warning("%dth instance of program '%s' is invalid\n",
  1487. n, prog->section_name);
  1488. return -ENOENT;
  1489. }
  1490. return fd;
  1491. }
  1492. void bpf_program__set_type(struct bpf_program *prog, enum bpf_prog_type type)
  1493. {
  1494. prog->type = type;
  1495. }
  1496. static bool bpf_program__is_type(struct bpf_program *prog,
  1497. enum bpf_prog_type type)
  1498. {
  1499. return prog ? (prog->type == type) : false;
  1500. }
  1501. #define BPF_PROG_TYPE_FNS(NAME, TYPE) \
  1502. int bpf_program__set_##NAME(struct bpf_program *prog) \
  1503. { \
  1504. if (!prog) \
  1505. return -EINVAL; \
  1506. bpf_program__set_type(prog, TYPE); \
  1507. return 0; \
  1508. } \
  1509. \
  1510. bool bpf_program__is_##NAME(struct bpf_program *prog) \
  1511. { \
  1512. return bpf_program__is_type(prog, TYPE); \
  1513. } \
  1514. BPF_PROG_TYPE_FNS(socket_filter, BPF_PROG_TYPE_SOCKET_FILTER);
  1515. BPF_PROG_TYPE_FNS(kprobe, BPF_PROG_TYPE_KPROBE);
  1516. BPF_PROG_TYPE_FNS(sched_cls, BPF_PROG_TYPE_SCHED_CLS);
  1517. BPF_PROG_TYPE_FNS(sched_act, BPF_PROG_TYPE_SCHED_ACT);
  1518. BPF_PROG_TYPE_FNS(tracepoint, BPF_PROG_TYPE_TRACEPOINT);
  1519. BPF_PROG_TYPE_FNS(xdp, BPF_PROG_TYPE_XDP);
  1520. BPF_PROG_TYPE_FNS(perf_event, BPF_PROG_TYPE_PERF_EVENT);
  1521. #define BPF_PROG_SEC(string, type) { string, sizeof(string) - 1, type }
  1522. static const struct {
  1523. const char *sec;
  1524. size_t len;
  1525. enum bpf_prog_type prog_type;
  1526. } section_names[] = {
  1527. BPF_PROG_SEC("socket", BPF_PROG_TYPE_SOCKET_FILTER),
  1528. BPF_PROG_SEC("kprobe/", BPF_PROG_TYPE_KPROBE),
  1529. BPF_PROG_SEC("kretprobe/", BPF_PROG_TYPE_KPROBE),
  1530. BPF_PROG_SEC("tracepoint/", BPF_PROG_TYPE_TRACEPOINT),
  1531. BPF_PROG_SEC("xdp", BPF_PROG_TYPE_XDP),
  1532. BPF_PROG_SEC("perf_event", BPF_PROG_TYPE_PERF_EVENT),
  1533. BPF_PROG_SEC("cgroup/skb", BPF_PROG_TYPE_CGROUP_SKB),
  1534. BPF_PROG_SEC("cgroup/sock", BPF_PROG_TYPE_CGROUP_SOCK),
  1535. BPF_PROG_SEC("cgroup/dev", BPF_PROG_TYPE_CGROUP_DEVICE),
  1536. BPF_PROG_SEC("sockops", BPF_PROG_TYPE_SOCK_OPS),
  1537. BPF_PROG_SEC("sk_skb", BPF_PROG_TYPE_SK_SKB),
  1538. };
  1539. #undef BPF_PROG_SEC
  1540. static enum bpf_prog_type bpf_program__guess_type(struct bpf_program *prog)
  1541. {
  1542. int i;
  1543. if (!prog->section_name)
  1544. goto err;
  1545. for (i = 0; i < ARRAY_SIZE(section_names); i++)
  1546. if (strncmp(prog->section_name, section_names[i].sec,
  1547. section_names[i].len) == 0)
  1548. return section_names[i].prog_type;
  1549. err:
  1550. pr_warning("failed to guess program type based on section name %s\n",
  1551. prog->section_name);
  1552. return BPF_PROG_TYPE_UNSPEC;
  1553. }
  1554. int bpf_map__fd(struct bpf_map *map)
  1555. {
  1556. return map ? map->fd : -EINVAL;
  1557. }
  1558. const struct bpf_map_def *bpf_map__def(struct bpf_map *map)
  1559. {
  1560. return map ? &map->def : ERR_PTR(-EINVAL);
  1561. }
  1562. const char *bpf_map__name(struct bpf_map *map)
  1563. {
  1564. return map ? map->name : NULL;
  1565. }
  1566. int bpf_map__set_priv(struct bpf_map *map, void *priv,
  1567. bpf_map_clear_priv_t clear_priv)
  1568. {
  1569. if (!map)
  1570. return -EINVAL;
  1571. if (map->priv) {
  1572. if (map->clear_priv)
  1573. map->clear_priv(map, map->priv);
  1574. }
  1575. map->priv = priv;
  1576. map->clear_priv = clear_priv;
  1577. return 0;
  1578. }
  1579. void *bpf_map__priv(struct bpf_map *map)
  1580. {
  1581. return map ? map->priv : ERR_PTR(-EINVAL);
  1582. }
  1583. struct bpf_map *
  1584. bpf_map__next(struct bpf_map *prev, struct bpf_object *obj)
  1585. {
  1586. size_t idx;
  1587. struct bpf_map *s, *e;
  1588. if (!obj || !obj->maps)
  1589. return NULL;
  1590. s = obj->maps;
  1591. e = obj->maps + obj->nr_maps;
  1592. if (prev == NULL)
  1593. return s;
  1594. if ((prev < s) || (prev >= e)) {
  1595. pr_warning("error in %s: map handler doesn't belong to object\n",
  1596. __func__);
  1597. return NULL;
  1598. }
  1599. idx = (prev - obj->maps) + 1;
  1600. if (idx >= obj->nr_maps)
  1601. return NULL;
  1602. return &obj->maps[idx];
  1603. }
  1604. struct bpf_map *
  1605. bpf_object__find_map_by_name(struct bpf_object *obj, const char *name)
  1606. {
  1607. struct bpf_map *pos;
  1608. bpf_map__for_each(pos, obj) {
  1609. if (pos->name && !strcmp(pos->name, name))
  1610. return pos;
  1611. }
  1612. return NULL;
  1613. }
  1614. struct bpf_map *
  1615. bpf_object__find_map_by_offset(struct bpf_object *obj, size_t offset)
  1616. {
  1617. int i;
  1618. for (i = 0; i < obj->nr_maps; i++) {
  1619. if (obj->maps[i].offset == offset)
  1620. return &obj->maps[i];
  1621. }
  1622. return ERR_PTR(-ENOENT);
  1623. }
  1624. long libbpf_get_error(const void *ptr)
  1625. {
  1626. if (IS_ERR(ptr))
  1627. return PTR_ERR(ptr);
  1628. return 0;
  1629. }
  1630. int bpf_prog_load(const char *file, enum bpf_prog_type type,
  1631. struct bpf_object **pobj, int *prog_fd)
  1632. {
  1633. struct bpf_program *prog, *first_prog = NULL;
  1634. struct bpf_object *obj;
  1635. int err;
  1636. obj = bpf_object__open(file);
  1637. if (IS_ERR(obj))
  1638. return -ENOENT;
  1639. bpf_object__for_each_program(prog, obj) {
  1640. /*
  1641. * If type is not specified, try to guess it based on
  1642. * section name.
  1643. */
  1644. if (type == BPF_PROG_TYPE_UNSPEC) {
  1645. type = bpf_program__guess_type(prog);
  1646. if (type == BPF_PROG_TYPE_UNSPEC) {
  1647. bpf_object__close(obj);
  1648. return -EINVAL;
  1649. }
  1650. }
  1651. bpf_program__set_type(prog, type);
  1652. if (prog->idx != obj->efile.text_shndx && !first_prog)
  1653. first_prog = prog;
  1654. }
  1655. if (!first_prog) {
  1656. pr_warning("object file doesn't contain bpf program\n");
  1657. bpf_object__close(obj);
  1658. return -ENOENT;
  1659. }
  1660. err = bpf_object__load(obj);
  1661. if (err) {
  1662. bpf_object__close(obj);
  1663. return -EINVAL;
  1664. }
  1665. *pobj = obj;
  1666. *prog_fd = bpf_program__fd(first_prog);
  1667. return 0;
  1668. }