bpf.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513
  1. /* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
  2. *
  3. * This program is free software; you can redistribute it and/or
  4. * modify it under the terms of version 2 of the GNU General Public
  5. * License as published by the Free Software Foundation.
  6. */
  7. #ifndef _LINUX_BPF_H
  8. #define _LINUX_BPF_H 1
  9. #include <uapi/linux/bpf.h>
  10. #include <linux/workqueue.h>
  11. #include <linux/file.h>
  12. #include <linux/percpu.h>
  13. #include <linux/err.h>
  14. #include <linux/rbtree_latch.h>
  15. #include <linux/numa.h>
  16. struct perf_event;
  17. struct bpf_prog;
  18. struct bpf_map;
  19. /* map is generic key/value storage optionally accesible by eBPF programs */
  20. struct bpf_map_ops {
  21. /* funcs callable from userspace (via syscall) */
  22. struct bpf_map *(*map_alloc)(union bpf_attr *attr);
  23. void (*map_release)(struct bpf_map *map, struct file *map_file);
  24. void (*map_free)(struct bpf_map *map);
  25. int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
  26. /* funcs callable from userspace and from eBPF programs */
  27. void *(*map_lookup_elem)(struct bpf_map *map, void *key);
  28. int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
  29. int (*map_delete_elem)(struct bpf_map *map, void *key);
  30. /* funcs called by prog_array and perf_event_array map */
  31. void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
  32. int fd);
  33. void (*map_fd_put_ptr)(void *ptr);
  34. u32 (*map_gen_lookup)(struct bpf_map *map, struct bpf_insn *insn_buf);
  35. u32 (*map_fd_sys_lookup_elem)(void *ptr);
  36. };
  37. struct bpf_map {
  38. atomic_t refcnt;
  39. enum bpf_map_type map_type;
  40. u32 key_size;
  41. u32 value_size;
  42. u32 max_entries;
  43. u32 map_flags;
  44. u32 pages;
  45. u32 id;
  46. int numa_node;
  47. struct user_struct *user;
  48. const struct bpf_map_ops *ops;
  49. struct work_struct work;
  50. atomic_t usercnt;
  51. struct bpf_map *inner_map_meta;
  52. char name[BPF_OBJ_NAME_LEN];
  53. #ifdef CONFIG_SECURITY
  54. void *security;
  55. #endif
  56. };
  57. /* function argument constraints */
  58. enum bpf_arg_type {
  59. ARG_DONTCARE = 0, /* unused argument in helper function */
  60. /* the following constraints used to prototype
  61. * bpf_map_lookup/update/delete_elem() functions
  62. */
  63. ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
  64. ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
  65. ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
  66. /* the following constraints used to prototype bpf_memcmp() and other
  67. * functions that access data on eBPF program stack
  68. */
  69. ARG_PTR_TO_MEM, /* pointer to valid memory (stack, packet, map value) */
  70. ARG_PTR_TO_UNINIT_MEM, /* pointer to memory does not need to be initialized,
  71. * helper function must fill all bytes or clear
  72. * them in error case.
  73. */
  74. ARG_CONST_SIZE, /* number of bytes accessed from memory */
  75. ARG_CONST_SIZE_OR_ZERO, /* number of bytes accessed from memory or 0 */
  76. ARG_PTR_TO_CTX, /* pointer to context */
  77. ARG_ANYTHING, /* any (initialized) argument is ok */
  78. };
  79. /* type of values returned from helper functions */
  80. enum bpf_return_type {
  81. RET_INTEGER, /* function returns integer */
  82. RET_VOID, /* function doesn't return anything */
  83. RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
  84. };
  85. /* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
  86. * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
  87. * instructions after verifying
  88. */
  89. struct bpf_func_proto {
  90. u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  91. bool gpl_only;
  92. bool pkt_access;
  93. enum bpf_return_type ret_type;
  94. enum bpf_arg_type arg1_type;
  95. enum bpf_arg_type arg2_type;
  96. enum bpf_arg_type arg3_type;
  97. enum bpf_arg_type arg4_type;
  98. enum bpf_arg_type arg5_type;
  99. };
  100. /* bpf_context is intentionally undefined structure. Pointer to bpf_context is
  101. * the first argument to eBPF programs.
  102. * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
  103. */
  104. struct bpf_context;
  105. enum bpf_access_type {
  106. BPF_READ = 1,
  107. BPF_WRITE = 2
  108. };
  109. /* types of values stored in eBPF registers */
  110. /* Pointer types represent:
  111. * pointer
  112. * pointer + imm
  113. * pointer + (u16) var
  114. * pointer + (u16) var + imm
  115. * if (range > 0) then [ptr, ptr + range - off) is safe to access
  116. * if (id > 0) means that some 'var' was added
  117. * if (off > 0) means that 'imm' was added
  118. */
  119. enum bpf_reg_type {
  120. NOT_INIT = 0, /* nothing was written into register */
  121. SCALAR_VALUE, /* reg doesn't contain a valid pointer */
  122. PTR_TO_CTX, /* reg points to bpf_context */
  123. CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
  124. PTR_TO_MAP_VALUE, /* reg points to map element value */
  125. PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
  126. PTR_TO_STACK, /* reg == frame_pointer + offset */
  127. PTR_TO_PACKET_META, /* skb->data - meta_len */
  128. PTR_TO_PACKET, /* reg points to skb->data */
  129. PTR_TO_PACKET_END, /* skb->data + headlen */
  130. };
  131. /* The information passed from prog-specific *_is_valid_access
  132. * back to the verifier.
  133. */
  134. struct bpf_insn_access_aux {
  135. enum bpf_reg_type reg_type;
  136. int ctx_field_size;
  137. };
  138. static inline void
  139. bpf_ctx_record_field_size(struct bpf_insn_access_aux *aux, u32 size)
  140. {
  141. aux->ctx_field_size = size;
  142. }
  143. struct bpf_prog_ops {
  144. int (*test_run)(struct bpf_prog *prog, const union bpf_attr *kattr,
  145. union bpf_attr __user *uattr);
  146. };
  147. struct bpf_verifier_ops {
  148. /* return eBPF function prototype for verification */
  149. const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
  150. /* return true if 'size' wide access at offset 'off' within bpf_context
  151. * with 'type' (read or write) is allowed
  152. */
  153. bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
  154. struct bpf_insn_access_aux *info);
  155. int (*gen_prologue)(struct bpf_insn *insn, bool direct_write,
  156. const struct bpf_prog *prog);
  157. u32 (*convert_ctx_access)(enum bpf_access_type type,
  158. const struct bpf_insn *src,
  159. struct bpf_insn *dst,
  160. struct bpf_prog *prog, u32 *target_size);
  161. };
  162. struct bpf_prog_aux {
  163. atomic_t refcnt;
  164. u32 used_map_cnt;
  165. u32 max_ctx_offset;
  166. u32 stack_depth;
  167. u32 id;
  168. struct latch_tree_node ksym_tnode;
  169. struct list_head ksym_lnode;
  170. const struct bpf_prog_ops *ops;
  171. struct bpf_map **used_maps;
  172. struct bpf_prog *prog;
  173. struct user_struct *user;
  174. u64 load_time; /* ns since boottime */
  175. char name[BPF_OBJ_NAME_LEN];
  176. #ifdef CONFIG_SECURITY
  177. void *security;
  178. #endif
  179. union {
  180. struct work_struct work;
  181. struct rcu_head rcu;
  182. };
  183. };
  184. struct bpf_array {
  185. struct bpf_map map;
  186. u32 elem_size;
  187. /* 'ownership' of prog_array is claimed by the first program that
  188. * is going to use this map or by the first program which FD is stored
  189. * in the map to make sure that all callers and callees have the same
  190. * prog_type and JITed flag
  191. */
  192. enum bpf_prog_type owner_prog_type;
  193. bool owner_jited;
  194. union {
  195. char value[0] __aligned(8);
  196. void *ptrs[0] __aligned(8);
  197. void __percpu *pptrs[0] __aligned(8);
  198. };
  199. };
  200. #define MAX_TAIL_CALL_CNT 32
  201. struct bpf_event_entry {
  202. struct perf_event *event;
  203. struct file *perf_file;
  204. struct file *map_file;
  205. struct rcu_head rcu;
  206. };
  207. u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
  208. u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  209. bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
  210. int bpf_prog_calc_tag(struct bpf_prog *fp);
  211. const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
  212. typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
  213. unsigned long off, unsigned long len);
  214. u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
  215. void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
  216. int bpf_prog_test_run_xdp(struct bpf_prog *prog, const union bpf_attr *kattr,
  217. union bpf_attr __user *uattr);
  218. int bpf_prog_test_run_skb(struct bpf_prog *prog, const union bpf_attr *kattr,
  219. union bpf_attr __user *uattr);
  220. /* an array of programs to be executed under rcu_lock.
  221. *
  222. * Typical usage:
  223. * ret = BPF_PROG_RUN_ARRAY(&bpf_prog_array, ctx, BPF_PROG_RUN);
  224. *
  225. * the structure returned by bpf_prog_array_alloc() should be populated
  226. * with program pointers and the last pointer must be NULL.
  227. * The user has to keep refcnt on the program and make sure the program
  228. * is removed from the array before bpf_prog_put().
  229. * The 'struct bpf_prog_array *' should only be replaced with xchg()
  230. * since other cpus are walking the array of pointers in parallel.
  231. */
  232. struct bpf_prog_array {
  233. struct rcu_head rcu;
  234. struct bpf_prog *progs[0];
  235. };
  236. struct bpf_prog_array __rcu *bpf_prog_array_alloc(u32 prog_cnt, gfp_t flags);
  237. void bpf_prog_array_free(struct bpf_prog_array __rcu *progs);
  238. int bpf_prog_array_length(struct bpf_prog_array __rcu *progs);
  239. int bpf_prog_array_copy_to_user(struct bpf_prog_array __rcu *progs,
  240. __u32 __user *prog_ids, u32 cnt);
  241. #define BPF_PROG_RUN_ARRAY(array, ctx, func) \
  242. ({ \
  243. struct bpf_prog **_prog; \
  244. u32 _ret = 1; \
  245. rcu_read_lock(); \
  246. _prog = rcu_dereference(array)->progs; \
  247. for (; *_prog; _prog++) \
  248. _ret &= func(*_prog, ctx); \
  249. rcu_read_unlock(); \
  250. _ret; \
  251. })
  252. #ifdef CONFIG_BPF_SYSCALL
  253. DECLARE_PER_CPU(int, bpf_prog_active);
  254. #define BPF_PROG_TYPE(_id, _name) \
  255. extern const struct bpf_prog_ops _name ## _prog_ops; \
  256. extern const struct bpf_verifier_ops _name ## _verifier_ops;
  257. #define BPF_MAP_TYPE(_id, _ops) \
  258. extern const struct bpf_map_ops _ops;
  259. #include <linux/bpf_types.h>
  260. #undef BPF_PROG_TYPE
  261. #undef BPF_MAP_TYPE
  262. extern const struct bpf_verifier_ops tc_cls_act_analyzer_ops;
  263. extern const struct bpf_verifier_ops xdp_analyzer_ops;
  264. struct bpf_prog *bpf_prog_get(u32 ufd);
  265. struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
  266. struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog, int i);
  267. void bpf_prog_sub(struct bpf_prog *prog, int i);
  268. struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog);
  269. struct bpf_prog * __must_check bpf_prog_inc_not_zero(struct bpf_prog *prog);
  270. void bpf_prog_put(struct bpf_prog *prog);
  271. int __bpf_prog_charge(struct user_struct *user, u32 pages);
  272. void __bpf_prog_uncharge(struct user_struct *user, u32 pages);
  273. struct bpf_map *bpf_map_get_with_uref(u32 ufd);
  274. struct bpf_map *__bpf_map_get(struct fd f);
  275. struct bpf_map * __must_check bpf_map_inc(struct bpf_map *map, bool uref);
  276. void bpf_map_put_with_uref(struct bpf_map *map);
  277. void bpf_map_put(struct bpf_map *map);
  278. int bpf_map_precharge_memlock(u32 pages);
  279. void *bpf_map_area_alloc(size_t size, int numa_node);
  280. void bpf_map_area_free(void *base);
  281. extern int sysctl_unprivileged_bpf_disabled;
  282. int bpf_map_new_fd(struct bpf_map *map, int flags);
  283. int bpf_prog_new_fd(struct bpf_prog *prog);
  284. int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
  285. int bpf_obj_get_user(const char __user *pathname, int flags);
  286. int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
  287. int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
  288. int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
  289. u64 flags);
  290. int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
  291. u64 flags);
  292. int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
  293. int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
  294. void *key, void *value, u64 map_flags);
  295. int bpf_fd_array_map_lookup_elem(struct bpf_map *map, void *key, u32 *value);
  296. void bpf_fd_array_map_clear(struct bpf_map *map);
  297. int bpf_fd_htab_map_update_elem(struct bpf_map *map, struct file *map_file,
  298. void *key, void *value, u64 map_flags);
  299. int bpf_fd_htab_map_lookup_elem(struct bpf_map *map, void *key, u32 *value);
  300. int bpf_get_file_flag(int flags);
  301. /* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
  302. * forced to use 'long' read/writes to try to atomically copy long counters.
  303. * Best-effort only. No barriers here, since it _will_ race with concurrent
  304. * updates from BPF programs. Called from bpf syscall and mostly used with
  305. * size 8 or 16 bytes, so ask compiler to inline it.
  306. */
  307. static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
  308. {
  309. const long *lsrc = src;
  310. long *ldst = dst;
  311. size /= sizeof(long);
  312. while (size--)
  313. *ldst++ = *lsrc++;
  314. }
  315. /* verify correctness of eBPF program */
  316. int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
  317. /* Map specifics */
  318. struct net_device *__dev_map_lookup_elem(struct bpf_map *map, u32 key);
  319. void __dev_map_insert_ctx(struct bpf_map *map, u32 index);
  320. void __dev_map_flush(struct bpf_map *map);
  321. struct bpf_cpu_map_entry *__cpu_map_lookup_elem(struct bpf_map *map, u32 key);
  322. void __cpu_map_insert_ctx(struct bpf_map *map, u32 index);
  323. void __cpu_map_flush(struct bpf_map *map);
  324. struct xdp_buff;
  325. int cpu_map_enqueue(struct bpf_cpu_map_entry *rcpu, struct xdp_buff *xdp,
  326. struct net_device *dev_rx);
  327. /* Return map's numa specified by userspace */
  328. static inline int bpf_map_attr_numa_node(const union bpf_attr *attr)
  329. {
  330. return (attr->map_flags & BPF_F_NUMA_NODE) ?
  331. attr->numa_node : NUMA_NO_NODE;
  332. }
  333. #else /* !CONFIG_BPF_SYSCALL */
  334. static inline struct bpf_prog *bpf_prog_get(u32 ufd)
  335. {
  336. return ERR_PTR(-EOPNOTSUPP);
  337. }
  338. static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
  339. enum bpf_prog_type type)
  340. {
  341. return ERR_PTR(-EOPNOTSUPP);
  342. }
  343. static inline struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog,
  344. int i)
  345. {
  346. return ERR_PTR(-EOPNOTSUPP);
  347. }
  348. static inline void bpf_prog_sub(struct bpf_prog *prog, int i)
  349. {
  350. }
  351. static inline void bpf_prog_put(struct bpf_prog *prog)
  352. {
  353. }
  354. static inline struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog)
  355. {
  356. return ERR_PTR(-EOPNOTSUPP);
  357. }
  358. static inline struct bpf_prog *__must_check
  359. bpf_prog_inc_not_zero(struct bpf_prog *prog)
  360. {
  361. return ERR_PTR(-EOPNOTSUPP);
  362. }
  363. static inline int __bpf_prog_charge(struct user_struct *user, u32 pages)
  364. {
  365. return 0;
  366. }
  367. static inline void __bpf_prog_uncharge(struct user_struct *user, u32 pages)
  368. {
  369. }
  370. static inline int bpf_obj_get_user(const char __user *pathname, int flags)
  371. {
  372. return -EOPNOTSUPP;
  373. }
  374. static inline struct net_device *__dev_map_lookup_elem(struct bpf_map *map,
  375. u32 key)
  376. {
  377. return NULL;
  378. }
  379. static inline void __dev_map_insert_ctx(struct bpf_map *map, u32 index)
  380. {
  381. }
  382. static inline void __dev_map_flush(struct bpf_map *map)
  383. {
  384. }
  385. static inline
  386. struct bpf_cpu_map_entry *__cpu_map_lookup_elem(struct bpf_map *map, u32 key)
  387. {
  388. return NULL;
  389. }
  390. static inline void __cpu_map_insert_ctx(struct bpf_map *map, u32 index)
  391. {
  392. }
  393. static inline void __cpu_map_flush(struct bpf_map *map)
  394. {
  395. }
  396. struct xdp_buff;
  397. static inline int cpu_map_enqueue(struct bpf_cpu_map_entry *rcpu,
  398. struct xdp_buff *xdp,
  399. struct net_device *dev_rx)
  400. {
  401. return 0;
  402. }
  403. #endif /* CONFIG_BPF_SYSCALL */
  404. #if defined(CONFIG_STREAM_PARSER) && defined(CONFIG_BPF_SYSCALL)
  405. struct sock *__sock_map_lookup_elem(struct bpf_map *map, u32 key);
  406. int sock_map_prog(struct bpf_map *map, struct bpf_prog *prog, u32 type);
  407. #else
  408. static inline struct sock *__sock_map_lookup_elem(struct bpf_map *map, u32 key)
  409. {
  410. return NULL;
  411. }
  412. static inline int sock_map_prog(struct bpf_map *map,
  413. struct bpf_prog *prog,
  414. u32 type)
  415. {
  416. return -EOPNOTSUPP;
  417. }
  418. #endif
  419. /* verifier prototypes for helper functions called from eBPF programs */
  420. extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
  421. extern const struct bpf_func_proto bpf_map_update_elem_proto;
  422. extern const struct bpf_func_proto bpf_map_delete_elem_proto;
  423. extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
  424. extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
  425. extern const struct bpf_func_proto bpf_get_numa_node_id_proto;
  426. extern const struct bpf_func_proto bpf_tail_call_proto;
  427. extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
  428. extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
  429. extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
  430. extern const struct bpf_func_proto bpf_get_current_comm_proto;
  431. extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
  432. extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
  433. extern const struct bpf_func_proto bpf_get_stackid_proto;
  434. extern const struct bpf_func_proto bpf_sock_map_update_proto;
  435. /* Shared helpers among cBPF and eBPF. */
  436. void bpf_user_rnd_init_once(void);
  437. u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  438. #endif /* _LINUX_BPF_H */