bpf.h 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348
  1. /* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
  2. *
  3. * This program is free software; you can redistribute it and/or
  4. * modify it under the terms of version 2 of the GNU General Public
  5. * License as published by the Free Software Foundation.
  6. */
  7. #ifndef _LINUX_BPF_H
  8. #define _LINUX_BPF_H 1
  9. #include <uapi/linux/bpf.h>
  10. #include <linux/workqueue.h>
  11. #include <linux/file.h>
  12. #include <linux/percpu.h>
  13. #include <linux/err.h>
  14. struct perf_event;
  15. struct bpf_map;
  16. /* map is generic key/value storage optionally accesible by eBPF programs */
  17. struct bpf_map_ops {
  18. /* funcs callable from userspace (via syscall) */
  19. struct bpf_map *(*map_alloc)(union bpf_attr *attr);
  20. void (*map_release)(struct bpf_map *map, struct file *map_file);
  21. void (*map_free)(struct bpf_map *map);
  22. int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
  23. /* funcs callable from userspace and from eBPF programs */
  24. void *(*map_lookup_elem)(struct bpf_map *map, void *key);
  25. int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
  26. int (*map_delete_elem)(struct bpf_map *map, void *key);
  27. /* funcs called by prog_array and perf_event_array map */
  28. void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
  29. int fd);
  30. void (*map_fd_put_ptr)(void *ptr);
  31. };
  32. struct bpf_map {
  33. /* 1st cacheline with read-mostly members of which some
  34. * are also accessed in fast-path (e.g. ops, max_entries).
  35. */
  36. const struct bpf_map_ops *ops ____cacheline_aligned;
  37. enum bpf_map_type map_type;
  38. u32 key_size;
  39. u32 value_size;
  40. u32 max_entries;
  41. u32 map_flags;
  42. u32 pages;
  43. bool unpriv_array;
  44. /* 7 bytes hole */
  45. /* 2nd cacheline with misc members to avoid false sharing
  46. * particularly with refcounting.
  47. */
  48. struct user_struct *user ____cacheline_aligned;
  49. atomic_t refcnt;
  50. atomic_t usercnt;
  51. struct work_struct work;
  52. };
  53. struct bpf_map_type_list {
  54. struct list_head list_node;
  55. const struct bpf_map_ops *ops;
  56. enum bpf_map_type type;
  57. };
  58. /* function argument constraints */
  59. enum bpf_arg_type {
  60. ARG_DONTCARE = 0, /* unused argument in helper function */
  61. /* the following constraints used to prototype
  62. * bpf_map_lookup/update/delete_elem() functions
  63. */
  64. ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
  65. ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
  66. ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
  67. /* the following constraints used to prototype bpf_memcmp() and other
  68. * functions that access data on eBPF program stack
  69. */
  70. ARG_PTR_TO_STACK, /* any pointer to eBPF program stack */
  71. ARG_PTR_TO_RAW_STACK, /* any pointer to eBPF program stack, area does not
  72. * need to be initialized, helper function must fill
  73. * all bytes or clear them in error case.
  74. */
  75. ARG_CONST_STACK_SIZE, /* number of bytes accessed from stack */
  76. ARG_CONST_STACK_SIZE_OR_ZERO, /* number of bytes accessed from stack or 0 */
  77. ARG_PTR_TO_CTX, /* pointer to context */
  78. ARG_ANYTHING, /* any (initialized) argument is ok */
  79. };
  80. /* type of values returned from helper functions */
  81. enum bpf_return_type {
  82. RET_INTEGER, /* function returns integer */
  83. RET_VOID, /* function doesn't return anything */
  84. RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
  85. };
  86. /* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
  87. * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
  88. * instructions after verifying
  89. */
  90. struct bpf_func_proto {
  91. u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  92. bool gpl_only;
  93. bool pkt_access;
  94. enum bpf_return_type ret_type;
  95. enum bpf_arg_type arg1_type;
  96. enum bpf_arg_type arg2_type;
  97. enum bpf_arg_type arg3_type;
  98. enum bpf_arg_type arg4_type;
  99. enum bpf_arg_type arg5_type;
  100. };
  101. /* bpf_context is intentionally undefined structure. Pointer to bpf_context is
  102. * the first argument to eBPF programs.
  103. * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
  104. */
  105. struct bpf_context;
  106. enum bpf_access_type {
  107. BPF_READ = 1,
  108. BPF_WRITE = 2
  109. };
  110. /* types of values stored in eBPF registers */
  111. enum bpf_reg_type {
  112. NOT_INIT = 0, /* nothing was written into register */
  113. UNKNOWN_VALUE, /* reg doesn't contain a valid pointer */
  114. PTR_TO_CTX, /* reg points to bpf_context */
  115. CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
  116. PTR_TO_MAP_VALUE, /* reg points to map element value */
  117. PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
  118. FRAME_PTR, /* reg == frame_pointer */
  119. PTR_TO_STACK, /* reg == frame_pointer + imm */
  120. CONST_IMM, /* constant integer value */
  121. /* PTR_TO_PACKET represents:
  122. * skb->data
  123. * skb->data + imm
  124. * skb->data + (u16) var
  125. * skb->data + (u16) var + imm
  126. * if (range > 0) then [ptr, ptr + range - off) is safe to access
  127. * if (id > 0) means that some 'var' was added
  128. * if (off > 0) menas that 'imm' was added
  129. */
  130. PTR_TO_PACKET,
  131. PTR_TO_PACKET_END, /* skb->data + headlen */
  132. /* PTR_TO_MAP_VALUE_ADJ is used for doing pointer math inside of a map
  133. * elem value. We only allow this if we can statically verify that
  134. * access from this register are going to fall within the size of the
  135. * map element.
  136. */
  137. PTR_TO_MAP_VALUE_ADJ,
  138. };
  139. struct bpf_prog;
  140. struct bpf_verifier_ops {
  141. /* return eBPF function prototype for verification */
  142. const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
  143. /* return true if 'size' wide access at offset 'off' within bpf_context
  144. * with 'type' (read or write) is allowed
  145. */
  146. bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
  147. enum bpf_reg_type *reg_type);
  148. int (*gen_prologue)(struct bpf_insn *insn, bool direct_write,
  149. const struct bpf_prog *prog);
  150. u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg,
  151. int src_reg, int ctx_off,
  152. struct bpf_insn *insn, struct bpf_prog *prog);
  153. };
  154. struct bpf_prog_type_list {
  155. struct list_head list_node;
  156. const struct bpf_verifier_ops *ops;
  157. enum bpf_prog_type type;
  158. };
  159. struct bpf_prog_aux {
  160. atomic_t refcnt;
  161. u32 used_map_cnt;
  162. u32 max_ctx_offset;
  163. const struct bpf_verifier_ops *ops;
  164. struct bpf_map **used_maps;
  165. struct bpf_prog *prog;
  166. struct user_struct *user;
  167. union {
  168. struct work_struct work;
  169. struct rcu_head rcu;
  170. };
  171. };
  172. struct bpf_array {
  173. struct bpf_map map;
  174. u32 elem_size;
  175. u32 index_mask;
  176. /* 'ownership' of prog_array is claimed by the first program that
  177. * is going to use this map or by the first program which FD is stored
  178. * in the map to make sure that all callers and callees have the same
  179. * prog_type and JITed flag
  180. */
  181. enum bpf_prog_type owner_prog_type;
  182. bool owner_jited;
  183. union {
  184. char value[0] __aligned(8);
  185. void *ptrs[0] __aligned(8);
  186. void __percpu *pptrs[0] __aligned(8);
  187. };
  188. };
  189. #define MAX_TAIL_CALL_CNT 32
  190. struct bpf_event_entry {
  191. struct perf_event *event;
  192. struct file *perf_file;
  193. struct file *map_file;
  194. struct rcu_head rcu;
  195. };
  196. u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
  197. u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  198. bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
  199. const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
  200. typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
  201. unsigned long off, unsigned long len);
  202. u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
  203. void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
  204. #ifdef CONFIG_BPF_SYSCALL
  205. DECLARE_PER_CPU(int, bpf_prog_active);
  206. void bpf_register_prog_type(struct bpf_prog_type_list *tl);
  207. void bpf_register_map_type(struct bpf_map_type_list *tl);
  208. struct bpf_prog *bpf_prog_get(u32 ufd);
  209. struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
  210. struct bpf_prog *bpf_prog_add(struct bpf_prog *prog, int i);
  211. struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog);
  212. void bpf_prog_put(struct bpf_prog *prog);
  213. struct bpf_map *bpf_map_get_with_uref(u32 ufd);
  214. struct bpf_map *__bpf_map_get(struct fd f);
  215. struct bpf_map *bpf_map_inc(struct bpf_map *map, bool uref);
  216. void bpf_map_put_with_uref(struct bpf_map *map);
  217. void bpf_map_put(struct bpf_map *map);
  218. int bpf_map_precharge_memlock(u32 pages);
  219. void *bpf_map_area_alloc(size_t size);
  220. void bpf_map_area_free(void *base);
  221. extern int sysctl_unprivileged_bpf_disabled;
  222. int bpf_map_new_fd(struct bpf_map *map);
  223. int bpf_prog_new_fd(struct bpf_prog *prog);
  224. int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
  225. int bpf_obj_get_user(const char __user *pathname);
  226. int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
  227. int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
  228. int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
  229. u64 flags);
  230. int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
  231. u64 flags);
  232. int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
  233. int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
  234. void *key, void *value, u64 map_flags);
  235. void bpf_fd_array_map_clear(struct bpf_map *map);
  236. /* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
  237. * forced to use 'long' read/writes to try to atomically copy long counters.
  238. * Best-effort only. No barriers here, since it _will_ race with concurrent
  239. * updates from BPF programs. Called from bpf syscall and mostly used with
  240. * size 8 or 16 bytes, so ask compiler to inline it.
  241. */
  242. static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
  243. {
  244. const long *lsrc = src;
  245. long *ldst = dst;
  246. size /= sizeof(long);
  247. while (size--)
  248. *ldst++ = *lsrc++;
  249. }
  250. /* verify correctness of eBPF program */
  251. int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
  252. #else
  253. static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl)
  254. {
  255. }
  256. static inline struct bpf_prog *bpf_prog_get(u32 ufd)
  257. {
  258. return ERR_PTR(-EOPNOTSUPP);
  259. }
  260. static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
  261. enum bpf_prog_type type)
  262. {
  263. return ERR_PTR(-EOPNOTSUPP);
  264. }
  265. static inline struct bpf_prog *bpf_prog_add(struct bpf_prog *prog, int i)
  266. {
  267. return ERR_PTR(-EOPNOTSUPP);
  268. }
  269. static inline void bpf_prog_put(struct bpf_prog *prog)
  270. {
  271. }
  272. static inline struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog)
  273. {
  274. return ERR_PTR(-EOPNOTSUPP);
  275. }
  276. #endif /* CONFIG_BPF_SYSCALL */
  277. /* verifier prototypes for helper functions called from eBPF programs */
  278. extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
  279. extern const struct bpf_func_proto bpf_map_update_elem_proto;
  280. extern const struct bpf_func_proto bpf_map_delete_elem_proto;
  281. extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
  282. extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
  283. extern const struct bpf_func_proto bpf_tail_call_proto;
  284. extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
  285. extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
  286. extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
  287. extern const struct bpf_func_proto bpf_get_current_comm_proto;
  288. extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
  289. extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
  290. extern const struct bpf_func_proto bpf_get_stackid_proto;
  291. /* Shared helpers among cBPF and eBPF. */
  292. void bpf_user_rnd_init_once(void);
  293. u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
  294. #endif /* _LINUX_BPF_H */