blob: 3ed1f3b1d594b67f1fab991492e5d73e10b81606 [file] [log] [blame]
Alexei Starovoitov99c55f72014-09-26 00:16:57 -07001/* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
6 */
7#ifndef _LINUX_BPF_H
8#define _LINUX_BPF_H 1
9
10#include <uapi/linux/bpf.h>
11#include <linux/workqueue.h>
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070012#include <linux/file.h>
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -080013#include <linux/percpu.h>
Zi Shen Lim002245c2016-06-08 21:18:47 -070014#include <linux/err.h>
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070015
Daniel Borkmann3b1efb12016-06-15 22:47:14 +020016struct perf_event;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070017struct bpf_map;
18
19/* map is generic key/value storage optionally accesible by eBPF programs */
20struct bpf_map_ops {
21 /* funcs callable from userspace (via syscall) */
22 struct bpf_map *(*map_alloc)(union bpf_attr *attr);
Daniel Borkmann61d1b6a2016-06-15 22:47:12 +020023 void (*map_release)(struct bpf_map *map, struct file *map_file);
24 void (*map_free)(struct bpf_map *map);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070025 int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
26
27 /* funcs callable from userspace and from eBPF programs */
28 void *(*map_lookup_elem)(struct bpf_map *map, void *key);
Alexei Starovoitov3274f522014-11-13 17:36:44 -080029 int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070030 int (*map_delete_elem)(struct bpf_map *map, void *key);
Wang Nan2a36f0b2015-08-06 07:02:33 +000031
32 /* funcs called by prog_array and perf_event_array map */
Daniel Borkmannd056a782016-06-15 22:47:13 +020033 void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
34 int fd);
35 void (*map_fd_put_ptr)(void *ptr);
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070036};
37
38struct bpf_map {
39 atomic_t refcnt;
40 enum bpf_map_type map_type;
41 u32 key_size;
42 u32 value_size;
43 u32 max_entries;
Alexei Starovoitov6c905982016-03-07 21:57:15 -080044 u32 map_flags;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -070045 u32 pages;
46 struct user_struct *user;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010047 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070048 struct work_struct work;
Daniel Borkmannc9da1612015-11-24 21:28:15 +010049 atomic_t usercnt;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070050};
51
52struct bpf_map_type_list {
53 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010054 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070055 enum bpf_map_type type;
56};
57
Alexei Starovoitov17a52672014-09-26 00:17:06 -070058/* function argument constraints */
59enum bpf_arg_type {
Daniel Borkmann80f1d682015-03-12 17:21:42 +010060 ARG_DONTCARE = 0, /* unused argument in helper function */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070061
62 /* the following constraints used to prototype
63 * bpf_map_lookup/update/delete_elem() functions
64 */
65 ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
66 ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
67 ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
68
69 /* the following constraints used to prototype bpf_memcmp() and other
70 * functions that access data on eBPF program stack
71 */
72 ARG_PTR_TO_STACK, /* any pointer to eBPF program stack */
Daniel Borkmann435faee12016-04-13 00:10:51 +020073 ARG_PTR_TO_RAW_STACK, /* any pointer to eBPF program stack, area does not
74 * need to be initialized, helper function must fill
75 * all bytes or clear them in error case.
76 */
77
Alexei Starovoitov17a52672014-09-26 00:17:06 -070078 ARG_CONST_STACK_SIZE, /* number of bytes accessed from stack */
Daniel Borkmann8e2fe1d92016-02-19 23:05:22 +010079 ARG_CONST_STACK_SIZE_OR_ZERO, /* number of bytes accessed from stack or 0 */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010080
Alexei Starovoitov608cd712015-03-26 19:53:57 -070081 ARG_PTR_TO_CTX, /* pointer to context */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010082 ARG_ANYTHING, /* any (initialized) argument is ok */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070083};
84
85/* type of values returned from helper functions */
86enum bpf_return_type {
87 RET_INTEGER, /* function returns integer */
88 RET_VOID, /* function doesn't return anything */
89 RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
90};
91
Alexei Starovoitov09756af2014-09-26 00:17:00 -070092/* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
93 * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
94 * instructions after verifying
95 */
96struct bpf_func_proto {
97 u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
98 bool gpl_only;
Daniel Borkmann36bbef52016-09-20 00:26:13 +020099 bool pkt_access;
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700100 enum bpf_return_type ret_type;
101 enum bpf_arg_type arg1_type;
102 enum bpf_arg_type arg2_type;
103 enum bpf_arg_type arg3_type;
104 enum bpf_arg_type arg4_type;
105 enum bpf_arg_type arg5_type;
106};
107
108/* bpf_context is intentionally undefined structure. Pointer to bpf_context is
109 * the first argument to eBPF programs.
110 * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
111 */
112struct bpf_context;
113
114enum bpf_access_type {
115 BPF_READ = 1,
116 BPF_WRITE = 2
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700117};
118
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700119/* types of values stored in eBPF registers */
120enum bpf_reg_type {
121 NOT_INIT = 0, /* nothing was written into register */
122 UNKNOWN_VALUE, /* reg doesn't contain a valid pointer */
123 PTR_TO_CTX, /* reg points to bpf_context */
124 CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
125 PTR_TO_MAP_VALUE, /* reg points to map element value */
126 PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
127 FRAME_PTR, /* reg == frame_pointer */
128 PTR_TO_STACK, /* reg == frame_pointer + imm */
129 CONST_IMM, /* constant integer value */
130
131 /* PTR_TO_PACKET represents:
132 * skb->data
133 * skb->data + imm
134 * skb->data + (u16) var
135 * skb->data + (u16) var + imm
136 * if (range > 0) then [ptr, ptr + range - off) is safe to access
137 * if (id > 0) means that some 'var' was added
138 * if (off > 0) menas that 'imm' was added
139 */
140 PTR_TO_PACKET,
141 PTR_TO_PACKET_END, /* skb->data + headlen */
Josef Bacik48461132016-09-28 10:54:32 -0400142
143 /* PTR_TO_MAP_VALUE_ADJ is used for doing pointer math inside of a map
144 * elem value. We only allow this if we can statically verify that
145 * access from this register are going to fall within the size of the
146 * map element.
147 */
148 PTR_TO_MAP_VALUE_ADJ,
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700149};
150
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700151struct bpf_prog;
152
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700153struct bpf_verifier_ops {
154 /* return eBPF function prototype for verification */
155 const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700156
157 /* return true if 'size' wide access at offset 'off' within bpf_context
158 * with 'type' (read or write) is allowed
159 */
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700160 bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
161 enum bpf_reg_type *reg_type);
Daniel Borkmann36bbef52016-09-20 00:26:13 +0200162 int (*gen_prologue)(struct bpf_insn *insn, bool direct_write,
163 const struct bpf_prog *prog);
Alexei Starovoitovd691f9e2015-06-04 10:11:54 -0700164 u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg,
165 int src_reg, int ctx_off,
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700166 struct bpf_insn *insn, struct bpf_prog *prog);
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700167};
168
169struct bpf_prog_type_list {
170 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100171 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700172 enum bpf_prog_type type;
173};
174
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700175struct bpf_prog_aux {
176 atomic_t refcnt;
Daniel Borkmann24701ec2015-03-01 12:31:47 +0100177 u32 used_map_cnt;
Alexei Starovoitov32bbe002016-04-06 18:43:28 -0700178 u32 max_ctx_offset;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100179 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700180 struct bpf_map **used_maps;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700181 struct bpf_prog *prog;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -0700182 struct user_struct *user;
Alexei Starovoitovabf2e7d2015-05-28 19:26:02 -0700183 union {
184 struct work_struct work;
185 struct rcu_head rcu;
186 };
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700187};
188
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700189struct bpf_array {
190 struct bpf_map map;
191 u32 elem_size;
192 /* 'ownership' of prog_array is claimed by the first program that
193 * is going to use this map or by the first program which FD is stored
194 * in the map to make sure that all callers and callees have the same
195 * prog_type and JITed flag
196 */
197 enum bpf_prog_type owner_prog_type;
198 bool owner_jited;
199 union {
200 char value[0] __aligned(8);
Wang Nan2a36f0b2015-08-06 07:02:33 +0000201 void *ptrs[0] __aligned(8);
Alexei Starovoitova10423b2016-02-01 22:39:54 -0800202 void __percpu *pptrs[0] __aligned(8);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700203 };
204};
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200205
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700206#define MAX_TAIL_CALL_CNT 32
207
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200208struct bpf_event_entry {
209 struct perf_event *event;
210 struct file *perf_file;
211 struct file *map_file;
212 struct rcu_head rcu;
213};
214
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700215u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
Alexei Starovoitov9940d672016-04-06 18:43:27 -0700216u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200217
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700218bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
Daniel Borkmannf1f77142017-01-13 23:38:15 +0100219int bpf_prog_calc_tag(struct bpf_prog *fp);
Daniel Borkmannbd570ff2016-04-18 21:01:24 +0200220
Alexei Starovoitov0756ea32015-06-12 19:39:13 -0700221const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200222
223typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
Daniel Borkmannaa7145c2016-07-22 01:19:42 +0200224 unsigned long off, unsigned long len);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200225
226u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
227 void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700228
Alexei Starovoitov89aa0752014-12-01 15:06:35 -0800229#ifdef CONFIG_BPF_SYSCALL
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -0800230DECLARE_PER_CPU(int, bpf_prog_active);
231
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100232void bpf_register_prog_type(struct bpf_prog_type_list *tl);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100233void bpf_register_map_type(struct bpf_map_type_list *tl);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100234
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700235struct bpf_prog *bpf_prog_get(u32 ufd);
Daniel Borkmann113214b2016-06-30 17:24:44 +0200236struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100237struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog, int i);
Daniel Borkmannc5405942016-11-09 22:02:34 +0100238void bpf_prog_sub(struct bpf_prog *prog, int i);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100239struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100240void bpf_prog_put(struct bpf_prog *prog);
Daniel Borkmann5ccb0712016-12-18 01:52:58 +0100241int __bpf_prog_charge(struct user_struct *user, u32 pages);
242void __bpf_prog_uncharge(struct user_struct *user, u32 pages);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100243
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100244struct bpf_map *bpf_map_get_with_uref(u32 ufd);
Daniel Borkmannc2101292015-10-29 14:58:07 +0100245struct bpf_map *__bpf_map_get(struct fd f);
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100246struct bpf_map * __must_check bpf_map_inc(struct bpf_map *map, bool uref);
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100247void bpf_map_put_with_uref(struct bpf_map *map);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100248void bpf_map_put(struct bpf_map *map);
Alexei Starovoitov6c905982016-03-07 21:57:15 -0800249int bpf_map_precharge_memlock(u32 pages);
Daniel Borkmannd407bd22017-01-18 15:14:17 +0100250void *bpf_map_area_alloc(size_t size);
251void bpf_map_area_free(void *base);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100252
Alexei Starovoitov1be7f752015-10-07 22:23:21 -0700253extern int sysctl_unprivileged_bpf_disabled;
254
Daniel Borkmannb2197752015-10-29 14:58:09 +0100255int bpf_map_new_fd(struct bpf_map *map);
256int bpf_prog_new_fd(struct bpf_prog *prog);
257
258int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
259int bpf_obj_get_user(const char __user *pathname);
260
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800261int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
262int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
263int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
264 u64 flags);
265int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
266 u64 flags);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200267
Alexei Starovoitov557c0c62016-03-07 21:57:17 -0800268int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800269
Daniel Borkmannd056a782016-06-15 22:47:13 +0200270int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
271 void *key, void *value, u64 map_flags);
272void bpf_fd_array_map_clear(struct bpf_map *map);
273
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800274/* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
275 * forced to use 'long' read/writes to try to atomically copy long counters.
276 * Best-effort only. No barriers here, since it _will_ race with concurrent
277 * updates from BPF programs. Called from bpf syscall and mostly used with
278 * size 8 or 16 bytes, so ask compiler to inline it.
279 */
280static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
281{
282 const long *lsrc = src;
283 long *ldst = dst;
284
285 size /= sizeof(long);
286 while (size--)
287 *ldst++ = *lsrc++;
288}
289
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100290/* verify correctness of eBPF program */
Alexei Starovoitov9bac3d62015-03-13 11:57:42 -0700291int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100292#else
293static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl)
294{
295}
296
297static inline struct bpf_prog *bpf_prog_get(u32 ufd)
298{
299 return ERR_PTR(-EOPNOTSUPP);
300}
301
Daniel Borkmann113214b2016-06-30 17:24:44 +0200302static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
303 enum bpf_prog_type type)
304{
305 return ERR_PTR(-EOPNOTSUPP);
306}
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100307static inline struct bpf_prog * __must_check bpf_prog_add(struct bpf_prog *prog,
308 int i)
Brenden Blancocc2e0b32016-07-20 07:55:52 -0700309{
310 return ERR_PTR(-EOPNOTSUPP);
311}
Daniel Borkmann113214b2016-06-30 17:24:44 +0200312
Daniel Borkmannc5405942016-11-09 22:02:34 +0100313static inline void bpf_prog_sub(struct bpf_prog *prog, int i)
314{
315}
316
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100317static inline void bpf_prog_put(struct bpf_prog *prog)
318{
319}
Daniel Borkmann6d67942dd2016-11-19 01:45:03 +0100320
321static inline struct bpf_prog * __must_check bpf_prog_inc(struct bpf_prog *prog)
Alexei Starovoitovaa6a5f32016-09-01 18:37:24 -0700322{
323 return ERR_PTR(-EOPNOTSUPP);
324}
Daniel Borkmann5ccb0712016-12-18 01:52:58 +0100325
326static inline int __bpf_prog_charge(struct user_struct *user, u32 pages)
327{
328 return 0;
329}
330
331static inline void __bpf_prog_uncharge(struct user_struct *user, u32 pages)
332{
333}
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100334#endif /* CONFIG_BPF_SYSCALL */
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700335
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800336/* verifier prototypes for helper functions called from eBPF programs */
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100337extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
338extern const struct bpf_func_proto bpf_map_update_elem_proto;
339extern const struct bpf_func_proto bpf_map_delete_elem_proto;
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800340
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100341extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
Daniel Borkmannc04167c2015-03-14 02:27:17 +0100342extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
Daniel Borkmann2d0e30c2016-10-21 12:46:33 +0200343extern const struct bpf_func_proto bpf_get_numa_node_id_proto;
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700344extern const struct bpf_func_proto bpf_tail_call_proto;
Daniel Borkmann17ca8cb2015-05-29 23:23:06 +0200345extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
Alexei Starovoitovffeedaf2015-06-12 19:39:12 -0700346extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
347extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
348extern const struct bpf_func_proto bpf_get_current_comm_proto;
Alexei Starovoitov4e10df92015-07-20 20:34:18 -0700349extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
350extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
Alexei Starovoitovd5a3b1f2016-02-17 19:58:58 -0800351extern const struct bpf_func_proto bpf_get_stackid_proto;
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100352
Daniel Borkmann3ad00402015-10-08 01:20:39 +0200353/* Shared helpers among cBPF and eBPF. */
354void bpf_user_rnd_init_once(void);
355u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
356
Alexei Starovoitov99c55f72014-09-26 00:16:57 -0700357#endif /* _LINUX_BPF_H */