blob: 7995940d41877e3f718635914d89dbcce672c374 [file] [log] [blame]
Alexei Starovoitov99c55f72014-09-26 00:16:57 -07001/* Copyright (c) 2011-2014 PLUMgrid, http://plumgrid.com
2 *
3 * This program is free software; you can redistribute it and/or
4 * modify it under the terms of version 2 of the GNU General Public
5 * License as published by the Free Software Foundation.
6 */
7#ifndef _LINUX_BPF_H
8#define _LINUX_BPF_H 1
9
10#include <uapi/linux/bpf.h>
11#include <linux/workqueue.h>
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070012#include <linux/file.h>
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -080013#include <linux/percpu.h>
Zi Shen Lim002245c2016-06-08 21:18:47 -070014#include <linux/err.h>
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070015
Daniel Borkmann3b1efb12016-06-15 22:47:14 +020016struct perf_event;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070017struct bpf_map;
18
19/* map is generic key/value storage optionally accesible by eBPF programs */
20struct bpf_map_ops {
21 /* funcs callable from userspace (via syscall) */
22 struct bpf_map *(*map_alloc)(union bpf_attr *attr);
Daniel Borkmann61d1b6a2016-06-15 22:47:12 +020023 void (*map_release)(struct bpf_map *map, struct file *map_file);
24 void (*map_free)(struct bpf_map *map);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070025 int (*map_get_next_key)(struct bpf_map *map, void *key, void *next_key);
26
27 /* funcs callable from userspace and from eBPF programs */
28 void *(*map_lookup_elem)(struct bpf_map *map, void *key);
Alexei Starovoitov3274f522014-11-13 17:36:44 -080029 int (*map_update_elem)(struct bpf_map *map, void *key, void *value, u64 flags);
Alexei Starovoitovdb20fd22014-09-26 00:16:59 -070030 int (*map_delete_elem)(struct bpf_map *map, void *key);
Wang Nan2a36f0b2015-08-06 07:02:33 +000031
32 /* funcs called by prog_array and perf_event_array map */
Daniel Borkmannd056a782016-06-15 22:47:13 +020033 void *(*map_fd_get_ptr)(struct bpf_map *map, struct file *map_file,
34 int fd);
35 void (*map_fd_put_ptr)(void *ptr);
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070036};
37
38struct bpf_map {
Daniel Borkmann5cb917a2018-01-29 02:48:58 +010039 /* 1st cacheline with read-mostly members of which some
40 * are also accessed in fast-path (e.g. ops, max_entries).
41 */
42 const struct bpf_map_ops *ops ____cacheline_aligned;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070043 enum bpf_map_type map_type;
44 u32 key_size;
45 u32 value_size;
46 u32 max_entries;
Alexei Starovoitov6c905982016-03-07 21:57:15 -080047 u32 map_flags;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -070048 u32 pages;
Alexei Starovoitova9bfac142018-01-07 17:33:02 -080049 bool unpriv_array;
Daniel Borkmann5cb917a2018-01-29 02:48:58 +010050 /* 7 bytes hole */
51
52 /* 2nd cacheline with misc members to avoid false sharing
53 * particularly with refcounting.
54 */
55 struct user_struct *user ____cacheline_aligned;
56 atomic_t refcnt;
Daniel Borkmannc9da1612015-11-24 21:28:15 +010057 atomic_t usercnt;
Daniel Borkmann5cb917a2018-01-29 02:48:58 +010058 struct work_struct work;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070059};
60
61struct bpf_map_type_list {
62 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +010063 const struct bpf_map_ops *ops;
Alexei Starovoitov99c55f72014-09-26 00:16:57 -070064 enum bpf_map_type type;
65};
66
Alexei Starovoitov17a52672014-09-26 00:17:06 -070067/* function argument constraints */
68enum bpf_arg_type {
Daniel Borkmann80f1d682015-03-12 17:21:42 +010069 ARG_DONTCARE = 0, /* unused argument in helper function */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070070
71 /* the following constraints used to prototype
72 * bpf_map_lookup/update/delete_elem() functions
73 */
74 ARG_CONST_MAP_PTR, /* const argument used as pointer to bpf_map */
75 ARG_PTR_TO_MAP_KEY, /* pointer to stack used as map key */
76 ARG_PTR_TO_MAP_VALUE, /* pointer to stack used as map value */
77
78 /* the following constraints used to prototype bpf_memcmp() and other
79 * functions that access data on eBPF program stack
80 */
81 ARG_PTR_TO_STACK, /* any pointer to eBPF program stack */
Daniel Borkmann435faee12016-04-13 00:10:51 +020082 ARG_PTR_TO_RAW_STACK, /* any pointer to eBPF program stack, area does not
83 * need to be initialized, helper function must fill
84 * all bytes or clear them in error case.
85 */
86
Alexei Starovoitov17a52672014-09-26 00:17:06 -070087 ARG_CONST_STACK_SIZE, /* number of bytes accessed from stack */
Daniel Borkmann8e2fe1d92016-02-19 23:05:22 +010088 ARG_CONST_STACK_SIZE_OR_ZERO, /* number of bytes accessed from stack or 0 */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010089
Alexei Starovoitov608cd712015-03-26 19:53:57 -070090 ARG_PTR_TO_CTX, /* pointer to context */
Daniel Borkmann80f1d682015-03-12 17:21:42 +010091 ARG_ANYTHING, /* any (initialized) argument is ok */
Alexei Starovoitov17a52672014-09-26 00:17:06 -070092};
93
94/* type of values returned from helper functions */
95enum bpf_return_type {
96 RET_INTEGER, /* function returns integer */
97 RET_VOID, /* function doesn't return anything */
98 RET_PTR_TO_MAP_VALUE_OR_NULL, /* returns a pointer to map elem value or NULL */
99};
100
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700101/* eBPF function prototype used by verifier to allow BPF_CALLs from eBPF programs
102 * to in-kernel helper functions and for adjusting imm32 field in BPF_CALL
103 * instructions after verifying
104 */
105struct bpf_func_proto {
106 u64 (*func)(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
107 bool gpl_only;
Daniel Borkmann36bbef52016-09-20 00:26:13 +0200108 bool pkt_access;
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700109 enum bpf_return_type ret_type;
110 enum bpf_arg_type arg1_type;
111 enum bpf_arg_type arg2_type;
112 enum bpf_arg_type arg3_type;
113 enum bpf_arg_type arg4_type;
114 enum bpf_arg_type arg5_type;
115};
116
117/* bpf_context is intentionally undefined structure. Pointer to bpf_context is
118 * the first argument to eBPF programs.
119 * For socket filters: 'struct bpf_context *' == 'struct sk_buff *'
120 */
121struct bpf_context;
122
123enum bpf_access_type {
124 BPF_READ = 1,
125 BPF_WRITE = 2
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700126};
127
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700128/* types of values stored in eBPF registers */
129enum bpf_reg_type {
130 NOT_INIT = 0, /* nothing was written into register */
131 UNKNOWN_VALUE, /* reg doesn't contain a valid pointer */
132 PTR_TO_CTX, /* reg points to bpf_context */
133 CONST_PTR_TO_MAP, /* reg points to struct bpf_map */
134 PTR_TO_MAP_VALUE, /* reg points to map element value */
135 PTR_TO_MAP_VALUE_OR_NULL,/* points to map elem value or NULL */
136 FRAME_PTR, /* reg == frame_pointer */
137 PTR_TO_STACK, /* reg == frame_pointer + imm */
138 CONST_IMM, /* constant integer value */
139
140 /* PTR_TO_PACKET represents:
141 * skb->data
142 * skb->data + imm
143 * skb->data + (u16) var
144 * skb->data + (u16) var + imm
145 * if (range > 0) then [ptr, ptr + range - off) is safe to access
146 * if (id > 0) means that some 'var' was added
147 * if (off > 0) menas that 'imm' was added
148 */
149 PTR_TO_PACKET,
150 PTR_TO_PACKET_END, /* skb->data + headlen */
Josef Bacik48461132016-09-28 10:54:32 -0400151
152 /* PTR_TO_MAP_VALUE_ADJ is used for doing pointer math inside of a map
153 * elem value. We only allow this if we can statically verify that
154 * access from this register are going to fall within the size of the
155 * map element.
156 */
157 PTR_TO_MAP_VALUE_ADJ,
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700158};
159
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700160struct bpf_prog;
161
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700162struct bpf_verifier_ops {
163 /* return eBPF function prototype for verification */
164 const struct bpf_func_proto *(*get_func_proto)(enum bpf_func_id func_id);
Alexei Starovoitov17a52672014-09-26 00:17:06 -0700165
166 /* return true if 'size' wide access at offset 'off' within bpf_context
167 * with 'type' (read or write) is allowed
168 */
Alexei Starovoitov19de99f2016-06-15 18:25:38 -0700169 bool (*is_valid_access)(int off, int size, enum bpf_access_type type,
170 enum bpf_reg_type *reg_type);
Daniel Borkmann36bbef52016-09-20 00:26:13 +0200171 int (*gen_prologue)(struct bpf_insn *insn, bool direct_write,
172 const struct bpf_prog *prog);
Alexei Starovoitovd691f9e2015-06-04 10:11:54 -0700173 u32 (*convert_ctx_access)(enum bpf_access_type type, int dst_reg,
174 int src_reg, int ctx_off,
Alexei Starovoitovff936a02015-10-07 10:55:41 -0700175 struct bpf_insn *insn, struct bpf_prog *prog);
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700176};
177
178struct bpf_prog_type_list {
179 struct list_head list_node;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100180 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700181 enum bpf_prog_type type;
182};
183
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700184struct bpf_prog_aux {
185 atomic_t refcnt;
Daniel Borkmann24701ec2015-03-01 12:31:47 +0100186 u32 used_map_cnt;
Alexei Starovoitov32bbe002016-04-06 18:43:28 -0700187 u32 max_ctx_offset;
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100188 const struct bpf_verifier_ops *ops;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700189 struct bpf_map **used_maps;
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700190 struct bpf_prog *prog;
Alexei Starovoitovaaac3ba2015-10-07 22:23:22 -0700191 struct user_struct *user;
Alexei Starovoitovabf2e7d2015-05-28 19:26:02 -0700192 union {
193 struct work_struct work;
194 struct rcu_head rcu;
195 };
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700196};
197
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700198struct bpf_array {
199 struct bpf_map map;
200 u32 elem_size;
Alexei Starovoitova9bfac142018-01-07 17:33:02 -0800201 u32 index_mask;
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700202 /* 'ownership' of prog_array is claimed by the first program that
203 * is going to use this map or by the first program which FD is stored
204 * in the map to make sure that all callers and callees have the same
205 * prog_type and JITed flag
206 */
207 enum bpf_prog_type owner_prog_type;
208 bool owner_jited;
209 union {
210 char value[0] __aligned(8);
Wang Nan2a36f0b2015-08-06 07:02:33 +0000211 void *ptrs[0] __aligned(8);
Alexei Starovoitova10423b2016-02-01 22:39:54 -0800212 void __percpu *pptrs[0] __aligned(8);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700213 };
214};
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200215
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700216#define MAX_TAIL_CALL_CNT 32
217
Daniel Borkmann3b1efb12016-06-15 22:47:14 +0200218struct bpf_event_entry {
219 struct perf_event *event;
220 struct file *perf_file;
221 struct file *map_file;
222 struct rcu_head rcu;
223};
224
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700225u64 bpf_tail_call(u64 ctx, u64 r2, u64 index, u64 r4, u64 r5);
Alexei Starovoitov9940d672016-04-06 18:43:27 -0700226u64 bpf_get_stackid(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200227
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700228bool bpf_prog_array_compatible(struct bpf_array *array, const struct bpf_prog *fp);
Daniel Borkmannbd570ff2016-04-18 21:01:24 +0200229
Alexei Starovoitov0756ea32015-06-12 19:39:13 -0700230const struct bpf_func_proto *bpf_get_trace_printk_proto(void);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200231
232typedef unsigned long (*bpf_ctx_copy_t)(void *dst, const void *src,
Daniel Borkmannaa7145c2016-07-22 01:19:42 +0200233 unsigned long off, unsigned long len);
Daniel Borkmann555c8a82016-07-14 18:08:05 +0200234
235u64 bpf_event_output(struct bpf_map *map, u64 flags, void *meta, u64 meta_size,
236 void *ctx, u64 ctx_size, bpf_ctx_copy_t ctx_copy);
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700237
Alexei Starovoitov89aa0752014-12-01 15:06:35 -0800238#ifdef CONFIG_BPF_SYSCALL
Alexei Starovoitovb121d1e2016-03-07 21:57:13 -0800239DECLARE_PER_CPU(int, bpf_prog_active);
240
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100241void bpf_register_prog_type(struct bpf_prog_type_list *tl);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100242void bpf_register_map_type(struct bpf_map_type_list *tl);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100243
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700244struct bpf_prog *bpf_prog_get(u32 ufd);
Daniel Borkmann113214b2016-06-30 17:24:44 +0200245struct bpf_prog *bpf_prog_get_type(u32 ufd, enum bpf_prog_type type);
Brenden Blanco59d36562016-07-19 12:16:46 -0700246struct bpf_prog *bpf_prog_add(struct bpf_prog *prog, int i);
Alexei Starovoitov92117d82016-04-27 18:56:20 -0700247struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100248void bpf_prog_put(struct bpf_prog *prog);
249
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100250struct bpf_map *bpf_map_get_with_uref(u32 ufd);
Daniel Borkmannc2101292015-10-29 14:58:07 +0100251struct bpf_map *__bpf_map_get(struct fd f);
Alexei Starovoitov92117d82016-04-27 18:56:20 -0700252struct bpf_map *bpf_map_inc(struct bpf_map *map, bool uref);
Daniel Borkmannc9da1612015-11-24 21:28:15 +0100253void bpf_map_put_with_uref(struct bpf_map *map);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100254void bpf_map_put(struct bpf_map *map);
Alexei Starovoitov6c905982016-03-07 21:57:15 -0800255int bpf_map_precharge_memlock(u32 pages);
Daniel Borkmann251d00b2017-01-18 15:14:17 +0100256void *bpf_map_area_alloc(size_t size);
257void bpf_map_area_free(void *base);
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100258
Alexei Starovoitov1be7f752015-10-07 22:23:21 -0700259extern int sysctl_unprivileged_bpf_disabled;
260
Daniel Borkmannb2197752015-10-29 14:58:09 +0100261int bpf_map_new_fd(struct bpf_map *map);
262int bpf_prog_new_fd(struct bpf_prog *prog);
263
264int bpf_obj_pin_user(u32 ufd, const char __user *pathname);
265int bpf_obj_get_user(const char __user *pathname);
266
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800267int bpf_percpu_hash_copy(struct bpf_map *map, void *key, void *value);
268int bpf_percpu_array_copy(struct bpf_map *map, void *key, void *value);
269int bpf_percpu_hash_update(struct bpf_map *map, void *key, void *value,
270 u64 flags);
271int bpf_percpu_array_update(struct bpf_map *map, void *key, void *value,
272 u64 flags);
Daniel Borkmannd056a782016-06-15 22:47:13 +0200273
Alexei Starovoitov557c0c62016-03-07 21:57:17 -0800274int bpf_stackmap_copy(struct bpf_map *map, void *key, void *value);
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800275
Daniel Borkmannd056a782016-06-15 22:47:13 +0200276int bpf_fd_array_map_update_elem(struct bpf_map *map, struct file *map_file,
277 void *key, void *value, u64 map_flags);
278void bpf_fd_array_map_clear(struct bpf_map *map);
279
Alexei Starovoitov15a07b32016-02-01 22:39:55 -0800280/* memcpy that is used with 8-byte aligned pointers, power-of-8 size and
281 * forced to use 'long' read/writes to try to atomically copy long counters.
282 * Best-effort only. No barriers here, since it _will_ race with concurrent
283 * updates from BPF programs. Called from bpf syscall and mostly used with
284 * size 8 or 16 bytes, so ask compiler to inline it.
285 */
286static inline void bpf_long_memcpy(void *dst, const void *src, u32 size)
287{
288 const long *lsrc = src;
289 long *ldst = dst;
290
291 size /= sizeof(long);
292 while (size--)
293 *ldst++ = *lsrc++;
294}
295
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100296/* verify correctness of eBPF program */
Alexei Starovoitov9bac3d62015-03-13 11:57:42 -0700297int bpf_check(struct bpf_prog **fp, union bpf_attr *attr);
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100298#else
299static inline void bpf_register_prog_type(struct bpf_prog_type_list *tl)
300{
301}
302
303static inline struct bpf_prog *bpf_prog_get(u32 ufd)
304{
305 return ERR_PTR(-EOPNOTSUPP);
306}
307
Daniel Borkmann113214b2016-06-30 17:24:44 +0200308static inline struct bpf_prog *bpf_prog_get_type(u32 ufd,
309 enum bpf_prog_type type)
310{
311 return ERR_PTR(-EOPNOTSUPP);
312}
Brenden Blancocc2e0b32016-07-20 07:55:52 -0700313static inline struct bpf_prog *bpf_prog_add(struct bpf_prog *prog, int i)
314{
315 return ERR_PTR(-EOPNOTSUPP);
316}
Daniel Borkmann113214b2016-06-30 17:24:44 +0200317
Daniel Borkmann0fc174d2015-03-01 12:31:44 +0100318static inline void bpf_prog_put(struct bpf_prog *prog)
319{
320}
Alexei Starovoitovaa6a5f32016-09-01 18:37:24 -0700321static inline struct bpf_prog *bpf_prog_inc(struct bpf_prog *prog)
322{
323 return ERR_PTR(-EOPNOTSUPP);
324}
Daniel Borkmann61e021f2015-03-02 15:21:55 +0100325#endif /* CONFIG_BPF_SYSCALL */
Alexei Starovoitov09756af2014-09-26 00:17:00 -0700326
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800327/* verifier prototypes for helper functions called from eBPF programs */
Daniel Borkmanna2c83ff2015-03-01 12:31:42 +0100328extern const struct bpf_func_proto bpf_map_lookup_elem_proto;
329extern const struct bpf_func_proto bpf_map_update_elem_proto;
330extern const struct bpf_func_proto bpf_map_delete_elem_proto;
Alexei Starovoitovd0003ec2014-11-13 17:36:49 -0800331
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100332extern const struct bpf_func_proto bpf_get_prandom_u32_proto;
Daniel Borkmannc04167c2015-03-14 02:27:17 +0100333extern const struct bpf_func_proto bpf_get_smp_processor_id_proto;
Alexei Starovoitov04fd61a2015-05-19 16:59:03 -0700334extern const struct bpf_func_proto bpf_tail_call_proto;
Daniel Borkmann17ca8cb2015-05-29 23:23:06 +0200335extern const struct bpf_func_proto bpf_ktime_get_ns_proto;
Alexei Starovoitovffeedaf2015-06-12 19:39:12 -0700336extern const struct bpf_func_proto bpf_get_current_pid_tgid_proto;
337extern const struct bpf_func_proto bpf_get_current_uid_gid_proto;
338extern const struct bpf_func_proto bpf_get_current_comm_proto;
Alexei Starovoitov4e10df92015-07-20 20:34:18 -0700339extern const struct bpf_func_proto bpf_skb_vlan_push_proto;
340extern const struct bpf_func_proto bpf_skb_vlan_pop_proto;
Alexei Starovoitovd5a3b1f2016-02-17 19:58:58 -0800341extern const struct bpf_func_proto bpf_get_stackid_proto;
Daniel Borkmann03e69b52015-03-14 02:27:16 +0100342
Daniel Borkmann3ad00402015-10-08 01:20:39 +0200343/* Shared helpers among cBPF and eBPF. */
344void bpf_user_rnd_init_once(void);
345u64 bpf_user_rnd_u32(u64 r1, u64 r2, u64 r3, u64 r4, u64 r5);
346
Alexei Starovoitov99c55f72014-09-26 00:16:57 -0700347#endif /* _LINUX_BPF_H */