at v5.11 462 lines 16 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2#ifndef _BPF_CGROUP_H 3#define _BPF_CGROUP_H 4 5#include <linux/bpf.h> 6#include <linux/errno.h> 7#include <linux/jump_label.h> 8#include <linux/percpu.h> 9#include <linux/percpu-refcount.h> 10#include <linux/rbtree.h> 11#include <uapi/linux/bpf.h> 12 13struct sock; 14struct sockaddr; 15struct cgroup; 16struct sk_buff; 17struct bpf_map; 18struct bpf_prog; 19struct bpf_sock_ops_kern; 20struct bpf_cgroup_storage; 21struct ctl_table; 22struct ctl_table_header; 23 24#ifdef CONFIG_CGROUP_BPF 25 26extern struct static_key_false cgroup_bpf_enabled_key; 27#define cgroup_bpf_enabled static_branch_unlikely(&cgroup_bpf_enabled_key) 28 29DECLARE_PER_CPU(struct bpf_cgroup_storage*, 30 bpf_cgroup_storage[MAX_BPF_CGROUP_STORAGE_TYPE]); 31 32#define for_each_cgroup_storage_type(stype) \ 33 for (stype = 0; stype < MAX_BPF_CGROUP_STORAGE_TYPE; stype++) 34 35struct bpf_cgroup_storage_map; 36 37struct bpf_storage_buffer { 38 struct rcu_head rcu; 39 char data[]; 40}; 41 42struct bpf_cgroup_storage { 43 union { 44 struct bpf_storage_buffer *buf; 45 void __percpu *percpu_buf; 46 }; 47 struct bpf_cgroup_storage_map *map; 48 struct bpf_cgroup_storage_key key; 49 struct list_head list_map; 50 struct list_head list_cg; 51 struct rb_node node; 52 struct rcu_head rcu; 53}; 54 55struct bpf_cgroup_link { 56 struct bpf_link link; 57 struct cgroup *cgroup; 58 enum bpf_attach_type type; 59}; 60 61struct bpf_prog_list { 62 struct list_head node; 63 struct bpf_prog *prog; 64 struct bpf_cgroup_link *link; 65 struct bpf_cgroup_storage *storage[MAX_BPF_CGROUP_STORAGE_TYPE]; 66}; 67 68struct bpf_prog_array; 69 70struct cgroup_bpf { 71 /* array of effective progs in this cgroup */ 72 struct bpf_prog_array __rcu *effective[MAX_BPF_ATTACH_TYPE]; 73 74 /* attached progs to this cgroup and attach flags 75 * when flags == 0 or BPF_F_ALLOW_OVERRIDE the progs list will 76 * have either zero or one element 77 * when BPF_F_ALLOW_MULTI the list can have up to BPF_CGROUP_MAX_PROGS 78 */ 79 struct list_head progs[MAX_BPF_ATTACH_TYPE]; 80 u32 flags[MAX_BPF_ATTACH_TYPE]; 81 82 /* list of cgroup shared storages */ 83 struct list_head storages; 84 85 /* temp storage for effective prog array used by prog_attach/detach */ 86 struct bpf_prog_array *inactive; 87 88 /* reference counter used to detach bpf programs after cgroup removal */ 89 struct percpu_ref refcnt; 90 91 /* cgroup_bpf is released using a work queue */ 92 struct work_struct release_work; 93}; 94 95int cgroup_bpf_inherit(struct cgroup *cgrp); 96void cgroup_bpf_offline(struct cgroup *cgrp); 97 98int __cgroup_bpf_attach(struct cgroup *cgrp, 99 struct bpf_prog *prog, struct bpf_prog *replace_prog, 100 struct bpf_cgroup_link *link, 101 enum bpf_attach_type type, u32 flags); 102int __cgroup_bpf_detach(struct cgroup *cgrp, struct bpf_prog *prog, 103 struct bpf_cgroup_link *link, 104 enum bpf_attach_type type); 105int __cgroup_bpf_query(struct cgroup *cgrp, const union bpf_attr *attr, 106 union bpf_attr __user *uattr); 107 108/* Wrapper for __cgroup_bpf_*() protected by cgroup_mutex */ 109int cgroup_bpf_attach(struct cgroup *cgrp, 110 struct bpf_prog *prog, struct bpf_prog *replace_prog, 111 struct bpf_cgroup_link *link, enum bpf_attach_type type, 112 u32 flags); 113int cgroup_bpf_detach(struct cgroup *cgrp, struct bpf_prog *prog, 114 enum bpf_attach_type type); 115int cgroup_bpf_query(struct cgroup *cgrp, const union bpf_attr *attr, 116 union bpf_attr __user *uattr); 117 118int __cgroup_bpf_run_filter_skb(struct sock *sk, 119 struct sk_buff *skb, 120 enum bpf_attach_type type); 121 122int __cgroup_bpf_run_filter_sk(struct sock *sk, 123 enum bpf_attach_type type); 124 125int __cgroup_bpf_run_filter_sock_addr(struct sock *sk, 126 struct sockaddr *uaddr, 127 enum bpf_attach_type type, 128 void *t_ctx); 129 130int __cgroup_bpf_run_filter_sock_ops(struct sock *sk, 131 struct bpf_sock_ops_kern *sock_ops, 132 enum bpf_attach_type type); 133 134int __cgroup_bpf_check_dev_permission(short dev_type, u32 major, u32 minor, 135 short access, enum bpf_attach_type type); 136 137int __cgroup_bpf_run_filter_sysctl(struct ctl_table_header *head, 138 struct ctl_table *table, int write, 139 char **buf, size_t *pcount, loff_t *ppos, 140 enum bpf_attach_type type); 141 142int __cgroup_bpf_run_filter_setsockopt(struct sock *sock, int *level, 143 int *optname, char __user *optval, 144 int *optlen, char **kernel_optval); 145int __cgroup_bpf_run_filter_getsockopt(struct sock *sk, int level, 146 int optname, char __user *optval, 147 int __user *optlen, int max_optlen, 148 int retval); 149 150static inline enum bpf_cgroup_storage_type cgroup_storage_type( 151 struct bpf_map *map) 152{ 153 if (map->map_type == BPF_MAP_TYPE_PERCPU_CGROUP_STORAGE) 154 return BPF_CGROUP_STORAGE_PERCPU; 155 156 return BPF_CGROUP_STORAGE_SHARED; 157} 158 159static inline void bpf_cgroup_storage_set(struct bpf_cgroup_storage 160 *storage[MAX_BPF_CGROUP_STORAGE_TYPE]) 161{ 162 enum bpf_cgroup_storage_type stype; 163 164 for_each_cgroup_storage_type(stype) 165 this_cpu_write(bpf_cgroup_storage[stype], storage[stype]); 166} 167 168struct bpf_cgroup_storage * 169cgroup_storage_lookup(struct bpf_cgroup_storage_map *map, 170 void *key, bool locked); 171struct bpf_cgroup_storage *bpf_cgroup_storage_alloc(struct bpf_prog *prog, 172 enum bpf_cgroup_storage_type stype); 173void bpf_cgroup_storage_free(struct bpf_cgroup_storage *storage); 174void bpf_cgroup_storage_link(struct bpf_cgroup_storage *storage, 175 struct cgroup *cgroup, 176 enum bpf_attach_type type); 177void bpf_cgroup_storage_unlink(struct bpf_cgroup_storage *storage); 178int bpf_cgroup_storage_assign(struct bpf_prog_aux *aux, struct bpf_map *map); 179 180int bpf_percpu_cgroup_storage_copy(struct bpf_map *map, void *key, void *value); 181int bpf_percpu_cgroup_storage_update(struct bpf_map *map, void *key, 182 void *value, u64 flags); 183 184/* Wrappers for __cgroup_bpf_run_filter_skb() guarded by cgroup_bpf_enabled. */ 185#define BPF_CGROUP_RUN_PROG_INET_INGRESS(sk, skb) \ 186({ \ 187 int __ret = 0; \ 188 if (cgroup_bpf_enabled) \ 189 __ret = __cgroup_bpf_run_filter_skb(sk, skb, \ 190 BPF_CGROUP_INET_INGRESS); \ 191 \ 192 __ret; \ 193}) 194 195#define BPF_CGROUP_RUN_PROG_INET_EGRESS(sk, skb) \ 196({ \ 197 int __ret = 0; \ 198 if (cgroup_bpf_enabled && sk && sk == skb->sk) { \ 199 typeof(sk) __sk = sk_to_full_sk(sk); \ 200 if (sk_fullsock(__sk)) \ 201 __ret = __cgroup_bpf_run_filter_skb(__sk, skb, \ 202 BPF_CGROUP_INET_EGRESS); \ 203 } \ 204 __ret; \ 205}) 206 207#define BPF_CGROUP_RUN_SK_PROG(sk, type) \ 208({ \ 209 int __ret = 0; \ 210 if (cgroup_bpf_enabled) { \ 211 __ret = __cgroup_bpf_run_filter_sk(sk, type); \ 212 } \ 213 __ret; \ 214}) 215 216#define BPF_CGROUP_RUN_PROG_INET_SOCK(sk) \ 217 BPF_CGROUP_RUN_SK_PROG(sk, BPF_CGROUP_INET_SOCK_CREATE) 218 219#define BPF_CGROUP_RUN_PROG_INET_SOCK_RELEASE(sk) \ 220 BPF_CGROUP_RUN_SK_PROG(sk, BPF_CGROUP_INET_SOCK_RELEASE) 221 222#define BPF_CGROUP_RUN_PROG_INET4_POST_BIND(sk) \ 223 BPF_CGROUP_RUN_SK_PROG(sk, BPF_CGROUP_INET4_POST_BIND) 224 225#define BPF_CGROUP_RUN_PROG_INET6_POST_BIND(sk) \ 226 BPF_CGROUP_RUN_SK_PROG(sk, BPF_CGROUP_INET6_POST_BIND) 227 228#define BPF_CGROUP_RUN_SA_PROG(sk, uaddr, type) \ 229({ \ 230 int __ret = 0; \ 231 if (cgroup_bpf_enabled) \ 232 __ret = __cgroup_bpf_run_filter_sock_addr(sk, uaddr, type, \ 233 NULL); \ 234 __ret; \ 235}) 236 237#define BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, type, t_ctx) \ 238({ \ 239 int __ret = 0; \ 240 if (cgroup_bpf_enabled) { \ 241 lock_sock(sk); \ 242 __ret = __cgroup_bpf_run_filter_sock_addr(sk, uaddr, type, \ 243 t_ctx); \ 244 release_sock(sk); \ 245 } \ 246 __ret; \ 247}) 248 249#define BPF_CGROUP_RUN_PROG_INET4_BIND_LOCK(sk, uaddr) \ 250 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_INET4_BIND, NULL) 251 252#define BPF_CGROUP_RUN_PROG_INET6_BIND_LOCK(sk, uaddr) \ 253 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_INET6_BIND, NULL) 254 255#define BPF_CGROUP_PRE_CONNECT_ENABLED(sk) (cgroup_bpf_enabled && \ 256 sk->sk_prot->pre_connect) 257 258#define BPF_CGROUP_RUN_PROG_INET4_CONNECT(sk, uaddr) \ 259 BPF_CGROUP_RUN_SA_PROG(sk, uaddr, BPF_CGROUP_INET4_CONNECT) 260 261#define BPF_CGROUP_RUN_PROG_INET6_CONNECT(sk, uaddr) \ 262 BPF_CGROUP_RUN_SA_PROG(sk, uaddr, BPF_CGROUP_INET6_CONNECT) 263 264#define BPF_CGROUP_RUN_PROG_INET4_CONNECT_LOCK(sk, uaddr) \ 265 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_INET4_CONNECT, NULL) 266 267#define BPF_CGROUP_RUN_PROG_INET6_CONNECT_LOCK(sk, uaddr) \ 268 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_INET6_CONNECT, NULL) 269 270#define BPF_CGROUP_RUN_PROG_UDP4_SENDMSG_LOCK(sk, uaddr, t_ctx) \ 271 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_UDP4_SENDMSG, t_ctx) 272 273#define BPF_CGROUP_RUN_PROG_UDP6_SENDMSG_LOCK(sk, uaddr, t_ctx) \ 274 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_UDP6_SENDMSG, t_ctx) 275 276#define BPF_CGROUP_RUN_PROG_UDP4_RECVMSG_LOCK(sk, uaddr) \ 277 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_UDP4_RECVMSG, NULL) 278 279#define BPF_CGROUP_RUN_PROG_UDP6_RECVMSG_LOCK(sk, uaddr) \ 280 BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, BPF_CGROUP_UDP6_RECVMSG, NULL) 281 282/* The SOCK_OPS"_SK" macro should be used when sock_ops->sk is not a 283 * fullsock and its parent fullsock cannot be traced by 284 * sk_to_full_sk(). 285 * 286 * e.g. sock_ops->sk is a request_sock and it is under syncookie mode. 287 * Its listener-sk is not attached to the rsk_listener. 288 * In this case, the caller holds the listener-sk (unlocked), 289 * set its sock_ops->sk to req_sk, and call this SOCK_OPS"_SK" with 290 * the listener-sk such that the cgroup-bpf-progs of the 291 * listener-sk will be run. 292 * 293 * Regardless of syncookie mode or not, 294 * calling bpf_setsockopt on listener-sk will not make sense anyway, 295 * so passing 'sock_ops->sk == req_sk' to the bpf prog is appropriate here. 296 */ 297#define BPF_CGROUP_RUN_PROG_SOCK_OPS_SK(sock_ops, sk) \ 298({ \ 299 int __ret = 0; \ 300 if (cgroup_bpf_enabled) \ 301 __ret = __cgroup_bpf_run_filter_sock_ops(sk, \ 302 sock_ops, \ 303 BPF_CGROUP_SOCK_OPS); \ 304 __ret; \ 305}) 306 307#define BPF_CGROUP_RUN_PROG_SOCK_OPS(sock_ops) \ 308({ \ 309 int __ret = 0; \ 310 if (cgroup_bpf_enabled && (sock_ops)->sk) { \ 311 typeof(sk) __sk = sk_to_full_sk((sock_ops)->sk); \ 312 if (__sk && sk_fullsock(__sk)) \ 313 __ret = __cgroup_bpf_run_filter_sock_ops(__sk, \ 314 sock_ops, \ 315 BPF_CGROUP_SOCK_OPS); \ 316 } \ 317 __ret; \ 318}) 319 320#define BPF_CGROUP_RUN_PROG_DEVICE_CGROUP(type, major, minor, access) \ 321({ \ 322 int __ret = 0; \ 323 if (cgroup_bpf_enabled) \ 324 __ret = __cgroup_bpf_check_dev_permission(type, major, minor, \ 325 access, \ 326 BPF_CGROUP_DEVICE); \ 327 \ 328 __ret; \ 329}) 330 331 332#define BPF_CGROUP_RUN_PROG_SYSCTL(head, table, write, buf, count, pos) \ 333({ \ 334 int __ret = 0; \ 335 if (cgroup_bpf_enabled) \ 336 __ret = __cgroup_bpf_run_filter_sysctl(head, table, write, \ 337 buf, count, pos, \ 338 BPF_CGROUP_SYSCTL); \ 339 __ret; \ 340}) 341 342#define BPF_CGROUP_RUN_PROG_SETSOCKOPT(sock, level, optname, optval, optlen, \ 343 kernel_optval) \ 344({ \ 345 int __ret = 0; \ 346 if (cgroup_bpf_enabled) \ 347 __ret = __cgroup_bpf_run_filter_setsockopt(sock, level, \ 348 optname, optval, \ 349 optlen, \ 350 kernel_optval); \ 351 __ret; \ 352}) 353 354#define BPF_CGROUP_GETSOCKOPT_MAX_OPTLEN(optlen) \ 355({ \ 356 int __ret = 0; \ 357 if (cgroup_bpf_enabled) \ 358 get_user(__ret, optlen); \ 359 __ret; \ 360}) 361 362#define BPF_CGROUP_RUN_PROG_GETSOCKOPT(sock, level, optname, optval, optlen, \ 363 max_optlen, retval) \ 364({ \ 365 int __ret = retval; \ 366 if (cgroup_bpf_enabled) \ 367 __ret = __cgroup_bpf_run_filter_getsockopt(sock, level, \ 368 optname, optval, \ 369 optlen, max_optlen, \ 370 retval); \ 371 __ret; \ 372}) 373 374int cgroup_bpf_prog_attach(const union bpf_attr *attr, 375 enum bpf_prog_type ptype, struct bpf_prog *prog); 376int cgroup_bpf_prog_detach(const union bpf_attr *attr, 377 enum bpf_prog_type ptype); 378int cgroup_bpf_link_attach(const union bpf_attr *attr, struct bpf_prog *prog); 379int cgroup_bpf_prog_query(const union bpf_attr *attr, 380 union bpf_attr __user *uattr); 381#else 382 383struct bpf_prog; 384struct cgroup_bpf {}; 385static inline int cgroup_bpf_inherit(struct cgroup *cgrp) { return 0; } 386static inline void cgroup_bpf_offline(struct cgroup *cgrp) {} 387 388static inline int cgroup_bpf_prog_attach(const union bpf_attr *attr, 389 enum bpf_prog_type ptype, 390 struct bpf_prog *prog) 391{ 392 return -EINVAL; 393} 394 395static inline int cgroup_bpf_prog_detach(const union bpf_attr *attr, 396 enum bpf_prog_type ptype) 397{ 398 return -EINVAL; 399} 400 401static inline int cgroup_bpf_link_attach(const union bpf_attr *attr, 402 struct bpf_prog *prog) 403{ 404 return -EINVAL; 405} 406 407static inline int cgroup_bpf_prog_query(const union bpf_attr *attr, 408 union bpf_attr __user *uattr) 409{ 410 return -EINVAL; 411} 412 413static inline void bpf_cgroup_storage_set( 414 struct bpf_cgroup_storage *storage[MAX_BPF_CGROUP_STORAGE_TYPE]) {} 415static inline int bpf_cgroup_storage_assign(struct bpf_prog_aux *aux, 416 struct bpf_map *map) { return 0; } 417static inline struct bpf_cgroup_storage *bpf_cgroup_storage_alloc( 418 struct bpf_prog *prog, enum bpf_cgroup_storage_type stype) { return NULL; } 419static inline void bpf_cgroup_storage_free( 420 struct bpf_cgroup_storage *storage) {} 421static inline int bpf_percpu_cgroup_storage_copy(struct bpf_map *map, void *key, 422 void *value) { 423 return 0; 424} 425static inline int bpf_percpu_cgroup_storage_update(struct bpf_map *map, 426 void *key, void *value, u64 flags) { 427 return 0; 428} 429 430#define cgroup_bpf_enabled (0) 431#define BPF_CGROUP_RUN_SA_PROG_LOCK(sk, uaddr, type, t_ctx) ({ 0; }) 432#define BPF_CGROUP_PRE_CONNECT_ENABLED(sk) (0) 433#define BPF_CGROUP_RUN_PROG_INET_INGRESS(sk,skb) ({ 0; }) 434#define BPF_CGROUP_RUN_PROG_INET_EGRESS(sk,skb) ({ 0; }) 435#define BPF_CGROUP_RUN_PROG_INET_SOCK(sk) ({ 0; }) 436#define BPF_CGROUP_RUN_PROG_INET_SOCK_RELEASE(sk) ({ 0; }) 437#define BPF_CGROUP_RUN_PROG_INET4_BIND_LOCK(sk, uaddr) ({ 0; }) 438#define BPF_CGROUP_RUN_PROG_INET6_BIND_LOCK(sk, uaddr) ({ 0; }) 439#define BPF_CGROUP_RUN_PROG_INET4_POST_BIND(sk) ({ 0; }) 440#define BPF_CGROUP_RUN_PROG_INET6_POST_BIND(sk) ({ 0; }) 441#define BPF_CGROUP_RUN_PROG_INET4_CONNECT(sk, uaddr) ({ 0; }) 442#define BPF_CGROUP_RUN_PROG_INET4_CONNECT_LOCK(sk, uaddr) ({ 0; }) 443#define BPF_CGROUP_RUN_PROG_INET6_CONNECT(sk, uaddr) ({ 0; }) 444#define BPF_CGROUP_RUN_PROG_INET6_CONNECT_LOCK(sk, uaddr) ({ 0; }) 445#define BPF_CGROUP_RUN_PROG_UDP4_SENDMSG_LOCK(sk, uaddr, t_ctx) ({ 0; }) 446#define BPF_CGROUP_RUN_PROG_UDP6_SENDMSG_LOCK(sk, uaddr, t_ctx) ({ 0; }) 447#define BPF_CGROUP_RUN_PROG_UDP4_RECVMSG_LOCK(sk, uaddr) ({ 0; }) 448#define BPF_CGROUP_RUN_PROG_UDP6_RECVMSG_LOCK(sk, uaddr) ({ 0; }) 449#define BPF_CGROUP_RUN_PROG_SOCK_OPS(sock_ops) ({ 0; }) 450#define BPF_CGROUP_RUN_PROG_DEVICE_CGROUP(type,major,minor,access) ({ 0; }) 451#define BPF_CGROUP_RUN_PROG_SYSCTL(head,table,write,buf,count,pos) ({ 0; }) 452#define BPF_CGROUP_GETSOCKOPT_MAX_OPTLEN(optlen) ({ 0; }) 453#define BPF_CGROUP_RUN_PROG_GETSOCKOPT(sock, level, optname, optval, \ 454 optlen, max_optlen, retval) ({ retval; }) 455#define BPF_CGROUP_RUN_PROG_SETSOCKOPT(sock, level, optname, optval, optlen, \ 456 kernel_optval) ({ 0; }) 457 458#define for_each_cgroup_storage_type(stype) for (; false; ) 459 460#endif /* CONFIG_CGROUP_BPF */ 461 462#endif /* _BPF_CGROUP_H */