at v6.15 19 kB view raw
1/* SPDX-License-Identifier: GPL-2.0 */ 2#ifndef __LINUX_UACCESS_H__ 3#define __LINUX_UACCESS_H__ 4 5#include <linux/fault-inject-usercopy.h> 6#include <linux/instrumented.h> 7#include <linux/minmax.h> 8#include <linux/nospec.h> 9#include <linux/sched.h> 10#include <linux/ucopysize.h> 11 12#include <asm/uaccess.h> 13 14/* 15 * Architectures that support memory tagging (assigning tags to memory regions, 16 * embedding these tags into addresses that point to these memory regions, and 17 * checking that the memory and the pointer tags match on memory accesses) 18 * redefine this macro to strip tags from pointers. 19 * 20 * Passing down mm_struct allows to define untagging rules on per-process 21 * basis. 22 * 23 * It's defined as noop for architectures that don't support memory tagging. 24 */ 25#ifndef untagged_addr 26#define untagged_addr(addr) (addr) 27#endif 28 29#ifndef untagged_addr_remote 30#define untagged_addr_remote(mm, addr) ({ \ 31 mmap_assert_locked(mm); \ 32 untagged_addr(addr); \ 33}) 34#endif 35 36#ifdef masked_user_access_begin 37 #define can_do_masked_user_access() 1 38#else 39 #define can_do_masked_user_access() 0 40 #define masked_user_access_begin(src) NULL 41 #define mask_user_address(src) (src) 42#endif 43 44/* 45 * Architectures should provide two primitives (raw_copy_{to,from}_user()) 46 * and get rid of their private instances of copy_{to,from}_user() and 47 * __copy_{to,from}_user{,_inatomic}(). 48 * 49 * raw_copy_{to,from}_user(to, from, size) should copy up to size bytes and 50 * return the amount left to copy. They should assume that access_ok() has 51 * already been checked (and succeeded); they should *not* zero-pad anything. 52 * No KASAN or object size checks either - those belong here. 53 * 54 * Both of these functions should attempt to copy size bytes starting at from 55 * into the area starting at to. They must not fetch or store anything 56 * outside of those areas. Return value must be between 0 (everything 57 * copied successfully) and size (nothing copied). 58 * 59 * If raw_copy_{to,from}_user(to, from, size) returns N, size - N bytes starting 60 * at to must become equal to the bytes fetched from the corresponding area 61 * starting at from. All data past to + size - N must be left unmodified. 62 * 63 * If copying succeeds, the return value must be 0. If some data cannot be 64 * fetched, it is permitted to copy less than had been fetched; the only 65 * hard requirement is that not storing anything at all (i.e. returning size) 66 * should happen only when nothing could be copied. In other words, you don't 67 * have to squeeze as much as possible - it is allowed, but not necessary. 68 * 69 * For raw_copy_from_user() to always points to kernel memory and no faults 70 * on store should happen. Interpretation of from is affected by set_fs(). 71 * For raw_copy_to_user() it's the other way round. 72 * 73 * Both can be inlined - it's up to architectures whether it wants to bother 74 * with that. They should not be used directly; they are used to implement 75 * the 6 functions (copy_{to,from}_user(), __copy_{to,from}_user_inatomic()) 76 * that are used instead. Out of those, __... ones are inlined. Plain 77 * copy_{to,from}_user() might or might not be inlined. If you want them 78 * inlined, have asm/uaccess.h define INLINE_COPY_{TO,FROM}_USER. 79 * 80 * NOTE: only copy_from_user() zero-pads the destination in case of short copy. 81 * Neither __copy_from_user() nor __copy_from_user_inatomic() zero anything 82 * at all; their callers absolutely must check the return value. 83 * 84 * Biarch ones should also provide raw_copy_in_user() - similar to the above, 85 * but both source and destination are __user pointers (affected by set_fs() 86 * as usual) and both source and destination can trigger faults. 87 */ 88 89static __always_inline __must_check unsigned long 90__copy_from_user_inatomic(void *to, const void __user *from, unsigned long n) 91{ 92 unsigned long res; 93 94 instrument_copy_from_user_before(to, from, n); 95 check_object_size(to, n, false); 96 res = raw_copy_from_user(to, from, n); 97 instrument_copy_from_user_after(to, from, n, res); 98 return res; 99} 100 101static __always_inline __must_check unsigned long 102__copy_from_user(void *to, const void __user *from, unsigned long n) 103{ 104 unsigned long res; 105 106 might_fault(); 107 instrument_copy_from_user_before(to, from, n); 108 if (should_fail_usercopy()) 109 return n; 110 check_object_size(to, n, false); 111 res = raw_copy_from_user(to, from, n); 112 instrument_copy_from_user_after(to, from, n, res); 113 return res; 114} 115 116/** 117 * __copy_to_user_inatomic: - Copy a block of data into user space, with less checking. 118 * @to: Destination address, in user space. 119 * @from: Source address, in kernel space. 120 * @n: Number of bytes to copy. 121 * 122 * Context: User context only. 123 * 124 * Copy data from kernel space to user space. Caller must check 125 * the specified block with access_ok() before calling this function. 126 * The caller should also make sure he pins the user space address 127 * so that we don't result in page fault and sleep. 128 */ 129static __always_inline __must_check unsigned long 130__copy_to_user_inatomic(void __user *to, const void *from, unsigned long n) 131{ 132 if (should_fail_usercopy()) 133 return n; 134 instrument_copy_to_user(to, from, n); 135 check_object_size(from, n, true); 136 return raw_copy_to_user(to, from, n); 137} 138 139static __always_inline __must_check unsigned long 140__copy_to_user(void __user *to, const void *from, unsigned long n) 141{ 142 might_fault(); 143 if (should_fail_usercopy()) 144 return n; 145 instrument_copy_to_user(to, from, n); 146 check_object_size(from, n, true); 147 return raw_copy_to_user(to, from, n); 148} 149 150/* 151 * Architectures that #define INLINE_COPY_TO_USER use this function 152 * directly in the normal copy_to/from_user(), the other ones go 153 * through an extern _copy_to/from_user(), which expands the same code 154 * here. 155 * 156 * Rust code always uses the extern definition. 157 */ 158static inline __must_check unsigned long 159_inline_copy_from_user(void *to, const void __user *from, unsigned long n) 160{ 161 unsigned long res = n; 162 might_fault(); 163 if (should_fail_usercopy()) 164 goto fail; 165 if (can_do_masked_user_access()) 166 from = mask_user_address(from); 167 else { 168 if (!access_ok(from, n)) 169 goto fail; 170 /* 171 * Ensure that bad access_ok() speculation will not 172 * lead to nasty side effects *after* the copy is 173 * finished: 174 */ 175 barrier_nospec(); 176 } 177 instrument_copy_from_user_before(to, from, n); 178 res = raw_copy_from_user(to, from, n); 179 instrument_copy_from_user_after(to, from, n, res); 180 if (likely(!res)) 181 return 0; 182fail: 183 memset(to + (n - res), 0, res); 184 return res; 185} 186extern __must_check unsigned long 187_copy_from_user(void *, const void __user *, unsigned long); 188 189static inline __must_check unsigned long 190_inline_copy_to_user(void __user *to, const void *from, unsigned long n) 191{ 192 might_fault(); 193 if (should_fail_usercopy()) 194 return n; 195 if (access_ok(to, n)) { 196 instrument_copy_to_user(to, from, n); 197 n = raw_copy_to_user(to, from, n); 198 } 199 return n; 200} 201extern __must_check unsigned long 202_copy_to_user(void __user *, const void *, unsigned long); 203 204static __always_inline unsigned long __must_check 205copy_from_user(void *to, const void __user *from, unsigned long n) 206{ 207 if (!check_copy_size(to, n, false)) 208 return n; 209#ifdef INLINE_COPY_FROM_USER 210 return _inline_copy_from_user(to, from, n); 211#else 212 return _copy_from_user(to, from, n); 213#endif 214} 215 216static __always_inline unsigned long __must_check 217copy_to_user(void __user *to, const void *from, unsigned long n) 218{ 219 if (!check_copy_size(from, n, true)) 220 return n; 221 222#ifdef INLINE_COPY_TO_USER 223 return _inline_copy_to_user(to, from, n); 224#else 225 return _copy_to_user(to, from, n); 226#endif 227} 228 229#ifndef copy_mc_to_kernel 230/* 231 * Without arch opt-in this generic copy_mc_to_kernel() will not handle 232 * #MC (or arch equivalent) during source read. 233 */ 234static inline unsigned long __must_check 235copy_mc_to_kernel(void *dst, const void *src, size_t cnt) 236{ 237 memcpy(dst, src, cnt); 238 return 0; 239} 240#endif 241 242static __always_inline void pagefault_disabled_inc(void) 243{ 244 current->pagefault_disabled++; 245} 246 247static __always_inline void pagefault_disabled_dec(void) 248{ 249 current->pagefault_disabled--; 250} 251 252/* 253 * These routines enable/disable the pagefault handler. If disabled, it will 254 * not take any locks and go straight to the fixup table. 255 * 256 * User access methods will not sleep when called from a pagefault_disabled() 257 * environment. 258 */ 259static inline void pagefault_disable(void) 260{ 261 pagefault_disabled_inc(); 262 /* 263 * make sure to have issued the store before a pagefault 264 * can hit. 265 */ 266 barrier(); 267} 268 269static inline void pagefault_enable(void) 270{ 271 /* 272 * make sure to issue those last loads/stores before enabling 273 * the pagefault handler again. 274 */ 275 barrier(); 276 pagefault_disabled_dec(); 277} 278 279/* 280 * Is the pagefault handler disabled? If so, user access methods will not sleep. 281 */ 282static inline bool pagefault_disabled(void) 283{ 284 return current->pagefault_disabled != 0; 285} 286 287/* 288 * The pagefault handler is in general disabled by pagefault_disable() or 289 * when in irq context (via in_atomic()). 290 * 291 * This function should only be used by the fault handlers. Other users should 292 * stick to pagefault_disabled(). 293 * Please NEVER use preempt_disable() to disable the fault handler. With 294 * !CONFIG_PREEMPT_COUNT, this is like a NOP. So the handler won't be disabled. 295 * in_atomic() will report different values based on !CONFIG_PREEMPT_COUNT. 296 */ 297#define faulthandler_disabled() (pagefault_disabled() || in_atomic()) 298 299#ifndef CONFIG_ARCH_HAS_SUBPAGE_FAULTS 300 301/** 302 * probe_subpage_writeable: probe the user range for write faults at sub-page 303 * granularity (e.g. arm64 MTE) 304 * @uaddr: start of address range 305 * @size: size of address range 306 * 307 * Returns 0 on success, the number of bytes not probed on fault. 308 * 309 * It is expected that the caller checked for the write permission of each 310 * page in the range either by put_user() or GUP. The architecture port can 311 * implement a more efficient get_user() probing if the same sub-page faults 312 * are triggered by either a read or a write. 313 */ 314static inline size_t probe_subpage_writeable(char __user *uaddr, size_t size) 315{ 316 return 0; 317} 318 319#endif /* CONFIG_ARCH_HAS_SUBPAGE_FAULTS */ 320 321#ifndef ARCH_HAS_NOCACHE_UACCESS 322 323static inline __must_check unsigned long 324__copy_from_user_inatomic_nocache(void *to, const void __user *from, 325 unsigned long n) 326{ 327 return __copy_from_user_inatomic(to, from, n); 328} 329 330#endif /* ARCH_HAS_NOCACHE_UACCESS */ 331 332extern __must_check int check_zeroed_user(const void __user *from, size_t size); 333 334/** 335 * copy_struct_from_user: copy a struct from userspace 336 * @dst: Destination address, in kernel space. This buffer must be @ksize 337 * bytes long. 338 * @ksize: Size of @dst struct. 339 * @src: Source address, in userspace. 340 * @usize: (Alleged) size of @src struct. 341 * 342 * Copies a struct from userspace to kernel space, in a way that guarantees 343 * backwards-compatibility for struct syscall arguments (as long as future 344 * struct extensions are made such that all new fields are *appended* to the 345 * old struct, and zeroed-out new fields have the same meaning as the old 346 * struct). 347 * 348 * @ksize is just sizeof(*dst), and @usize should've been passed by userspace. 349 * The recommended usage is something like the following: 350 * 351 * SYSCALL_DEFINE2(foobar, const struct foo __user *, uarg, size_t, usize) 352 * { 353 * int err; 354 * struct foo karg = {}; 355 * 356 * if (usize > PAGE_SIZE) 357 * return -E2BIG; 358 * if (usize < FOO_SIZE_VER0) 359 * return -EINVAL; 360 * 361 * err = copy_struct_from_user(&karg, sizeof(karg), uarg, usize); 362 * if (err) 363 * return err; 364 * 365 * // ... 366 * } 367 * 368 * There are three cases to consider: 369 * * If @usize == @ksize, then it's copied verbatim. 370 * * If @usize < @ksize, then the userspace has passed an old struct to a 371 * newer kernel. The rest of the trailing bytes in @dst (@ksize - @usize) 372 * are to be zero-filled. 373 * * If @usize > @ksize, then the userspace has passed a new struct to an 374 * older kernel. The trailing bytes unknown to the kernel (@usize - @ksize) 375 * are checked to ensure they are zeroed, otherwise -E2BIG is returned. 376 * 377 * Returns (in all cases, some data may have been copied): 378 * * -E2BIG: (@usize > @ksize) and there are non-zero trailing bytes in @src. 379 * * -EFAULT: access to userspace failed. 380 */ 381static __always_inline __must_check int 382copy_struct_from_user(void *dst, size_t ksize, const void __user *src, 383 size_t usize) 384{ 385 size_t size = min(ksize, usize); 386 size_t rest = max(ksize, usize) - size; 387 388 /* Double check if ksize is larger than a known object size. */ 389 if (WARN_ON_ONCE(ksize > __builtin_object_size(dst, 1))) 390 return -E2BIG; 391 392 /* Deal with trailing bytes. */ 393 if (usize < ksize) { 394 memset(dst + size, 0, rest); 395 } else if (usize > ksize) { 396 int ret = check_zeroed_user(src + size, rest); 397 if (ret <= 0) 398 return ret ?: -E2BIG; 399 } 400 /* Copy the interoperable parts of the struct. */ 401 if (copy_from_user(dst, src, size)) 402 return -EFAULT; 403 return 0; 404} 405 406/** 407 * copy_struct_to_user: copy a struct to userspace 408 * @dst: Destination address, in userspace. This buffer must be @ksize 409 * bytes long. 410 * @usize: (Alleged) size of @dst struct. 411 * @src: Source address, in kernel space. 412 * @ksize: Size of @src struct. 413 * @ignored_trailing: Set to %true if there was a non-zero byte in @src that 414 * userspace cannot see because they are using an smaller struct. 415 * 416 * Copies a struct from kernel space to userspace, in a way that guarantees 417 * backwards-compatibility for struct syscall arguments (as long as future 418 * struct extensions are made such that all new fields are *appended* to the 419 * old struct, and zeroed-out new fields have the same meaning as the old 420 * struct). 421 * 422 * Some syscalls may wish to make sure that userspace knows about everything in 423 * the struct, and if there is a non-zero value that userspce doesn't know 424 * about, they want to return an error (such as -EMSGSIZE) or have some other 425 * fallback (such as adding a "you're missing some information" flag). If 426 * @ignored_trailing is non-%NULL, it will be set to %true if there was a 427 * non-zero byte that could not be copied to userspace (ie. was past @usize). 428 * 429 * While unconditionally returning an error in this case is the simplest 430 * solution, for maximum backward compatibility you should try to only return 431 * -EMSGSIZE if the user explicitly requested the data that couldn't be copied. 432 * Note that structure sizes can change due to header changes and simple 433 * recompilations without code changes(!), so if you care about 434 * @ignored_trailing you probably want to make sure that any new field data is 435 * associated with a flag. Otherwise you might assume that a program knows 436 * about data it does not. 437 * 438 * @ksize is just sizeof(*src), and @usize should've been passed by userspace. 439 * The recommended usage is something like the following: 440 * 441 * SYSCALL_DEFINE2(foobar, struct foo __user *, uarg, size_t, usize) 442 * { 443 * int err; 444 * bool ignored_trailing; 445 * struct foo karg = {}; 446 * 447 * if (usize > PAGE_SIZE) 448 * return -E2BIG; 449 * if (usize < FOO_SIZE_VER0) 450 * return -EINVAL; 451 * 452 * // ... modify karg somehow ... 453 * 454 * err = copy_struct_to_user(uarg, usize, &karg, sizeof(karg), 455 * &ignored_trailing); 456 * if (err) 457 * return err; 458 * if (ignored_trailing) 459 * return -EMSGSIZE: 460 * 461 * // ... 462 * } 463 * 464 * There are three cases to consider: 465 * * If @usize == @ksize, then it's copied verbatim. 466 * * If @usize < @ksize, then the kernel is trying to pass userspace a newer 467 * struct than it supports. Thus we only copy the interoperable portions 468 * (@usize) and ignore the rest (but @ignored_trailing is set to %true if 469 * any of the trailing (@ksize - @usize) bytes are non-zero). 470 * * If @usize > @ksize, then the kernel is trying to pass userspace an older 471 * struct than userspace supports. In order to make sure the 472 * unknown-to-the-kernel fields don't contain garbage values, we zero the 473 * trailing (@usize - @ksize) bytes. 474 * 475 * Returns (in all cases, some data may have been copied): 476 * * -EFAULT: access to userspace failed. 477 */ 478static __always_inline __must_check int 479copy_struct_to_user(void __user *dst, size_t usize, const void *src, 480 size_t ksize, bool *ignored_trailing) 481{ 482 size_t size = min(ksize, usize); 483 size_t rest = max(ksize, usize) - size; 484 485 /* Double check if ksize is larger than a known object size. */ 486 if (WARN_ON_ONCE(ksize > __builtin_object_size(src, 1))) 487 return -E2BIG; 488 489 /* Deal with trailing bytes. */ 490 if (usize > ksize) { 491 if (clear_user(dst + size, rest)) 492 return -EFAULT; 493 } 494 if (ignored_trailing) 495 *ignored_trailing = ksize < usize && 496 memchr_inv(src + size, 0, rest) != NULL; 497 /* Copy the interoperable parts of the struct. */ 498 if (copy_to_user(dst, src, size)) 499 return -EFAULT; 500 return 0; 501} 502 503bool copy_from_kernel_nofault_allowed(const void *unsafe_src, size_t size); 504 505long copy_from_kernel_nofault(void *dst, const void *src, size_t size); 506long notrace copy_to_kernel_nofault(void *dst, const void *src, size_t size); 507 508long copy_from_user_nofault(void *dst, const void __user *src, size_t size); 509long notrace copy_to_user_nofault(void __user *dst, const void *src, 510 size_t size); 511 512long strncpy_from_kernel_nofault(char *dst, const void *unsafe_addr, 513 long count); 514 515long strncpy_from_user_nofault(char *dst, const void __user *unsafe_addr, 516 long count); 517long strnlen_user_nofault(const void __user *unsafe_addr, long count); 518 519#ifndef __get_kernel_nofault 520#define __get_kernel_nofault(dst, src, type, label) \ 521do { \ 522 type __user *p = (type __force __user *)(src); \ 523 type data; \ 524 if (__get_user(data, p)) \ 525 goto label; \ 526 *(type *)dst = data; \ 527} while (0) 528 529#define __put_kernel_nofault(dst, src, type, label) \ 530do { \ 531 type __user *p = (type __force __user *)(dst); \ 532 type data = *(type *)src; \ 533 if (__put_user(data, p)) \ 534 goto label; \ 535} while (0) 536#endif 537 538/** 539 * get_kernel_nofault(): safely attempt to read from a location 540 * @val: read into this variable 541 * @ptr: address to read from 542 * 543 * Returns 0 on success, or -EFAULT. 544 */ 545#define get_kernel_nofault(val, ptr) ({ \ 546 const typeof(val) *__gk_ptr = (ptr); \ 547 copy_from_kernel_nofault(&(val), __gk_ptr, sizeof(val));\ 548}) 549 550#ifndef user_access_begin 551#define user_access_begin(ptr,len) access_ok(ptr, len) 552#define user_access_end() do { } while (0) 553#define unsafe_op_wrap(op, err) do { if (unlikely(op)) goto err; } while (0) 554#define unsafe_get_user(x,p,e) unsafe_op_wrap(__get_user(x,p),e) 555#define unsafe_put_user(x,p,e) unsafe_op_wrap(__put_user(x,p),e) 556#define unsafe_copy_to_user(d,s,l,e) unsafe_op_wrap(__copy_to_user(d,s,l),e) 557#define unsafe_copy_from_user(d,s,l,e) unsafe_op_wrap(__copy_from_user(d,s,l),e) 558static inline unsigned long user_access_save(void) { return 0UL; } 559static inline void user_access_restore(unsigned long flags) { } 560#endif 561#ifndef user_write_access_begin 562#define user_write_access_begin user_access_begin 563#define user_write_access_end user_access_end 564#endif 565#ifndef user_read_access_begin 566#define user_read_access_begin user_access_begin 567#define user_read_access_end user_access_end 568#endif 569 570#ifdef CONFIG_HARDENED_USERCOPY 571void __noreturn usercopy_abort(const char *name, const char *detail, 572 bool to_user, unsigned long offset, 573 unsigned long len); 574#endif 575 576#endif /* __LINUX_UACCESS_H__ */