Linux kernel mirror (for testing) git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel os linux

NFSD: fix race between nfsd registration and exports_proc

As of now nfsd calls create_proc_exports_entry() at start of init_nfsd
and cleanup by remove_proc_entry() at last of exit_nfsd.

Which causes kernel OOPs if there is race between below 2 operations:
(i) exportfs -r
(ii) mount -t nfsd none /proc/fs/nfsd

for 5.4 kernel ARM64:

CPU 1:
el1_irq+0xbc/0x180
arch_counter_get_cntvct+0x14/0x18
running_clock+0xc/0x18
preempt_count_add+0x88/0x110
prep_new_page+0xb0/0x220
get_page_from_freelist+0x2d8/0x1778
__alloc_pages_nodemask+0x15c/0xef0
__vmalloc_node_range+0x28c/0x478
__vmalloc_node_flags_caller+0x8c/0xb0
kvmalloc_node+0x88/0xe0
nfsd_init_net+0x6c/0x108 [nfsd]
ops_init+0x44/0x170
register_pernet_operations+0x114/0x270
register_pernet_subsys+0x34/0x50
init_nfsd+0xa8/0x718 [nfsd]
do_one_initcall+0x54/0x2e0

CPU 2 :
Unable to handle kernel NULL pointer dereference at virtual address 0000000000000010

PC is at : exports_net_open+0x50/0x68 [nfsd]

Call trace:
exports_net_open+0x50/0x68 [nfsd]
exports_proc_open+0x2c/0x38 [nfsd]
proc_reg_open+0xb8/0x198
do_dentry_open+0x1c4/0x418
vfs_open+0x38/0x48
path_openat+0x28c/0xf18
do_filp_open+0x70/0xe8
do_sys_open+0x154/0x248

Sometimes it crashes at exports_net_open() and sometimes cache_seq_next_rcu().

and same is happening on latest 6.14 kernel as well:

[ 0.000000] Linux version 6.14.0-rc5-next-20250304-dirty
...
[ 285.455918] Unable to handle kernel paging request at virtual address 00001f4800001f48
...
[ 285.464902] pc : cache_seq_next_rcu+0x78/0xa4
...
[ 285.469695] Call trace:
[ 285.470083] cache_seq_next_rcu+0x78/0xa4 (P)
[ 285.470488] seq_read+0xe0/0x11c
[ 285.470675] proc_reg_read+0x9c/0xf0
[ 285.470874] vfs_read+0xc4/0x2fc
[ 285.471057] ksys_read+0x6c/0xf4
[ 285.471231] __arm64_sys_read+0x1c/0x28
[ 285.471428] invoke_syscall+0x44/0x100
[ 285.471633] el0_svc_common.constprop.0+0x40/0xe0
[ 285.471870] do_el0_svc_compat+0x1c/0x34
[ 285.472073] el0_svc_compat+0x2c/0x80
[ 285.472265] el0t_32_sync_handler+0x90/0x140
[ 285.472473] el0t_32_sync+0x19c/0x1a0
[ 285.472887] Code: f9400885 93407c23 937d7c27 11000421 (f86378a3)
[ 285.473422] ---[ end trace 0000000000000000 ]---

It reproduced simply with below script:
while [ 1 ]
do
/exportfs -r
done &

while [ 1 ]
do
insmod /nfsd.ko
mount -t nfsd none /proc/fs/nfsd
umount /proc/fs/nfsd
rmmod nfsd
done &

So exporting interfaces to user space shall be done at last and
cleanup at first place.

With change there is no Kernel OOPs.

Co-developed-by: Shubham Rana <s9.rana@samsung.com>
Signed-off-by: Shubham Rana <s9.rana@samsung.com>
Signed-off-by: Maninder Singh <maninder1.s@samsung.com>
Reviewed-by: Jeff Layton <jlayton@kernel.org>
Cc: stable@vger.kernel.org
Signed-off-by: Chuck Lever <chuck.lever@oracle.com>

authored by

Maninder Singh and committed by
Chuck Lever
f7fb730c ff12eb37

+8 -9
+8 -9
fs/nfsd/nfsctl.c
··· 2291 2291 if (retval) 2292 2292 goto out_free_pnfs; 2293 2293 nfsd_lockd_init(); /* lockd->nfsd callbacks */ 2294 - retval = create_proc_exports_entry(); 2295 - if (retval) 2296 - goto out_free_lockd; 2297 2294 retval = register_pernet_subsys(&nfsd_net_ops); 2298 2295 if (retval < 0) 2299 - goto out_free_exports; 2296 + goto out_free_lockd; 2300 2297 retval = register_cld_notifier(); 2301 2298 if (retval) 2302 2299 goto out_free_subsys; ··· 2305 2308 goto out_free_nfsd4; 2306 2309 retval = genl_register_family(&nfsd_nl_family); 2307 2310 if (retval) 2311 + goto out_free_filesystem; 2312 + retval = create_proc_exports_entry(); 2313 + if (retval) 2308 2314 goto out_free_all; 2309 2315 nfsd_localio_ops_init(); 2310 2316 2311 2317 return 0; 2312 2318 out_free_all: 2319 + genl_unregister_family(&nfsd_nl_family); 2320 + out_free_filesystem: 2313 2321 unregister_filesystem(&nfsd_fs_type); 2314 2322 out_free_nfsd4: 2315 2323 nfsd4_destroy_laundry_wq(); ··· 2322 2320 unregister_cld_notifier(); 2323 2321 out_free_subsys: 2324 2322 unregister_pernet_subsys(&nfsd_net_ops); 2325 - out_free_exports: 2326 - remove_proc_entry("fs/nfs/exports", NULL); 2327 - remove_proc_entry("fs/nfs", NULL); 2328 2323 out_free_lockd: 2329 2324 nfsd_lockd_shutdown(); 2330 2325 nfsd_drc_slab_free(); ··· 2334 2335 2335 2336 static void __exit exit_nfsd(void) 2336 2337 { 2338 + remove_proc_entry("fs/nfs/exports", NULL); 2339 + remove_proc_entry("fs/nfs", NULL); 2337 2340 genl_unregister_family(&nfsd_nl_family); 2338 2341 unregister_filesystem(&nfsd_fs_type); 2339 2342 nfsd4_destroy_laundry_wq(); 2340 2343 unregister_cld_notifier(); 2341 2344 unregister_pernet_subsys(&nfsd_net_ops); 2342 2345 nfsd_drc_slab_free(); 2343 - remove_proc_entry("fs/nfs/exports", NULL); 2344 - remove_proc_entry("fs/nfs", NULL); 2345 2346 nfsd_lockd_shutdown(); 2346 2347 nfsd4_free_slabs(); 2347 2348 nfsd4_exit_pnfs();