Linux kernel mirror (for testing)
git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
kernel
os
linux
1// SPDX-License-Identifier: GPL-2.0-or-later
2/* AFS server record management
3 *
4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved.
5 * Written by David Howells (dhowells@redhat.com)
6 */
7
8#include <linux/sched.h>
9#include <linux/slab.h>
10#include "afs_fs.h"
11#include "internal.h"
12#include "protocol_yfs.h"
13
14static unsigned afs_server_gc_delay = 10; /* Server record timeout in seconds */
15static atomic_t afs_server_debug_id;
16
17static void __afs_put_server(struct afs_net *, struct afs_server *);
18static void afs_server_timer(struct timer_list *timer);
19static void afs_server_destroyer(struct work_struct *work);
20
21/*
22 * Find a server by one of its addresses.
23 */
24struct afs_server *afs_find_server(const struct rxrpc_peer *peer)
25{
26 struct afs_server *server = (struct afs_server *)rxrpc_kernel_get_peer_data(peer);
27
28 if (!server)
29 return NULL;
30 return afs_use_server(server, false, afs_server_trace_use_cm_call);
31}
32
33/*
34 * Look up a server by its UUID and mark it active. The caller must hold
35 * cell->fs_lock.
36 */
37static struct afs_server *afs_find_server_by_uuid(struct afs_cell *cell, const uuid_t *uuid)
38{
39 struct afs_server *server;
40 struct rb_node *p;
41 int diff;
42
43 _enter("%pU", uuid);
44
45 p = cell->fs_servers.rb_node;
46 while (p) {
47 server = rb_entry(p, struct afs_server, uuid_rb);
48
49 diff = memcmp(uuid, &server->uuid, sizeof(*uuid));
50 if (diff < 0) {
51 p = p->rb_left;
52 } else if (diff > 0) {
53 p = p->rb_right;
54 } else {
55 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags))
56 return NULL; /* Need a write lock */
57 afs_use_server(server, true, afs_server_trace_use_by_uuid);
58 return server;
59 }
60 }
61
62 return NULL;
63}
64
65/*
66 * Install a server record in the cell tree. The caller must hold an exclusive
67 * lock on cell->fs_lock.
68 */
69static struct afs_server *afs_install_server(struct afs_cell *cell,
70 struct afs_server **candidate)
71{
72 struct afs_server *server;
73 struct afs_net *net = cell->net;
74 struct rb_node **pp, *p;
75 int diff;
76
77 _enter("%p", candidate);
78
79 /* Firstly install the server in the UUID lookup tree */
80 pp = &cell->fs_servers.rb_node;
81 p = NULL;
82 while (*pp) {
83 p = *pp;
84 _debug("- consider %p", p);
85 server = rb_entry(p, struct afs_server, uuid_rb);
86 diff = memcmp(&(*candidate)->uuid, &server->uuid, sizeof(uuid_t));
87 if (diff < 0)
88 pp = &(*pp)->rb_left;
89 else if (diff > 0)
90 pp = &(*pp)->rb_right;
91 else
92 goto exists;
93 }
94
95 server = *candidate;
96 *candidate = NULL;
97 rb_link_node(&server->uuid_rb, p, pp);
98 rb_insert_color(&server->uuid_rb, &cell->fs_servers);
99 write_seqlock(&net->fs_lock);
100 hlist_add_head_rcu(&server->proc_link, &net->fs_proc);
101 write_sequnlock(&net->fs_lock);
102
103 afs_get_cell(cell, afs_cell_trace_get_server);
104
105exists:
106 afs_use_server(server, true, afs_server_trace_use_install);
107 return server;
108}
109
110/*
111 * Allocate a new server record and mark it as active but uncreated.
112 */
113static struct afs_server *afs_alloc_server(struct afs_cell *cell, const uuid_t *uuid)
114{
115 struct afs_server *server;
116 struct afs_net *net = cell->net;
117
118 _enter("");
119
120 server = kzalloc(sizeof(struct afs_server), GFP_KERNEL);
121 if (!server)
122 return NULL;
123
124 refcount_set(&server->ref, 1);
125 atomic_set(&server->active, 0);
126 __set_bit(AFS_SERVER_FL_UNCREATED, &server->flags);
127 server->debug_id = atomic_inc_return(&afs_server_debug_id);
128 server->uuid = *uuid;
129 rwlock_init(&server->fs_lock);
130 INIT_WORK(&server->destroyer, &afs_server_destroyer);
131 timer_setup(&server->timer, afs_server_timer, 0);
132 INIT_LIST_HEAD(&server->volumes);
133 init_waitqueue_head(&server->probe_wq);
134 INIT_LIST_HEAD(&server->probe_link);
135 INIT_HLIST_NODE(&server->proc_link);
136 spin_lock_init(&server->probe_lock);
137 server->cell = cell;
138 server->rtt = UINT_MAX;
139 server->service_id = FS_SERVICE;
140 server->probe_counter = 1;
141 server->probed_at = jiffies - LONG_MAX / 2;
142
143 afs_inc_servers_outstanding(net);
144 _leave(" = %p", server);
145 return server;
146}
147
148/*
149 * Look up an address record for a server
150 */
151static struct afs_addr_list *afs_vl_lookup_addrs(struct afs_server *server,
152 struct key *key)
153{
154 struct afs_vl_cursor vc;
155 struct afs_addr_list *alist = NULL;
156 int ret;
157
158 ret = -ERESTARTSYS;
159 if (afs_begin_vlserver_operation(&vc, server->cell, key)) {
160 while (afs_select_vlserver(&vc)) {
161 if (test_bit(AFS_VLSERVER_FL_IS_YFS, &vc.server->flags))
162 alist = afs_yfsvl_get_endpoints(&vc, &server->uuid);
163 else
164 alist = afs_vl_get_addrs_u(&vc, &server->uuid);
165 }
166
167 ret = afs_end_vlserver_operation(&vc);
168 }
169
170 return ret < 0 ? ERR_PTR(ret) : alist;
171}
172
173/*
174 * Get or create a fileserver record and return it with an active-use count on
175 * it.
176 */
177struct afs_server *afs_lookup_server(struct afs_cell *cell, struct key *key,
178 const uuid_t *uuid, u32 addr_version)
179{
180 struct afs_addr_list *alist = NULL;
181 struct afs_server *server, *candidate = NULL;
182 bool creating = false;
183 int ret;
184
185 _enter("%p,%pU", cell->net, uuid);
186
187 down_read(&cell->fs_lock);
188 server = afs_find_server_by_uuid(cell, uuid);
189 /* Won't see servers marked uncreated. */
190 up_read(&cell->fs_lock);
191
192 if (server) {
193 timer_delete_sync(&server->timer);
194 if (test_bit(AFS_SERVER_FL_CREATING, &server->flags))
195 goto wait_for_creation;
196 if (server->addr_version != addr_version)
197 set_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags);
198 return server;
199 }
200
201 candidate = afs_alloc_server(cell, uuid);
202 if (!candidate) {
203 afs_put_addrlist(alist, afs_alist_trace_put_server_oom);
204 return ERR_PTR(-ENOMEM);
205 }
206
207 down_write(&cell->fs_lock);
208 server = afs_install_server(cell, &candidate);
209 if (test_bit(AFS_SERVER_FL_CREATING, &server->flags)) {
210 /* We need to wait for creation to complete. */
211 up_write(&cell->fs_lock);
212 goto wait_for_creation;
213 }
214 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags)) {
215 set_bit(AFS_SERVER_FL_CREATING, &server->flags);
216 clear_bit(AFS_SERVER_FL_UNCREATED, &server->flags);
217 creating = true;
218 }
219 up_write(&cell->fs_lock);
220 timer_delete_sync(&server->timer);
221
222 /* If we get to create the server, we look up the addresses and then
223 * immediately dispatch an asynchronous probe to each interface on the
224 * fileserver. This will make sure the repeat-probing service is
225 * started.
226 */
227 if (creating) {
228 alist = afs_vl_lookup_addrs(server, key);
229 if (IS_ERR(alist)) {
230 ret = PTR_ERR(alist);
231 goto create_failed;
232 }
233
234 ret = afs_fs_probe_fileserver(cell->net, server, alist, key);
235 if (ret)
236 goto create_failed;
237
238 clear_and_wake_up_bit(AFS_SERVER_FL_CREATING, &server->flags);
239 }
240
241out:
242 afs_put_addrlist(alist, afs_alist_trace_put_server_create);
243 if (candidate) {
244 kfree(rcu_access_pointer(server->endpoint_state));
245 kfree(candidate);
246 afs_dec_servers_outstanding(cell->net);
247 }
248 return server ?: ERR_PTR(ret);
249
250wait_for_creation:
251 afs_see_server(server, afs_server_trace_wait_create);
252 wait_on_bit(&server->flags, AFS_SERVER_FL_CREATING, TASK_UNINTERRUPTIBLE);
253 if (test_bit_acquire(AFS_SERVER_FL_UNCREATED, &server->flags)) {
254 /* Barrier: read flag before error */
255 ret = READ_ONCE(server->create_error);
256 afs_put_server(cell->net, server, afs_server_trace_unuse_create_fail);
257 server = NULL;
258 goto out;
259 }
260
261 ret = 0;
262 goto out;
263
264create_failed:
265 down_write(&cell->fs_lock);
266
267 WRITE_ONCE(server->create_error, ret);
268 smp_wmb(); /* Barrier: set error before flag. */
269 set_bit(AFS_SERVER_FL_UNCREATED, &server->flags);
270
271 clear_and_wake_up_bit(AFS_SERVER_FL_CREATING, &server->flags);
272
273 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags)) {
274 clear_bit(AFS_SERVER_FL_UNCREATED, &server->flags);
275 creating = true;
276 }
277 afs_unuse_server(cell->net, server, afs_server_trace_unuse_create_fail);
278 server = NULL;
279
280 up_write(&cell->fs_lock);
281 goto out;
282}
283
284/*
285 * Set/reduce a server's timer.
286 */
287static void afs_set_server_timer(struct afs_server *server, unsigned int delay_secs)
288{
289 mod_timer(&server->timer, jiffies + delay_secs * HZ);
290}
291
292/*
293 * Get a reference on a server object.
294 */
295struct afs_server *afs_get_server(struct afs_server *server,
296 enum afs_server_trace reason)
297{
298 unsigned int a;
299 int r;
300
301 __refcount_inc(&server->ref, &r);
302 a = atomic_read(&server->active);
303 trace_afs_server(server->debug_id, r + 1, a, reason);
304 return server;
305}
306
307/*
308 * Get an active count on a server object and maybe remove from the inactive
309 * list.
310 */
311struct afs_server *afs_use_server(struct afs_server *server, bool activate,
312 enum afs_server_trace reason)
313{
314 unsigned int a;
315 int r;
316
317 __refcount_inc(&server->ref, &r);
318 a = atomic_inc_return(&server->active);
319 if (a == 1 && activate &&
320 !test_bit(AFS_SERVER_FL_EXPIRED, &server->flags))
321 timer_delete(&server->timer);
322
323 trace_afs_server(server->debug_id, r + 1, a, reason);
324 return server;
325}
326
327/*
328 * Release a reference on a server record.
329 */
330void afs_put_server(struct afs_net *net, struct afs_server *server,
331 enum afs_server_trace reason)
332{
333 unsigned int a, debug_id = server->debug_id;
334 bool zero;
335 int r;
336
337 if (!server)
338 return;
339
340 a = atomic_read(&server->active);
341 zero = __refcount_dec_and_test(&server->ref, &r);
342 trace_afs_server(debug_id, r - 1, a, reason);
343 if (unlikely(zero))
344 __afs_put_server(net, server);
345}
346
347/*
348 * Drop an active count on a server object without updating the last-unused
349 * time.
350 */
351void afs_unuse_server_notime(struct afs_net *net, struct afs_server *server,
352 enum afs_server_trace reason)
353{
354 if (!server)
355 return;
356
357 if (atomic_dec_and_test(&server->active)) {
358 if (test_bit(AFS_SERVER_FL_EXPIRED, &server->flags) ||
359 READ_ONCE(server->cell->state) >= AFS_CELL_REMOVING)
360 schedule_work(&server->destroyer);
361 }
362
363 afs_put_server(net, server, reason);
364}
365
366/*
367 * Drop an active count on a server object.
368 */
369void afs_unuse_server(struct afs_net *net, struct afs_server *server,
370 enum afs_server_trace reason)
371{
372 if (!server)
373 return;
374
375 if (atomic_dec_and_test(&server->active)) {
376 if (!test_bit(AFS_SERVER_FL_EXPIRED, &server->flags) &&
377 READ_ONCE(server->cell->state) < AFS_CELL_REMOVING) {
378 time64_t unuse_time = ktime_get_real_seconds();
379
380 server->unuse_time = unuse_time;
381 afs_set_server_timer(server, afs_server_gc_delay);
382 } else {
383 schedule_work(&server->destroyer);
384 }
385 }
386
387 afs_put_server(net, server, reason);
388}
389
390static void afs_server_rcu(struct rcu_head *rcu)
391{
392 struct afs_server *server = container_of(rcu, struct afs_server, rcu);
393
394 trace_afs_server(server->debug_id, refcount_read(&server->ref),
395 atomic_read(&server->active), afs_server_trace_free);
396 afs_put_endpoint_state(rcu_access_pointer(server->endpoint_state),
397 afs_estate_trace_put_server);
398 afs_put_cell(server->cell, afs_cell_trace_put_server);
399 kfree(server);
400}
401
402static void __afs_put_server(struct afs_net *net, struct afs_server *server)
403{
404 call_rcu(&server->rcu, afs_server_rcu);
405 afs_dec_servers_outstanding(net);
406}
407
408static void afs_give_up_callbacks(struct afs_net *net, struct afs_server *server)
409{
410 struct afs_endpoint_state *estate = rcu_access_pointer(server->endpoint_state);
411 struct afs_addr_list *alist = estate->addresses;
412
413 afs_fs_give_up_all_callbacks(net, server, &alist->addrs[alist->preferred], NULL);
414}
415
416/*
417 * Check to see if the server record has expired.
418 */
419static bool afs_has_server_expired(const struct afs_server *server)
420{
421 time64_t expires_at;
422
423 if (atomic_read(&server->active))
424 return false;
425
426 if (server->cell->net->live ||
427 server->cell->state >= AFS_CELL_REMOVING) {
428 trace_afs_server(server->debug_id, refcount_read(&server->ref),
429 0, afs_server_trace_purging);
430 return true;
431 }
432
433 expires_at = server->unuse_time;
434 if (!test_bit(AFS_SERVER_FL_VL_FAIL, &server->flags) &&
435 !test_bit(AFS_SERVER_FL_NOT_FOUND, &server->flags))
436 expires_at += afs_server_gc_delay;
437
438 return ktime_get_real_seconds() > expires_at;
439}
440
441/*
442 * Remove a server record from it's parent cell's database.
443 */
444static bool afs_remove_server_from_cell(struct afs_server *server)
445{
446 struct afs_cell *cell = server->cell;
447
448 down_write(&cell->fs_lock);
449
450 if (!afs_has_server_expired(server)) {
451 up_write(&cell->fs_lock);
452 return false;
453 }
454
455 set_bit(AFS_SERVER_FL_EXPIRED, &server->flags);
456 _debug("expire %pU %u", &server->uuid, atomic_read(&server->active));
457 afs_see_server(server, afs_server_trace_see_expired);
458 rb_erase(&server->uuid_rb, &cell->fs_servers);
459 up_write(&cell->fs_lock);
460 return true;
461}
462
463static void afs_server_destroyer(struct work_struct *work)
464{
465 struct afs_endpoint_state *estate;
466 struct afs_server *server = container_of(work, struct afs_server, destroyer);
467 struct afs_net *net = server->cell->net;
468
469 afs_see_server(server, afs_server_trace_see_destroyer);
470
471 if (test_bit(AFS_SERVER_FL_EXPIRED, &server->flags))
472 return;
473
474 if (!afs_remove_server_from_cell(server))
475 return;
476
477 timer_shutdown_sync(&server->timer);
478 cancel_work(&server->destroyer);
479
480 if (test_bit(AFS_SERVER_FL_MAY_HAVE_CB, &server->flags))
481 afs_give_up_callbacks(net, server);
482
483 /* Unbind the rxrpc_peer records from the server. */
484 estate = rcu_access_pointer(server->endpoint_state);
485 if (estate)
486 afs_set_peer_appdata(server, estate->addresses, NULL);
487
488 write_seqlock(&net->fs_lock);
489 list_del_init(&server->probe_link);
490 if (!hlist_unhashed(&server->proc_link))
491 hlist_del_rcu(&server->proc_link);
492 write_sequnlock(&net->fs_lock);
493
494 afs_put_server(net, server, afs_server_trace_destroy);
495}
496
497static void afs_server_timer(struct timer_list *timer)
498{
499 struct afs_server *server = container_of(timer, struct afs_server, timer);
500
501 afs_see_server(server, afs_server_trace_see_timer);
502 if (!test_bit(AFS_SERVER_FL_EXPIRED, &server->flags))
503 schedule_work(&server->destroyer);
504}
505
506/*
507 * Wake up all the servers in a cell so that they can purge themselves.
508 */
509void afs_purge_servers(struct afs_cell *cell)
510{
511 struct afs_server *server;
512 struct rb_node *rb;
513
514 down_read(&cell->fs_lock);
515 for (rb = rb_first(&cell->fs_servers); rb; rb = rb_next(rb)) {
516 server = rb_entry(rb, struct afs_server, uuid_rb);
517 afs_see_server(server, afs_server_trace_see_purge);
518 schedule_work(&server->destroyer);
519 }
520 up_read(&cell->fs_lock);
521}
522
523/*
524 * Wait for outstanding servers.
525 */
526void afs_wait_for_servers(struct afs_net *net)
527{
528 _enter("");
529
530 atomic_dec(&net->servers_outstanding);
531 wait_var_event(&net->servers_outstanding,
532 !atomic_read(&net->servers_outstanding));
533 _leave("");
534}
535
536/*
537 * Get an update for a server's address list.
538 */
539static noinline bool afs_update_server_record(struct afs_operation *op,
540 struct afs_server *server,
541 struct key *key)
542{
543 struct afs_endpoint_state *estate;
544 struct afs_addr_list *alist;
545 bool has_addrs;
546
547 _enter("");
548
549 trace_afs_server(server->debug_id, refcount_read(&server->ref),
550 atomic_read(&server->active),
551 afs_server_trace_update);
552
553 alist = afs_vl_lookup_addrs(server, op->key);
554 if (IS_ERR(alist)) {
555 rcu_read_lock();
556 estate = rcu_dereference(server->endpoint_state);
557 has_addrs = estate->addresses;
558 rcu_read_unlock();
559
560 if ((PTR_ERR(alist) == -ERESTARTSYS ||
561 PTR_ERR(alist) == -EINTR) &&
562 (op->flags & AFS_OPERATION_UNINTR) &&
563 has_addrs) {
564 _leave(" = t [intr]");
565 return true;
566 }
567 afs_op_set_error(op, PTR_ERR(alist));
568 _leave(" = f [%d]", afs_op_error(op));
569 return false;
570 }
571
572 if (server->addr_version != alist->version)
573 afs_fs_probe_fileserver(op->net, server, alist, key);
574
575 afs_put_addrlist(alist, afs_alist_trace_put_server_update);
576 _leave(" = t");
577 return true;
578}
579
580/*
581 * See if a server's address list needs updating.
582 */
583bool afs_check_server_record(struct afs_operation *op, struct afs_server *server,
584 struct key *key)
585{
586 bool success;
587 int ret, retries = 0;
588
589 _enter("");
590
591 ASSERT(server);
592
593retry:
594 if (test_bit(AFS_SERVER_FL_UPDATING, &server->flags))
595 goto wait;
596 if (test_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags))
597 goto update;
598 _leave(" = t [good]");
599 return true;
600
601update:
602 if (!test_and_set_bit_lock(AFS_SERVER_FL_UPDATING, &server->flags)) {
603 clear_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags);
604 success = afs_update_server_record(op, server, key);
605 clear_bit_unlock(AFS_SERVER_FL_UPDATING, &server->flags);
606 wake_up_bit(&server->flags, AFS_SERVER_FL_UPDATING);
607 _leave(" = %d", success);
608 return success;
609 }
610
611wait:
612 ret = wait_on_bit(&server->flags, AFS_SERVER_FL_UPDATING,
613 (op->flags & AFS_OPERATION_UNINTR) ?
614 TASK_UNINTERRUPTIBLE : TASK_INTERRUPTIBLE);
615 if (ret == -ERESTARTSYS) {
616 afs_op_set_error(op, ret);
617 _leave(" = f [intr]");
618 return false;
619 }
620
621 retries++;
622 if (retries == 4) {
623 _leave(" = f [stale]");
624 ret = -ESTALE;
625 return false;
626 }
627 goto retry;
628}