1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* AFS server record management 3 * 4 * Copyright (C) 2002, 2007 Red Hat, Inc. All Rights Reserved. 5 * Written by David Howells (dhowells@redhat.com) 6 */ 7 8 #include <linux/sched.h> 9 #include <linux/slab.h> 10 #include "afs_fs.h" 11 #include "internal.h" 12 #include "protocol_yfs.h" 13 14 static unsigned afs_server_gc_delay = 10; /* Server record timeout in seconds */ 15 static atomic_t afs_server_debug_id; 16 17 static void __afs_put_server(struct afs_net *, struct afs_server *); 18 static void afs_server_timer(struct timer_list *timer); 19 static void afs_server_destroyer(struct work_struct *work); 20 21 /* 22 * Find a server by one of its addresses. 23 */ 24 struct afs_server *afs_find_server(const struct rxrpc_peer *peer) 25 { 26 struct afs_server *server = (struct afs_server *)rxrpc_kernel_get_peer_data(peer); 27 28 if (!server) 29 return NULL; 30 return afs_use_server(server, false, afs_server_trace_use_cm_call); 31 } 32 33 /* 34 * Look up a server by its UUID and mark it active. The caller must hold 35 * cell->fs_lock. 36 */ 37 static struct afs_server *afs_find_server_by_uuid(struct afs_cell *cell, const uuid_t *uuid) 38 { 39 struct afs_server *server; 40 struct rb_node *p; 41 int diff; 42 43 _enter("%pU", uuid); 44 45 p = cell->fs_servers.rb_node; 46 while (p) { 47 server = rb_entry(p, struct afs_server, uuid_rb); 48 49 diff = memcmp(uuid, &server->uuid, sizeof(*uuid)); 50 if (diff < 0) { 51 p = p->rb_left; 52 } else if (diff > 0) { 53 p = p->rb_right; 54 } else { 55 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags)) 56 return NULL; /* Need a write lock */ 57 afs_use_server(server, true, afs_server_trace_use_by_uuid); 58 return server; 59 } 60 } 61 62 return NULL; 63 } 64 65 /* 66 * Install a server record in the cell tree. The caller must hold an exclusive 67 * lock on cell->fs_lock. 68 */ 69 static struct afs_server *afs_install_server(struct afs_cell *cell, 70 struct afs_server **candidate) 71 { 72 struct afs_server *server; 73 struct afs_net *net = cell->net; 74 struct rb_node **pp, *p; 75 int diff; 76 77 _enter("%p", candidate); 78 79 /* Firstly install the server in the UUID lookup tree */ 80 pp = &cell->fs_servers.rb_node; 81 p = NULL; 82 while (*pp) { 83 p = *pp; 84 _debug("- consider %p", p); 85 server = rb_entry(p, struct afs_server, uuid_rb); 86 diff = memcmp(&(*candidate)->uuid, &server->uuid, sizeof(uuid_t)); 87 if (diff < 0) 88 pp = &(*pp)->rb_left; 89 else if (diff > 0) 90 pp = &(*pp)->rb_right; 91 else 92 goto exists; 93 } 94 95 server = *candidate; 96 *candidate = NULL; 97 rb_link_node(&server->uuid_rb, p, pp); 98 rb_insert_color(&server->uuid_rb, &cell->fs_servers); 99 write_seqlock(&net->fs_lock); 100 hlist_add_head_rcu(&server->proc_link, &net->fs_proc); 101 write_sequnlock(&net->fs_lock); 102 103 afs_get_cell(cell, afs_cell_trace_get_server); 104 105 exists: 106 afs_use_server(server, true, afs_server_trace_use_install); 107 return server; 108 } 109 110 /* 111 * Allocate a new server record and mark it as active but uncreated. 112 */ 113 static struct afs_server *afs_alloc_server(struct afs_cell *cell, const uuid_t *uuid) 114 { 115 struct afs_server *server; 116 struct afs_net *net = cell->net; 117 118 _enter(""); 119 120 server = kzalloc(sizeof(struct afs_server), GFP_KERNEL); 121 if (!server) 122 return NULL; 123 124 refcount_set(&server->ref, 1); 125 atomic_set(&server->active, 0); 126 __set_bit(AFS_SERVER_FL_UNCREATED, &server->flags); 127 server->debug_id = atomic_inc_return(&afs_server_debug_id); 128 server->uuid = *uuid; 129 rwlock_init(&server->fs_lock); 130 INIT_WORK(&server->destroyer, &afs_server_destroyer); 131 timer_setup(&server->timer, afs_server_timer, 0); 132 INIT_LIST_HEAD(&server->volumes); 133 init_waitqueue_head(&server->probe_wq); 134 INIT_LIST_HEAD(&server->probe_link); 135 INIT_HLIST_NODE(&server->proc_link); 136 spin_lock_init(&server->probe_lock); 137 server->cell = cell; 138 server->rtt = UINT_MAX; 139 server->service_id = FS_SERVICE; 140 server->probe_counter = 1; 141 server->probed_at = jiffies - LONG_MAX / 2; 142 143 afs_inc_servers_outstanding(net); 144 _leave(" = %p", server); 145 return server; 146 } 147 148 /* 149 * Look up an address record for a server 150 */ 151 static struct afs_addr_list *afs_vl_lookup_addrs(struct afs_server *server, 152 struct key *key) 153 { 154 struct afs_vl_cursor vc; 155 struct afs_addr_list *alist = NULL; 156 int ret; 157 158 ret = -ERESTARTSYS; 159 if (afs_begin_vlserver_operation(&vc, server->cell, key)) { 160 while (afs_select_vlserver(&vc)) { 161 if (test_bit(AFS_VLSERVER_FL_IS_YFS, &vc.server->flags)) 162 alist = afs_yfsvl_get_endpoints(&vc, &server->uuid); 163 else 164 alist = afs_vl_get_addrs_u(&vc, &server->uuid); 165 } 166 167 ret = afs_end_vlserver_operation(&vc); 168 } 169 170 return ret < 0 ? ERR_PTR(ret) : alist; 171 } 172 173 /* 174 * Get or create a fileserver record and return it with an active-use count on 175 * it. 176 */ 177 struct afs_server *afs_lookup_server(struct afs_cell *cell, struct key *key, 178 const uuid_t *uuid, u32 addr_version) 179 { 180 struct afs_addr_list *alist = NULL; 181 struct afs_server *server, *candidate = NULL; 182 bool creating = false; 183 int ret; 184 185 _enter("%p,%pU", cell->net, uuid); 186 187 down_read(&cell->fs_lock); 188 server = afs_find_server_by_uuid(cell, uuid); 189 /* Won't see servers marked uncreated. */ 190 up_read(&cell->fs_lock); 191 192 if (server) { 193 timer_delete_sync(&server->timer); 194 if (test_bit(AFS_SERVER_FL_CREATING, &server->flags)) 195 goto wait_for_creation; 196 if (server->addr_version != addr_version) 197 set_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags); 198 return server; 199 } 200 201 candidate = afs_alloc_server(cell, uuid); 202 if (!candidate) { 203 afs_put_addrlist(alist, afs_alist_trace_put_server_oom); 204 return ERR_PTR(-ENOMEM); 205 } 206 207 down_write(&cell->fs_lock); 208 server = afs_install_server(cell, &candidate); 209 if (test_bit(AFS_SERVER_FL_CREATING, &server->flags)) { 210 /* We need to wait for creation to complete. */ 211 up_write(&cell->fs_lock); 212 goto wait_for_creation; 213 } 214 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags)) { 215 set_bit(AFS_SERVER_FL_CREATING, &server->flags); 216 clear_bit(AFS_SERVER_FL_UNCREATED, &server->flags); 217 creating = true; 218 } 219 up_write(&cell->fs_lock); 220 timer_delete_sync(&server->timer); 221 222 /* If we get to create the server, we look up the addresses and then 223 * immediately dispatch an asynchronous probe to each interface on the 224 * fileserver. This will make sure the repeat-probing service is 225 * started. 226 */ 227 if (creating) { 228 alist = afs_vl_lookup_addrs(server, key); 229 if (IS_ERR(alist)) { 230 ret = PTR_ERR(alist); 231 goto create_failed; 232 } 233 234 ret = afs_fs_probe_fileserver(cell->net, server, alist, key); 235 if (ret) 236 goto create_failed; 237 238 clear_and_wake_up_bit(AFS_SERVER_FL_CREATING, &server->flags); 239 } 240 241 out: 242 afs_put_addrlist(alist, afs_alist_trace_put_server_create); 243 if (candidate) { 244 kfree(rcu_access_pointer(server->endpoint_state)); 245 kfree(candidate); 246 afs_dec_servers_outstanding(cell->net); 247 } 248 return server ?: ERR_PTR(ret); 249 250 wait_for_creation: 251 afs_see_server(server, afs_server_trace_wait_create); 252 wait_on_bit(&server->flags, AFS_SERVER_FL_CREATING, TASK_UNINTERRUPTIBLE); 253 if (test_bit_acquire(AFS_SERVER_FL_UNCREATED, &server->flags)) { 254 /* Barrier: read flag before error */ 255 ret = READ_ONCE(server->create_error); 256 afs_put_server(cell->net, server, afs_server_trace_unuse_create_fail); 257 server = NULL; 258 goto out; 259 } 260 261 ret = 0; 262 goto out; 263 264 create_failed: 265 down_write(&cell->fs_lock); 266 267 WRITE_ONCE(server->create_error, ret); 268 smp_wmb(); /* Barrier: set error before flag. */ 269 set_bit(AFS_SERVER_FL_UNCREATED, &server->flags); 270 271 clear_and_wake_up_bit(AFS_SERVER_FL_CREATING, &server->flags); 272 273 if (test_bit(AFS_SERVER_FL_UNCREATED, &server->flags)) { 274 clear_bit(AFS_SERVER_FL_UNCREATED, &server->flags); 275 creating = true; 276 } 277 afs_unuse_server(cell->net, server, afs_server_trace_unuse_create_fail); 278 server = NULL; 279 280 up_write(&cell->fs_lock); 281 goto out; 282 } 283 284 /* 285 * Set/reduce a server's timer. 286 */ 287 static void afs_set_server_timer(struct afs_server *server, unsigned int delay_secs) 288 { 289 mod_timer(&server->timer, jiffies + delay_secs * HZ); 290 } 291 292 /* 293 * Get a reference on a server object. 294 */ 295 struct afs_server *afs_get_server(struct afs_server *server, 296 enum afs_server_trace reason) 297 { 298 unsigned int a; 299 int r; 300 301 __refcount_inc(&server->ref, &r); 302 a = atomic_read(&server->active); 303 trace_afs_server(server->debug_id, r + 1, a, reason); 304 return server; 305 } 306 307 /* 308 * Get an active count on a server object and maybe remove from the inactive 309 * list. 310 */ 311 struct afs_server *afs_use_server(struct afs_server *server, bool activate, 312 enum afs_server_trace reason) 313 { 314 unsigned int a; 315 int r; 316 317 __refcount_inc(&server->ref, &r); 318 a = atomic_inc_return(&server->active); 319 if (a == 1 && activate && 320 !test_bit(AFS_SERVER_FL_EXPIRED, &server->flags)) 321 timer_delete(&server->timer); 322 323 trace_afs_server(server->debug_id, r + 1, a, reason); 324 return server; 325 } 326 327 /* 328 * Release a reference on a server record. 329 */ 330 void afs_put_server(struct afs_net *net, struct afs_server *server, 331 enum afs_server_trace reason) 332 { 333 unsigned int a, debug_id = server->debug_id; 334 bool zero; 335 int r; 336 337 if (!server) 338 return; 339 340 a = atomic_read(&server->active); 341 zero = __refcount_dec_and_test(&server->ref, &r); 342 trace_afs_server(debug_id, r - 1, a, reason); 343 if (unlikely(zero)) 344 __afs_put_server(net, server); 345 } 346 347 /* 348 * Drop an active count on a server object without updating the last-unused 349 * time. 350 */ 351 void afs_unuse_server_notime(struct afs_net *net, struct afs_server *server, 352 enum afs_server_trace reason) 353 { 354 if (!server) 355 return; 356 357 if (atomic_dec_and_test(&server->active)) { 358 if (test_bit(AFS_SERVER_FL_EXPIRED, &server->flags) || 359 READ_ONCE(server->cell->state) >= AFS_CELL_REMOVING) 360 schedule_work(&server->destroyer); 361 } 362 363 afs_put_server(net, server, reason); 364 } 365 366 /* 367 * Drop an active count on a server object. 368 */ 369 void afs_unuse_server(struct afs_net *net, struct afs_server *server, 370 enum afs_server_trace reason) 371 { 372 if (!server) 373 return; 374 375 if (atomic_dec_and_test(&server->active)) { 376 if (!test_bit(AFS_SERVER_FL_EXPIRED, &server->flags) && 377 READ_ONCE(server->cell->state) < AFS_CELL_REMOVING) { 378 time64_t unuse_time = ktime_get_real_seconds(); 379 380 server->unuse_time = unuse_time; 381 afs_set_server_timer(server, afs_server_gc_delay); 382 } else { 383 schedule_work(&server->destroyer); 384 } 385 } 386 387 afs_put_server(net, server, reason); 388 } 389 390 static void afs_server_rcu(struct rcu_head *rcu) 391 { 392 struct afs_server *server = container_of(rcu, struct afs_server, rcu); 393 394 trace_afs_server(server->debug_id, refcount_read(&server->ref), 395 atomic_read(&server->active), afs_server_trace_free); 396 afs_put_endpoint_state(rcu_access_pointer(server->endpoint_state), 397 afs_estate_trace_put_server); 398 afs_put_cell(server->cell, afs_cell_trace_put_server); 399 kfree(server); 400 } 401 402 static void __afs_put_server(struct afs_net *net, struct afs_server *server) 403 { 404 call_rcu(&server->rcu, afs_server_rcu); 405 afs_dec_servers_outstanding(net); 406 } 407 408 static void afs_give_up_callbacks(struct afs_net *net, struct afs_server *server) 409 { 410 struct afs_endpoint_state *estate = rcu_access_pointer(server->endpoint_state); 411 struct afs_addr_list *alist = estate->addresses; 412 413 afs_fs_give_up_all_callbacks(net, server, &alist->addrs[alist->preferred], NULL); 414 } 415 416 /* 417 * Check to see if the server record has expired. 418 */ 419 static bool afs_has_server_expired(const struct afs_server *server) 420 { 421 time64_t expires_at; 422 423 if (atomic_read(&server->active)) 424 return false; 425 426 if (server->cell->net->live || 427 server->cell->state >= AFS_CELL_REMOVING) { 428 trace_afs_server(server->debug_id, refcount_read(&server->ref), 429 0, afs_server_trace_purging); 430 return true; 431 } 432 433 expires_at = server->unuse_time; 434 if (!test_bit(AFS_SERVER_FL_VL_FAIL, &server->flags) && 435 !test_bit(AFS_SERVER_FL_NOT_FOUND, &server->flags)) 436 expires_at += afs_server_gc_delay; 437 438 return ktime_get_real_seconds() > expires_at; 439 } 440 441 /* 442 * Remove a server record from it's parent cell's database. 443 */ 444 static bool afs_remove_server_from_cell(struct afs_server *server) 445 { 446 struct afs_cell *cell = server->cell; 447 448 down_write(&cell->fs_lock); 449 450 if (!afs_has_server_expired(server)) { 451 up_write(&cell->fs_lock); 452 return false; 453 } 454 455 set_bit(AFS_SERVER_FL_EXPIRED, &server->flags); 456 _debug("expire %pU %u", &server->uuid, atomic_read(&server->active)); 457 afs_see_server(server, afs_server_trace_see_expired); 458 rb_erase(&server->uuid_rb, &cell->fs_servers); 459 up_write(&cell->fs_lock); 460 return true; 461 } 462 463 static void afs_server_destroyer(struct work_struct *work) 464 { 465 struct afs_endpoint_state *estate; 466 struct afs_server *server = container_of(work, struct afs_server, destroyer); 467 struct afs_net *net = server->cell->net; 468 469 afs_see_server(server, afs_server_trace_see_destroyer); 470 471 if (test_bit(AFS_SERVER_FL_EXPIRED, &server->flags)) 472 return; 473 474 if (!afs_remove_server_from_cell(server)) 475 return; 476 477 timer_shutdown_sync(&server->timer); 478 cancel_work(&server->destroyer); 479 480 if (test_bit(AFS_SERVER_FL_MAY_HAVE_CB, &server->flags)) 481 afs_give_up_callbacks(net, server); 482 483 /* Unbind the rxrpc_peer records from the server. */ 484 estate = rcu_access_pointer(server->endpoint_state); 485 if (estate) 486 afs_set_peer_appdata(server, estate->addresses, NULL); 487 488 write_seqlock(&net->fs_lock); 489 list_del_init(&server->probe_link); 490 if (!hlist_unhashed(&server->proc_link)) 491 hlist_del_rcu(&server->proc_link); 492 write_sequnlock(&net->fs_lock); 493 494 afs_put_server(net, server, afs_server_trace_destroy); 495 } 496 497 static void afs_server_timer(struct timer_list *timer) 498 { 499 struct afs_server *server = container_of(timer, struct afs_server, timer); 500 501 afs_see_server(server, afs_server_trace_see_timer); 502 if (!test_bit(AFS_SERVER_FL_EXPIRED, &server->flags)) 503 schedule_work(&server->destroyer); 504 } 505 506 /* 507 * Wake up all the servers in a cell so that they can purge themselves. 508 */ 509 void afs_purge_servers(struct afs_cell *cell) 510 { 511 struct afs_server *server; 512 struct rb_node *rb; 513 514 down_read(&cell->fs_lock); 515 for (rb = rb_first(&cell->fs_servers); rb; rb = rb_next(rb)) { 516 server = rb_entry(rb, struct afs_server, uuid_rb); 517 afs_see_server(server, afs_server_trace_see_purge); 518 schedule_work(&server->destroyer); 519 } 520 up_read(&cell->fs_lock); 521 } 522 523 /* 524 * Wait for outstanding servers. 525 */ 526 void afs_wait_for_servers(struct afs_net *net) 527 { 528 _enter(""); 529 530 atomic_dec(&net->servers_outstanding); 531 wait_var_event(&net->servers_outstanding, 532 !atomic_read(&net->servers_outstanding)); 533 _leave(""); 534 } 535 536 /* 537 * Get an update for a server's address list. 538 */ 539 static noinline bool afs_update_server_record(struct afs_operation *op, 540 struct afs_server *server, 541 struct key *key) 542 { 543 struct afs_endpoint_state *estate; 544 struct afs_addr_list *alist; 545 bool has_addrs; 546 547 _enter(""); 548 549 trace_afs_server(server->debug_id, refcount_read(&server->ref), 550 atomic_read(&server->active), 551 afs_server_trace_update); 552 553 alist = afs_vl_lookup_addrs(server, op->key); 554 if (IS_ERR(alist)) { 555 rcu_read_lock(); 556 estate = rcu_dereference(server->endpoint_state); 557 has_addrs = estate->addresses; 558 rcu_read_unlock(); 559 560 if ((PTR_ERR(alist) == -ERESTARTSYS || 561 PTR_ERR(alist) == -EINTR) && 562 (op->flags & AFS_OPERATION_UNINTR) && 563 has_addrs) { 564 _leave(" = t [intr]"); 565 return true; 566 } 567 afs_op_set_error(op, PTR_ERR(alist)); 568 _leave(" = f [%d]", afs_op_error(op)); 569 return false; 570 } 571 572 if (server->addr_version != alist->version) 573 afs_fs_probe_fileserver(op->net, server, alist, key); 574 575 afs_put_addrlist(alist, afs_alist_trace_put_server_update); 576 _leave(" = t"); 577 return true; 578 } 579 580 /* 581 * See if a server's address list needs updating. 582 */ 583 bool afs_check_server_record(struct afs_operation *op, struct afs_server *server, 584 struct key *key) 585 { 586 bool success; 587 int ret, retries = 0; 588 589 _enter(""); 590 591 ASSERT(server); 592 593 retry: 594 if (test_bit(AFS_SERVER_FL_UPDATING, &server->flags)) 595 goto wait; 596 if (test_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags)) 597 goto update; 598 _leave(" = t [good]"); 599 return true; 600 601 update: 602 if (!test_and_set_bit_lock(AFS_SERVER_FL_UPDATING, &server->flags)) { 603 clear_bit(AFS_SERVER_FL_NEEDS_UPDATE, &server->flags); 604 success = afs_update_server_record(op, server, key); 605 clear_bit_unlock(AFS_SERVER_FL_UPDATING, &server->flags); 606 wake_up_bit(&server->flags, AFS_SERVER_FL_UPDATING); 607 _leave(" = %d", success); 608 return success; 609 } 610 611 wait: 612 ret = wait_on_bit(&server->flags, AFS_SERVER_FL_UPDATING, 613 (op->flags & AFS_OPERATION_UNINTR) ? 614 TASK_UNINTERRUPTIBLE : TASK_INTERRUPTIBLE); 615 if (ret == -ERESTARTSYS) { 616 afs_op_set_error(op, ret); 617 _leave(" = f [intr]"); 618 return false; 619 } 620 621 retries++; 622 if (retries == 4) { 623 _leave(" = f [stale]"); 624 ret = -ESTALE; 625 return false; 626 } 627 goto retry; 628 } 629