250 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			250 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| // SPDX-License-Identifier: GPL-2.0-or-later
 | |
| /* AFS fileserver list management.
 | |
|  *
 | |
|  * Copyright (C) 2017 Red Hat, Inc. All Rights Reserved.
 | |
|  * Written by David Howells (dhowells@redhat.com)
 | |
|  */
 | |
| 
 | |
| #include <linux/kernel.h>
 | |
| #include <linux/slab.h>
 | |
| #include "internal.h"
 | |
| 
 | |
| void afs_put_serverlist(struct afs_net *net, struct afs_server_list *slist)
 | |
| {
 | |
| 	int i;
 | |
| 
 | |
| 	if (slist && refcount_dec_and_test(&slist->usage)) {
 | |
| 		for (i = 0; i < slist->nr_servers; i++)
 | |
| 			afs_unuse_server(net, slist->servers[i].server,
 | |
| 					 afs_server_trace_put_slist);
 | |
| 		kfree_rcu(slist, rcu);
 | |
| 	}
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Build a server list from a VLDB record.
 | |
|  */
 | |
| struct afs_server_list *afs_alloc_server_list(struct afs_volume *volume,
 | |
| 					      struct key *key,
 | |
| 					      struct afs_vldb_entry *vldb)
 | |
| {
 | |
| 	struct afs_server_list *slist;
 | |
| 	struct afs_server *server;
 | |
| 	unsigned int type_mask = 1 << volume->type;
 | |
| 	bool use_newrepsites = false;
 | |
| 	int ret = -ENOMEM, nr_servers = 0, newrep = 0, i, j, usable = 0;
 | |
| 
 | |
| 	/* Work out if we're going to restrict to NEWREPSITE-marked servers or
 | |
| 	 * not.  If at least one site is marked as NEWREPSITE, then it's likely
 | |
| 	 * that "vos release" is busy updating RO sites.  We cut over from one
 | |
| 	 * to the other when >=50% of the sites have been updated.  Sites that
 | |
| 	 * are in the process of being updated are marked DONTUSE.
 | |
| 	 */
 | |
| 	for (i = 0; i < vldb->nr_servers; i++) {
 | |
| 		if (!(vldb->fs_mask[i] & type_mask))
 | |
| 			continue;
 | |
| 		nr_servers++;
 | |
| 		if (vldb->vlsf_flags[i] & AFS_VLSF_DONTUSE)
 | |
| 			continue;
 | |
| 		usable++;
 | |
| 		if (vldb->vlsf_flags[i] & AFS_VLSF_NEWREPSITE)
 | |
| 			newrep++;
 | |
| 	}
 | |
| 
 | |
| 	slist = kzalloc(struct_size(slist, servers, nr_servers), GFP_KERNEL);
 | |
| 	if (!slist)
 | |
| 		goto error;
 | |
| 
 | |
| 	if (newrep) {
 | |
| 		if (newrep < usable / 2) {
 | |
| 			slist->ro_replicating = AFS_RO_REPLICATING_USE_OLD;
 | |
| 		} else {
 | |
| 			slist->ro_replicating = AFS_RO_REPLICATING_USE_NEW;
 | |
| 			use_newrepsites = true;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	refcount_set(&slist->usage, 1);
 | |
| 	rwlock_init(&slist->lock);
 | |
| 
 | |
| 	/* Make sure a records exists for each server in the list. */
 | |
| 	for (i = 0; i < vldb->nr_servers; i++) {
 | |
| 		unsigned long se_flags = 0;
 | |
| 		bool newrepsite = vldb->vlsf_flags[i] & AFS_VLSF_NEWREPSITE;
 | |
| 
 | |
| 		if (!(vldb->fs_mask[i] & type_mask))
 | |
| 			continue;
 | |
| 		if (vldb->vlsf_flags[i] & AFS_VLSF_DONTUSE)
 | |
| 			__set_bit(AFS_SE_EXCLUDED, &se_flags);
 | |
| 		if (newrep && (newrepsite ^ use_newrepsites))
 | |
| 			__set_bit(AFS_SE_EXCLUDED, &se_flags);
 | |
| 
 | |
| 		server = afs_lookup_server(volume->cell, key, &vldb->fs_server[i],
 | |
| 					   vldb->addr_version[i]);
 | |
| 		if (IS_ERR(server)) {
 | |
| 			ret = PTR_ERR(server);
 | |
| 			if (ret == -ENOENT ||
 | |
| 			    ret == -ENOMEDIUM)
 | |
| 				continue;
 | |
| 			goto error_2;
 | |
| 		}
 | |
| 
 | |
| 		/* Insertion-sort by UUID */
 | |
| 		for (j = 0; j < slist->nr_servers; j++)
 | |
| 			if (memcmp(&slist->servers[j].server->uuid,
 | |
| 				   &server->uuid,
 | |
| 				   sizeof(server->uuid)) >= 0)
 | |
| 				break;
 | |
| 		if (j < slist->nr_servers) {
 | |
| 			if (slist->servers[j].server == server) {
 | |
| 				afs_put_server(volume->cell->net, server,
 | |
| 					       afs_server_trace_put_slist_isort);
 | |
| 				continue;
 | |
| 			}
 | |
| 
 | |
| 			memmove(slist->servers + j + 1,
 | |
| 				slist->servers + j,
 | |
| 				(slist->nr_servers - j) * sizeof(struct afs_server_entry));
 | |
| 		}
 | |
| 
 | |
| 		slist->servers[j].server = server;
 | |
| 		slist->servers[j].volume = volume;
 | |
| 		slist->servers[j].flags = se_flags;
 | |
| 		slist->servers[j].cb_expires_at = AFS_NO_CB_PROMISE;
 | |
| 		slist->nr_servers++;
 | |
| 	}
 | |
| 
 | |
| 	if (slist->nr_servers == 0) {
 | |
| 		ret = -EDESTADDRREQ;
 | |
| 		goto error_2;
 | |
| 	}
 | |
| 
 | |
| 	return slist;
 | |
| 
 | |
| error_2:
 | |
| 	afs_put_serverlist(volume->cell->net, slist);
 | |
| error:
 | |
| 	return ERR_PTR(ret);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Copy the annotations from an old server list to its potential replacement.
 | |
|  */
 | |
| bool afs_annotate_server_list(struct afs_server_list *new,
 | |
| 			      struct afs_server_list *old)
 | |
| {
 | |
| 	unsigned long mask = 1UL << AFS_SE_EXCLUDED;
 | |
| 	int i;
 | |
| 
 | |
| 	if (old->nr_servers != new->nr_servers ||
 | |
| 	    old->ro_replicating != new->ro_replicating)
 | |
| 		goto changed;
 | |
| 
 | |
| 	for (i = 0; i < old->nr_servers; i++) {
 | |
| 		if (old->servers[i].server != new->servers[i].server)
 | |
| 			goto changed;
 | |
| 		if ((old->servers[i].flags & mask) != (new->servers[i].flags & mask))
 | |
| 			goto changed;
 | |
| 	}
 | |
| 	return false;
 | |
| changed:
 | |
| 	return true;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Attach a volume to the servers it is going to use.
 | |
|  */
 | |
| void afs_attach_volume_to_servers(struct afs_volume *volume, struct afs_server_list *slist)
 | |
| {
 | |
| 	struct afs_server_entry *se, *pe;
 | |
| 	struct afs_server *server;
 | |
| 	struct list_head *p;
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	down_write(&volume->cell->vs_lock);
 | |
| 
 | |
| 	for (i = 0; i < slist->nr_servers; i++) {
 | |
| 		se = &slist->servers[i];
 | |
| 		server = se->server;
 | |
| 
 | |
| 		list_for_each(p, &server->volumes) {
 | |
| 			pe = list_entry(p, struct afs_server_entry, slink);
 | |
| 			if (volume->vid <= pe->volume->vid)
 | |
| 				break;
 | |
| 		}
 | |
| 		list_add_tail(&se->slink, p);
 | |
| 	}
 | |
| 
 | |
| 	slist->attached = true;
 | |
| 	up_write(&volume->cell->vs_lock);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Reattach a volume to the servers it is going to use when server list is
 | |
|  * replaced.  We try to switch the attachment points to avoid rewalking the
 | |
|  * lists.
 | |
|  */
 | |
| void afs_reattach_volume_to_servers(struct afs_volume *volume, struct afs_server_list *new,
 | |
| 				    struct afs_server_list *old)
 | |
| {
 | |
| 	unsigned int n = 0, o = 0;
 | |
| 
 | |
| 	down_write(&volume->cell->vs_lock);
 | |
| 
 | |
| 	while (n < new->nr_servers || o < old->nr_servers) {
 | |
| 		struct afs_server_entry *pn = n < new->nr_servers ? &new->servers[n] : NULL;
 | |
| 		struct afs_server_entry *po = o < old->nr_servers ? &old->servers[o] : NULL;
 | |
| 		struct afs_server_entry *s;
 | |
| 		struct list_head *p;
 | |
| 		int diff;
 | |
| 
 | |
| 		if (pn && po && pn->server == po->server) {
 | |
| 			pn->cb_expires_at = po->cb_expires_at;
 | |
| 			list_replace(&po->slink, &pn->slink);
 | |
| 			n++;
 | |
| 			o++;
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		if (pn && po)
 | |
| 			diff = memcmp(&pn->server->uuid, &po->server->uuid,
 | |
| 				      sizeof(pn->server->uuid));
 | |
| 		else
 | |
| 			diff = pn ? -1 : 1;
 | |
| 
 | |
| 		if (diff < 0) {
 | |
| 			list_for_each(p, &pn->server->volumes) {
 | |
| 				s = list_entry(p, struct afs_server_entry, slink);
 | |
| 				if (volume->vid <= s->volume->vid)
 | |
| 					break;
 | |
| 			}
 | |
| 			list_add_tail(&pn->slink, p);
 | |
| 			n++;
 | |
| 		} else {
 | |
| 			list_del(&po->slink);
 | |
| 			o++;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	up_write(&volume->cell->vs_lock);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Detach a volume from the servers it has been using.
 | |
|  */
 | |
| void afs_detach_volume_from_servers(struct afs_volume *volume, struct afs_server_list *slist)
 | |
| {
 | |
| 	unsigned int i;
 | |
| 
 | |
| 	if (!slist->attached)
 | |
| 		return;
 | |
| 
 | |
| 	down_write(&volume->cell->vs_lock);
 | |
| 
 | |
| 	for (i = 0; i < slist->nr_servers; i++)
 | |
| 		list_del(&slist->servers[i].slink);
 | |
| 
 | |
| 	slist->attached = false;
 | |
| 	up_write(&volume->cell->vs_lock);
 | |
| }
 |