2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afs/param.h>
18 #include <sys/socket.h>
28 osi_rwlock_t cm_serverLock;
30 cm_server_t *cm_allServersp;
33 cm_PingServer(cm_server_t *tsp)
38 struct rx_connection * callp;
41 Capabilities caps = {0, 0};
44 lock_ObtainMutex(&tsp->mx);
45 if (tsp->flags & CM_SERVERFLAG_PINGING) {
47 osi_SleepM((LONG_PTR)tsp, &tsp->mx);
48 lock_ObtainMutex(&tsp->mx);
50 if (tsp->waitCount == 0)
51 tsp->flags &= ~CM_SERVERFLAG_PINGING;
53 osi_Wakeup((LONG_PTR)tsp);
54 lock_ReleaseMutex(&tsp->mx);
57 tsp->flags |= CM_SERVERFLAG_PINGING;
58 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
59 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
60 lock_ReleaseMutex(&tsp->mx);
62 code = cm_ConnByServer(tsp, cm_rootUserp, &connp);
64 /* now call the appropriate ping call. Drop the timeout if
65 * the server is known to be down, so that we don't waste a
66 * lot of time retiming out down servers.
69 osi_Log4(afsd_logp, "cm_PingServer server %s (%s) was %s with caps 0x%x",
70 osi_LogSaveString(afsd_logp, hoststr),
71 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
72 wasDown ? "down" : "up",
76 rx_SetConnDeadTime(connp->callp, 10);
77 if (tsp->type == CM_SERVER_VLDB) {
78 code = VL_ProbeServer(connp->callp);
82 callp = cm_GetRxConn(connp);
83 code = RXAFS_GetCapabilities(callp, &caps);
84 if (code == RXGEN_OPCODE)
85 code = RXAFS_GetTime(callp, &secs, &usecs);
86 rx_PutConnection(callp);
89 rx_SetConnDeadTime(connp->callp, ConnDeadtimeout);
91 } /* got an unauthenticated connection to this server */
93 lock_ObtainMutex(&tsp->mx);
95 /* mark server as up */
96 tsp->flags &= ~CM_SERVERFLAG_DOWN;
98 /* we currently handle 32-bits of capabilities */
99 if (caps.Capabilities_len > 0) {
100 tsp->capabilities = caps.Capabilities_val[0];
101 free(caps.Capabilities_val);
102 caps.Capabilities_len = 0;
103 caps.Capabilities_val = 0;
105 tsp->capabilities = 0;
108 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is up with caps 0x%x",
109 osi_LogSaveString(afsd_logp, hoststr),
110 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
113 /* mark server as down */
114 tsp->flags |= CM_SERVERFLAG_DOWN;
115 if (code != VRESTARTING)
116 cm_ForceNewConnections(tsp);
118 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is down with caps 0x%x",
119 osi_LogSaveString(afsd_logp, hoststr),
120 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
124 if (tsp->waitCount == 0)
125 tsp->flags &= ~CM_SERVERFLAG_PINGING;
127 osi_Wakeup((LONG_PTR)tsp);
128 lock_ReleaseMutex(&tsp->mx);
132 void cm_CheckServers(long flags, cm_cell_t *cellp)
134 /* ping all file servers, up or down, with unauthenticated connection,
135 * to find out whether we have all our callbacks from the server still.
136 * Also, ping down VLDBs.
142 lock_ObtainWrite(&cm_serverLock);
143 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
144 cm_GetServerNoLock(tsp);
145 lock_ReleaseWrite(&cm_serverLock);
147 /* now process the server */
148 lock_ObtainMutex(&tsp->mx);
151 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
153 /* only do the ping if the cell matches the requested cell, or we're
154 * matching all cells (cellp == NULL), and if we've requested to ping
155 * this type of {up, down} servers.
157 if ((cellp == NULL || cellp == tsp->cellp) &&
158 ((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
159 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
161 } /* we're supposed to check this up/down server */
162 lock_ReleaseMutex(&tsp->mx);
164 /* at this point, we've adjusted the server state, so do the ping and
170 /* also, run the GC function for connections on all of the
171 * server's connections.
173 cm_GCConnections(tsp);
175 lock_ObtainWrite(&cm_serverLock);
176 cm_PutServerNoLock(tsp);
178 lock_ReleaseWrite(&cm_serverLock);
181 void cm_InitServer(void)
183 static osi_once_t once;
185 if (osi_Once(&once)) {
186 lock_InitializeRWLock(&cm_serverLock, "cm_serverLock");
191 void cm_GetServer(cm_server_t *serverp)
193 lock_ObtainWrite(&cm_serverLock);
195 lock_ReleaseWrite(&cm_serverLock);
198 void cm_GetServerNoLock(cm_server_t *serverp)
203 void cm_PutServer(cm_server_t *serverp)
205 lock_ObtainWrite(&cm_serverLock);
206 osi_assert(serverp->refCount-- > 0);
207 lock_ReleaseWrite(&cm_serverLock);
210 void cm_PutServerNoLock(cm_server_t *serverp)
212 osi_assert(serverp->refCount-- > 0);
215 void cm_SetServerPrefs(cm_server_t * serverp)
217 unsigned long serverAddr; /* in host byte order */
218 unsigned long myAddr, myNet, mySubnet;/* in host byte order */
219 unsigned long netMask;
222 int cm_noIPAddr; /* number of client network interfaces */
223 int cm_IPAddr[CM_MAXINTERFACE_ADDR]; /* client's IP address in host order */
224 int cm_SubnetMask[CM_MAXINTERFACE_ADDR];/* client's subnet mask in host order*/
225 int cm_NetMtu[CM_MAXINTERFACE_ADDR]; /* client's MTU sizes */
226 int cm_NetFlags[CM_MAXINTERFACE_ADDR]; /* network flags */
229 /* get network related info */
230 cm_noIPAddr = CM_MAXINTERFACE_ADDR;
231 code = syscfg_GetIFInfo(&cm_noIPAddr,
232 cm_IPAddr, cm_SubnetMask,
233 cm_NetMtu, cm_NetFlags);
235 serverAddr = ntohl(serverp->addr.sin_addr.s_addr);
236 serverp->ipRank = CM_IPRANK_LOW; /* default setings */
238 for ( i=0; i < cm_noIPAddr; i++)
240 /* loop through all the client's IP address and compare
241 ** each of them against the server's IP address */
243 myAddr = cm_IPAddr[i];
244 if ( IN_CLASSA(myAddr) )
245 netMask = IN_CLASSA_NET;
246 else if ( IN_CLASSB(myAddr) )
247 netMask = IN_CLASSB_NET;
248 else if ( IN_CLASSC(myAddr) )
249 netMask = IN_CLASSC_NET;
253 myNet = myAddr & netMask;
254 mySubnet = myAddr & cm_SubnetMask[i];
256 if ( (serverAddr & netMask) == myNet )
258 if ( (serverAddr & cm_SubnetMask[i]) == mySubnet)
260 if ( serverAddr == myAddr )
261 serverp->ipRank = min(serverp->ipRank,
262 CM_IPRANK_TOP);/* same machine */
263 else serverp->ipRank = min(serverp->ipRank,
264 CM_IPRANK_HI); /* same subnet */
266 else serverp->ipRank = min(serverp->ipRank,CM_IPRANK_MED);
269 /* random between 0..15*/
270 serverp->ipRank += min(serverp->ipRank, rand() % 0x000f);
271 } /* and of for loop */
274 cm_server_t *cm_NewServer(struct sockaddr_in *socketp, int type, cm_cell_t *cellp) {
277 osi_assert(socketp->sin_family == AF_INET);
279 tsp = malloc(sizeof(*tsp));
280 memset(tsp, 0, sizeof(*tsp));
284 lock_InitializeMutex(&tsp->mx, "cm_server_t mutex");
285 tsp->addr = *socketp;
286 tsp->flags = CM_SERVERFLAG_DOWN; /* assume down; ping will mark up if available */
288 cm_SetServerPrefs(tsp);
290 lock_ObtainWrite(&cm_serverLock); /* get server lock */
291 tsp->allNextp = cm_allServersp;
292 cm_allServersp = tsp;
293 lock_ReleaseWrite(&cm_serverLock); /* release server lock */
295 cm_PingServer(tsp); /* Obtain Capabilities and check up/down state */
299 /* find a server based on its properties */
300 cm_server_t *cm_FindServer(struct sockaddr_in *addrp, int type)
304 osi_assert(addrp->sin_family == AF_INET);
306 lock_ObtainWrite(&cm_serverLock);
307 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp) {
308 if (tsp->type == type &&
309 tsp->addr.sin_addr.s_addr == addrp->sin_addr.s_addr)
313 /* bump ref count if we found the server */
315 cm_GetServerNoLock(tsp);
317 /* drop big table lock */
318 lock_ReleaseWrite(&cm_serverLock);
320 /* return what we found */
324 cm_serverRef_t *cm_NewServerRef(cm_server_t *serverp)
326 cm_serverRef_t *tsrp;
328 cm_GetServer(serverp);
329 tsrp = malloc(sizeof(*tsrp));
330 tsrp->server = serverp;
331 tsrp->status = not_busy;
338 LONG_PTR cm_ChecksumServerList(cm_serverRef_t *serversp)
342 cm_serverRef_t *tsrp;
344 lock_ObtainWrite(&cm_serverLock);
345 for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
350 sum ^= (LONG_PTR) tsrp->server;
353 lock_ReleaseWrite(&cm_serverLock);
358 ** Insert a server into the server list keeping the list sorted in
359 ** asending order of ipRank.
361 ** The refCount of the cm_serverRef_t is increased
363 void cm_InsertServerList(cm_serverRef_t** list, cm_serverRef_t* element)
365 cm_serverRef_t *current=*list;
366 unsigned short ipRank = element->server->ipRank;
368 lock_ObtainWrite(&cm_serverLock);
369 element->refCount++; /* increase refCount */
371 /* insertion into empty list or at the beginning of the list */
372 if ( !current || (current->server->ipRank > ipRank) )
374 element->next = *list;
376 lock_ReleaseWrite(&cm_serverLock);
380 while ( current->next ) /* find appropriate place to insert */
382 if ( current->next->server->ipRank > ipRank )
384 else current = current->next;
386 element->next = current->next;
387 current->next = element;
388 lock_ReleaseWrite(&cm_serverLock);
391 ** Re-sort the server list with the modified rank
392 ** returns 0 if element was changed successfully.
393 ** returns 1 if list remained unchanged.
395 long cm_ChangeRankServer(cm_serverRef_t** list, cm_server_t* server)
397 cm_serverRef_t **current=list;
398 cm_serverRef_t *element=0;
400 /* if there is max of one element in the list, nothing to sort */
401 if ( (!*current) || !((*current)->next) )
402 return 1; /* list unchanged: return success */
404 lock_ObtainWrite(&cm_serverLock);
405 /* if the server is on the list, delete it from list */
408 if ( (*current)->server == server)
410 element = (*current);
411 *current = (*current)->next; /* delete it */
414 current = & ( (*current)->next);
416 lock_ReleaseWrite(&cm_serverLock);
418 /* if this volume is not replicated on this server */
420 return 1; /* server is not on list */
422 /* re-insert deleted element into the list with modified rank*/
423 cm_InsertServerList(list, element);
425 /* reduce refCount which was increased by cm_InsertServerList */
426 lock_ObtainWrite(&cm_serverLock);
428 lock_ReleaseWrite(&cm_serverLock);
432 ** If there are more than one server on the list and the first n servers on
433 ** the list have the same rank( n>1), then randomise among the first n servers.
435 void cm_RandomizeServer(cm_serverRef_t** list)
438 cm_serverRef_t* tsrp = *list, *lastTsrp;
439 unsigned short lowestRank;
441 /* an empty list or a list with only one element */
442 if ( !tsrp || ! tsrp->next )
445 lock_ObtainWrite(&cm_serverLock);
447 /* count the number of servers with the lowest rank */
448 lowestRank = tsrp->server->ipRank;
449 for ( count=1, tsrp=tsrp->next; tsrp; tsrp=tsrp->next)
451 if ( tsrp->server->ipRank != lowestRank)
457 /* if there is only one server with the lowest rank, we are done */
459 lock_ReleaseWrite(&cm_serverLock);
463 picked = rand() % count;
465 lock_ReleaseWrite(&cm_serverLock);
470 while (--picked >= 0)
475 lastTsrp->next = tsrp->next; /* delete random element from list*/
476 tsrp->next = *list; /* insert element at the beginning of list */
478 lock_ReleaseWrite(&cm_serverLock);
481 /* call cm_FreeServer while holding a write lock on cm_serverLock */
482 void cm_FreeServer(cm_server_t* serverp)
484 cm_PutServerNoLock(serverp);
485 if (serverp->refCount == 0)
487 /* we need to check to ensure that all of the connections
488 * for this server have a 0 refCount; otherwise, they will
489 * not be garbage collected
491 cm_GCConnections(serverp); /* connsp */
493 if (!(serverp->flags & CM_SERVERFLAG_PREF_SET)) {
494 lock_FinalizeMutex(&serverp->mx);
495 if ( cm_allServersp == serverp )
496 cm_allServersp = serverp->allNextp;
500 for(tsp = cm_allServersp; tsp->allNextp; tsp=tsp->allNextp) {
501 if ( tsp->allNextp == serverp ) {
502 tsp->allNextp = serverp->allNextp;
512 void cm_FreeServerList(cm_serverRef_t** list)
514 cm_serverRef_t **current = list;
515 cm_serverRef_t **nextp = 0;
516 cm_serverRef_t * next = 0;
518 lock_ObtainWrite(&cm_serverLock);
522 nextp = &(*current)->next;
523 if (--((*current)->refCount) == 0) {
525 cm_FreeServer((*current)->server);
533 lock_ReleaseWrite(&cm_serverLock);