2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afs/param.h>
21 #include <WINNT\syscfg.h>
22 #include <WINNT/afsreg.h>
26 osi_rwlock_t cm_serverLock;
27 osi_rwlock_t cm_syscfgLock;
29 cm_server_t *cm_allServersp;
30 afs_uint32 cm_numFileServers = 0;
31 afs_uint32 cm_numVldbServers = 0;
34 cm_ForceNewConnectionsAllServers(void)
38 lock_ObtainRead(&cm_serverLock);
39 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
40 cm_GetServerNoLock(tsp);
41 lock_ReleaseRead(&cm_serverLock);
42 cm_ForceNewConnections(tsp);
43 lock_ObtainRead(&cm_serverLock);
44 cm_PutServerNoLock(tsp);
46 lock_ReleaseRead(&cm_serverLock);
50 cm_PingServer(cm_server_t *tsp)
55 struct rx_connection * rxconnp;
58 Capabilities caps = {0, 0};
62 lock_ObtainMutex(&tsp->mx);
63 if (tsp->flags & CM_SERVERFLAG_PINGING) {
65 osi_SleepM((LONG_PTR)tsp, &tsp->mx);
66 lock_ObtainMutex(&tsp->mx);
68 if (tsp->waitCount == 0)
69 tsp->flags &= ~CM_SERVERFLAG_PINGING;
71 osi_Wakeup((LONG_PTR)tsp);
72 lock_ReleaseMutex(&tsp->mx);
75 tsp->flags |= CM_SERVERFLAG_PINGING;
76 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
77 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
78 lock_ReleaseMutex(&tsp->mx);
80 code = cm_ConnByServer(tsp, cm_rootUserp, &connp);
82 /* now call the appropriate ping call. Drop the timeout if
83 * the server is known to be down, so that we don't waste a
84 * lot of time retiming out down servers.
87 osi_Log4(afsd_logp, "cm_PingServer server %s (%s) was %s with caps 0x%x",
88 osi_LogSaveString(afsd_logp, hoststr),
89 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
90 wasDown ? "down" : "up",
93 rxconnp = cm_GetRxConn(connp);
95 rx_SetConnDeadTime(rxconnp, 10);
96 if (tsp->type == CM_SERVER_VLDB) {
97 code = VL_ProbeServer(rxconnp);
101 code = RXAFS_GetCapabilities(rxconnp, &caps);
102 if (code == RXGEN_OPCODE)
103 code = RXAFS_GetTime(rxconnp, &secs, &usecs);
106 rx_SetConnDeadTime(rxconnp, ConnDeadtimeout);
107 rx_PutConnection(rxconnp);
109 } /* got an unauthenticated connection to this server */
111 lock_ObtainMutex(&tsp->mx);
113 /* mark server as up */
114 tsp->flags &= ~CM_SERVERFLAG_DOWN;
117 /* we currently handle 32-bits of capabilities */
118 if (caps.Capabilities_len > 0) {
119 tsp->capabilities = caps.Capabilities_val[0];
120 xdr_free(caps.Capabilities_val, caps.Capabilities_len);
121 caps.Capabilities_len = 0;
122 caps.Capabilities_val = 0;
124 tsp->capabilities = 0;
127 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is up with caps 0x%x",
128 osi_LogSaveString(afsd_logp, hoststr),
129 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
132 /* Now update the volume status if necessary */
134 cm_server_vols_t * tsrvp;
138 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
139 for (i=0; i<NUM_SERVER_VOLS; i++) {
140 if (tsrvp->ids[i] != 0) {
143 lock_ReleaseMutex(&tsp->mx);
144 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
145 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
146 lock_ObtainMutex(&tsp->mx);
148 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
156 /* mark server as down */
157 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
158 tsp->flags |= CM_SERVERFLAG_DOWN;
159 tsp->downTime = time(NULL);
161 if (code != VRESTARTING) {
162 lock_ReleaseMutex(&tsp->mx);
163 cm_ForceNewConnections(tsp);
164 lock_ObtainMutex(&tsp->mx);
166 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is down with caps 0x%x",
167 osi_LogSaveString(afsd_logp, hoststr),
168 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
171 /* Now update the volume status if necessary */
173 cm_server_vols_t * tsrvp;
177 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
178 for (i=0; i<NUM_SERVER_VOLS; i++) {
179 if (tsrvp->ids[i] != 0) {
182 lock_ReleaseMutex(&tsp->mx);
183 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
184 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
185 lock_ObtainMutex(&tsp->mx);
187 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
196 if (tsp->waitCount == 0)
197 tsp->flags &= ~CM_SERVERFLAG_PINGING;
199 osi_Wakeup((LONG_PTR)tsp);
200 lock_ReleaseMutex(&tsp->mx);
203 static void cm_CheckServersSingular(afs_uint32 flags, cm_cell_t *cellp)
205 /* ping all file servers, up or down, with unauthenticated connection,
206 * to find out whether we have all our callbacks from the server still.
207 * Also, ping down VLDBs.
215 lock_ObtainRead(&cm_serverLock);
216 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
217 cm_GetServerNoLock(tsp);
218 lock_ReleaseRead(&cm_serverLock);
220 /* now process the server */
221 lock_ObtainMutex(&tsp->mx);
224 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
225 isFS = tsp->type == CM_SERVER_FILE;
226 isVLDB = tsp->type == CM_SERVER_VLDB;
228 /* only do the ping if the cell matches the requested cell, or we're
229 * matching all cells (cellp == NULL), and if we've requested to ping
230 * this type of {up, down} servers.
232 if ((cellp == NULL || cellp == tsp->cellp) &&
233 ((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
234 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS))) &&
235 ((!(flags & CM_FLAG_CHECKVLDBSERVERS) ||
236 isVLDB && (flags & CM_FLAG_CHECKVLDBSERVERS)) &&
237 (!(flags & CM_FLAG_CHECKFILESERVERS) ||
238 isFS && (flags & CM_FLAG_CHECKFILESERVERS)))) {
240 } /* we're supposed to check this up/down server */
241 lock_ReleaseMutex(&tsp->mx);
243 /* at this point, we've adjusted the server state, so do the ping and
249 /* also, run the GC function for connections on all of the
250 * server's connections.
252 cm_GCConnections(tsp);
254 lock_ObtainRead(&cm_serverLock);
255 cm_PutServerNoLock(tsp);
257 lock_ReleaseRead(&cm_serverLock);
260 static void cm_CheckServersMulti(afs_uint32 flags, cm_cell_t *cellp)
263 * The goal of this function is to probe simultaneously
264 * probe all of the up/down servers (vldb/file) as
265 * specified by flags in the minimum number of RPCs.
266 * Effectively that means use one multi_RXAFS_GetCapabilities()
267 * followed by possibly one multi_RXAFS_GetTime() and
268 * one multi_VL_ProbeServer().
270 * To make this work we must construct the list of vldb
271 * and file servers that are to be probed as well as the
272 * associated data structures.
275 int srvAddrCount = 0;
276 struct srvAddr **addrs = NULL;
277 cm_conn_t **conns = NULL;
278 struct rx_connection **rxconns = NULL;
280 afs_int32 i, j, nconns = 0, maxconns;
281 afs_int32 *conntimer, *results;
282 Capabilities *caps = NULL;
283 cm_server_t ** serversp, *tsp;
284 afs_uint32 isDown, wasDown;
286 time_t start, end, *deltas;
292 maxconns = max(cm_numFileServers,cm_numVldbServers);
296 conns = (cm_conn_t **)malloc(maxconns * sizeof(cm_conn_t *));
297 rxconns = (struct rx_connection **)malloc(maxconns * sizeof(struct rx_connection *));
298 conntimer = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
299 deltas = (time_t *)malloc(maxconns * sizeof (time_t));
300 results = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
301 serversp = (cm_server_t **)malloc(maxconns * sizeof(cm_server_t *));
302 caps = (Capabilities *)malloc(maxconns * sizeof(Capabilities));
304 memset(caps, 0, maxconns * sizeof(Capabilities));
306 if ((flags & CM_FLAG_CHECKFILESERVERS) ||
307 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
309 lock_ObtainRead(&cm_serverLock);
310 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
311 if (tsp->type != CM_SERVER_FILE ||
312 tsp->cellp == NULL || /* SetPref only */
313 cellp && cellp != tsp->cellp)
316 cm_GetServerNoLock(tsp);
317 lock_ReleaseRead(&cm_serverLock);
319 lock_ObtainMutex(&tsp->mx);
320 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
322 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
323 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
324 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
325 lock_ReleaseMutex(&tsp->mx);
326 lock_ObtainRead(&cm_serverLock);
327 cm_PutServerNoLock(tsp);
331 tsp->flags |= CM_SERVERFLAG_PINGING;
332 lock_ReleaseMutex(&tsp->mx);
334 serversp[nconns] = tsp;
335 code = cm_ConnByServer(tsp, cm_rootUserp, &conns[nconns]);
337 lock_ObtainRead(&cm_serverLock);
338 cm_PutServerNoLock(tsp);
341 lock_ObtainRead(&cm_serverLock);
342 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
343 if (conntimer[nconns] = (isDown ? 1 : 0))
344 rx_SetConnDeadTime(rxconns[nconns], 10);
348 lock_ReleaseRead(&cm_serverLock);
351 /* Perform the multi call */
353 multi_Rx(rxconns,nconns)
355 multi_RXAFS_GetCapabilities(&caps[multi_i]);
356 results[multi_i]=multi_error;
360 /* Process results of servers that support RXAFS_GetCapabilities */
361 for (i=0; i<nconns; i++) {
362 /* Leave the servers that did not support GetCapabilities alone */
363 if (results[i] == RXGEN_OPCODE)
367 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
368 rx_PutConnection(rxconns[i]);
369 cm_PutConn(conns[i]);
372 cm_GCConnections(tsp);
374 lock_ObtainMutex(&tsp->mx);
375 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
377 if (results[i] >= 0) {
378 /* mark server as up */
379 tsp->flags &= ~CM_SERVERFLAG_DOWN;
382 /* we currently handle 32-bits of capabilities */
383 if (caps[i].Capabilities_len > 0) {
384 tsp->capabilities = caps[i].Capabilities_val[0];
385 xdr_free(caps[i].Capabilities_val, caps[i].Capabilities_len);
386 caps[i].Capabilities_len = 0;
387 caps[i].Capabilities_val = 0;
389 tsp->capabilities = 0;
392 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
393 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
394 osi_LogSaveString(afsd_logp, hoststr),
395 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
398 /* Now update the volume status if necessary */
400 cm_server_vols_t * tsrvp;
404 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
405 for (i=0; i<NUM_SERVER_VOLS; i++) {
406 if (tsrvp->ids[i] != 0) {
409 lock_ReleaseMutex(&tsp->mx);
410 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
411 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
412 lock_ObtainMutex(&tsp->mx);
414 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
422 /* mark server as down */
423 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
424 tsp->flags |= CM_SERVERFLAG_DOWN;
425 tsp->downTime = time(NULL);
427 if (code != VRESTARTING) {
428 lock_ReleaseMutex(&tsp->mx);
429 cm_ForceNewConnections(tsp);
430 lock_ObtainMutex(&tsp->mx);
432 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
433 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
434 osi_LogSaveString(afsd_logp, hoststr),
435 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
438 /* Now update the volume status if necessary */
440 cm_server_vols_t * tsrvp;
444 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
445 for (i=0; i<NUM_SERVER_VOLS; i++) {
446 if (tsrvp->ids[i] != 0) {
449 lock_ReleaseMutex(&tsp->mx);
450 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
451 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
452 lock_ObtainMutex(&tsp->mx);
454 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
463 if (tsp->waitCount == 0)
464 tsp->flags &= ~CM_SERVERFLAG_PINGING;
466 osi_Wakeup((LONG_PTR)tsp);
468 lock_ReleaseMutex(&tsp->mx);
474 * At this point we have handled any responses that did not indicate
475 * that RXAFS_GetCapabilities is not supported.
477 for ( i=0, j=0; i<nconns; i++) {
478 if (results[i] == RXGEN_OPCODE) {
481 rxconns[j] = rxconns[i];
482 serversp[j] = serversp[i];
490 /* Perform the multi call */
492 multi_Rx(rxconns,nconns)
495 multi_RXAFS_GetTime(&secs, &usecs);
497 results[multi_i]=multi_error;
498 if ((start == end) && !multi_error)
499 deltas[multi_i] = end - secs;
503 /* Process Results of servers that only support RXAFS_GetTime */
504 for (i=0; i<nconns; i++) {
505 /* Leave the servers that did not support GetCapabilities alone */
507 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
508 rx_PutConnection(rxconns[i]);
509 cm_PutConn(conns[i]);
512 cm_GCConnections(tsp);
514 lock_ObtainMutex(&tsp->mx);
515 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
517 if (results[i] >= 0) {
518 /* mark server as up */
519 tsp->flags &= ~CM_SERVERFLAG_DOWN;
521 tsp->capabilities = 0;
523 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
524 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
525 osi_LogSaveString(afsd_logp, hoststr),
526 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
529 /* Now update the volume status if necessary */
531 cm_server_vols_t * tsrvp;
535 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
536 for (i=0; i<NUM_SERVER_VOLS; i++) {
537 if (tsrvp->ids[i] != 0) {
540 lock_ReleaseMutex(&tsp->mx);
541 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
542 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
543 lock_ObtainMutex(&tsp->mx);
545 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
553 /* mark server as down */
554 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
555 tsp->flags |= CM_SERVERFLAG_DOWN;
556 tsp->downTime = time(NULL);
558 if (code != VRESTARTING) {
559 lock_ReleaseMutex(&tsp->mx);
560 cm_ForceNewConnections(tsp);
561 lock_ObtainMutex(&tsp->mx);
563 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
564 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
565 osi_LogSaveString(afsd_logp, hoststr),
566 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
569 /* Now update the volume status if necessary */
571 cm_server_vols_t * tsrvp;
575 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
576 for (i=0; i<NUM_SERVER_VOLS; i++) {
577 if (tsrvp->ids[i] != 0) {
580 lock_ReleaseMutex(&tsp->mx);
581 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
582 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
583 lock_ObtainMutex(&tsp->mx);
585 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
594 if (tsp->waitCount == 0)
595 tsp->flags &= ~CM_SERVERFLAG_PINGING;
597 osi_Wakeup((LONG_PTR)tsp);
599 lock_ReleaseMutex(&tsp->mx);
605 if ((flags & CM_FLAG_CHECKVLDBSERVERS) ||
606 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
608 lock_ObtainRead(&cm_serverLock);
609 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
610 if (tsp->type != CM_SERVER_VLDB ||
611 tsp->cellp == NULL || /* SetPref only */
612 cellp && cellp != tsp->cellp)
615 cm_GetServerNoLock(tsp);
616 lock_ReleaseRead(&cm_serverLock);
618 lock_ObtainMutex(&tsp->mx);
619 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
621 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
622 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
623 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
624 lock_ReleaseMutex(&tsp->mx);
625 lock_ObtainRead(&cm_serverLock);
626 cm_PutServerNoLock(tsp);
630 tsp->flags |= CM_SERVERFLAG_PINGING;
631 lock_ReleaseMutex(&tsp->mx);
633 serversp[nconns] = tsp;
634 code = cm_ConnByServer(tsp, cm_rootUserp, &conns[nconns]);
636 lock_ObtainRead(&cm_serverLock);
637 cm_PutServerNoLock(tsp);
640 lock_ObtainRead(&cm_serverLock);
641 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
642 conntimer[nconns] = (isDown ? 1 : 0);
644 rx_SetConnDeadTime(rxconns[nconns], 10);
648 lock_ReleaseRead(&cm_serverLock);
651 /* Perform the multi call */
653 multi_Rx(rxconns,nconns)
655 multi_VL_ProbeServer();
656 results[multi_i]=multi_error;
660 /* Process results of servers that support VL_ProbeServer */
661 for (i=0; i<nconns; i++) {
663 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
664 rx_PutConnection(rxconns[i]);
665 cm_PutConn(conns[i]);
668 cm_GCConnections(tsp);
670 lock_ObtainMutex(&tsp->mx);
671 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
673 if (results[i] >= 0) {
674 /* mark server as up */
675 tsp->flags &= ~CM_SERVERFLAG_DOWN;
677 tsp->capabilities = 0;
679 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
680 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
681 osi_LogSaveString(afsd_logp, hoststr),
682 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
685 /* mark server as down */
686 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
687 tsp->flags |= CM_SERVERFLAG_DOWN;
688 tsp->downTime = time(NULL);
690 if (code != VRESTARTING) {
691 lock_ReleaseMutex(&tsp->mx);
692 cm_ForceNewConnections(tsp);
693 lock_ObtainMutex(&tsp->mx);
695 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
696 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
697 osi_LogSaveString(afsd_logp, hoststr),
698 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
702 if (tsp->waitCount == 0)
703 tsp->flags &= ~CM_SERVERFLAG_PINGING;
705 osi_Wakeup((LONG_PTR)tsp);
707 lock_ReleaseMutex(&tsp->mx);
722 void cm_CheckServers(afs_uint32 flags, cm_cell_t *cellp)
729 code = RegOpenKeyEx(HKEY_LOCAL_MACHINE, AFSREG_CLT_SVC_PARAM_SUBKEY,
730 0, KEY_QUERY_VALUE, &parmKey);
731 if (code == ERROR_SUCCESS) {
732 dummyLen = sizeof(multi);
733 code = RegQueryValueEx(parmKey, "MultiCheckServers", NULL, NULL,
734 (BYTE *) &multi, &dummyLen);
735 RegCloseKey (parmKey);
739 cm_CheckServersMulti(flags, cellp);
741 cm_CheckServersSingular(flags, cellp);
744 void cm_InitServer(void)
746 static osi_once_t once;
748 if (osi_Once(&once)) {
749 lock_InitializeRWLock(&cm_serverLock, "cm_serverLock", LOCK_HIERARCHY_SERVER_GLOBAL);
750 lock_InitializeRWLock(&cm_syscfgLock, "cm_syscfgLock", LOCK_HIERARCHY_SYSCFG_GLOBAL);
755 /* Protected by cm_syscfgLock (rw) */
756 int cm_noIPAddr; /* number of client network interfaces */
757 int cm_IPAddr[CM_MAXINTERFACE_ADDR]; /* client's IP address in host order */
758 int cm_SubnetMask[CM_MAXINTERFACE_ADDR];/* client's subnet mask in host order*/
759 int cm_NetMtu[CM_MAXINTERFACE_ADDR]; /* client's MTU sizes */
760 int cm_NetFlags[CM_MAXINTERFACE_ADDR]; /* network flags */
761 int cm_LanAdapterChangeDetected = 1;
763 void cm_SetLanAdapterChangeDetected(void)
765 lock_ObtainWrite(&cm_syscfgLock);
766 cm_LanAdapterChangeDetected = 1;
767 lock_ReleaseWrite(&cm_syscfgLock);
770 void cm_GetServer(cm_server_t *serverp)
772 lock_ObtainRead(&cm_serverLock);
773 InterlockedIncrement(&serverp->refCount);
774 lock_ReleaseRead(&cm_serverLock);
777 void cm_GetServerNoLock(cm_server_t *serverp)
779 InterlockedIncrement(&serverp->refCount);
782 void cm_PutServer(cm_server_t *serverp)
785 lock_ObtainRead(&cm_serverLock);
786 refCount = InterlockedDecrement(&serverp->refCount);
787 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
788 lock_ReleaseRead(&cm_serverLock);
791 void cm_PutServerNoLock(cm_server_t *serverp)
793 afs_int32 refCount = InterlockedDecrement(&serverp->refCount);
794 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
797 void cm_SetServerNo64Bit(cm_server_t * serverp, int no64bit)
799 lock_ObtainMutex(&serverp->mx);
801 serverp->flags |= CM_SERVERFLAG_NO64BIT;
803 serverp->flags &= ~CM_SERVERFLAG_NO64BIT;
804 lock_ReleaseMutex(&serverp->mx);
807 void cm_SetServerNoInlineBulk(cm_server_t * serverp, int no)
809 lock_ObtainMutex(&serverp->mx);
811 serverp->flags |= CM_SERVERFLAG_NOINLINEBULK;
813 serverp->flags &= ~CM_SERVERFLAG_NOINLINEBULK;
814 lock_ReleaseMutex(&serverp->mx);
817 void cm_SetServerPrefs(cm_server_t * serverp)
819 unsigned long serverAddr; /* in host byte order */
820 unsigned long myAddr, myNet, mySubnet;/* in host byte order */
821 unsigned long netMask;
826 lock_ObtainRead(&cm_syscfgLock);
827 if (cm_LanAdapterChangeDetected) {
828 lock_ConvertRToW(&cm_syscfgLock);
830 if (cm_LanAdapterChangeDetected) {
831 /* get network related info */
832 cm_noIPAddr = CM_MAXINTERFACE_ADDR;
833 code = syscfg_GetIFInfo(&cm_noIPAddr,
834 cm_IPAddr, cm_SubnetMask,
835 cm_NetMtu, cm_NetFlags);
836 cm_LanAdapterChangeDetected = 0;
838 lock_ConvertWToR(&cm_syscfgLock);
841 serverAddr = ntohl(serverp->addr.sin_addr.s_addr);
842 serverp->ipRank = CM_IPRANK_LOW; /* default settings */
844 for ( i=0; i < cm_noIPAddr; i++)
846 /* loop through all the client's IP address and compare
847 ** each of them against the server's IP address */
849 myAddr = cm_IPAddr[i];
850 if ( IN_CLASSA(myAddr) )
851 netMask = IN_CLASSA_NET;
852 else if ( IN_CLASSB(myAddr) )
853 netMask = IN_CLASSB_NET;
854 else if ( IN_CLASSC(myAddr) )
855 netMask = IN_CLASSC_NET;
859 myNet = myAddr & netMask;
860 mySubnet = myAddr & cm_SubnetMask[i];
862 if ( (serverAddr & netMask) == myNet )
864 if ( (serverAddr & cm_SubnetMask[i]) == mySubnet)
866 if ( serverAddr == myAddr )
867 serverp->ipRank = min(serverp->ipRank,
868 CM_IPRANK_TOP);/* same machine */
869 else serverp->ipRank = min(serverp->ipRank,
870 CM_IPRANK_HI); /* same subnet */
872 else serverp->ipRank = min(serverp->ipRank,CM_IPRANK_MED);
875 } /* and of for loop */
877 /* random between 0..15*/
878 serverp->ipRank += (rand() % 0x000f);
879 lock_ReleaseRead(&cm_syscfgLock);
882 cm_server_t *cm_NewServer(struct sockaddr_in *socketp, int type, cm_cell_t *cellp, afsUUID *uuidp, afs_uint32 flags) {
885 osi_assertx(socketp->sin_family == AF_INET, "unexpected socket family");
887 tsp = malloc(sizeof(*tsp));
889 memset(tsp, 0, sizeof(*tsp));
892 if (uuidp && !afs_uuid_is_nil(uuidp)) {
894 tsp->flags |= CM_SERVERFLAG_UUID;
897 lock_InitializeMutex(&tsp->mx, "cm_server_t mutex", LOCK_HIERARCHY_SERVER);
898 tsp->addr = *socketp;
900 cm_SetServerPrefs(tsp);
902 lock_ObtainWrite(&cm_serverLock); /* get server lock */
903 tsp->allNextp = cm_allServersp;
904 cm_allServersp = tsp;
915 lock_ReleaseWrite(&cm_serverLock); /* release server lock */
917 if ( !(flags & CM_FLAG_NOPROBE) ) {
918 tsp->flags |= CM_SERVERFLAG_DOWN; /* assume down; ping will mark up if available */
919 cm_PingServer(tsp); /* Obtain Capabilities and check up/down state */
926 cm_FindServerByIP(afs_uint32 ipaddr, unsigned short port, int type)
930 lock_ObtainRead(&cm_serverLock);
931 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
932 if (tsp->type == type &&
933 tsp->addr.sin_addr.S_un.S_addr == ipaddr &&
934 (tsp->addr.sin_port == port || tsp->addr.sin_port == 0))
938 /* bump ref count if we found the server */
940 cm_GetServerNoLock(tsp);
942 lock_ReleaseRead(&cm_serverLock);
948 cm_FindServerByUuid(afsUUID *serverUuid, int type)
952 lock_ObtainRead(&cm_serverLock);
953 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
954 if (tsp->type == type && !afs_uuid_equal(&tsp->uuid, serverUuid))
958 /* bump ref count if we found the server */
960 cm_GetServerNoLock(tsp);
962 lock_ReleaseRead(&cm_serverLock);
967 /* find a server based on its properties */
968 cm_server_t *cm_FindServer(struct sockaddr_in *addrp, int type)
972 osi_assertx(addrp->sin_family == AF_INET, "unexpected socket value");
974 lock_ObtainRead(&cm_serverLock);
975 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp) {
976 if (tsp->type == type &&
977 tsp->addr.sin_addr.s_addr == addrp->sin_addr.s_addr &&
978 (tsp->addr.sin_port == addrp->sin_port || tsp->addr.sin_port == 0))
982 /* bump ref count if we found the server */
984 cm_GetServerNoLock(tsp);
986 /* drop big table lock */
987 lock_ReleaseRead(&cm_serverLock);
989 /* return what we found */
993 cm_server_vols_t *cm_NewServerVols(void) {
994 cm_server_vols_t *tsvp;
996 tsvp = malloc(sizeof(*tsvp));
998 memset(tsvp, 0, sizeof(*tsvp));
1003 cm_serverRef_t *cm_NewServerRef(cm_server_t *serverp, afs_uint32 volID)
1005 cm_serverRef_t *tsrp;
1006 cm_server_vols_t **tsrvpp = NULL;
1007 afs_uint32 *slotp = NULL;
1010 cm_GetServer(serverp);
1011 tsrp = malloc(sizeof(*tsrp));
1012 tsrp->server = serverp;
1013 tsrp->status = srv_not_busy;
1015 tsrp->volID = volID;
1018 /* if we have a non-zero volID, we need to add it to the list
1019 * of volumes maintained by the server. There are two phases:
1020 * (1) see if the volID is already in the list and (2) insert
1021 * it into the first empty slot if it is not.
1024 lock_ObtainMutex(&serverp->mx);
1026 tsrvpp = &serverp->vols;
1030 for (i=0; i<NUM_SERVER_VOLS; i++) {
1031 if ((*tsrvpp)->ids[i] == volID) {
1034 } else if (!slotp && (*tsrvpp)->ids[i] == 0) {
1035 slotp = &(*tsrvpp)->ids[i];
1042 tsrvpp = &(*tsrvpp)->nextp;
1049 /* if we didn't find an empty slot in a current
1050 * page we must need a new page */
1051 *tsrvpp = cm_NewServerVols();
1053 (*tsrvpp)->ids[0] = volID;
1057 lock_ReleaseMutex(&serverp->mx);
1063 LONG_PTR cm_ChecksumServerList(cm_serverRef_t *serversp)
1067 cm_serverRef_t *tsrp;
1069 lock_ObtainRead(&cm_serverLock);
1070 for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
1071 if (tsrp->status == srv_deleted)
1077 sum ^= (LONG_PTR) tsrp->server;
1080 lock_ReleaseRead(&cm_serverLock);
1085 ** Insert a server into the server list keeping the list sorted in
1086 ** ascending order of ipRank.
1088 ** The refCount of the cm_serverRef_t is increased
1090 void cm_InsertServerList(cm_serverRef_t** list, cm_serverRef_t* element)
1092 cm_serverRef_t *current=*list;
1093 unsigned short ipRank = element->server->ipRank;
1095 lock_ObtainWrite(&cm_serverLock);
1096 element->refCount++; /* increase refCount */
1098 /* insertion into empty list or at the beginning of the list */
1099 if ( !current || (current->server->ipRank > ipRank) )
1101 element->next = *list;
1103 lock_ReleaseWrite(&cm_serverLock);
1107 while ( current->next ) /* find appropriate place to insert */
1109 if ( current->next->server->ipRank > ipRank )
1111 else current = current->next;
1113 element->next = current->next;
1114 current->next = element;
1115 lock_ReleaseWrite(&cm_serverLock);
1118 ** Re-sort the server list with the modified rank
1119 ** returns 0 if element was changed successfully.
1120 ** returns 1 if list remained unchanged.
1122 long cm_ChangeRankServer(cm_serverRef_t** list, cm_server_t* server)
1124 cm_serverRef_t **current=list;
1125 cm_serverRef_t *element=0;
1127 /* if there is max of one element in the list, nothing to sort */
1128 if ( (!*current) || !((*current)->next) )
1129 return 1; /* list unchanged: return success */
1131 lock_ObtainWrite(&cm_serverLock);
1132 /* if the server is on the list, delete it from list */
1135 if ( (*current)->server == server)
1137 element = (*current);
1138 *current = (*current)->next; /* delete it */
1141 current = & ( (*current)->next);
1143 lock_ReleaseWrite(&cm_serverLock);
1145 /* if this volume is not replicated on this server */
1147 return 1; /* server is not on list */
1149 /* re-insert deleted element into the list with modified rank*/
1150 cm_InsertServerList(list, element);
1152 /* reduce refCount which was increased by cm_InsertServerList */
1153 lock_ObtainWrite(&cm_serverLock);
1154 element->refCount--;
1155 lock_ReleaseWrite(&cm_serverLock);
1159 ** If there are more than one server on the list and the first n servers on
1160 ** the list have the same rank( n>1), then randomise among the first n servers.
1162 void cm_RandomizeServer(cm_serverRef_t** list)
1165 cm_serverRef_t* tsrp = *list, *lastTsrp;
1166 unsigned short lowestRank;
1168 /* an empty list or a list with only one element */
1169 if ( !tsrp || ! tsrp->next )
1172 lock_ObtainWrite(&cm_serverLock);
1174 /* count the number of servers with the lowest rank */
1175 lowestRank = tsrp->server->ipRank;
1176 for ( count=1, tsrp=tsrp->next; tsrp; tsrp=tsrp->next)
1178 if ( tsrp->server->ipRank != lowestRank)
1184 /* if there is only one server with the lowest rank, we are done */
1186 lock_ReleaseWrite(&cm_serverLock);
1190 picked = rand() % count;
1192 lock_ReleaseWrite(&cm_serverLock);
1197 while (--picked >= 0)
1202 lastTsrp->next = tsrp->next; /* delete random element from list*/
1203 tsrp->next = *list; /* insert element at the beginning of list */
1205 lock_ReleaseWrite(&cm_serverLock);
1208 /* call cm_FreeServer while holding a write lock on cm_serverLock */
1209 void cm_FreeServer(cm_server_t* serverp)
1211 cm_server_vols_t * tsrvp, *nextp;
1214 cm_PutServerNoLock(serverp);
1215 if (serverp->refCount == 0)
1218 * we need to check to ensure that all of the connections
1219 * for this server have a 0 refCount; otherwise, they will
1220 * not be garbage collected
1222 * must drop the cm_serverLock because cm_GCConnections
1223 * obtains the cm_connLock and that comes first in the
1226 lock_ReleaseWrite(&cm_serverLock);
1227 cm_GCConnections(serverp); /* connsp */
1228 lock_ObtainWrite(&cm_serverLock);
1233 * Once we have the cm_serverLock locked check to make
1234 * sure the refCount is still zero before removing the
1237 if (serverp->refCount == 0) {
1238 if (!(serverp->flags & CM_SERVERFLAG_PREF_SET)) {
1239 switch (serverp->type) {
1240 case CM_SERVER_VLDB:
1241 cm_numVldbServers--;
1243 case CM_SERVER_FILE:
1244 cm_numFileServers--;
1248 lock_FinalizeMutex(&serverp->mx);
1249 if ( cm_allServersp == serverp )
1250 cm_allServersp = serverp->allNextp;
1254 for(tsp = cm_allServersp; tsp->allNextp; tsp=tsp->allNextp) {
1255 if ( tsp->allNextp == serverp ) {
1256 tsp->allNextp = serverp->allNextp;
1262 /* free the volid list */
1263 for ( tsrvp = serverp->vols; tsrvp; tsrvp = nextp) {
1264 nextp = tsrvp->nextp;
1273 /* Called with cm_serverLock write locked */
1274 void cm_RemoveVolumeFromServer(cm_server_t * serverp, afs_uint32 volID)
1276 cm_server_vols_t * tsrvp;
1282 for (tsrvp = serverp->vols; tsrvp; tsrvp = tsrvp->nextp) {
1283 for (i=0; i<NUM_SERVER_VOLS; i++) {
1284 if (tsrvp->ids[i] == volID) {
1292 void cm_FreeServerList(cm_serverRef_t** list, afs_uint32 flags)
1294 cm_serverRef_t **current = list;
1295 cm_serverRef_t **nextp = 0;
1296 cm_serverRef_t * next = 0;
1301 lock_ObtainWrite(&cm_serverLock);
1305 nextp = &(*current)->next;
1306 if (--((*current)->refCount) == 0) {
1309 if ((*current)->volID)
1310 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1311 cm_FreeServer((*current)->server);
1315 if (flags & CM_FREESERVERLIST_DELETE) {
1316 (*current)->status = srv_deleted;
1317 if ((*current)->volID)
1318 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1324 lock_ReleaseWrite(&cm_serverLock);
1327 /* dump all servers to a file.
1328 * cookie is used to identify this batch for easy parsing,
1329 * and it a string provided by a caller
1331 int cm_DumpServers(FILE *outputFile, char *cookie, int lock)
1340 lock_ObtainRead(&cm_serverLock);
1343 "%s - dumping servers - cm_numFileServers=%d, cm_numVldbServers=%d\r\n",
1344 cookie, cm_numFileServers, cm_numVldbServers);
1345 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1347 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp)
1352 switch (tsp->type) {
1353 case CM_SERVER_VLDB:
1356 case CM_SERVER_FILE:
1363 afsUUID_to_string(&tsp->uuid, uuidstr, sizeof(uuidstr));
1364 afs_inet_ntoa_r(tsp->addr.sin_addr.s_addr, hoststr);
1365 down = ctime(&tsp->downTime);
1366 down[strlen(down)-1] = '\0';
1369 "%s - tsp=0x%p cell=%s addr=%-15s port=%u uuid=%s type=%s caps=0x%x "
1370 "flags=0x%x waitCount=%u rank=%u downTime=\"%s\" refCount=%u\r\n",
1371 cookie, tsp, tsp->cellp ? tsp->cellp->name : "", hoststr,
1372 ntohs(tsp->addr.sin_port), uuidstr, type,
1373 tsp->capabilities, tsp->flags, tsp->waitCount, tsp->ipRank,
1374 (tsp->flags & CM_SERVERFLAG_DOWN) ? down : "up",
1376 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1378 sprintf(output, "%s - Done dumping servers.\r\n", cookie);
1379 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1382 lock_ReleaseRead(&cm_serverLock);
1388 * Determine if two servers are in fact the same.
1390 * Returns 1 if they match, 0 if they do not
1392 int cm_ServerEqual(cm_server_t *srv1, cm_server_t *srv2)
1396 if (srv1 == NULL || srv2 == NULL)
1402 if (srv1->flags & CM_SERVERFLAG_UUID) {
1403 if (!(srv2->flags & CM_SERVERFLAG_UUID))
1406 /* Both support UUID */
1407 if (UuidEqual((UUID *)&srv1->uuid, (UUID *)&srv2->uuid, &status))