2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afsconfig.h>
11 #include <afs/param.h>
24 #include <WINNT\syscfg.h>
25 #include <WINNT/afsreg.h>
30 osi_rwlock_t cm_serverLock;
31 osi_rwlock_t cm_syscfgLock;
33 cm_server_t *cm_allServersp;
34 afs_uint32 cm_numFileServers = 0;
35 afs_uint32 cm_numVldbServers = 0;
38 cm_ForceNewConnectionsAllServers(void)
42 lock_ObtainRead(&cm_serverLock);
43 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
44 cm_GetServerNoLock(tsp);
45 lock_ReleaseRead(&cm_serverLock);
46 cm_ForceNewConnections(tsp);
47 lock_ObtainRead(&cm_serverLock);
48 cm_PutServerNoLock(tsp);
50 lock_ReleaseRead(&cm_serverLock);
54 * lock_ObtainMutex must be held prior to calling
58 cm_RankServer(cm_server_t * tsp)
60 afs_int32 code = 0; /* start with "success" */
61 struct rx_debugPeer tpeer;
76 code = rx_GetLocalPeers(tsp->addr.sin_addr.s_addr, port, &tpeer);
78 /*check if rx_GetLocalPeers succeeded and if there is data for tsp */
79 if(code == 0 && (tpeer.rtt == 0 && tpeer.rtt_dev == 0))
83 if((tsp->flags & CM_SERVERFLAG_PREF_SET))
84 newRank = tsp->adminRank +
85 ((int)(623 * log(tpeer.rtt) / 10) * 10 + 5);
86 else /* rank has not been set by admin, derive rank from rtt */
87 newRank = (int)(7200 * log(tpeer.rtt) / 5000) * 5000 + 5000;
89 newRank += (rand() & 0x000f); /* randomize */
91 if (abs(newRank - tsp->ipRank) > 0xf) {
92 tsp->ipRank = newRank;
94 lock_ReleaseMutex(&tsp->mx);
98 * find volumes which might have RO copy
99 * on server and change the ordering of
102 cm_ChangeRankVolume(tsp);
105 /* set preferences for an existing vlserver */
106 cm_ChangeRankCellVLServer(tsp);
109 lock_ObtainMutex(&tsp->mx);
117 cm_PingServer(cm_server_t *tsp)
122 struct rx_connection * rxconnp;
125 Capabilities caps = {0, 0};
129 lock_ObtainMutex(&tsp->mx);
130 if (tsp->flags & CM_SERVERFLAG_PINGING) {
132 osi_SleepM((LONG_PTR)tsp, &tsp->mx);
133 lock_ObtainMutex(&tsp->mx);
135 if (tsp->waitCount == 0)
136 tsp->flags &= ~CM_SERVERFLAG_PINGING;
138 osi_Wakeup((LONG_PTR)tsp);
139 lock_ReleaseMutex(&tsp->mx);
142 tsp->flags |= CM_SERVERFLAG_PINGING;
143 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
144 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
145 lock_ReleaseMutex(&tsp->mx);
147 code = cm_ConnByServer(tsp, cm_rootUserp, &connp);
149 /* now call the appropriate ping call. Drop the timeout if
150 * the server is known to be down, so that we don't waste a
151 * lot of time retiming out down servers.
154 osi_Log4(afsd_logp, "cm_PingServer server %s (%s) was %s with caps 0x%x",
155 osi_LogSaveString(afsd_logp, hoststr),
156 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
157 wasDown ? "down" : "up",
160 rxconnp = cm_GetRxConn(connp);
162 rx_SetConnDeadTime(rxconnp, 10);
163 if (tsp->type == CM_SERVER_VLDB) {
164 code = VL_ProbeServer(rxconnp);
168 code = RXAFS_GetCapabilities(rxconnp, &caps);
169 if (code == RXGEN_OPCODE)
170 code = RXAFS_GetTime(rxconnp, &secs, &usecs);
173 rx_SetConnDeadTime(rxconnp, ConnDeadtimeout);
174 rx_PutConnection(rxconnp);
176 } /* got an unauthenticated connection to this server */
178 lock_ObtainMutex(&tsp->mx);
180 /* mark server as up */
181 tsp->flags &= ~CM_SERVERFLAG_DOWN;
184 /* we currently handle 32-bits of capabilities */
185 if (caps.Capabilities_len > 0) {
186 tsp->capabilities = caps.Capabilities_val[0];
187 xdr_free((xdrproc_t) xdr_Capabilities, &caps);
188 caps.Capabilities_len = 0;
189 caps.Capabilities_val = 0;
191 tsp->capabilities = 0;
194 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is up with caps 0x%x",
195 osi_LogSaveString(afsd_logp, hoststr),
196 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
199 /* Now update the volume status if necessary */
201 cm_server_vols_t * tsrvp;
205 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
206 for (i=0; i<NUM_SERVER_VOLS; i++) {
207 if (tsrvp->ids[i] != 0) {
210 lock_ReleaseMutex(&tsp->mx);
211 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
212 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
213 lock_ObtainMutex(&tsp->mx);
215 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
223 /* mark server as down */
224 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
225 tsp->flags |= CM_SERVERFLAG_DOWN;
226 tsp->downTime = time(NULL);
228 if (code != VRESTARTING) {
229 lock_ReleaseMutex(&tsp->mx);
230 cm_ForceNewConnections(tsp);
231 lock_ObtainMutex(&tsp->mx);
233 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is down with caps 0x%x",
234 osi_LogSaveString(afsd_logp, hoststr),
235 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
238 /* Now update the volume status if necessary */
240 cm_server_vols_t * tsrvp;
244 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
245 for (i=0; i<NUM_SERVER_VOLS; i++) {
246 if (tsrvp->ids[i] != 0) {
249 lock_ReleaseMutex(&tsp->mx);
250 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
251 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
252 lock_ObtainMutex(&tsp->mx);
254 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
263 if (tsp->waitCount == 0)
264 tsp->flags &= ~CM_SERVERFLAG_PINGING;
266 osi_Wakeup((LONG_PTR)tsp);
267 lock_ReleaseMutex(&tsp->mx);
275 lock_ObtainRead(&cm_serverLock);
276 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
277 cm_GetServerNoLock(tsp);
278 lock_ReleaseRead(&cm_serverLock);
280 lock_ObtainMutex(&tsp->mx);
282 /* if the server is not down, rank the server */
283 if(!(tsp->flags & CM_SERVERFLAG_DOWN))
286 lock_ReleaseMutex(&tsp->mx);
288 lock_ObtainRead(&cm_serverLock);
289 cm_PutServerNoLock(tsp);
291 lock_ReleaseRead(&cm_serverLock);
294 static void cm_CheckServersSingular(afs_uint32 flags, cm_cell_t *cellp)
296 /* ping all file servers, up or down, with unauthenticated connection,
297 * to find out whether we have all our callbacks from the server still.
298 * Also, ping down VLDBs.
306 lock_ObtainRead(&cm_serverLock);
307 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
308 cm_GetServerNoLock(tsp);
309 lock_ReleaseRead(&cm_serverLock);
311 /* now process the server */
312 lock_ObtainMutex(&tsp->mx);
315 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
316 isFS = tsp->type == CM_SERVER_FILE;
317 isVLDB = tsp->type == CM_SERVER_VLDB;
319 /* only do the ping if the cell matches the requested cell, or we're
320 * matching all cells (cellp == NULL), and if we've requested to ping
321 * this type of {up, down} servers.
323 if ((cellp == NULL || cellp == tsp->cellp) &&
324 ((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
325 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS))) &&
326 ((!(flags & CM_FLAG_CHECKVLDBSERVERS) ||
327 isVLDB && (flags & CM_FLAG_CHECKVLDBSERVERS)) &&
328 (!(flags & CM_FLAG_CHECKFILESERVERS) ||
329 isFS && (flags & CM_FLAG_CHECKFILESERVERS)))) {
331 } /* we're supposed to check this up/down server */
332 lock_ReleaseMutex(&tsp->mx);
334 /* at this point, we've adjusted the server state, so do the ping and
340 /* also, run the GC function for connections on all of the
341 * server's connections.
343 cm_GCConnections(tsp);
345 lock_ObtainRead(&cm_serverLock);
346 cm_PutServerNoLock(tsp);
348 lock_ReleaseRead(&cm_serverLock);
351 static void cm_CheckServersMulti(afs_uint32 flags, cm_cell_t *cellp)
354 * The goal of this function is to probe simultaneously
355 * probe all of the up/down servers (vldb/file) as
356 * specified by flags in the minimum number of RPCs.
357 * Effectively that means use one multi_RXAFS_GetCapabilities()
358 * followed by possibly one multi_RXAFS_GetTime() and
359 * one multi_VL_ProbeServer().
361 * To make this work we must construct the list of vldb
362 * and file servers that are to be probed as well as the
363 * associated data structures.
366 int srvAddrCount = 0;
367 struct srvAddr **addrs = NULL;
368 cm_conn_t **conns = NULL;
369 struct rx_connection **rxconns = NULL;
371 afs_int32 i, j, nconns = 0, maxconns;
372 afs_int32 *conntimer, *results;
373 Capabilities *caps = NULL;
374 cm_server_t ** serversp, *tsp;
375 afs_uint32 isDown, wasDown;
377 time_t start, end, *deltas;
383 maxconns = max(cm_numFileServers,cm_numVldbServers);
387 conns = (cm_conn_t **)malloc(maxconns * sizeof(cm_conn_t *));
388 rxconns = (struct rx_connection **)malloc(maxconns * sizeof(struct rx_connection *));
389 conntimer = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
390 deltas = (time_t *)malloc(maxconns * sizeof (time_t));
391 results = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
392 serversp = (cm_server_t **)malloc(maxconns * sizeof(cm_server_t *));
393 caps = (Capabilities *)malloc(maxconns * sizeof(Capabilities));
395 memset(caps, 0, maxconns * sizeof(Capabilities));
397 if ((flags & CM_FLAG_CHECKFILESERVERS) ||
398 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
400 lock_ObtainRead(&cm_serverLock);
401 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
402 if (tsp->type != CM_SERVER_FILE ||
403 tsp->cellp == NULL || /* SetPref only */
404 cellp && cellp != tsp->cellp)
407 cm_GetServerNoLock(tsp);
408 lock_ReleaseRead(&cm_serverLock);
410 lock_ObtainMutex(&tsp->mx);
411 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
413 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
414 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
415 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
416 lock_ReleaseMutex(&tsp->mx);
417 lock_ObtainRead(&cm_serverLock);
418 cm_PutServerNoLock(tsp);
422 tsp->flags |= CM_SERVERFLAG_PINGING;
423 lock_ReleaseMutex(&tsp->mx);
425 serversp[nconns] = tsp;
426 code = cm_ConnByServer(tsp, cm_rootUserp, &conns[nconns]);
428 lock_ObtainRead(&cm_serverLock);
429 cm_PutServerNoLock(tsp);
432 lock_ObtainRead(&cm_serverLock);
433 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
434 if (conntimer[nconns] = (isDown ? 1 : 0))
435 rx_SetConnDeadTime(rxconns[nconns], 10);
439 lock_ReleaseRead(&cm_serverLock);
442 /* Perform the multi call */
444 multi_Rx(rxconns,nconns)
446 multi_RXAFS_GetCapabilities(&caps[multi_i]);
447 results[multi_i]=multi_error;
451 /* Process results of servers that support RXAFS_GetCapabilities */
452 for (i=0; i<nconns; i++) {
453 /* Leave the servers that did not support GetCapabilities alone */
454 if (results[i] == RXGEN_OPCODE)
458 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
459 rx_PutConnection(rxconns[i]);
460 cm_PutConn(conns[i]);
463 cm_GCConnections(tsp);
465 lock_ObtainMutex(&tsp->mx);
466 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
468 if (results[i] >= 0) {
469 /* mark server as up */
470 tsp->flags &= ~CM_SERVERFLAG_DOWN;
473 /* we currently handle 32-bits of capabilities */
474 if (caps[i].Capabilities_len > 0) {
475 tsp->capabilities = caps[i].Capabilities_val[0];
476 xdr_free((xdrproc_t) xdr_Capabilities, &caps[i]);
477 caps[i].Capabilities_len = 0;
478 caps[i].Capabilities_val = 0;
480 tsp->capabilities = 0;
483 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
484 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
485 osi_LogSaveString(afsd_logp, hoststr),
486 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
489 /* Now update the volume status if necessary */
491 cm_server_vols_t * tsrvp;
495 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
496 for (i=0; i<NUM_SERVER_VOLS; i++) {
497 if (tsrvp->ids[i] != 0) {
500 lock_ReleaseMutex(&tsp->mx);
501 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
502 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
503 lock_ObtainMutex(&tsp->mx);
505 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
513 /* mark server as down */
514 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
515 tsp->flags |= CM_SERVERFLAG_DOWN;
516 tsp->downTime = time(NULL);
518 if (code != VRESTARTING) {
519 lock_ReleaseMutex(&tsp->mx);
520 cm_ForceNewConnections(tsp);
521 lock_ObtainMutex(&tsp->mx);
523 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
524 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
525 osi_LogSaveString(afsd_logp, hoststr),
526 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
529 /* Now update the volume status if necessary */
531 cm_server_vols_t * tsrvp;
535 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
536 for (i=0; i<NUM_SERVER_VOLS; i++) {
537 if (tsrvp->ids[i] != 0) {
540 lock_ReleaseMutex(&tsp->mx);
541 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
542 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
543 lock_ObtainMutex(&tsp->mx);
545 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
554 if (tsp->waitCount == 0)
555 tsp->flags &= ~CM_SERVERFLAG_PINGING;
557 osi_Wakeup((LONG_PTR)tsp);
559 lock_ReleaseMutex(&tsp->mx);
565 * At this point we have handled any responses that did not indicate
566 * that RXAFS_GetCapabilities is not supported.
568 for ( i=0, j=0; i<nconns; i++) {
569 if (results[i] == RXGEN_OPCODE) {
572 rxconns[j] = rxconns[i];
573 serversp[j] = serversp[i];
581 /* Perform the multi call */
583 multi_Rx(rxconns,nconns)
586 multi_RXAFS_GetTime(&secs, &usecs);
588 results[multi_i]=multi_error;
589 if ((start == end) && !multi_error)
590 deltas[multi_i] = end - secs;
594 /* Process Results of servers that only support RXAFS_GetTime */
595 for (i=0; i<nconns; i++) {
596 /* Leave the servers that did not support GetCapabilities alone */
598 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
599 rx_PutConnection(rxconns[i]);
600 cm_PutConn(conns[i]);
603 cm_GCConnections(tsp);
605 lock_ObtainMutex(&tsp->mx);
606 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
608 if (results[i] >= 0) {
609 /* mark server as up */
610 tsp->flags &= ~CM_SERVERFLAG_DOWN;
612 tsp->capabilities = 0;
614 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
615 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
616 osi_LogSaveString(afsd_logp, hoststr),
617 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
620 /* Now update the volume status if necessary */
622 cm_server_vols_t * tsrvp;
626 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
627 for (i=0; i<NUM_SERVER_VOLS; i++) {
628 if (tsrvp->ids[i] != 0) {
631 lock_ReleaseMutex(&tsp->mx);
632 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
633 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
634 lock_ObtainMutex(&tsp->mx);
636 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
644 /* mark server as down */
645 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
646 tsp->flags |= CM_SERVERFLAG_DOWN;
647 tsp->downTime = time(NULL);
649 if (code != VRESTARTING) {
650 lock_ReleaseMutex(&tsp->mx);
651 cm_ForceNewConnections(tsp);
652 lock_ObtainMutex(&tsp->mx);
654 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
655 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
656 osi_LogSaveString(afsd_logp, hoststr),
657 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
660 /* Now update the volume status if necessary */
662 cm_server_vols_t * tsrvp;
666 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
667 for (i=0; i<NUM_SERVER_VOLS; i++) {
668 if (tsrvp->ids[i] != 0) {
671 lock_ReleaseMutex(&tsp->mx);
672 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
673 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
674 lock_ObtainMutex(&tsp->mx);
676 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
685 if (tsp->waitCount == 0)
686 tsp->flags &= ~CM_SERVERFLAG_PINGING;
688 osi_Wakeup((LONG_PTR)tsp);
690 lock_ReleaseMutex(&tsp->mx);
696 if ((flags & CM_FLAG_CHECKVLDBSERVERS) ||
697 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
699 lock_ObtainRead(&cm_serverLock);
700 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
701 if (tsp->type != CM_SERVER_VLDB ||
702 tsp->cellp == NULL || /* SetPref only */
703 cellp && cellp != tsp->cellp)
706 cm_GetServerNoLock(tsp);
707 lock_ReleaseRead(&cm_serverLock);
709 lock_ObtainMutex(&tsp->mx);
710 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
712 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
713 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
714 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
715 lock_ReleaseMutex(&tsp->mx);
716 lock_ObtainRead(&cm_serverLock);
717 cm_PutServerNoLock(tsp);
721 tsp->flags |= CM_SERVERFLAG_PINGING;
722 lock_ReleaseMutex(&tsp->mx);
724 serversp[nconns] = tsp;
725 code = cm_ConnByServer(tsp, cm_rootUserp, &conns[nconns]);
727 lock_ObtainRead(&cm_serverLock);
728 cm_PutServerNoLock(tsp);
731 lock_ObtainRead(&cm_serverLock);
732 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
733 conntimer[nconns] = (isDown ? 1 : 0);
735 rx_SetConnDeadTime(rxconns[nconns], 10);
739 lock_ReleaseRead(&cm_serverLock);
742 /* Perform the multi call */
744 multi_Rx(rxconns,nconns)
746 multi_VL_ProbeServer();
747 results[multi_i]=multi_error;
751 /* Process results of servers that support VL_ProbeServer */
752 for (i=0; i<nconns; i++) {
754 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
755 rx_PutConnection(rxconns[i]);
756 cm_PutConn(conns[i]);
759 cm_GCConnections(tsp);
761 lock_ObtainMutex(&tsp->mx);
762 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
764 if (results[i] >= 0) {
765 /* mark server as up */
766 tsp->flags &= ~CM_SERVERFLAG_DOWN;
768 tsp->capabilities = 0;
770 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
771 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
772 osi_LogSaveString(afsd_logp, hoststr),
773 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
776 /* mark server as down */
777 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
778 tsp->flags |= CM_SERVERFLAG_DOWN;
779 tsp->downTime = time(NULL);
781 if (code != VRESTARTING) {
782 lock_ReleaseMutex(&tsp->mx);
783 cm_ForceNewConnections(tsp);
784 lock_ObtainMutex(&tsp->mx);
786 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
787 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
788 osi_LogSaveString(afsd_logp, hoststr),
789 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
793 if (tsp->waitCount == 0)
794 tsp->flags &= ~CM_SERVERFLAG_PINGING;
796 osi_Wakeup((LONG_PTR)tsp);
798 lock_ReleaseMutex(&tsp->mx);
813 void cm_CheckServers(afs_uint32 flags, cm_cell_t *cellp)
820 code = RegOpenKeyEx(HKEY_LOCAL_MACHINE, AFSREG_CLT_SVC_PARAM_SUBKEY,
821 0, KEY_QUERY_VALUE, &parmKey);
822 if (code == ERROR_SUCCESS) {
823 dummyLen = sizeof(multi);
824 code = RegQueryValueEx(parmKey, "MultiCheckServers", NULL, NULL,
825 (BYTE *) &multi, &dummyLen);
826 RegCloseKey (parmKey);
830 cm_CheckServersMulti(flags, cellp);
832 cm_CheckServersSingular(flags, cellp);
835 void cm_InitServer(void)
837 static osi_once_t once;
839 if (osi_Once(&once)) {
840 lock_InitializeRWLock(&cm_serverLock, "cm_serverLock", LOCK_HIERARCHY_SERVER_GLOBAL);
841 lock_InitializeRWLock(&cm_syscfgLock, "cm_syscfgLock", LOCK_HIERARCHY_SYSCFG_GLOBAL);
846 /* Protected by cm_syscfgLock (rw) */
847 int cm_noIPAddr; /* number of client network interfaces */
848 int cm_IPAddr[CM_MAXINTERFACE_ADDR]; /* client's IP address in host order */
849 int cm_SubnetMask[CM_MAXINTERFACE_ADDR];/* client's subnet mask in host order*/
850 int cm_NetMtu[CM_MAXINTERFACE_ADDR]; /* client's MTU sizes */
851 int cm_NetFlags[CM_MAXINTERFACE_ADDR]; /* network flags */
852 int cm_LanAdapterChangeDetected = 1;
854 void cm_SetLanAdapterChangeDetected(void)
856 lock_ObtainWrite(&cm_syscfgLock);
857 cm_LanAdapterChangeDetected = 1;
858 lock_ReleaseWrite(&cm_syscfgLock);
861 void cm_GetServer(cm_server_t *serverp)
863 lock_ObtainRead(&cm_serverLock);
864 InterlockedIncrement(&serverp->refCount);
865 lock_ReleaseRead(&cm_serverLock);
868 void cm_GetServerNoLock(cm_server_t *serverp)
870 InterlockedIncrement(&serverp->refCount);
873 void cm_PutServer(cm_server_t *serverp)
876 lock_ObtainRead(&cm_serverLock);
877 refCount = InterlockedDecrement(&serverp->refCount);
878 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
879 lock_ReleaseRead(&cm_serverLock);
882 void cm_PutServerNoLock(cm_server_t *serverp)
884 afs_int32 refCount = InterlockedDecrement(&serverp->refCount);
885 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
888 void cm_SetServerNo64Bit(cm_server_t * serverp, int no64bit)
890 lock_ObtainMutex(&serverp->mx);
892 serverp->flags |= CM_SERVERFLAG_NO64BIT;
894 serverp->flags &= ~CM_SERVERFLAG_NO64BIT;
895 lock_ReleaseMutex(&serverp->mx);
898 void cm_SetServerNoInlineBulk(cm_server_t * serverp, int no)
900 lock_ObtainMutex(&serverp->mx);
902 serverp->flags |= CM_SERVERFLAG_NOINLINEBULK;
904 serverp->flags &= ~CM_SERVERFLAG_NOINLINEBULK;
905 lock_ReleaseMutex(&serverp->mx);
908 void cm_SetServerPrefs(cm_server_t * serverp)
910 unsigned long serverAddr; /* in host byte order */
911 unsigned long myAddr, myNet, mySubnet;/* in host byte order */
912 unsigned long netMask;
917 lock_ObtainRead(&cm_syscfgLock);
918 if (cm_LanAdapterChangeDetected) {
919 lock_ConvertRToW(&cm_syscfgLock);
921 if (cm_LanAdapterChangeDetected) {
922 /* get network related info */
923 cm_noIPAddr = CM_MAXINTERFACE_ADDR;
924 code = syscfg_GetIFInfo(&cm_noIPAddr,
925 cm_IPAddr, cm_SubnetMask,
926 cm_NetMtu, cm_NetFlags);
927 cm_LanAdapterChangeDetected = 0;
929 lock_ConvertWToR(&cm_syscfgLock);
932 serverAddr = ntohl(serverp->addr.sin_addr.s_addr);
933 serverp->ipRank = CM_IPRANK_LOW; /* default settings */
935 for ( i=0; i < cm_noIPAddr; i++)
937 /* loop through all the client's IP address and compare
938 ** each of them against the server's IP address */
940 myAddr = cm_IPAddr[i];
941 if ( IN_CLASSA(myAddr) )
942 netMask = IN_CLASSA_NET;
943 else if ( IN_CLASSB(myAddr) )
944 netMask = IN_CLASSB_NET;
945 else if ( IN_CLASSC(myAddr) )
946 netMask = IN_CLASSC_NET;
950 myNet = myAddr & netMask;
951 mySubnet = myAddr & cm_SubnetMask[i];
953 if ( (serverAddr & netMask) == myNet )
955 if ( (serverAddr & cm_SubnetMask[i]) == mySubnet)
957 if ( serverAddr == myAddr )
958 serverp->ipRank = min(serverp->ipRank,
959 CM_IPRANK_TOP);/* same machine */
960 else serverp->ipRank = min(serverp->ipRank,
961 CM_IPRANK_HI); /* same subnet */
963 else serverp->ipRank = min(serverp->ipRank,CM_IPRANK_MED);
966 } /* and of for loop */
968 /* random between 0..15*/
969 serverp->ipRank += (rand() % 0x000f);
970 lock_ReleaseRead(&cm_syscfgLock);
973 cm_server_t *cm_NewServer(struct sockaddr_in *socketp, int type, cm_cell_t *cellp, afsUUID *uuidp, afs_uint32 flags) {
976 osi_assertx(socketp->sin_family == AF_INET, "unexpected socket family");
978 tsp = malloc(sizeof(*tsp));
980 memset(tsp, 0, sizeof(*tsp));
983 if (uuidp && !afs_uuid_is_nil(uuidp)) {
985 tsp->flags |= CM_SERVERFLAG_UUID;
988 lock_InitializeMutex(&tsp->mx, "cm_server_t mutex", LOCK_HIERARCHY_SERVER);
989 tsp->addr = *socketp;
991 cm_SetServerPrefs(tsp);
993 lock_ObtainWrite(&cm_serverLock); /* get server lock */
994 tsp->allNextp = cm_allServersp;
995 cm_allServersp = tsp;
1001 case CM_SERVER_FILE:
1002 cm_numFileServers++;
1006 lock_ReleaseWrite(&cm_serverLock); /* release server lock */
1008 if ( !(flags & CM_FLAG_NOPROBE) ) {
1009 tsp->flags |= CM_SERVERFLAG_DOWN; /* assume down; ping will mark up if available */
1010 cm_PingServer(tsp); /* Obtain Capabilities and check up/down state */
1017 cm_FindServerByIP(afs_uint32 ipaddr, unsigned short port, int type)
1021 lock_ObtainRead(&cm_serverLock);
1022 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
1023 if (tsp->type == type &&
1024 tsp->addr.sin_addr.S_un.S_addr == ipaddr &&
1025 (tsp->addr.sin_port == port || tsp->addr.sin_port == 0))
1029 /* bump ref count if we found the server */
1031 cm_GetServerNoLock(tsp);
1033 lock_ReleaseRead(&cm_serverLock);
1039 cm_FindServerByUuid(afsUUID *serverUuid, int type)
1043 lock_ObtainRead(&cm_serverLock);
1044 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
1045 if (tsp->type == type && !afs_uuid_equal(&tsp->uuid, serverUuid))
1049 /* bump ref count if we found the server */
1051 cm_GetServerNoLock(tsp);
1053 lock_ReleaseRead(&cm_serverLock);
1058 /* find a server based on its properties */
1059 cm_server_t *cm_FindServer(struct sockaddr_in *addrp, int type)
1063 osi_assertx(addrp->sin_family == AF_INET, "unexpected socket value");
1065 lock_ObtainRead(&cm_serverLock);
1066 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp) {
1067 if (tsp->type == type &&
1068 tsp->addr.sin_addr.s_addr == addrp->sin_addr.s_addr &&
1069 (tsp->addr.sin_port == addrp->sin_port || tsp->addr.sin_port == 0))
1073 /* bump ref count if we found the server */
1075 cm_GetServerNoLock(tsp);
1077 /* drop big table lock */
1078 lock_ReleaseRead(&cm_serverLock);
1080 /* return what we found */
1084 cm_server_vols_t *cm_NewServerVols(void) {
1085 cm_server_vols_t *tsvp;
1087 tsvp = malloc(sizeof(*tsvp));
1089 memset(tsvp, 0, sizeof(*tsvp));
1094 cm_serverRef_t *cm_NewServerRef(cm_server_t *serverp, afs_uint32 volID)
1096 cm_serverRef_t *tsrp;
1097 cm_server_vols_t **tsrvpp = NULL;
1098 afs_uint32 *slotp = NULL;
1101 cm_GetServer(serverp);
1102 tsrp = malloc(sizeof(*tsrp));
1103 tsrp->server = serverp;
1104 tsrp->status = srv_not_busy;
1106 tsrp->volID = volID;
1109 /* if we have a non-zero volID, we need to add it to the list
1110 * of volumes maintained by the server. There are two phases:
1111 * (1) see if the volID is already in the list and (2) insert
1112 * it into the first empty slot if it is not.
1115 lock_ObtainMutex(&serverp->mx);
1117 tsrvpp = &serverp->vols;
1121 for (i=0; i<NUM_SERVER_VOLS; i++) {
1122 if ((*tsrvpp)->ids[i] == volID) {
1125 } else if (!slotp && (*tsrvpp)->ids[i] == 0) {
1126 slotp = &(*tsrvpp)->ids[i];
1133 tsrvpp = &(*tsrvpp)->nextp;
1140 /* if we didn't find an empty slot in a current
1141 * page we must need a new page */
1142 *tsrvpp = cm_NewServerVols();
1144 (*tsrvpp)->ids[0] = volID;
1148 lock_ReleaseMutex(&serverp->mx);
1154 LONG_PTR cm_ChecksumServerList(cm_serverRef_t *serversp)
1158 cm_serverRef_t *tsrp;
1160 lock_ObtainRead(&cm_serverLock);
1161 for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
1162 if (tsrp->status == srv_deleted)
1168 sum ^= (LONG_PTR) tsrp->server;
1171 lock_ReleaseRead(&cm_serverLock);
1176 ** Insert a server into the server list keeping the list sorted in
1177 ** ascending order of ipRank.
1179 ** The refCount of the cm_serverRef_t is increased
1181 void cm_InsertServerList(cm_serverRef_t** list, cm_serverRef_t* element)
1183 cm_serverRef_t *current=*list;
1184 unsigned short ipRank = element->server->ipRank;
1186 lock_ObtainWrite(&cm_serverLock);
1187 element->refCount++; /* increase refCount */
1189 /* insertion into empty list or at the beginning of the list */
1190 if ( !current || (current->server->ipRank > ipRank) )
1192 element->next = *list;
1194 lock_ReleaseWrite(&cm_serverLock);
1198 while ( current->next ) /* find appropriate place to insert */
1200 if ( current->next->server->ipRank > ipRank )
1202 else current = current->next;
1204 element->next = current->next;
1205 current->next = element;
1206 lock_ReleaseWrite(&cm_serverLock);
1209 ** Re-sort the server list with the modified rank
1210 ** returns 0 if element was changed successfully.
1211 ** returns 1 if list remained unchanged.
1213 long cm_ChangeRankServer(cm_serverRef_t** list, cm_server_t* server)
1215 cm_serverRef_t **current=list;
1216 cm_serverRef_t *element=0;
1218 /* if there is max of one element in the list, nothing to sort */
1219 if ( (!*current) || !((*current)->next) )
1220 return 1; /* list unchanged: return success */
1222 lock_ObtainWrite(&cm_serverLock);
1223 /* if the server is on the list, delete it from list */
1226 if ( (*current)->server == server)
1228 element = (*current);
1229 *current = (*current)->next; /* delete it */
1232 current = & ( (*current)->next);
1234 lock_ReleaseWrite(&cm_serverLock);
1236 /* if this volume is not replicated on this server */
1238 return 1; /* server is not on list */
1240 /* re-insert deleted element into the list with modified rank*/
1241 cm_InsertServerList(list, element);
1243 /* reduce refCount which was increased by cm_InsertServerList */
1244 lock_ObtainWrite(&cm_serverLock);
1245 element->refCount--;
1246 lock_ReleaseWrite(&cm_serverLock);
1250 ** If there are more than one server on the list and the first n servers on
1251 ** the list have the same rank( n>1), then randomise among the first n servers.
1253 void cm_RandomizeServer(cm_serverRef_t** list)
1256 cm_serverRef_t* tsrp = *list, *lastTsrp;
1257 unsigned short lowestRank;
1259 /* an empty list or a list with only one element */
1260 if ( !tsrp || ! tsrp->next )
1263 lock_ObtainWrite(&cm_serverLock);
1265 /* count the number of servers with the lowest rank */
1266 lowestRank = tsrp->server->ipRank;
1267 for ( count=1, tsrp=tsrp->next; tsrp; tsrp=tsrp->next)
1269 if ( tsrp->server->ipRank != lowestRank)
1275 /* if there is only one server with the lowest rank, we are done */
1277 lock_ReleaseWrite(&cm_serverLock);
1281 picked = rand() % count;
1283 lock_ReleaseWrite(&cm_serverLock);
1288 while (--picked >= 0)
1293 lastTsrp->next = tsrp->next; /* delete random element from list*/
1294 tsrp->next = *list; /* insert element at the beginning of list */
1296 lock_ReleaseWrite(&cm_serverLock);
1299 /* call cm_FreeServer while holding a write lock on cm_serverLock */
1300 void cm_FreeServer(cm_server_t* serverp)
1302 cm_server_vols_t * tsrvp, *nextp;
1305 cm_PutServerNoLock(serverp);
1306 if (serverp->refCount == 0)
1309 * we need to check to ensure that all of the connections
1310 * for this server have a 0 refCount; otherwise, they will
1311 * not be garbage collected
1313 * must drop the cm_serverLock because cm_GCConnections
1314 * obtains the cm_connLock and that comes first in the
1317 lock_ReleaseWrite(&cm_serverLock);
1318 cm_GCConnections(serverp); /* connsp */
1319 lock_ObtainWrite(&cm_serverLock);
1324 * Once we have the cm_serverLock locked check to make
1325 * sure the refCount is still zero before removing the
1328 if (serverp->refCount == 0) {
1329 if (!(serverp->flags & CM_SERVERFLAG_PREF_SET)) {
1330 switch (serverp->type) {
1331 case CM_SERVER_VLDB:
1332 cm_numVldbServers--;
1334 case CM_SERVER_FILE:
1335 cm_numFileServers--;
1339 lock_FinalizeMutex(&serverp->mx);
1340 if ( cm_allServersp == serverp )
1341 cm_allServersp = serverp->allNextp;
1345 for(tsp = cm_allServersp; tsp->allNextp; tsp=tsp->allNextp) {
1346 if ( tsp->allNextp == serverp ) {
1347 tsp->allNextp = serverp->allNextp;
1353 /* free the volid list */
1354 for ( tsrvp = serverp->vols; tsrvp; tsrvp = nextp) {
1355 nextp = tsrvp->nextp;
1364 /* Called with cm_serverLock write locked */
1365 void cm_RemoveVolumeFromServer(cm_server_t * serverp, afs_uint32 volID)
1367 cm_server_vols_t * tsrvp;
1373 for (tsrvp = serverp->vols; tsrvp; tsrvp = tsrvp->nextp) {
1374 for (i=0; i<NUM_SERVER_VOLS; i++) {
1375 if (tsrvp->ids[i] == volID) {
1383 void cm_FreeServerList(cm_serverRef_t** list, afs_uint32 flags)
1385 cm_serverRef_t **current = list;
1386 cm_serverRef_t **nextp = 0;
1387 cm_serverRef_t * next = 0;
1389 lock_ObtainWrite(&cm_serverLock);
1396 nextp = &(*current)->next;
1397 if (--((*current)->refCount) == 0) {
1400 if ((*current)->volID)
1401 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1402 cm_FreeServer((*current)->server);
1406 if (flags & CM_FREESERVERLIST_DELETE) {
1407 (*current)->status = srv_deleted;
1408 if ((*current)->volID)
1409 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1417 lock_ReleaseWrite(&cm_serverLock);
1420 /* dump all servers to a file.
1421 * cookie is used to identify this batch for easy parsing,
1422 * and it a string provided by a caller
1424 int cm_DumpServers(FILE *outputFile, char *cookie, int lock)
1433 lock_ObtainRead(&cm_serverLock);
1436 "%s - dumping servers - cm_numFileServers=%d, cm_numVldbServers=%d\r\n",
1437 cookie, cm_numFileServers, cm_numVldbServers);
1438 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1440 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp)
1445 switch (tsp->type) {
1446 case CM_SERVER_VLDB:
1449 case CM_SERVER_FILE:
1456 afsUUID_to_string(&tsp->uuid, uuidstr, sizeof(uuidstr));
1457 afs_inet_ntoa_r(tsp->addr.sin_addr.s_addr, hoststr);
1458 down = ctime(&tsp->downTime);
1459 down[strlen(down)-1] = '\0';
1462 "%s - tsp=0x%p cell=%s addr=%-15s port=%u uuid=%s type=%s caps=0x%x "
1463 "flags=0x%x waitCount=%u rank=%u downTime=\"%s\" refCount=%u\r\n",
1464 cookie, tsp, tsp->cellp ? tsp->cellp->name : "", hoststr,
1465 ntohs(tsp->addr.sin_port), uuidstr, type,
1466 tsp->capabilities, tsp->flags, tsp->waitCount, tsp->ipRank,
1467 (tsp->flags & CM_SERVERFLAG_DOWN) ? down : "up",
1469 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1471 sprintf(output, "%s - Done dumping servers.\r\n", cookie);
1472 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1475 lock_ReleaseRead(&cm_serverLock);
1481 * Determine if two servers are in fact the same.
1483 * Returns 1 if they match, 0 if they do not
1485 int cm_ServerEqual(cm_server_t *srv1, cm_server_t *srv2)
1489 if (srv1 == NULL || srv2 == NULL)
1495 if (srv1->flags & CM_SERVERFLAG_UUID) {
1496 if (!(srv2->flags & CM_SERVERFLAG_UUID))
1499 /* Both support UUID */
1500 if (UuidEqual((UUID *)&srv1->uuid, (UUID *)&srv2->uuid, &status))