2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afsconfig.h>
11 #include <afs/param.h>
24 #include <WINNT\syscfg.h>
25 #include <WINNT/afsreg.h>
30 osi_rwlock_t cm_serverLock;
31 osi_rwlock_t cm_syscfgLock;
33 cm_server_t *cm_allServersp;
34 afs_uint32 cm_numFileServers = 0;
35 afs_uint32 cm_numVldbServers = 0;
38 cm_ForceNewConnectionsAllServers(void)
42 lock_ObtainRead(&cm_serverLock);
43 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
44 cm_GetServerNoLock(tsp);
45 lock_ReleaseRead(&cm_serverLock);
46 cm_ForceNewConnections(tsp);
47 lock_ObtainRead(&cm_serverLock);
48 cm_PutServerNoLock(tsp);
50 lock_ReleaseRead(&cm_serverLock);
54 * lock_ObtainMutex must be held prior to calling
58 cm_RankServer(cm_server_t * tsp)
60 afs_int32 code = 0; /* start with "success" */
61 struct rx_debugPeer tpeer;
76 code = rx_GetLocalPeers(tsp->addr.sin_addr.s_addr, port, &tpeer);
78 /*check if rx_GetLocalPeers succeeded and if there is data for tsp */
79 if(code == 0 && (tpeer.rtt == 0 && tpeer.rtt_dev == 0))
83 if((tsp->flags & CM_SERVERFLAG_PREF_SET))
84 newRank = tsp->adminRank +
85 ((int)(623 * log(tpeer.rtt) / 10) * 10 + 5);
86 else /* rank has not been set by admin, derive rank from rtt */
87 newRank = (int)(7200 * log(tpeer.rtt) / 5000) * 5000 + 5000;
89 newRank += (rand() & 0x000f); /* randomize */
91 if (abs(newRank - tsp->ipRank) > 0xf) {
92 tsp->ipRank = newRank;
94 lock_ReleaseMutex(&tsp->mx);
98 * find volumes which might have RO copy
99 * on server and change the ordering of
102 cm_ChangeRankVolume(tsp);
105 /* set preferences for an existing vlserver */
106 cm_ChangeRankCellVLServer(tsp);
109 lock_ObtainMutex(&tsp->mx);
117 cm_PingServer(cm_server_t *tsp)
122 struct rx_connection * rxconnp;
123 Capabilities caps = {0, 0};
127 lock_ObtainMutex(&tsp->mx);
128 if (tsp->flags & CM_SERVERFLAG_PINGING) {
130 osi_SleepM((LONG_PTR)tsp, &tsp->mx);
131 lock_ObtainMutex(&tsp->mx);
133 if (tsp->waitCount == 0)
134 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_PINGING);
136 osi_Wakeup((LONG_PTR)tsp);
137 lock_ReleaseMutex(&tsp->mx);
140 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_PINGING);
141 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
142 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
143 lock_ReleaseMutex(&tsp->mx);
145 code = cm_ConnByServer(tsp, cm_rootUserp, FALSE, &connp);
147 /* now call the appropriate ping call. Drop the timeout if
148 * the server is known to be down, so that we don't waste a
149 * lot of time retiming out down servers.
152 osi_Log4(afsd_logp, "cm_PingServer server %s (%s) was %s with caps 0x%x",
153 osi_LogSaveString(afsd_logp, hoststr),
154 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
155 wasDown ? "down" : "up",
158 rxconnp = cm_GetRxConn(connp);
160 rx_SetConnDeadTime(rxconnp, 10);
161 if (tsp->type == CM_SERVER_VLDB) {
162 code = VL_ProbeServer(rxconnp);
166 code = RXAFS_GetCapabilities(rxconnp, &caps);
169 rx_SetConnDeadTime(rxconnp, ConnDeadtimeout);
170 rx_PutConnection(rxconnp);
172 } /* got an unauthenticated connection to this server */
174 lock_ObtainMutex(&tsp->mx);
175 if (code >= 0 || code == RXGEN_OPCODE || code == RX_CALL_BUSY) {
176 /* mark server as up */
177 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_DOWN);
180 /* we currently handle 32-bits of capabilities */
181 if (code != RXGEN_OPCODE && code != RX_CALL_BUSY &&
182 caps.Capabilities_len > 0) {
183 tsp->capabilities = caps.Capabilities_val[0];
184 xdr_free((xdrproc_t) xdr_Capabilities, &caps);
185 caps.Capabilities_len = 0;
186 caps.Capabilities_val = 0;
188 tsp->capabilities = 0;
191 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is up with caps 0x%x",
192 osi_LogSaveString(afsd_logp, hoststr),
193 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
196 /* Now update the volume status if necessary */
198 cm_server_vols_t * tsrvp;
202 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
203 for (i=0; i<NUM_SERVER_VOLS; i++) {
204 if (tsrvp->ids[i] != 0) {
207 lock_ReleaseMutex(&tsp->mx);
208 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
209 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
210 lock_ObtainMutex(&tsp->mx);
212 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
220 /* mark server as down */
221 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
222 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_DOWN);
223 tsp->downTime = time(NULL);
225 if (code != VRESTARTING) {
226 lock_ReleaseMutex(&tsp->mx);
227 cm_ForceNewConnections(tsp);
228 lock_ObtainMutex(&tsp->mx);
230 osi_Log3(afsd_logp, "cm_PingServer server %s (%s) is down with caps 0x%x",
231 osi_LogSaveString(afsd_logp, hoststr),
232 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
235 /* Now update the volume status if necessary */
237 cm_server_vols_t * tsrvp;
241 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
242 for (i=0; i<NUM_SERVER_VOLS; i++) {
243 if (tsrvp->ids[i] != 0) {
246 lock_ReleaseMutex(&tsp->mx);
247 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
248 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
249 lock_ObtainMutex(&tsp->mx);
251 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
260 if (tsp->waitCount == 0)
261 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_PINGING);
263 osi_Wakeup((LONG_PTR)tsp);
264 lock_ReleaseMutex(&tsp->mx);
272 lock_ObtainRead(&cm_serverLock);
273 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
274 cm_GetServerNoLock(tsp);
275 lock_ReleaseRead(&cm_serverLock);
277 lock_ObtainMutex(&tsp->mx);
279 /* if the server is not down, rank the server */
280 if(!(tsp->flags & CM_SERVERFLAG_DOWN))
283 lock_ReleaseMutex(&tsp->mx);
285 lock_ObtainRead(&cm_serverLock);
286 cm_PutServerNoLock(tsp);
288 lock_ReleaseRead(&cm_serverLock);
291 static void cm_CheckServersSingular(afs_uint32 flags, cm_cell_t *cellp)
293 /* ping all file servers, up or down, with unauthenticated connection,
294 * to find out whether we have all our callbacks from the server still.
295 * Also, ping down VLDBs.
303 lock_ObtainRead(&cm_serverLock);
304 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
305 cm_GetServerNoLock(tsp);
306 lock_ReleaseRead(&cm_serverLock);
308 /* now process the server */
309 lock_ObtainMutex(&tsp->mx);
312 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
313 isFS = tsp->type == CM_SERVER_FILE;
314 isVLDB = tsp->type == CM_SERVER_VLDB;
316 /* only do the ping if the cell matches the requested cell, or we're
317 * matching all cells (cellp == NULL), and if we've requested to ping
318 * this type of {up, down} servers.
320 if ((cellp == NULL || cellp == tsp->cellp) &&
321 ((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
322 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS))) &&
323 ((!(flags & CM_FLAG_CHECKVLDBSERVERS) ||
324 isVLDB && (flags & CM_FLAG_CHECKVLDBSERVERS)) &&
325 (!(flags & CM_FLAG_CHECKFILESERVERS) ||
326 isFS && (flags & CM_FLAG_CHECKFILESERVERS)))) {
328 } /* we're supposed to check this up/down server */
329 lock_ReleaseMutex(&tsp->mx);
331 /* at this point, we've adjusted the server state, so do the ping and
337 /* also, run the GC function for connections on all of the
338 * server's connections.
340 cm_GCConnections(tsp);
342 lock_ObtainRead(&cm_serverLock);
343 cm_PutServerNoLock(tsp);
345 lock_ReleaseRead(&cm_serverLock);
348 static void cm_CheckServersMulti(afs_uint32 flags, cm_cell_t *cellp)
351 * The goal of this function is to probe simultaneously
352 * probe all of the up/down servers (vldb/file) as
353 * specified by flags in the minimum number of RPCs.
354 * Effectively that means use one multi_RXAFS_GetCapabilities()
355 * followed by possibly one multi_RXAFS_GetTime() and
356 * one multi_VL_ProbeServer().
358 * To make this work we must construct the list of vldb
359 * and file servers that are to be probed as well as the
360 * associated data structures.
363 int srvAddrCount = 0;
364 struct srvAddr **addrs = NULL;
365 cm_conn_t **conns = NULL;
366 struct rx_connection **rxconns = NULL;
368 afs_int32 i, nconns = 0, maxconns;
369 afs_int32 *conntimer, *results;
370 Capabilities *caps = NULL;
371 cm_server_t ** serversp, *tsp;
372 afs_uint32 isDown, wasDown;
374 time_t start, *deltas;
378 maxconns = max(cm_numFileServers,cm_numVldbServers);
382 conns = (cm_conn_t **)malloc(maxconns * sizeof(cm_conn_t *));
383 rxconns = (struct rx_connection **)malloc(maxconns * sizeof(struct rx_connection *));
384 conntimer = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
385 deltas = (time_t *)malloc(maxconns * sizeof (time_t));
386 results = (afs_int32 *)malloc(maxconns * sizeof (afs_int32));
387 serversp = (cm_server_t **)malloc(maxconns * sizeof(cm_server_t *));
388 caps = (Capabilities *)malloc(maxconns * sizeof(Capabilities));
390 memset(caps, 0, maxconns * sizeof(Capabilities));
392 if ((flags & CM_FLAG_CHECKFILESERVERS) ||
393 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
395 lock_ObtainRead(&cm_serverLock);
396 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
397 if (tsp->type != CM_SERVER_FILE ||
398 tsp->cellp == NULL || /* SetPref only */
399 cellp && cellp != tsp->cellp)
402 cm_GetServerNoLock(tsp);
403 lock_ReleaseRead(&cm_serverLock);
405 lock_ObtainMutex(&tsp->mx);
406 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
408 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
409 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
410 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
411 lock_ReleaseMutex(&tsp->mx);
412 lock_ObtainRead(&cm_serverLock);
413 cm_PutServerNoLock(tsp);
417 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_PINGING);
418 lock_ReleaseMutex(&tsp->mx);
420 serversp[nconns] = tsp;
421 code = cm_ConnByServer(tsp, cm_rootUserp, FALSE, &conns[nconns]);
423 lock_ObtainRead(&cm_serverLock);
424 cm_PutServerNoLock(tsp);
427 lock_ObtainRead(&cm_serverLock);
428 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
429 if (conntimer[nconns] = (isDown ? 1 : 0))
430 rx_SetConnDeadTime(rxconns[nconns], 10);
434 lock_ReleaseRead(&cm_serverLock);
437 /* Perform the multi call */
439 multi_Rx(rxconns,nconns)
441 multi_RXAFS_GetCapabilities(&caps[multi_i]);
442 results[multi_i]=multi_error;
446 /* Process results of servers that support RXAFS_GetCapabilities */
447 for (i=0; i<nconns; i++) {
449 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
450 rx_PutConnection(rxconns[i]);
451 cm_PutConn(conns[i]);
454 cm_GCConnections(tsp);
456 lock_ObtainMutex(&tsp->mx);
457 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
459 if (results[i] >= 0 || results[i] == RXGEN_OPCODE ||
460 results[i] == RX_CALL_BUSY) {
461 /* mark server as up */
462 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_DOWN);
465 /* we currently handle 32-bits of capabilities */
466 if (results[i] != RXGEN_OPCODE && results[i] != RX_CALL_BUSY &&
467 caps[i].Capabilities_len > 0) {
468 tsp->capabilities = caps[i].Capabilities_val[0];
469 xdr_free((xdrproc_t) xdr_Capabilities, &caps[i]);
470 caps[i].Capabilities_len = 0;
471 caps[i].Capabilities_val = 0;
473 tsp->capabilities = 0;
476 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
477 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
478 osi_LogSaveString(afsd_logp, hoststr),
479 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
482 /* Now update the volume status if necessary */
484 cm_server_vols_t * tsrvp;
488 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
489 for (i=0; i<NUM_SERVER_VOLS; i++) {
490 if (tsrvp->ids[i] != 0) {
493 lock_ReleaseMutex(&tsp->mx);
494 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
495 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
496 lock_ObtainMutex(&tsp->mx);
498 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
506 /* mark server as down */
507 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
508 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_DOWN);
509 tsp->downTime = time(NULL);
511 if (code != VRESTARTING) {
512 lock_ReleaseMutex(&tsp->mx);
513 cm_ForceNewConnections(tsp);
514 lock_ObtainMutex(&tsp->mx);
516 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
517 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
518 osi_LogSaveString(afsd_logp, hoststr),
519 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
522 /* Now update the volume status if necessary */
524 cm_server_vols_t * tsrvp;
528 for (tsrvp = tsp->vols; tsrvp; tsrvp = tsrvp->nextp) {
529 for (i=0; i<NUM_SERVER_VOLS; i++) {
530 if (tsrvp->ids[i] != 0) {
533 lock_ReleaseMutex(&tsp->mx);
534 code = cm_FindVolumeByID(tsp->cellp, tsrvp->ids[i], cm_rootUserp,
535 &req, CM_GETVOL_FLAG_NO_LRU_UPDATE, &volp);
536 lock_ObtainMutex(&tsp->mx);
538 cm_UpdateVolumeStatus(volp, tsrvp->ids[i]);
547 if (tsp->waitCount == 0)
548 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_PINGING);
550 osi_Wakeup((LONG_PTR)tsp);
552 lock_ReleaseMutex(&tsp->mx);
558 if ((flags & CM_FLAG_CHECKVLDBSERVERS) ||
559 !(flags & (CM_FLAG_CHECKFILESERVERS|CM_FLAG_CHECKVLDBSERVERS)))
561 lock_ObtainRead(&cm_serverLock);
562 for (nconns=0, tsp = cm_allServersp; tsp && nconns < maxconns; tsp = tsp->allNextp) {
563 if (tsp->type != CM_SERVER_VLDB ||
564 tsp->cellp == NULL || /* SetPref only */
565 cellp && cellp != tsp->cellp)
568 cm_GetServerNoLock(tsp);
569 lock_ReleaseRead(&cm_serverLock);
571 lock_ObtainMutex(&tsp->mx);
572 isDown = tsp->flags & CM_SERVERFLAG_DOWN;
574 if ((tsp->flags & CM_SERVERFLAG_PINGING) ||
575 !((isDown && (flags & CM_FLAG_CHECKDOWNSERVERS)) ||
576 (!isDown && (flags & CM_FLAG_CHECKUPSERVERS)))) {
577 lock_ReleaseMutex(&tsp->mx);
578 lock_ObtainRead(&cm_serverLock);
579 cm_PutServerNoLock(tsp);
583 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_PINGING);
584 lock_ReleaseMutex(&tsp->mx);
586 serversp[nconns] = tsp;
587 code = cm_ConnByServer(tsp, cm_rootUserp, FALSE, &conns[nconns]);
589 lock_ObtainRead(&cm_serverLock);
590 cm_PutServerNoLock(tsp);
593 lock_ObtainRead(&cm_serverLock);
594 rxconns[nconns] = cm_GetRxConn(conns[nconns]);
595 conntimer[nconns] = (isDown ? 1 : 0);
597 rx_SetConnDeadTime(rxconns[nconns], 10);
601 lock_ReleaseRead(&cm_serverLock);
604 /* Perform the multi call */
606 multi_Rx(rxconns,nconns)
608 multi_VL_ProbeServer();
609 results[multi_i]=multi_error;
613 /* Process results of servers that support VL_ProbeServer */
614 for (i=0; i<nconns; i++) {
616 rx_SetConnDeadTime(rxconns[i], ConnDeadtimeout);
617 rx_PutConnection(rxconns[i]);
618 cm_PutConn(conns[i]);
621 cm_GCConnections(tsp);
623 lock_ObtainMutex(&tsp->mx);
624 wasDown = tsp->flags & CM_SERVERFLAG_DOWN;
626 if (results[i] >= 0 || results[i] == RX_CALL_BUSY) {
627 /* mark server as up */
628 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_DOWN);
630 tsp->capabilities = 0;
632 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
633 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is up with caps 0x%x",
634 osi_LogSaveString(afsd_logp, hoststr),
635 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
638 /* mark server as down */
639 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
640 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_DOWN);
641 tsp->downTime = time(NULL);
643 if (code != VRESTARTING) {
644 lock_ReleaseMutex(&tsp->mx);
645 cm_ForceNewConnections(tsp);
646 lock_ObtainMutex(&tsp->mx);
648 afs_inet_ntoa_r(tsp->addr.sin_addr.S_un.S_addr, hoststr);
649 osi_Log3(afsd_logp, "cm_MultiPingServer server %s (%s) is down with caps 0x%x",
650 osi_LogSaveString(afsd_logp, hoststr),
651 tsp->type == CM_SERVER_VLDB ? "vldb" : "file",
655 if (tsp->waitCount == 0)
656 _InterlockedAnd(&tsp->flags, ~CM_SERVERFLAG_PINGING);
658 osi_Wakeup((LONG_PTR)tsp);
660 lock_ReleaseMutex(&tsp->mx);
675 void cm_CheckServers(afs_uint32 flags, cm_cell_t *cellp)
682 code = RegOpenKeyEx(HKEY_LOCAL_MACHINE, AFSREG_CLT_SVC_PARAM_SUBKEY,
683 0, KEY_QUERY_VALUE, &parmKey);
684 if (code == ERROR_SUCCESS) {
685 dummyLen = sizeof(multi);
686 code = RegQueryValueEx(parmKey, "MultiCheckServers", NULL, NULL,
687 (BYTE *) &multi, &dummyLen);
688 RegCloseKey (parmKey);
692 cm_CheckServersMulti(flags, cellp);
694 cm_CheckServersSingular(flags, cellp);
697 void cm_InitServer(void)
699 static osi_once_t once;
701 if (osi_Once(&once)) {
702 lock_InitializeRWLock(&cm_serverLock, "cm_serverLock", LOCK_HIERARCHY_SERVER_GLOBAL);
703 lock_InitializeRWLock(&cm_syscfgLock, "cm_syscfgLock", LOCK_HIERARCHY_SYSCFG_GLOBAL);
708 /* Protected by cm_syscfgLock (rw) */
709 int cm_noIPAddr; /* number of client network interfaces */
710 int cm_IPAddr[CM_MAXINTERFACE_ADDR]; /* client's IP address in host order */
711 int cm_SubnetMask[CM_MAXINTERFACE_ADDR];/* client's subnet mask in host order*/
712 int cm_NetMtu[CM_MAXINTERFACE_ADDR]; /* client's MTU sizes */
713 int cm_NetFlags[CM_MAXINTERFACE_ADDR]; /* network flags */
714 int cm_LanAdapterChangeDetected = 1;
716 void cm_SetLanAdapterChangeDetected(void)
718 lock_ObtainWrite(&cm_syscfgLock);
719 cm_LanAdapterChangeDetected = 1;
720 lock_ReleaseWrite(&cm_syscfgLock);
723 void cm_GetServer(cm_server_t *serverp)
725 lock_ObtainRead(&cm_serverLock);
726 InterlockedIncrement(&serverp->refCount);
727 lock_ReleaseRead(&cm_serverLock);
730 void cm_GetServerNoLock(cm_server_t *serverp)
732 InterlockedIncrement(&serverp->refCount);
735 void cm_PutServer(cm_server_t *serverp)
738 lock_ObtainRead(&cm_serverLock);
739 refCount = InterlockedDecrement(&serverp->refCount);
740 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
741 lock_ReleaseRead(&cm_serverLock);
744 void cm_PutServerNoLock(cm_server_t *serverp)
746 afs_int32 refCount = InterlockedDecrement(&serverp->refCount);
747 osi_assertx(refCount >= 0, "cm_server_t refCount underflow");
750 void cm_SetServerNo64Bit(cm_server_t * serverp, int no64bit)
752 lock_ObtainMutex(&serverp->mx);
754 _InterlockedOr(&serverp->flags, CM_SERVERFLAG_NO64BIT);
756 _InterlockedAnd(&serverp->flags, ~CM_SERVERFLAG_NO64BIT);
757 lock_ReleaseMutex(&serverp->mx);
760 void cm_SetServerNoInlineBulk(cm_server_t * serverp, int no)
762 lock_ObtainMutex(&serverp->mx);
764 _InterlockedOr(&serverp->flags, CM_SERVERFLAG_NOINLINEBULK);
766 _InterlockedAnd(&serverp->flags, ~CM_SERVERFLAG_NOINLINEBULK);
767 lock_ReleaseMutex(&serverp->mx);
770 void cm_SetServerPrefs(cm_server_t * serverp)
772 unsigned long serverAddr; /* in host byte order */
773 unsigned long myAddr, myNet, mySubnet;/* in host byte order */
774 unsigned long netMask;
779 lock_ObtainRead(&cm_syscfgLock);
780 if (cm_LanAdapterChangeDetected) {
781 lock_ConvertRToW(&cm_syscfgLock);
783 if (cm_LanAdapterChangeDetected) {
784 /* get network related info */
785 cm_noIPAddr = CM_MAXINTERFACE_ADDR;
786 code = syscfg_GetIFInfo(&cm_noIPAddr,
787 cm_IPAddr, cm_SubnetMask,
788 cm_NetMtu, cm_NetFlags);
789 cm_LanAdapterChangeDetected = 0;
791 lock_ConvertWToR(&cm_syscfgLock);
794 serverAddr = ntohl(serverp->addr.sin_addr.s_addr);
795 serverp->ipRank = CM_IPRANK_LOW; /* default settings */
797 for ( i=0; i < cm_noIPAddr; i++)
799 /* loop through all the client's IP address and compare
800 ** each of them against the server's IP address */
802 myAddr = cm_IPAddr[i];
803 if ( IN_CLASSA(myAddr) )
804 netMask = IN_CLASSA_NET;
805 else if ( IN_CLASSB(myAddr) )
806 netMask = IN_CLASSB_NET;
807 else if ( IN_CLASSC(myAddr) )
808 netMask = IN_CLASSC_NET;
812 myNet = myAddr & netMask;
813 mySubnet = myAddr & cm_SubnetMask[i];
815 if ( (serverAddr & netMask) == myNet )
817 if ( (serverAddr & cm_SubnetMask[i]) == mySubnet)
819 if ( serverAddr == myAddr )
820 serverp->ipRank = min(serverp->ipRank,
821 CM_IPRANK_TOP);/* same machine */
822 else serverp->ipRank = min(serverp->ipRank,
823 CM_IPRANK_HI); /* same subnet */
825 else serverp->ipRank = min(serverp->ipRank,CM_IPRANK_MED);
828 } /* and of for loop */
830 /* random between 0..15*/
831 serverp->ipRank += (rand() % 0x000f);
832 lock_ReleaseRead(&cm_syscfgLock);
835 cm_server_t *cm_NewServer(struct sockaddr_in *socketp, int type, cm_cell_t *cellp, afsUUID *uuidp, afs_uint32 flags) {
838 osi_assertx(socketp->sin_family == AF_INET, "unexpected socket family");
840 lock_ObtainWrite(&cm_serverLock); /* get server lock */
841 tsp = cm_FindServer(socketp, type, TRUE);
843 /* we might have found a server created by set server prefs */
844 if (uuidp && !afs_uuid_is_nil(uuidp) &&
845 !(tsp->flags & CM_SERVERFLAG_UUID))
848 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_UUID);
850 lock_ReleaseWrite(&cm_serverLock);
854 tsp = malloc(sizeof(*tsp));
856 memset(tsp, 0, sizeof(*tsp));
859 if (uuidp && !afs_uuid_is_nil(uuidp)) {
861 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_UUID);
864 lock_InitializeMutex(&tsp->mx, "cm_server_t mutex", LOCK_HIERARCHY_SERVER);
865 tsp->addr = *socketp;
867 cm_SetServerPrefs(tsp);
869 tsp->allNextp = cm_allServersp;
870 cm_allServersp = tsp;
881 lock_ReleaseWrite(&cm_serverLock); /* release server lock */
883 if (!(flags & CM_FLAG_NOPROBE) && tsp) {
884 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_DOWN); /* assume down; ping will mark up if available */
885 cm_PingServer(tsp); /* Obtain Capabilities and check up/down state */
892 cm_FindServerByIP(afs_uint32 ipaddr, unsigned short port, int type, int locked)
897 lock_ObtainRead(&cm_serverLock);
899 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
900 if (tsp->type == type &&
901 tsp->addr.sin_addr.S_un.S_addr == ipaddr &&
902 (tsp->addr.sin_port == port || tsp->addr.sin_port == 0))
906 /* bump ref count if we found the server */
908 cm_GetServerNoLock(tsp);
911 lock_ReleaseRead(&cm_serverLock);
917 cm_FindServerByUuid(afsUUID *serverUuid, int type, int locked)
922 lock_ObtainRead(&cm_serverLock);
924 for (tsp = cm_allServersp; tsp; tsp = tsp->allNextp) {
925 if (tsp->type == type && !afs_uuid_equal(&tsp->uuid, serverUuid))
929 /* bump ref count if we found the server */
931 cm_GetServerNoLock(tsp);
934 lock_ReleaseRead(&cm_serverLock);
939 /* find a server based on its properties */
940 cm_server_t *cm_FindServer(struct sockaddr_in *addrp, int type, int locked)
942 osi_assertx(addrp->sin_family == AF_INET, "unexpected socket value");
944 return cm_FindServerByIP(addrp->sin_addr.s_addr, addrp->sin_port, type, locked);
947 cm_server_vols_t *cm_NewServerVols(void) {
948 cm_server_vols_t *tsvp;
950 tsvp = malloc(sizeof(*tsvp));
952 memset(tsvp, 0, sizeof(*tsvp));
958 * cm_NewServerRef() returns with the allocated cm_serverRef_t
959 * with a refCount of 1.
961 cm_serverRef_t *cm_NewServerRef(cm_server_t *serverp, afs_uint32 volID)
963 cm_serverRef_t *tsrp;
964 cm_server_vols_t **tsrvpp = NULL;
965 afs_uint32 *slotp = NULL;
968 cm_GetServer(serverp);
969 tsrp = malloc(sizeof(*tsrp));
970 tsrp->server = serverp;
971 tsrp->status = srv_not_busy;
976 /* if we have a non-zero volID, we need to add it to the list
977 * of volumes maintained by the server. There are two phases:
978 * (1) see if the volID is already in the list and (2) insert
979 * it into the first empty slot if it is not.
982 lock_ObtainMutex(&serverp->mx);
984 tsrvpp = &serverp->vols;
988 for (i=0; i<NUM_SERVER_VOLS; i++) {
989 if ((*tsrvpp)->ids[i] == volID) {
992 } else if (!slotp && (*tsrvpp)->ids[i] == 0) {
993 slotp = &(*tsrvpp)->ids[i];
1000 tsrvpp = &(*tsrvpp)->nextp;
1007 /* if we didn't find an empty slot in a current
1008 * page we must need a new page */
1009 *tsrvpp = cm_NewServerVols();
1011 (*tsrvpp)->ids[0] = volID;
1015 lock_ReleaseMutex(&serverp->mx);
1021 void cm_GetServerRef(cm_serverRef_t *tsrp, int locked)
1026 lock_ObtainRead(&cm_serverLock);
1027 refCount = InterlockedIncrement(&tsrp->refCount);
1029 lock_ReleaseRead(&cm_serverLock);
1032 afs_int32 cm_PutServerRef(cm_serverRef_t *tsrp, int locked)
1037 lock_ObtainRead(&cm_serverLock);
1038 refCount = InterlockedDecrement(&tsrp->refCount);
1039 osi_assertx(refCount >= 0, "cm_serverRef_t refCount underflow");
1042 lock_ReleaseRead(&cm_serverLock);
1049 LONG_PTR cm_ChecksumServerList(cm_serverRef_t *serversp)
1053 cm_serverRef_t *tsrp;
1055 lock_ObtainRead(&cm_serverLock);
1056 for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
1057 if (tsrp->status == srv_deleted)
1063 sum ^= (LONG_PTR) tsrp->server;
1066 lock_ReleaseRead(&cm_serverLock);
1071 ** Insert a server into the server list keeping the list sorted in
1072 ** ascending order of ipRank.
1074 ** The refCount of the cm_serverRef_t is not altered.
1076 void cm_InsertServerList(cm_serverRef_t** list, cm_serverRef_t* element)
1078 cm_serverRef_t *current;
1079 unsigned short ipRank;
1081 lock_ObtainWrite(&cm_serverLock);
1083 * Since we are grabbing the serverLock exclusively remove any
1084 * deleted serverRef objects with a zero refcount before
1085 * inserting the new item.
1088 cm_serverRef_t **currentp = list;
1089 cm_serverRef_t **nextp = NULL;
1090 cm_serverRef_t * next = NULL;
1092 for (currentp = list; *currentp; currentp = nextp)
1094 nextp = &(*currentp)->next;
1095 if ((*currentp)->refCount == 0 &&
1096 (*currentp)->status == srv_deleted) {
1099 if ((*currentp)->volID)
1100 cm_RemoveVolumeFromServer((*currentp)->server, (*currentp)->volID);
1101 cm_FreeServer((*currentp)->server);
1108 /* insertion into empty list or at the beginning of the list */
1111 element->next = NULL;
1117 * Now that deleted entries have been removed and we know that the
1118 * list was not empty, look for duplicates. If the element we are
1119 * inserting already exists, discard it.
1121 for ( current = *list; current; current = current->next)
1123 cm_server_t * server1 = current->server;
1124 cm_server_t * server2 = element->server;
1126 if (current->status == srv_deleted)
1129 if (server1->type != server2->type)
1132 if (server1->addr.sin_addr.s_addr != server2->addr.sin_addr.s_addr)
1135 if ((server1->flags & CM_SERVERFLAG_UUID) != (server2->flags & CM_SERVERFLAG_UUID))
1138 if ((server1->flags & CM_SERVERFLAG_UUID) &&
1139 !afs_uuid_equal(&server1->uuid, &server2->uuid))
1142 /* we must have a match, discard the new element */
1147 ipRank = element->server->ipRank;
1149 /* insertion at the beginning of the list */
1150 if ((*list)->server->ipRank > ipRank)
1152 element->next = *list;
1157 /* find appropriate place to insert */
1158 for ( current = *list; current->next; current = current->next)
1160 if ( current->next->server->ipRank > ipRank )
1163 element->next = current->next;
1164 current->next = element;
1167 lock_ReleaseWrite(&cm_serverLock);
1170 ** Re-sort the server list with the modified rank
1171 ** returns 0 if element was changed successfully.
1172 ** returns 1 if list remained unchanged.
1174 long cm_ChangeRankServer(cm_serverRef_t** list, cm_server_t* server)
1176 cm_serverRef_t **current;
1177 cm_serverRef_t *element;
1179 lock_ObtainWrite(&cm_serverLock);
1183 /* if there is max of one element in the list, nothing to sort */
1184 if ( (!*current) || !((*current)->next) ) {
1185 lock_ReleaseWrite(&cm_serverLock);
1186 return 1; /* list unchanged: return success */
1189 /* if the server is on the list, delete it from list */
1192 if ( (*current)->server == server)
1194 element = (*current);
1195 *current = element->next; /* delete it */
1198 current = & ( (*current)->next);
1200 lock_ReleaseWrite(&cm_serverLock);
1202 /* if this volume is not replicated on this server */
1204 return 1; /* server is not on list */
1206 /* re-insert deleted element into the list with modified rank*/
1207 cm_InsertServerList(list, element);
1212 ** If there are more than one server on the list and the first n servers on
1213 ** the list have the same rank( n>1), then randomise among the first n servers.
1215 void cm_RandomizeServer(cm_serverRef_t** list)
1218 cm_serverRef_t* tsrp, *lastTsrp;
1219 unsigned short lowestRank;
1221 lock_ObtainWrite(&cm_serverLock);
1224 /* an empty list or a list with only one element */
1225 if ( !tsrp || ! tsrp->next ) {
1226 lock_ReleaseWrite(&cm_serverLock);
1230 /* count the number of servers with the lowest rank */
1231 lowestRank = tsrp->server->ipRank;
1232 for ( count=1, tsrp=tsrp->next; tsrp; tsrp=tsrp->next)
1234 if ( tsrp->server->ipRank != lowestRank)
1240 /* if there is only one server with the lowest rank, we are done */
1242 lock_ReleaseWrite(&cm_serverLock);
1246 picked = rand() % count;
1248 lock_ReleaseWrite(&cm_serverLock);
1253 while (--picked >= 0)
1258 lastTsrp->next = tsrp->next; /* delete random element from list*/
1259 tsrp->next = *list; /* insert element at the beginning of list */
1261 lock_ReleaseWrite(&cm_serverLock);
1264 /* call cm_FreeServer while holding a write lock on cm_serverLock */
1265 void cm_FreeServer(cm_server_t* serverp)
1267 cm_server_vols_t * tsrvp, *nextp;
1270 cm_PutServerNoLock(serverp);
1271 if (serverp->refCount == 0)
1274 * we need to check to ensure that all of the connections
1275 * for this server have a 0 refCount; otherwise, they will
1276 * not be garbage collected
1278 * must drop the cm_serverLock because cm_GCConnections
1279 * obtains the cm_connLock and that comes first in the
1282 lock_ReleaseWrite(&cm_serverLock);
1283 cm_GCConnections(serverp); /* connsp */
1284 lock_ObtainWrite(&cm_serverLock);
1289 * Once we have the cm_serverLock locked check to make
1290 * sure the refCount is still zero before removing the
1293 if (serverp->refCount == 0) {
1294 if (!(serverp->flags & CM_SERVERFLAG_PREF_SET)) {
1295 switch (serverp->type) {
1296 case CM_SERVER_VLDB:
1297 cm_numVldbServers--;
1299 case CM_SERVER_FILE:
1300 cm_numFileServers--;
1304 lock_FinalizeMutex(&serverp->mx);
1305 if ( cm_allServersp == serverp )
1306 cm_allServersp = serverp->allNextp;
1310 for(tsp = cm_allServersp; tsp->allNextp; tsp=tsp->allNextp) {
1311 if ( tsp->allNextp == serverp ) {
1312 tsp->allNextp = serverp->allNextp;
1318 /* free the volid list */
1319 for ( tsrvp = serverp->vols; tsrvp; tsrvp = nextp) {
1320 nextp = tsrvp->nextp;
1329 /* Called with cm_serverLock write locked */
1330 void cm_RemoveVolumeFromServer(cm_server_t * serverp, afs_uint32 volID)
1332 cm_server_vols_t * tsrvp;
1338 for (tsrvp = serverp->vols; tsrvp; tsrvp = tsrvp->nextp) {
1339 for (i=0; i<NUM_SERVER_VOLS; i++) {
1340 if (tsrvp->ids[i] == volID) {
1348 int cm_IsServerListEmpty(cm_serverRef_t *serversp)
1350 cm_serverRef_t *tsrp;
1353 if (serversp == NULL)
1354 return CM_ERROR_EMPTY;
1356 lock_ObtainRead(&cm_serverLock);
1357 for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
1358 if (tsrp->status == srv_deleted)
1363 lock_ReleaseRead(&cm_serverLock);
1365 return ( allDeleted ? CM_ERROR_EMPTY : 0 );
1368 void cm_FreeServerList(cm_serverRef_t** list, afs_uint32 flags)
1370 cm_serverRef_t **current;
1371 cm_serverRef_t **nextp;
1372 cm_serverRef_t * next;
1375 lock_ObtainWrite(&cm_serverLock);
1385 nextp = &(*current)->next;
1386 refCount = cm_PutServerRef(*current, TRUE);
1387 if (refCount == 0) {
1390 if ((*current)->volID)
1391 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1392 cm_FreeServer((*current)->server);
1396 if (flags & CM_FREESERVERLIST_DELETE) {
1397 (*current)->status = srv_deleted;
1398 if ((*current)->volID)
1399 cm_RemoveVolumeFromServer((*current)->server, (*current)->volID);
1407 lock_ReleaseWrite(&cm_serverLock);
1410 /* dump all servers to a file.
1411 * cookie is used to identify this batch for easy parsing,
1412 * and it a string provided by a caller
1414 int cm_DumpServers(FILE *outputFile, char *cookie, int lock)
1423 lock_ObtainRead(&cm_serverLock);
1426 "%s - dumping servers - cm_numFileServers=%d, cm_numVldbServers=%d\r\n",
1427 cookie, cm_numFileServers, cm_numVldbServers);
1428 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1430 for (tsp = cm_allServersp; tsp; tsp=tsp->allNextp)
1435 switch (tsp->type) {
1436 case CM_SERVER_VLDB:
1439 case CM_SERVER_FILE:
1446 afsUUID_to_string(&tsp->uuid, uuidstr, sizeof(uuidstr));
1447 afs_inet_ntoa_r(tsp->addr.sin_addr.s_addr, hoststr);
1448 down = ctime(&tsp->downTime);
1449 down[strlen(down)-1] = '\0';
1452 "%s - tsp=0x%p cell=%s addr=%-15s port=%u uuid=%s type=%s caps=0x%x "
1453 "flags=0x%x waitCount=%u rank=%u downTime=\"%s\" refCount=%u\r\n",
1454 cookie, tsp, tsp->cellp ? tsp->cellp->name : "", hoststr,
1455 ntohs(tsp->addr.sin_port), uuidstr, type,
1456 tsp->capabilities, tsp->flags, tsp->waitCount, tsp->ipRank,
1457 (tsp->flags & CM_SERVERFLAG_DOWN) ? down : "up",
1459 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1461 sprintf(output, "%s - Done dumping servers.\r\n", cookie);
1462 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1465 lock_ReleaseRead(&cm_serverLock);
1471 * Determine if two servers are in fact the same.
1473 * Returns 1 if they match, 0 if they do not
1475 int cm_ServerEqual(cm_server_t *srv1, cm_server_t *srv2)
1479 if (srv1 == NULL || srv2 == NULL)
1485 if (srv1->flags & CM_SERVERFLAG_UUID) {
1486 if (!(srv2->flags & CM_SERVERFLAG_UUID))
1489 /* Both support UUID */
1490 if (UuidEqual((UUID *)&srv1->uuid, (UUID *)&srv2->uuid, &status))
1493 if (srv1->flags & CM_SERVERFLAG_UUID)
1496 /* Neither support UUID so perform an addr/port comparison */
1497 if ( srv1->addr.sin_family == srv2->addr.sin_family &&
1498 srv1->addr.sin_addr.s_addr == srv2->addr.sin_addr.s_addr &&
1499 srv1->addr.sin_port == srv2->addr.sin_port )