2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afsconfig.h>
11 #include <afs/param.h>
26 osi_rwlock_t cm_volumeLock;
29 cm_ValidateVolume(void)
34 for (volp = cm_data.allVolumesp, count = 0; volp; volp=volp->allNextp, count++) {
35 if ( volp->magic != CM_VOLUME_MAGIC ) {
36 afsi_log("cm_ValidateVolume failure: volp->magic != CM_VOLUME_MAGIC");
37 fprintf(stderr, "cm_ValidateVolume failure: volp->magic != CM_VOLUME_MAGIC\n");
40 if ( volp->cellp && volp->cellp->magic != CM_CELL_MAGIC ) {
41 afsi_log("cm_ValidateVolume failure: volp->cellp->magic != CM_CELL_MAGIC");
42 fprintf(stderr, "cm_ValidateVolume failure: volp->cellp->magic != CM_CELL_MAGIC\n");
45 if ( volp->allNextp && volp->allNextp->magic != CM_VOLUME_MAGIC ) {
46 afsi_log("cm_ValidateVolume failure: volp->allNextp->magic != CM_VOLUME_MAGIC");
47 fprintf(stderr, "cm_ValidateVolume failure: volp->allNextp->magic != CM_VOLUME_MAGIC\n");
50 if ( count != 0 && volp == cm_data.allVolumesp ||
51 count > cm_data.maxVolumes ) {
52 afsi_log("cm_ValidateVolume failure: cm_data.allVolumep loop detected");
53 fprintf(stderr, "cm_ValidateVolume failure: cm_data.allVolumep loop detected\n");
58 if ( count != cm_data.currentVolumes ) {
59 afsi_log("cm_ValidateVolume failure: count != cm_data.currentVolumes");
60 fprintf(stderr, "cm_ValidateVolume failure: count != cm_data.currentVolumes\n");
68 cm_ShutdownVolume(void)
72 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
74 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
75 if (volp->vol[volType].ID)
76 cm_VolumeStatusNotification(volp, volp->vol[volType].ID, volp->vol[volType].state, vl_alldown);
78 volp->cbExpiresRO = 0;
80 volp->cbServerpRO = NULL;
81 lock_FinalizeRWLock(&volp->rw);
87 void cm_InitVolume(int newFile, long maxVols)
89 static osi_once_t once;
91 if (osi_Once(&once)) {
92 lock_InitializeRWLock(&cm_volumeLock, "cm global volume lock", LOCK_HIERARCHY_VOLUME_GLOBAL);
95 cm_data.allVolumesp = NULL;
96 cm_data.currentVolumes = 0;
97 cm_data.maxVolumes = maxVols;
98 memset(cm_data.volumeNameHashTablep, 0, sizeof(cm_volume_t *) * cm_data.volumeHashTableSize);
99 memset(cm_data.volumeRWIDHashTablep, 0, sizeof(cm_volume_t *) * cm_data.volumeHashTableSize);
100 memset(cm_data.volumeROIDHashTablep, 0, sizeof(cm_volume_t *) * cm_data.volumeHashTableSize);
101 memset(cm_data.volumeBKIDHashTablep, 0, sizeof(cm_volume_t *) * cm_data.volumeHashTableSize);
102 cm_data.volumeLRUFirstp = cm_data.volumeLRULastp = NULL;
106 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
109 lock_InitializeRWLock(&volp->rw, "cm_volume_t rwlock", LOCK_HIERARCHY_VOLUME);
110 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RESET);
111 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_UPDATING_VL);
112 volp->lastUpdateTime = 0;
113 for (volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
114 volp->vol[volType].state = vl_unknown;
115 volp->vol[volType].serversp = NULL;
116 if (volp->vol[volType].ID)
117 cm_VolumeStatusNotification(volp, volp->vol[volType].ID, vl_unknown, volp->vol[volType].state);
119 volp->cbExpiresRO = 0;
120 volp->cbIssuedRO = 0;
121 volp->cbServerpRO = NULL;
129 /* returns true if the id is a decimal integer, in which case we interpret it
130 * as an id. make the cache manager much simpler.
131 * Stolen from src/volser/vlprocs.c */
133 cm_VolNameIsID(char *aname)
136 while (tc = *aname++) {
137 if (tc > '9' || tc < '0')
145 * Update a volume. Caller holds a write lock on the volume (volp->rw).
148 * shadow / openafs / jhutz@CS.CMU.EDU {ANDREW.CMU.EDU} 01:38 (JHutz)
149 * Yes, we support multihomed fileservers.
150 * Since before we got the code from IBM.
151 * But to find out about multiple addresses on a multihomed server, you need
152 * to use VL_GetEntryByNameU and VL_GetAddrsU. If you use
153 * VL_GetEntryByNameO or VL_GetEntryByNameN, the vlserver just gives you one
154 * address per server.
155 * shadow / openafs / jhutz@CS.CMU.EDU {ANDREW.CMU.EDU} 01:39 (JHutz)
156 * see src/afs/afs_volume.c, paying particular attention to
157 * afs_NewVolumeByName, afs_SetupVolume, and InstallUVolumeEntry
158 * shadow / openafs / jaltman {ANDREW.CMU.EDU} 01:40 (Jeffrey Altman)
159 * thanks. The windows client calls the 0 versions.
160 * shadow / openafs / jhutz@CS.CMU.EDU {ANDREW.CMU.EDU} 01:51 (JHutz)
162 * By not using the N versions, you only get up to 8 sites instead of 13.
163 * By not using the U versions, you don't get to know about multihomed serve
164 * shadow / openafs / jhutz@CS.CMU.EDU {ANDREW.CMU.EDU} 01:52 (JHutz)
165 * Of course, you probably want to support the older versions for backward
166 * compatibility. If you do that, you need to call the newest interface
167 * first, and fall back to successively older versions if you get
171 cm_GetEntryByName( struct cm_cell *cellp, const char *name,
172 struct vldbentry *vldbEntryp,
173 struct nvldbentry *nvldbEntryp,
174 struct uvldbentry *uvldbEntryp,
182 struct rx_connection * rxconnp;
184 osi_Log2(afsd_logp, "CALL VL_GetEntryByName{UNO} name %s:%s",
185 osi_LogSaveString(afsd_logp,cellp->name),
186 osi_LogSaveString(afsd_logp,name));
189 code = cm_ConnByMServers(cellp->vlServersp, FALSE, userp, reqp, &connp);
193 rxconnp = cm_GetRxConn(connp);
194 code = VL_GetEntryByNameU(rxconnp, name, uvldbEntryp);
196 if ( code == RXGEN_OPCODE )
198 code = VL_GetEntryByNameN(rxconnp, name, nvldbEntryp);
201 if ( code == RXGEN_OPCODE ) {
202 code = VL_GetEntryByNameO(rxconnp, name, vldbEntryp);
205 rx_PutConnection(rxconnp);
206 } while (cm_Analyze(connp, userp, reqp, NULL, cellp, 0, NULL, NULL, &cellp->vlServersp, NULL, code));
207 code = cm_MapVLRPCError(code, reqp);
209 osi_Log3(afsd_logp, "CALL VL_GetEntryByName{UNO} name %s:%s FAILURE, code 0x%x",
210 osi_LogSaveString(afsd_logp,cellp->name),
211 osi_LogSaveString(afsd_logp,name), code);
213 osi_Log2(afsd_logp, "CALL VL_GetEntryByName{UNO} name %s:%s SUCCESS",
214 osi_LogSaveString(afsd_logp,cellp->name),
215 osi_LogSaveString(afsd_logp,name));
220 cm_GetEntryByID( struct cm_cell *cellp, afs_uint32 id,
221 struct vldbentry *vldbEntryp,
222 struct nvldbentry *nvldbEntryp,
223 struct uvldbentry *uvldbEntryp,
231 StringCbPrintf(name, sizeof(name), "%u", id);
233 return cm_GetEntryByName(cellp, name, vldbEntryp, nvldbEntryp, uvldbEntryp, methodp, userp, reqp);
236 long cm_UpdateVolumeLocation(struct cm_cell *cellp, cm_user_t *userp, cm_req_t *reqp,
239 struct rx_connection *rxconnp;
243 cm_serverRef_t *tsrp;
245 struct sockaddr_in tsockAddr;
248 struct vldbentry vldbEntry;
249 struct nvldbentry nvldbEntry;
250 struct uvldbentry uvldbEntry;
255 enum volstatus rwNewstate = vl_online;
256 enum volstatus roNewstate = vl_online;
257 enum volstatus bkNewstate = vl_online;
258 #ifdef AFS_FREELANCE_CLIENT
264 lock_AssertWrite(&volp->rw);
267 * If the last volume update was in the last five
268 * minutes and it did not exist, then avoid the RPC
269 * and return No Such Volume immediately.
272 if ((volp->flags & CM_VOLUMEFLAG_NOEXIST) &&
273 (now < volp->lastUpdateTime + 600))
275 return CM_ERROR_NOSUCHVOLUME;
278 #ifdef AFS_FREELANCE_CLIENT
279 if (cellp->cellID == AFS_FAKE_ROOT_CELL_ID)
282 memset(&vldbEntry, 0, sizeof(vldbEntry));
283 vldbEntry.flags |= VLF_RWEXISTS;
284 vldbEntry.volumeId[0] = AFS_FAKE_ROOT_VOL_ID;
290 while (volp->flags & CM_VOLUMEFLAG_UPDATING_VL) {
291 osi_Log3(afsd_logp, "cm_UpdateVolumeLocation sleeping name %s:%s flags 0x%x",
292 volp->cellp->name, volp->namep, volp->flags);
293 osi_SleepW((LONG_PTR) &volp->flags, &volp->rw);
294 lock_ObtainWrite(&volp->rw);
295 osi_Log3(afsd_logp, "cm_UpdateVolumeLocation awake name %s:%s flags 0x%x",
296 volp->cellp->name, volp->namep, volp->flags);
297 if (!(volp->flags & CM_VOLUMEFLAG_RESET)) {
298 osi_Log3(afsd_logp, "cm_UpdateVolumeLocation nothing to do, waking others name %s:%s flags 0x%x",
299 volp->cellp->name, volp->namep, volp->flags);
300 osi_Wakeup((LONG_PTR) &volp->flags);
306 /* Do not query again if the last update attempt failed in the last 60 seconds */
307 if ((volp->flags & CM_VOLUMEFLAG_RESET) && (volp->lastUpdateTime > now - 60))
309 osi_Log3(afsd_logp, "cm_UpdateVolumeLocation unsuccessful update in last 60 seconds -- name %s:%s flags 0x%x",
310 volp->cellp->name, volp->namep, volp->flags);
311 return(CM_ERROR_ALLDOWN);
314 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_UPDATING_VL);
316 /* Do not hold the volume lock across the RPC calls */
317 lock_ReleaseWrite(&volp->rw);
319 if (cellp->flags & CM_CELLFLAG_VLSERVER_INVALID)
320 cm_UpdateCell(cellp, 0);
322 /* now we have volume structure locked and held; make RPC to fill it */
323 code = cm_GetEntryByName(cellp, volp->namep, &vldbEntry, &nvldbEntry,
325 &method, userp, reqp);
327 /* We can end up here with code == CM_ERROR_NOSUCHVOLUME if the base volume name
328 * does not exist and is not a numeric string but there might exist a .readonly volume.
329 * If the base name doesn't exist we will not care about the .backup that might be left
330 * behind since there should be no method to access it.
332 if (code == CM_ERROR_NOSUCHVOLUME &&
333 _atoi64(volp->namep) == 0 &&
334 volp->vol[RWVOL].ID == 0 &&
335 strlen(volp->namep) < (VL_MAXNAMELEN - 9)) {
336 char name[VL_MAXNAMELEN];
338 snprintf(name, VL_MAXNAMELEN, "%s.readonly", volp->namep);
340 /* now we have volume structure locked and held; make RPC to fill it */
341 code = cm_GetEntryByName(cellp, name, &vldbEntry, &nvldbEntry,
343 &method, userp, reqp);
347 * What if there was a volume rename? The volume name no longer exists but the
348 * volume id might. Try to refresh the volume location information based one
349 * of the readwrite or readonly volume id.
351 if (code == CM_ERROR_NOSUCHVOLUME) {
352 if (volp->vol[RWVOL].ID != 0) {
353 code = cm_GetEntryByID(cellp, volp->vol[RWVOL].ID, &vldbEntry, &nvldbEntry,
355 &method, userp, reqp);
356 } else if (volp->vol[ROVOL].ID != 0) {
357 code = cm_GetEntryByID(cellp, volp->vol[ROVOL].ID, &vldbEntry, &nvldbEntry,
359 &method, userp, reqp);
362 lock_ObtainWrite(&volp->rw);
371 afs_int32 serverNumber[NMAXNSERVERS];
372 afs_int32 serverFlags[NMAXNSERVERS];
373 afsUUID serverUUID[NMAXNSERVERS];
374 afs_int32 rwServers_alldown = 1;
375 afs_int32 roServers_alldown = 1;
376 afs_int32 bkServers_alldown = 1;
377 char name[VL_MAXNAMELEN];
379 #ifdef AFS_FREELANCE_CLIENT
381 rwServers_alldown = 0;
384 /* clear out old bindings */
385 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
386 if (volp->vol[volType].serversp)
387 cm_FreeServerList(&volp->vol[volType].serversp, CM_FREESERVERLIST_DELETE);
390 memset(serverUUID, 0, sizeof(serverUUID));
394 flags = vldbEntry.flags;
395 nServers = vldbEntry.nServers;
396 rwID = vldbEntry.volumeId[0];
397 roID = vldbEntry.volumeId[1];
398 bkID = vldbEntry.volumeId[2];
399 for ( i=0; i<nServers; i++ ) {
400 serverFlags[i] = vldbEntry.serverFlags[i];
401 serverNumber[i] = vldbEntry.serverNumber[i];
403 strncpy(name, vldbEntry.name, VL_MAXNAMELEN);
404 name[VL_MAXNAMELEN - 1] = '\0';
407 flags = nvldbEntry.flags;
408 nServers = nvldbEntry.nServers;
409 rwID = nvldbEntry.volumeId[0];
410 roID = nvldbEntry.volumeId[1];
411 bkID = nvldbEntry.volumeId[2];
412 for ( i=0; i<nServers; i++ ) {
413 serverFlags[i] = nvldbEntry.serverFlags[i];
414 serverNumber[i] = nvldbEntry.serverNumber[i];
416 strncpy(name, nvldbEntry.name, VL_MAXNAMELEN);
417 name[VL_MAXNAMELEN - 1] = '\0';
420 flags = uvldbEntry.flags;
421 nServers = uvldbEntry.nServers;
422 rwID = uvldbEntry.volumeId[0];
423 roID = uvldbEntry.volumeId[1];
424 bkID = uvldbEntry.volumeId[2];
425 for ( i=0, j=0; code == 0 && i<nServers && j<NMAXNSERVERS; i++ ) {
426 if ( !(uvldbEntry.serverFlags[i] & VLSF_UUID) ) {
427 serverFlags[j] = uvldbEntry.serverFlags[i];
428 serverNumber[j] = uvldbEntry.serverNumber[i].time_low;
431 afs_uint32 * addrp, nentries, code, unique;
433 ListAddrByAttributes attrs;
436 memset(&attrs, 0, sizeof(attrs));
437 attrs.Mask = VLADDR_UUID;
438 attrs.uuid = uvldbEntry.serverNumber[i];
439 memset(&uuid, 0, sizeof(uuid));
440 memset(&addrs, 0, sizeof(addrs));
443 code = cm_ConnByMServers(cellp->vlServersp, FALSE, userp, reqp, &connp);
447 rxconnp = cm_GetRxConn(connp);
448 code = VL_GetAddrsU(rxconnp, &attrs, &uuid, &unique, &nentries, &addrs);
449 rx_PutConnection(rxconnp);
450 } while (cm_Analyze(connp, userp, reqp, NULL, cellp, 0, NULL, NULL, &cellp->vlServersp, NULL, code));
453 code = cm_MapVLRPCError(code, reqp);
454 osi_Log2(afsd_logp, "CALL VL_GetAddrsU serverNumber %u FAILURE, code 0x%x",
458 osi_Log1(afsd_logp, "CALL VL_GetAddrsU serverNumber %u SUCCESS", i);
460 addrp = addrs.bulkaddrs_val;
461 for (k = 0; k < nentries && j < NMAXNSERVERS; j++, k++) {
462 serverFlags[j] = uvldbEntry.serverFlags[i];
463 serverNumber[j] = addrp[k];
464 serverUUID[j] = uuid;
467 xdr_free((xdrproc_t) xdr_bulkaddrs, &addrs);
470 code = CM_ERROR_INVAL;
473 nServers = j; /* update the server count */
474 strncpy(name, uvldbEntry.name, VL_MAXNAMELEN);
475 name[VL_MAXNAMELEN - 1] = '\0';
479 /* decode the response */
480 lock_ObtainWrite(&cm_volumeLock);
481 if (!cm_VolNameIsID(volp->namep)) {
486 if (len >= 8 && strcmp(name + len - 7, ".backup") == 0) {
487 name[len - 7] = '\0';
488 } else if (len >= 10 && strcmp(name + len - 9, ".readonly") == 0) {
489 name[len - 9] = '\0';
492 osi_Log2(afsd_logp, "cm_UpdateVolume name %s -> %s",
493 osi_LogSaveString(afsd_logp,volp->namep), osi_LogSaveString(afsd_logp,name));
495 if (volp->qflags & CM_VOLUME_QFLAG_IN_HASH)
496 cm_RemoveVolumeFromNameHashTable(volp);
498 strcpy(volp->namep, name);
500 cm_AddVolumeToNameHashTable(volp);
503 if (flags & VLF_DFSFILESET) {
504 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_DFS_VOLUME);
505 osi_Log1(afsd_logp, "cm_UpdateVolume Volume Group '%s' is a DFS File Set. Correct behavior is not implemented.",
506 osi_LogSaveString(afsd_logp, volp->namep));
509 if (flags & VLF_RWEXISTS) {
510 if (volp->vol[RWVOL].ID != rwID) {
511 if (volp->vol[RWVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
512 cm_RemoveVolumeFromIDHashTable(volp, RWVOL);
513 volp->vol[RWVOL].ID = rwID;
514 cm_AddVolumeToIDHashTable(volp, RWVOL);
517 if (volp->vol[RWVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
518 cm_RemoveVolumeFromIDHashTable(volp, RWVOL);
519 volp->vol[RWVOL].ID = 0;
521 if (flags & VLF_ROEXISTS) {
522 if (volp->vol[ROVOL].ID != roID) {
523 if (volp->vol[ROVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
524 cm_RemoveVolumeFromIDHashTable(volp, ROVOL);
525 volp->vol[ROVOL].ID = roID;
526 cm_AddVolumeToIDHashTable(volp, ROVOL);
529 if (volp->vol[ROVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
530 cm_RemoveVolumeFromIDHashTable(volp, ROVOL);
531 volp->vol[ROVOL].ID = 0;
533 if (flags & VLF_BACKEXISTS) {
534 if (volp->vol[BACKVOL].ID != bkID) {
535 if (volp->vol[BACKVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
536 cm_RemoveVolumeFromIDHashTable(volp, BACKVOL);
537 volp->vol[BACKVOL].ID = bkID;
538 cm_AddVolumeToIDHashTable(volp, BACKVOL);
541 if (volp->vol[BACKVOL].qflags & CM_VOLUME_QFLAG_IN_HASH)
542 cm_RemoveVolumeFromIDHashTable(volp, BACKVOL);
543 volp->vol[BACKVOL].ID = 0;
545 lock_ReleaseWrite(&cm_volumeLock);
547 /* See if the replica sites are mixed versions */
548 for (i=0; i<nServers; i++) {
549 if (serverFlags[i] & VLSF_NEWREPSITE) {
555 for (i=0; i<nServers; i++) {
556 /* create a server entry */
557 tflags = serverFlags[i];
558 if (tflags & VLSF_DONTUSE)
560 tsockAddr.sin_port = htons(7000);
561 tsockAddr.sin_family = AF_INET;
562 tempAddr = htonl(serverNumber[i]);
563 tsockAddr.sin_addr.s_addr = tempAddr;
564 tsp = cm_FindServer(&tsockAddr, CM_SERVER_FILE, FALSE);
565 if (tsp && (method == 2) && (tsp->flags & CM_SERVERFLAG_UUID)) {
567 * Check to see if the uuid of the server we know at this address
568 * matches the uuid of the server we are being told about by the
569 * vlserver. If not, ...?
571 if (!afs_uuid_equal(&serverUUID[i], &tsp->uuid)) {
572 char uuid1[128], uuid2[128];
575 afsUUID_to_string(&serverUUID[i], uuid1, sizeof(uuid1));
576 afsUUID_to_string(&tsp->uuid, uuid2, sizeof(uuid2));
577 afs_inet_ntoa_r(serverNumber[i], hoststr);
579 osi_Log3(afsd_logp, "cm_UpdateVolumeLocation UUIDs do not match! %s != %s (%s)",
580 osi_LogSaveString(afsd_logp, uuid1),
581 osi_LogSaveString(afsd_logp, uuid2),
582 osi_LogSaveString(afsd_logp, hoststr));
587 * cm_NewServer will probe the file server which in turn will
588 * update the state on the volume group object. Do not probe
589 * in this thread. It will block the thread and can result in
590 * a recursive call to cm_UpdateVolumeLocation().
592 lock_ReleaseWrite(&volp->rw);
593 tsp = cm_NewServer(&tsockAddr, CM_SERVER_FILE, cellp, &serverUUID[i], CM_FLAG_NOPROBE);
594 lock_ObtainWrite(&volp->rw);
596 osi_assertx(tsp != NULL, "null cm_server_t");
599 * if this server was created by fs setserverprefs
600 * then it won't have either a cell assignment or
605 if ( (method == 2) && !(tsp->flags & CM_SERVERFLAG_UUID) &&
606 !afs_uuid_is_nil(&serverUUID[i])) {
607 tsp->uuid = serverUUID[i];
608 _InterlockedOr(&tsp->flags, CM_SERVERFLAG_UUID);
611 /* and add it to the list(s). */
613 * Each call to cm_NewServerRef() increments the
614 * ref count of tsp. These reference will be dropped,
615 * if and when the volume is reset; see reset code
616 * earlier in this function.
618 if ((tflags & VLSF_RWVOL) && (flags & VLF_RWEXISTS)) {
619 tsrp = cm_NewServerRef(tsp, rwID);
620 cm_InsertServerList(&volp->vol[RWVOL].serversp, tsrp);
621 if (!(tsp->flags & CM_SERVERFLAG_DOWN))
622 rwServers_alldown = 0;
625 * If there are mixed versions of RO releases on the replica
626 * sites, skip the servers with the out of date versions.
628 if ((tflags & VLSF_ROVOL) && (flags & VLF_ROEXISTS) &&
629 (!isMixed || (tflags & VLSF_NEWREPSITE))) {
630 tsrp = cm_NewServerRef(tsp, roID);
631 cm_InsertServerList(&volp->vol[ROVOL].serversp, tsrp);
634 if (!(tsp->flags & CM_SERVERFLAG_DOWN))
635 roServers_alldown = 0;
637 /* We don't use VLSF_BACKVOL !?! */
638 /* Because only the backup on the server holding the RW
639 * volume can be valid. This check prevents errors if a
640 * RW is moved but the old backup is not removed.
642 if ((tflags & VLSF_RWVOL) && (flags & VLF_BACKEXISTS)) {
643 tsrp = cm_NewServerRef(tsp, bkID);
644 cm_InsertServerList(&volp->vol[BACKVOL].serversp, tsrp);
646 if (!(tsp->flags & CM_SERVERFLAG_DOWN))
647 bkServers_alldown = 0;
649 /* Drop the reference obtained by cm_FindServer() */
656 * If the first n servers have the same rank, then we
657 * randomly pick one among them and move it to the beginning.
658 * We don't bother to re-order the whole list because
659 * the rest of the list is used only if the first server is
660 * down. We only do this for the RO list; we assume the other
661 * lists are length 1.
664 cm_RandomizeServer(&volp->vol[ROVOL].serversp);
665 _InterlockedOr(&volp->vol[ROVOL].flags, CM_VOL_STATE_FLAG_REPLICATED);
668 _InterlockedAnd(&volp->vol[ROVOL].flags, ~CM_VOL_STATE_FLAG_REPLICATED);
671 rwNewstate = rwServers_alldown ? vl_alldown : vl_online;
672 roNewstate = roServers_alldown ? vl_alldown : vl_online;
673 bkNewstate = bkServers_alldown ? vl_alldown : vl_online;
675 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_NOEXIST);
676 } else if (code == CM_ERROR_NOSUCHVOLUME || code == VL_NOENT || code == VL_BADNAME) {
677 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_NOEXIST);
679 rwNewstate = roNewstate = bkNewstate = vl_alldown;
682 * we are updating lastUpdateTime but didn't get an answer
683 * so clear the no exist flag.
685 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_NOEXIST);
688 if (volp->vol[RWVOL].state != rwNewstate) {
689 if (volp->vol[RWVOL].ID)
690 cm_VolumeStatusNotification(volp, volp->vol[RWVOL].ID, volp->vol[RWVOL].state, rwNewstate);
691 volp->vol[RWVOL].state = rwNewstate;
693 if (volp->vol[ROVOL].state != roNewstate) {
694 if (volp->vol[ROVOL].ID)
695 cm_VolumeStatusNotification(volp, volp->vol[ROVOL].ID, volp->vol[ROVOL].state, roNewstate);
696 volp->vol[ROVOL].state = roNewstate;
698 if (volp->vol[BACKVOL].state != bkNewstate) {
699 if (volp->vol[BACKVOL].ID)
700 cm_VolumeStatusNotification(volp, volp->vol[BACKVOL].ID, volp->vol[BACKVOL].state, bkNewstate);
701 volp->vol[BACKVOL].state = bkNewstate;
704 volp->lastUpdateTime = time(NULL);
706 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RO_MIXED);
708 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_RO_MIXED);
711 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_RESET);
713 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_UPDATING_VL);
714 osi_Log4(afsd_logp, "cm_UpdateVolumeLocation done, waking others name %s:%s flags 0x%x code 0x%x",
715 osi_LogSaveString(afsd_logp,volp->cellp->name),
716 osi_LogSaveString(afsd_logp,volp->namep), volp->flags, code);
717 osi_Wakeup((LONG_PTR) &volp->flags);
722 /* Requires read or write lock on cm_volumeLock */
723 void cm_GetVolume(cm_volume_t *volp)
725 InterlockedIncrement(&volp->refCount);
728 cm_volume_t *cm_GetVolumeByFID(cm_fid_t *fidp)
733 lock_ObtainRead(&cm_volumeLock);
734 hash = CM_VOLUME_ID_HASH(fidp->volume);
735 /* The volumeID can be any one of the three types. So we must
736 * search the hash table for all three types until we find it.
737 * We will search in the order of RO, RW, BK.
739 for ( volp = cm_data.volumeROIDHashTablep[hash]; volp; volp = volp->vol[ROVOL].nextp) {
740 if ( fidp->cell == volp->cellp->cellID && fidp->volume == volp->vol[ROVOL].ID )
745 for ( volp = cm_data.volumeRWIDHashTablep[hash]; volp; volp = volp->vol[RWVOL].nextp) {
746 if ( fidp->cell == volp->cellp->cellID && fidp->volume == volp->vol[RWVOL].ID )
752 for ( volp = cm_data.volumeBKIDHashTablep[hash]; volp; volp = volp->vol[BACKVOL].nextp) {
753 if ( fidp->cell == volp->cellp->cellID && fidp->volume == volp->vol[BACKVOL].ID )
758 /* hold the volume if we found it */
762 lock_ReleaseRead(&cm_volumeLock);
766 long cm_FindVolumeByID(cm_cell_t *cellp, afs_uint32 volumeID, cm_user_t *userp,
767 cm_req_t *reqp, afs_uint32 flags, cm_volume_t **outVolpp)
770 #ifdef SEARCH_ALL_VOLUMES
773 char volNameString[VL_MAXNAMELEN];
777 lock_ObtainRead(&cm_volumeLock);
778 #ifdef SEARCH_ALL_VOLUMES
779 for(volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
780 if (cellp == volp->cellp &&
781 ((unsigned) volumeID == volp->vol[RWVOL].ID ||
782 (unsigned) volumeID == volp->vol[ROVOL].ID ||
783 (unsigned) volumeID == volp->vol[BACKVOL].ID))
788 #endif /* SEARCH_ALL_VOLUMES */
790 hash = CM_VOLUME_ID_HASH(volumeID);
791 /* The volumeID can be any one of the three types. So we must
792 * search the hash table for all three types until we find it.
793 * We will search in the order of RO, RW, BK.
795 for ( volp = cm_data.volumeROIDHashTablep[hash]; volp; volp = volp->vol[ROVOL].nextp) {
796 if ( cellp == volp->cellp && volumeID == volp->vol[ROVOL].ID )
801 for ( volp = cm_data.volumeRWIDHashTablep[hash]; volp; volp = volp->vol[RWVOL].nextp) {
802 if ( cellp == volp->cellp && volumeID == volp->vol[RWVOL].ID )
808 for ( volp = cm_data.volumeBKIDHashTablep[hash]; volp; volp = volp->vol[BACKVOL].nextp) {
809 if ( cellp == volp->cellp && volumeID == volp->vol[BACKVOL].ID )
814 #ifdef SEARCH_ALL_VOLUMES
815 osi_assertx(volp == volp2, "unexpected cm_vol_t");
818 /* hold the volume if we found it */
822 lock_ReleaseRead(&cm_volumeLock);
826 lock_ObtainWrite(&volp->rw);
829 if ((volp->flags & CM_VOLUMEFLAG_RESET) && !(flags & CM_GETVOL_FLAG_NO_RESET)) {
830 code = cm_UpdateVolumeLocation(cellp, userp, reqp, volp);
832 lock_ReleaseWrite(&volp->rw);
836 if (!(flags & CM_GETVOL_FLAG_NO_LRU_UPDATE)) {
837 lock_ObtainWrite(&cm_volumeLock);
838 cm_AdjustVolumeLRU(volp);
839 lock_ReleaseWrite(&cm_volumeLock);
842 lock_ObtainRead(&cm_volumeLock);
844 lock_ReleaseRead(&cm_volumeLock);
849 /* otherwise, we didn't find it so consult the VLDB */
850 sprintf(volNameString, "%u", volumeID);
851 code = cm_FindVolumeByName(cellp, volNameString, userp, reqp,
852 flags | CM_GETVOL_FLAG_IGNORE_LINKED_CELL, outVolpp);
854 if (code == CM_ERROR_NOSUCHVOLUME && cellp->linkedName[0] &&
855 !(flags & CM_GETVOL_FLAG_IGNORE_LINKED_CELL)) {
856 cm_cell_t *linkedCellp = cm_GetCell(cellp->linkedName, flags);
859 code = cm_FindVolumeByID(linkedCellp, volumeID, userp, reqp,
860 flags | CM_GETVOL_FLAG_IGNORE_LINKED_CELL,
867 long cm_FindVolumeByName(struct cm_cell *cellp, char *volumeNamep,
868 struct cm_user *userp, struct cm_req *reqp,
869 afs_uint32 flags, cm_volume_t **outVolpp)
872 #ifdef SEARCH_ALL_VOLUMES
876 char name[VL_MAXNAMELEN];
881 strncpy(name, volumeNamep, VL_MAXNAMELEN);
882 name[VL_MAXNAMELEN-1] = '\0';
885 if (len >= 8 && strcmp(name + len - 7, ".backup") == 0) {
887 name[len - 7] = '\0';
888 } else if (len >= 10 && strcmp(name + len - 9, ".readonly") == 0) {
890 name[len - 9] = '\0';
895 lock_ObtainRead(&cm_volumeLock);
896 #ifdef SEARCH_ALL_VOLUMES
897 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
898 if (cellp == volp->cellp && strcmp(name, volp->namep) == 0) {
903 #endif /* SEARCH_ALL_VOLUMES */
905 hash = CM_VOLUME_NAME_HASH(name);
906 for (volp = cm_data.volumeNameHashTablep[hash]; volp; volp = volp->nameNextp) {
907 if (cellp == volp->cellp && strcmp(name, volp->namep) == 0)
911 #ifdef SEARCH_ALL_VOLUMES
912 osi_assertx(volp2 == volp, "unexpected cm_vol_t");
915 if (!volp && (flags & CM_GETVOL_FLAG_CREATE)) {
917 /* otherwise, get from VLDB */
920 * Change to a write lock so that we have exclusive use of
921 * the first cm_volume_t with a refCount of 0 so that we
922 * have time to increment it.
924 lock_ConvertRToW(&cm_volumeLock);
927 * While the lock was converted it may have been dropped
928 * Search again now that we are exclusive.
930 for (volp = cm_data.volumeNameHashTablep[hash]; volp; volp = volp->nameNextp) {
931 if (cellp == volp->cellp && strcmp(name, volp->namep) == 0)
937 lock_ReleaseWrite(&cm_volumeLock);
938 lock_ObtainWrite(&volp->rw);
940 if ( cm_data.currentVolumes >= cm_data.maxVolumes ) {
941 #ifdef RECYCLE_FROM_ALL_VOLUMES_LIST
942 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
943 if ( volp->refCount == 0 ) {
944 /* There is one we can re-use */
949 for ( volp = cm_data.volumeLRULastp;
951 volp = (cm_volume_t *) osi_QPrev(&volp->q))
953 if ( volp->refCount == 0 ) {
954 /* There is one we can re-use */
960 osi_panic("Exceeded Max Volumes", __FILE__, __LINE__);
962 osi_Log2(afsd_logp, "Recycling Volume %s:%s",
963 volp->cellp->name, volp->namep);
965 /* The volp is removed from the LRU queue in order to
966 * prevent two threads from attempting to recycle the
967 * same object. This volp must be re-inserted back into
968 * the LRU queue before this function exits.
970 if (volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE)
971 cm_RemoveVolumeFromLRU(volp);
972 if (volp->qflags & CM_VOLUME_QFLAG_IN_HASH)
973 cm_RemoveVolumeFromNameHashTable(volp);
975 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
976 if (volp->vol[volType].qflags & CM_VOLUME_QFLAG_IN_HASH)
977 cm_RemoveVolumeFromIDHashTable(volp, volType);
978 if (volp->vol[volType].ID)
979 cm_VolumeStatusNotification(volp, volp->vol[volType].ID, volp->vol[volType].state, vl_unknown);
980 volp->vol[volType].ID = 0;
981 cm_SetFid(&volp->vol[volType].dotdotFid, 0, 0, 0, 0);
984 volp = &cm_data.volumeBaseAddress[InterlockedIncrement(&cm_data.currentVolumes) - 1];
985 memset(volp, 0, sizeof(cm_volume_t));
986 volp->magic = CM_VOLUME_MAGIC;
987 volp->allNextp = cm_data.allVolumesp;
988 cm_data.allVolumesp = volp;
989 lock_InitializeRWLock(&volp->rw, "cm_volume_t rwlock", LOCK_HIERARCHY_VOLUME);
992 * no one else can find this object and we have not dropped
993 * cm_volumeLock in any case. The object is either new or
994 * recycled. Initialize its new values and put it into the
995 * name hash table before dropping cm_volumeLock which makes
996 * it visible to competing threads.
999 strncpy(volp->namep, name, VL_MAXNAMELEN);
1000 volp->namep[VL_MAXNAMELEN-1] = '\0';
1001 volp->flags = CM_VOLUMEFLAG_RESET;
1002 volp->lastUpdateTime = 0;
1004 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
1005 volp->vol[volType].state = vl_unknown;
1006 volp->vol[volType].nextp = NULL;
1007 volp->vol[volType].flags = 0;
1009 volp->cbExpiresRO = 0;
1010 volp->cbIssuedRO = 0;
1011 volp->cbServerpRO = NULL;
1012 volp->creationDateRO = 0;
1013 cm_AddVolumeToNameHashTable(volp);
1015 lock_ReleaseWrite(&cm_volumeLock);
1016 lock_ObtainWrite(&volp->rw);
1017 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
1018 cm_FreeServerList(&volp->vol[volType].serversp, CM_FREESERVERLIST_DELETE);
1024 lock_ReleaseRead(&cm_volumeLock);
1025 lock_ObtainWrite(&volp->rw);
1027 lock_ReleaseRead(&cm_volumeLock);
1028 return CM_ERROR_NOSUCHVOLUME;
1031 /* if we get here we are holding the mutex */
1032 if ((volp->flags & CM_VOLUMEFLAG_RESET) && !(flags & CM_GETVOL_FLAG_NO_RESET)) {
1033 code = cm_UpdateVolumeLocation(cellp, userp, reqp, volp);
1035 lock_ReleaseWrite(&volp->rw);
1037 if (code == 0 && (type == BACKVOL && volp->vol[BACKVOL].ID == 0 ||
1038 type == ROVOL && volp->vol[ROVOL].ID == 0))
1039 code = CM_ERROR_NOSUCHVOLUME;
1044 lock_ObtainWrite(&cm_volumeLock);
1045 if (!(volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE) ||
1046 (flags & CM_GETVOL_FLAG_NO_LRU_UPDATE))
1047 cm_AdjustVolumeLRU(volp);
1048 lock_ReleaseWrite(&cm_volumeLock);
1051 * do not return it to the caller but do insert it in the LRU
1052 * otherwise it will be lost
1054 lock_ObtainWrite(&cm_volumeLock);
1055 if (!(volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE) ||
1056 (flags & CM_GETVOL_FLAG_NO_LRU_UPDATE))
1057 cm_AdjustVolumeLRU(volp);
1059 lock_ReleaseWrite(&cm_volumeLock);
1062 if (code == CM_ERROR_NOSUCHVOLUME && cellp->linkedName[0] &&
1063 !(flags & CM_GETVOL_FLAG_IGNORE_LINKED_CELL)) {
1064 cm_cell_t *linkedCellp = cm_GetCell(cellp->linkedName, flags);
1067 code = cm_FindVolumeByName(linkedCellp, volumeNamep, userp, reqp,
1068 flags | CM_GETVOL_FLAG_IGNORE_LINKED_CELL,
1075 * Only call this function in response to a VNOVOL or VMOVED error
1076 * from a file server. Do not call it in response to CM_ERROR_NOSUCHVOLUME
1077 * as that can lead to recursive calls.
1079 long cm_ForceUpdateVolume(cm_fid_t *fidp, cm_user_t *userp, cm_req_t *reqp)
1083 #ifdef SEARCH_ALL_VOLUMES
1090 return CM_ERROR_INVAL;
1092 cellp = cm_FindCellByID(fidp->cell, 0);
1094 return CM_ERROR_NOSUCHCELL;
1096 /* search for the volume */
1097 lock_ObtainRead(&cm_volumeLock);
1098 #ifdef SEARCH_ALL_VOLUMES
1099 for(volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
1100 if (cellp == volp->cellp &&
1101 (fidp->volume == volp->vol[RWVOL].ID ||
1102 fidp->volume == volp->vol[ROVOL].ID ||
1103 fidp->volume == volp->vol[BACKVOL].ID))
1106 #endif /* SEARCH_ALL_VOLUMES */
1108 hash = CM_VOLUME_ID_HASH(fidp->volume);
1109 /* The volumeID can be any one of the three types. So we must
1110 * search the hash table for all three types until we find it.
1111 * We will search in the order of RO, RW, BK.
1113 for ( volp = cm_data.volumeROIDHashTablep[hash]; volp; volp = volp->vol[ROVOL].nextp) {
1114 if ( cellp == volp->cellp && fidp->volume == volp->vol[ROVOL].ID )
1118 /* try RW volumes */
1119 for ( volp = cm_data.volumeRWIDHashTablep[hash]; volp; volp = volp->vol[RWVOL].nextp) {
1120 if ( cellp == volp->cellp && fidp->volume == volp->vol[RWVOL].ID )
1125 /* try BK volumes */
1126 for ( volp = cm_data.volumeBKIDHashTablep[hash]; volp; volp = volp->vol[BACKVOL].nextp) {
1127 if ( cellp == volp->cellp && fidp->volume == volp->vol[BACKVOL].ID )
1132 #ifdef SEARCH_ALL_VOLUMES
1133 osi_assertx(volp == volp2, "unexpected cm_vol_t");
1135 /* hold the volume if we found it */
1139 lock_ReleaseRead(&cm_volumeLock);
1142 return CM_ERROR_NOSUCHVOLUME;
1145 cm_data.mountRootGen = time(NULL);
1146 lock_ObtainWrite(&volp->rw);
1147 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RESET);
1148 volp->lastUpdateTime = 0;
1150 code = cm_UpdateVolumeLocation(cellp, userp, reqp, volp);
1151 lock_ReleaseWrite(&volp->rw);
1153 lock_ObtainRead(&cm_volumeLock);
1155 lock_ReleaseRead(&cm_volumeLock);
1160 /* find the appropriate servers from a volume */
1161 cm_serverRef_t **cm_GetVolServers(cm_volume_t *volp, afs_uint32 volid, cm_user_t *userp, cm_req_t *reqp, afs_uint32 *replicated)
1163 cm_serverRef_t **serverspp;
1164 cm_serverRef_t *current;
1166 cm_vol_state_t *volstatep = NULL;
1169 volstatep = cm_VolumeStateByID(volp, volid);
1171 lock_ObtainWrite(&cm_serverLock);
1174 *replicated = (volstatep->flags & CM_VOL_STATE_FLAG_REPLICATED);
1175 serverspp = &volstatep->serversp;
1177 lock_ReleaseWrite(&cm_serverLock);
1181 lock_ObtainWrite(&volp->rw);
1182 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RESET);
1183 volp->lastUpdateTime = 0;
1184 code = cm_UpdateVolumeLocation(volp->cellp, userp, reqp, volp);
1185 lock_ReleaseWrite(&volp->rw);
1193 * Increment the refCount on deleted items as well.
1194 * They will be freed by cm_FreeServerList when they get to zero
1196 for (current = *serverspp; current; current = current->next)
1197 cm_GetServerRef(current, TRUE);
1199 lock_ReleaseWrite(&cm_serverLock);
1204 void cm_PutVolume(cm_volume_t *volp)
1206 afs_int32 refCount = InterlockedDecrement(&volp->refCount);
1207 osi_assertx(refCount >= 0, "cm_volume_t refCount underflow has occurred");
1210 /* return the read-only volume, if there is one, or the read-write volume if
1213 long cm_GetROVolumeID(cm_volume_t *volp)
1217 lock_ObtainRead(&volp->rw);
1218 if (volp->vol[ROVOL].ID && !cm_IsServerListEmpty(volp->vol[ROVOL].serversp))
1219 id = volp->vol[ROVOL].ID;
1221 id = volp->vol[RWVOL].ID;
1222 lock_ReleaseRead(&volp->rw);
1227 void cm_RefreshVolumes(int lifetime)
1235 /* force mount point target updates */
1236 if (cm_data.mountRootGen + lifetime <= now)
1237 cm_data.mountRootGen = now;
1240 * force a re-loading of volume data from the vldb
1241 * if the lifetime for the cached data has expired
1243 lock_ObtainRead(&cm_volumeLock);
1244 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp) {
1246 lock_ReleaseRead(&cm_volumeLock);
1248 if (!(volp->flags & CM_VOLUMEFLAG_RESET) ||
1249 (volp->flags & CM_VOLUMEFLAG_NOEXIST)) {
1250 lock_ObtainWrite(&volp->rw);
1251 if (volp->flags & CM_VOLUMEFLAG_NOEXIST) {
1252 _InterlockedAnd(&volp->flags, ~CM_VOLUMEFLAG_NOEXIST);
1255 if (volp->flags & CM_VOLUMEFLAG_RO_MIXED) {
1256 if (volp->lastUpdateTime + 300 <= now) {
1257 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RESET);
1258 volp->lastUpdateTime = 0;
1261 if (volp->lastUpdateTime + lifetime <= now) {
1262 _InterlockedOr(&volp->flags, CM_VOLUMEFLAG_RESET);
1263 volp->lastUpdateTime = 0;
1266 lock_ReleaseWrite(&volp->rw);
1269 lock_ObtainRead(&cm_volumeLock);
1272 lock_ReleaseRead(&cm_volumeLock);
1276 cm_CheckOfflineVolumeState(cm_volume_t *volp, cm_vol_state_t *statep, afs_uint32 volID,
1277 afs_uint32 *onlinep, afs_uint32 *volumeUpdatedp)
1281 AFSFetchVolumeStatus volStat;
1286 struct rx_connection * rxconnp;
1288 char offLineMsg[256];
1290 long alldown, alldeleted;
1291 cm_serverRef_t *serversp;
1293 cm_scache_t *vscp = NULL;
1296 OfflineMsg = offLineMsg;
1299 if (statep->ID != 0 && (!volID || volID == statep->ID)) {
1300 /* create fid for volume root so that VNOVOL and VMOVED errors can be processed */
1301 cm_SetFid(&vfid, volp->cellp->cellID, statep->ID, 1, 1);
1303 if (!statep->serversp && !(*volumeUpdatedp)) {
1305 code = cm_UpdateVolumeLocation(volp->cellp, cm_rootUserp, &req, volp);
1306 *volumeUpdatedp = 1;
1309 lock_ObtainRead(&cm_serverLock);
1310 if (statep->serversp) {
1313 for (serversp = statep->serversp; serversp; serversp = serversp->next) {
1314 if (serversp->status == srv_deleted)
1319 if (!(serversp->server->flags & CM_SERVERFLAG_DOWN))
1322 if (serversp->status == srv_busy || serversp->status == srv_offline)
1323 serversp->status = srv_not_busy;
1325 lock_ReleaseRead(&cm_serverLock);
1327 if (alldeleted && !(*volumeUpdatedp)) {
1329 code = cm_UpdateVolumeLocation(volp->cellp, cm_rootUserp, &req, volp);
1330 *volumeUpdatedp = 1;
1333 if (statep->state == vl_busy || statep->state == vl_offline || statep->state == vl_unknown ||
1334 (!alldown && statep->state == vl_alldown)) {
1336 req.flags |= CM_REQ_OFFLINE_VOL_CHK;
1337 lock_ReleaseWrite(&volp->rw);
1339 code = cm_GetSCache(&vfid, NULL, &vscp, cm_rootUserp, &req);
1341 lock_ObtainWrite(&vscp->rw);
1342 code = cm_SyncOp(vscp, NULL, cm_rootUserp, &req, PRSFS_READ,
1343 CM_SCACHESYNC_NEEDCALLBACK | CM_SCACHESYNC_GETSTATUS);
1344 lock_ReleaseWrite(&vscp->rw);
1347 code = cm_ConnFromVolume(volp, statep->ID, cm_rootUserp, &req, &connp);
1351 rxconnp = cm_GetRxConn(connp);
1352 code = RXAFS_GetVolumeStatus(rxconnp, statep->ID,
1353 &volStat, &Name, &OfflineMsg, &MOTD);
1354 rx_PutConnection(rxconnp);
1355 } while (cm_Analyze(connp, cm_rootUserp, &req, &vfid, NULL, 0, NULL, NULL, NULL, NULL, code));
1356 code = cm_MapRPCError(code, &req);
1359 lock_ObtainWrite(&vscp->rw);
1360 cm_SyncOpDone(vscp, NULL, CM_SCACHESYNC_NEEDCALLBACK | CM_SCACHESYNC_GETSTATUS);
1361 lock_ReleaseWrite(&vscp->rw);
1362 cm_ReleaseSCache(vscp);
1364 lock_ObtainWrite(&volp->rw);
1365 if (code == 0 && volStat.Online) {
1366 cm_VolumeStatusNotification(volp, statep->ID, statep->state, vl_online);
1367 statep->state = vl_online;
1369 } else if (code == CM_ERROR_NOACCESS) {
1370 cm_VolumeStatusNotification(volp, statep->ID, statep->state, vl_unknown);
1371 statep->state = vl_unknown;
1374 } else if (alldown && statep->state != vl_alldown) {
1375 cm_VolumeStatusNotification(volp, statep->ID, statep->state, vl_alldown);
1376 statep->state = vl_alldown;
1379 lock_ReleaseRead(&cm_serverLock);
1380 if (statep->state != vl_alldown) {
1381 cm_VolumeStatusNotification(volp, statep->ID, statep->state, vl_alldown);
1382 statep->state = vl_alldown;
1388 /* The return code is 0 if the volume is not online and
1389 * 1 if the volume is online
1392 cm_CheckOfflineVolume(cm_volume_t *volp, afs_uint32 volID)
1396 afs_uint32 online = 0;
1397 afs_uint32 volumeUpdated = 0;
1399 lock_ObtainWrite(&volp->rw);
1401 if (volp->flags & CM_VOLUMEFLAG_RESET) {
1403 code = cm_UpdateVolumeLocation(volp->cellp, cm_rootUserp, &req, volp);
1407 cm_CheckOfflineVolumeState(volp, &volp->vol[RWVOL], volID, &online, &volumeUpdated);
1408 cm_CheckOfflineVolumeState(volp, &volp->vol[ROVOL], volID, &online, &volumeUpdated);
1409 cm_CheckOfflineVolumeState(volp, &volp->vol[BACKVOL], volID, &online, &volumeUpdated);
1411 lock_ReleaseWrite(&volp->rw);
1417 * called from the Daemon thread.
1418 * when checking the offline status, check those of the most recently used volumes first.
1420 void cm_CheckOfflineVolumes(void)
1424 extern int daemon_ShutdownFlag;
1425 extern int powerStateSuspended;
1427 lock_ObtainRead(&cm_volumeLock);
1428 for (volp = cm_data.volumeLRULastp;
1429 volp && !daemon_ShutdownFlag && !powerStateSuspended;
1430 volp=(cm_volume_t *) osi_QPrev(&volp->q)) {
1432 * Skip volume entries that did not exist last time
1433 * the vldb was queried. For those entries wait until
1434 * the next actual request is received for the volume
1435 * before checking its state.
1437 if ((volp->qflags & CM_VOLUME_QFLAG_IN_HASH) &&
1438 !(volp->flags & CM_VOLUMEFLAG_NOEXIST)) {
1440 lock_ReleaseRead(&cm_volumeLock);
1441 cm_CheckOfflineVolume(volp, 0);
1442 lock_ObtainRead(&cm_volumeLock);
1446 lock_ReleaseRead(&cm_volumeLock);
1451 cm_UpdateVolumeStatusInt(cm_volume_t *volp, struct cm_vol_state *statep)
1453 enum volstatus newStatus;
1454 cm_serverRef_t *tsrp;
1456 int someBusy = 0, someOffline = 0, allOffline = 1, allBusy = 1, allDown = 1;
1459 if (!volp || !statep) {
1466 lock_ObtainWrite(&cm_serverLock);
1467 for (tsrp = statep->serversp; tsrp; tsrp=tsrp->next) {
1469 sprintf(addr, "%d.%d.%d.%d",
1470 ((tsp->addr.sin_addr.s_addr & 0xff)),
1471 ((tsp->addr.sin_addr.s_addr & 0xff00)>> 8),
1472 ((tsp->addr.sin_addr.s_addr & 0xff0000)>> 16),
1473 ((tsp->addr.sin_addr.s_addr & 0xff000000)>> 24));
1475 if (tsrp->status == srv_deleted) {
1476 osi_Log2(afsd_logp, "cm_UpdateVolumeStatusInt volume %d server reference %s deleted",
1477 statep->ID, osi_LogSaveString(afsd_logp,addr));
1481 cm_GetServerNoLock(tsp);
1482 if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
1484 if (tsrp->status == srv_busy) {
1485 osi_Log2(afsd_logp, "cm_UpdateVolumeStatusInt volume %d server reference %s busy",
1486 statep->ID, osi_LogSaveString(afsd_logp,addr));
1489 } else if (tsrp->status == srv_offline) {
1490 osi_Log2(afsd_logp, "cm_UpdateVolumeStatusInt volume %d server reference %s offline",
1491 statep->ID, osi_LogSaveString(afsd_logp,addr));
1495 osi_Log2(afsd_logp, "cm_UpdateVolumeStatusInt volume %d server reference %s online",
1496 statep->ID, osi_LogSaveString(afsd_logp,addr));
1501 osi_Log2(afsd_logp, "cm_UpdateVolumeStatusInt volume %d server reference %s down",
1502 statep->ID, osi_LogSaveString(afsd_logp,addr));
1504 cm_PutServerNoLock(tsp);
1507 lock_ReleaseWrite(&cm_serverLock);
1509 osi_Log5(afsd_logp, "cm_UpdateVolumeStatusInt allDown %d allBusy %d someBusy %d someOffline %d allOffline %d",
1510 allDown, allBusy, someBusy, someOffline, allOffline);
1513 newStatus = vl_alldown;
1514 else if (allBusy || (someBusy && someOffline))
1515 newStatus = vl_busy;
1516 else if (allOffline)
1517 newStatus = vl_offline;
1519 newStatus = vl_online;
1521 if (statep->ID && statep->state != newStatus)
1522 cm_VolumeStatusNotification(volp, statep->ID, statep->state, newStatus);
1524 statep->state = newStatus;
1528 cm_UpdateVolumeStatus(cm_volume_t *volp, afs_uint32 volID)
1531 if (volp->vol[RWVOL].ID == volID) {
1532 cm_UpdateVolumeStatusInt(volp, &volp->vol[RWVOL]);
1533 } else if (volp->vol[ROVOL].ID == volID) {
1534 cm_UpdateVolumeStatusInt(volp, &volp->vol[ROVOL]);
1535 } else if (volp->vol[BACKVOL].ID == volID) {
1536 cm_UpdateVolumeStatusInt(volp, &volp->vol[BACKVOL]);
1539 * If we are called with volID == 0 then something has gone wrong.
1540 * Most likely a race occurred in the server volume list maintenance.
1541 * Since we don't know which volume's status should be updated,
1542 * just update all of them that are known to exist. Better to be
1543 * correct than fast.
1546 for ( volType = RWVOL; volType < NUM_VOL_TYPES; volType++) {
1547 if (volp->vol[volType].ID != 0)
1548 cm_UpdateVolumeStatusInt(volp, &volp->vol[volType]);
1554 ** Finds all volumes that reside on this server and reorders their
1555 ** RO list according to the changed rank of server.
1557 void cm_ChangeRankVolume(cm_server_t *tsp)
1563 /* find volumes which might have RO copy on server*/
1564 lock_ObtainRead(&cm_volumeLock);
1565 for(volp = cm_data.allVolumesp; volp; volp=volp->allNextp)
1567 code = 1 ; /* assume that list is unchanged */
1569 lock_ReleaseRead(&cm_volumeLock);
1570 lock_ObtainWrite(&volp->rw);
1572 if ((tsp->cellp==volp->cellp) && (volp->vol[ROVOL].serversp))
1573 code =cm_ChangeRankServer(&volp->vol[ROVOL].serversp, tsp);
1575 /* this volume list was changed */
1577 cm_RandomizeServer(&volp->vol[ROVOL].serversp);
1579 lock_ReleaseWrite(&volp->rw);
1580 lock_ObtainRead(&cm_volumeLock);
1583 lock_ReleaseRead(&cm_volumeLock);
1586 /* dump all volumes that have reference count > 0 to a file.
1587 * cookie is used to identify this batch for easy parsing,
1588 * and it a string provided by a caller
1590 int cm_DumpVolumes(FILE *outputFile, char *cookie, int lock)
1597 lock_ObtainRead(&cm_scacheLock);
1598 lock_ObtainRead(&cm_volumeLock);
1601 sprintf(output, "%s - dumping volumes - cm_data.currentVolumes=%d, cm_data.maxVolumes=%d\r\n",
1602 cookie, cm_data.currentVolumes, cm_data.maxVolumes);
1603 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1605 for (volp = cm_data.allVolumesp; volp; volp=volp->allNextp)
1608 char *srvStr = NULL;
1609 afs_uint32 srvStrRpc = TRUE;
1613 if (volp->cbServerpRO) {
1614 if (!((volp->cbServerpRO->flags & CM_SERVERFLAG_UUID) &&
1615 UuidToString((UUID *)&volp->cbServerpRO->uuid, &srvStr) == RPC_S_OK)) {
1616 srvStr = malloc(16);
1618 afs_inet_ntoa_r(volp->cbServerpRO->addr.sin_addr.s_addr, srvStr);
1622 if (volp->cbExpiresRO) {
1623 t = volp->cbExpiresRO;
1627 cbt[strlen(cbt)-1] = '\0';
1630 if (volp->creationDateRO) {
1631 t = volp->creationDateRO;
1634 cdrot = strdup(cdrot);
1635 cdrot[strlen(cdrot)-1] = '\0';
1640 "%s - volp=0x%p cell=%s name=%s rwID=%u roID=%u bkID=%u flags=0x%x:%x "
1641 "cbServerpRO='%s' cbExpiresRO='%s' creationDateRO='%s' refCount=%u\r\n",
1642 cookie, volp, volp->cellp->name, volp->namep, volp->vol[RWVOL].ID,
1643 volp->vol[ROVOL].ID, volp->vol[BACKVOL].ID, volp->flags, volp->qflags,
1644 srvStr ? srvStr : "<none>", cbt ? cbt : "<none>", cdrot ? cdrot : "<none>",
1646 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1650 RpcStringFree(&srvStr);
1659 sprintf(output, "%s - Done dumping volumes.\r\n", cookie);
1660 WriteFile(outputFile, output, (DWORD)strlen(output), &zilch, NULL);
1663 lock_ReleaseRead(&cm_volumeLock);
1664 lock_ReleaseRead(&cm_scacheLock);
1671 * String hash function used by SDBM project.
1672 * It was chosen because it is fast and provides
1675 afs_uint32 SDBMHash(const char * str)
1677 afs_uint32 hash = 0;
1683 for(i = 0, len = strlen(str); i < len; i++)
1685 hash = str[i] + (hash << 6) + (hash << 16) - hash;
1688 return (hash & 0x7FFFFFFF);
1691 /* call with volume write-locked and mutex held */
1692 void cm_AddVolumeToNameHashTable(cm_volume_t *volp)
1696 if (volp->qflags & CM_VOLUME_QFLAG_IN_HASH)
1699 i = CM_VOLUME_NAME_HASH(volp->namep);
1701 volp->nameNextp = cm_data.volumeNameHashTablep[i];
1702 cm_data.volumeNameHashTablep[i] = volp;
1703 _InterlockedOr(&volp->qflags, CM_VOLUME_QFLAG_IN_HASH);
1706 /* call with volume write-locked and mutex held */
1707 void cm_RemoveVolumeFromNameHashTable(cm_volume_t *volp)
1709 cm_volume_t **lvolpp;
1713 if (volp->qflags & CM_VOLUME_QFLAG_IN_HASH) {
1714 /* hash it out first */
1715 i = CM_VOLUME_NAME_HASH(volp->namep);
1716 for (lvolpp = &cm_data.volumeNameHashTablep[i], tvolp = cm_data.volumeNameHashTablep[i];
1718 lvolpp = &tvolp->nameNextp, tvolp = tvolp->nameNextp) {
1719 if (tvolp == volp) {
1720 *lvolpp = volp->nameNextp;
1721 _InterlockedAnd(&volp->qflags, ~CM_VOLUME_QFLAG_IN_HASH);
1722 volp->nameNextp = NULL;
1729 /* call with volume write-locked and mutex held */
1730 void cm_AddVolumeToIDHashTable(cm_volume_t *volp, afs_uint32 volType)
1733 struct cm_vol_state * statep;
1735 statep = cm_VolumeStateByType(volp, volType);
1737 if (statep->qflags & CM_VOLUME_QFLAG_IN_HASH)
1740 i = CM_VOLUME_ID_HASH(statep->ID);
1744 statep->nextp = cm_data.volumeRWIDHashTablep[i];
1745 cm_data.volumeRWIDHashTablep[i] = volp;
1748 statep->nextp = cm_data.volumeROIDHashTablep[i];
1749 cm_data.volumeROIDHashTablep[i] = volp;
1752 statep->nextp = cm_data.volumeBKIDHashTablep[i];
1753 cm_data.volumeBKIDHashTablep[i] = volp;
1756 _InterlockedOr(&statep->qflags, CM_VOLUME_QFLAG_IN_HASH);
1760 /* call with volume write-locked and mutex held */
1761 void cm_RemoveVolumeFromIDHashTable(cm_volume_t *volp, afs_uint32 volType)
1763 cm_volume_t **lvolpp;
1765 struct cm_vol_state * statep;
1768 statep = cm_VolumeStateByType(volp, volType);
1770 if (statep->qflags & CM_VOLUME_QFLAG_IN_HASH) {
1771 /* hash it out first */
1772 i = CM_VOLUME_ID_HASH(statep->ID);
1776 lvolpp = &cm_data.volumeRWIDHashTablep[i];
1777 tvolp = cm_data.volumeRWIDHashTablep[i];
1780 lvolpp = &cm_data.volumeROIDHashTablep[i];
1781 tvolp = cm_data.volumeROIDHashTablep[i];
1784 lvolpp = &cm_data.volumeBKIDHashTablep[i];
1785 tvolp = cm_data.volumeBKIDHashTablep[i];
1788 osi_assertx(0, "invalid volume type");
1791 if (tvolp == volp) {
1792 *lvolpp = statep->nextp;
1793 _InterlockedAnd(&statep->qflags, ~CM_VOLUME_QFLAG_IN_HASH);
1794 statep->nextp = NULL;
1798 lvolpp = &tvolp->vol[volType].nextp;
1799 tvolp = tvolp->vol[volType].nextp;
1804 /* must be called with cm_volumeLock write-locked! */
1805 void cm_AdjustVolumeLRU(cm_volume_t *volp)
1807 lock_AssertWrite(&cm_volumeLock);
1809 if (volp == cm_data.volumeLRUFirstp)
1812 if (volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE)
1813 osi_QRemoveHT((osi_queue_t **) &cm_data.volumeLRUFirstp, (osi_queue_t **) &cm_data.volumeLRULastp, &volp->q);
1814 osi_QAddH((osi_queue_t **) &cm_data.volumeLRUFirstp, (osi_queue_t **) &cm_data.volumeLRULastp, &volp->q);
1815 _InterlockedOr(&volp->qflags, CM_VOLUME_QFLAG_IN_LRU_QUEUE);
1817 osi_assertx(cm_data.volumeLRULastp != NULL, "null cm_data.volumeLRULastp");
1820 /* must be called with cm_volumeLock write-locked! */
1821 void cm_MoveVolumeToLRULast(cm_volume_t *volp)
1823 lock_AssertWrite(&cm_volumeLock);
1825 if (volp == cm_data.volumeLRULastp)
1828 if (volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE)
1829 osi_QRemoveHT((osi_queue_t **) &cm_data.volumeLRUFirstp, (osi_queue_t **) &cm_data.volumeLRULastp, &volp->q);
1830 osi_QAddT((osi_queue_t **) &cm_data.volumeLRUFirstp, (osi_queue_t **) &cm_data.volumeLRULastp, &volp->q);
1831 _InterlockedOr(&volp->qflags, CM_VOLUME_QFLAG_IN_LRU_QUEUE);
1833 osi_assertx(cm_data.volumeLRULastp != NULL, "null cm_data.volumeLRULastp");
1836 /* must be called with cm_volumeLock write-locked! */
1837 void cm_RemoveVolumeFromLRU(cm_volume_t *volp)
1839 lock_AssertWrite(&cm_volumeLock);
1841 if (volp->qflags & CM_VOLUME_QFLAG_IN_LRU_QUEUE) {
1842 osi_QRemoveHT((osi_queue_t **) &cm_data.volumeLRUFirstp, (osi_queue_t **) &cm_data.volumeLRULastp, &volp->q);
1843 _InterlockedAnd(&volp->qflags, ~CM_VOLUME_QFLAG_IN_LRU_QUEUE);
1846 osi_assertx(cm_data.volumeLRULastp != NULL, "null cm_data.volumeLRULastp");
1849 static char * volstatus_str(enum volstatus vs)
1865 void cm_VolumeStatusNotification(cm_volume_t * volp, afs_uint32 volID, enum volstatus old, enum volstatus new)
1867 char volstr[CELL_MAXNAMELEN + VL_MAXNAMELEN]="";
1870 if (volID == volp->vol[RWVOL].ID)
1872 else if (volID == volp->vol[ROVOL].ID)
1874 else if (volID == volp->vol[BACKVOL].ID)
1878 snprintf(volstr, sizeof(volstr), "%s:%s%s", volp->cellp->name, volp->namep, ext);
1880 osi_Log4(afsd_logp, "VolumeStatusNotification: %-48s [%10u] (%s -> %s)",
1881 osi_LogSaveString(afsd_logp, volstr), volID, volstatus_str(old), volstatus_str(new));
1883 cm_VolStatus_Change_Notification(volp->cellp->cellID, volID, new);
1886 enum volstatus cm_GetVolumeStatus(cm_volume_t *volp, afs_uint32 volID)
1888 cm_vol_state_t * statep = cm_VolumeStateByID(volp, volID);
1890 return statep->state;
1895 /* Renew .readonly volume callbacks that are more than
1896 * 30 minutes old. (A volume callback is issued for 2 hours.)
1899 cm_VolumeRenewROCallbacks(void)
1902 time_t minexp = time(NULL) + 90 * 60;
1903 extern int daemon_ShutdownFlag;
1904 extern int powerStateSuspended;
1906 lock_ObtainRead(&cm_volumeLock);
1907 for (volp = cm_data.allVolumesp;
1908 volp && !daemon_ShutdownFlag && !powerStateSuspended;
1909 volp=volp->allNextp) {
1910 if ( volp->cbExpiresRO > 0 && volp->cbExpiresRO < minexp) {
1915 cm_SetFid(&fid, volp->cellp->cellID, volp->vol[ROVOL].ID, 1, 1);
1919 lock_ReleaseRead(&cm_volumeLock);
1920 if (cm_GetSCache(&fid, NULL, &scp, cm_rootUserp, &req) == 0) {
1921 lock_ObtainWrite(&scp->rw);
1922 cm_GetCallback(scp, cm_rootUserp, &req, 1);
1923 lock_ReleaseWrite(&scp->rw);
1924 cm_ReleaseSCache(scp);
1926 lock_ObtainRead(&cm_volumeLock);
1929 lock_ReleaseRead(&cm_volumeLock);
1933 cm_VolumeStateByType(cm_volume_t *volp, afs_uint32 volType)
1935 return &volp->vol[volType];
1939 cm_VolumeStateByID(cm_volume_t *volp, afs_uint32 id)
1941 cm_vol_state_t * statep = NULL;
1943 if (id == volp->vol[RWVOL].ID)
1944 statep = &volp->vol[RWVOL];
1945 else if (id == volp->vol[ROVOL].ID)
1946 statep = &volp->vol[ROVOL];
1947 else if (id == volp->vol[BACKVOL].ID)
1948 statep = &volp->vol[BACKVOL];
1954 cm_VolumeStateByName(cm_volume_t *volp, char *volname)
1956 size_t len = strlen(volname);
1957 cm_vol_state_t *statep;
1959 if (cm_stricmp_utf8N(".readonly", &volname[len-9]) == 0)
1960 statep = &volp->vol[ROVOL];
1961 else if (cm_stricmp_utf8N(".backup", &volname[len-7]) == 0)
1962 statep = &volp->vol[BACKVOL];
1964 statep = &volp->vol[RWVOL];
1970 cm_VolumeType(cm_volume_t *volp, afs_uint32 id)
1972 if (id == volp->vol[RWVOL].ID)
1974 else if (id == volp->vol[ROVOL].ID)
1976 else if (id == volp->vol[BACKVOL].ID)
1983 cm_ChecksumVolumeServerList(struct cm_fid *fidp, cm_user_t *userp, cm_req_t *reqp)
1987 afs_uint32 replicated;
1988 cm_serverRef_t **serverspp;
1990 code = cm_GetServerList(fidp, userp, reqp, &replicated, &serverspp);
1992 cksum = cm_ChecksumServerList(*serverspp);
1993 cm_FreeServerList(serverspp, 0);
1999 cm_IsVolumeReplicated(cm_fid_t *fidp)
2001 afs_int32 replicated = 0;
2003 cm_vol_state_t * volstatep;
2005 volp = cm_GetVolumeByFID(fidp);
2007 volstatep = cm_VolumeStateByID(volp, fidp->volume);
2008 replicated = (volstatep->flags & CM_VOL_STATE_FLAG_REPLICATED);