2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
10 #include <afsconfig.h>
11 #include <afs/param.h>
17 #include <sys/types.h>
21 #include <sys/statfs.h>
28 #include <netinet/in.h>
32 #include <afs/voldefs.h>
35 #include <afs/vlserver.h>
37 #include <afs/cellconfig.h>
40 #include <afs/afsint.h>
44 #include <afs/com_err.h>
46 #include <afs/kautils.h>
49 #define ERRCODE_RANGE 8 /* from error_table.h */
50 #define CLOCKSKEW 2 /* not really skew, but resolution */
51 #define CLOCKADJ(x) (((x) < CLOCKSKEW) ? 0 : (x) - CLOCKSKEW)
53 /* for UV_MoveVolume() recovery */
55 #include <afs/procmgmt.h> /* signal(), kill(), wait(), etc. */
58 #include "volser_prototypes.h"
59 #include "vsutils_prototypes.h"
60 #include "lockprocs_prototypes.h"
62 struct ubik_client *cstruct;
63 int verbose = 0, noresolve = 0;
68 afs_int32 vldbEntryIndex;
71 /* Utility macros used by rest of this source file */
72 #define EPRINT(ec, es) \
74 fprintf(STDERR, "\n"); \
75 fprintf(STDERR, (es)); \
79 #define EPRINT1(ec, es, ep1) \
81 fprintf(STDERR, "\n"); \
82 fprintf(STDERR, (es), (ep1)); \
86 #define EPRINT2(ec, es, ep1, ep2) \
88 fprintf(STDERR, "\n"); \
89 fprintf(STDERR, (es), (ep1), (ep2)); \
93 #define EPRINT3(ec, es, ep1, ep2, ep3) \
95 fprintf(STDERR, "\n"); \
96 fprintf(STDERR, (es), (ep1), (ep2), (ep3)); \
100 #define EGOTO(where, ec, es) \
109 #define EGOTO1(where, ec, es, ep1) \
112 EPRINT1((ec),(es),(ep1)); \
118 #define EGOTO2(where, ec, es, ep1, ep2) \
121 EPRINT2((ec),(es),(ep1),(ep2)); \
127 #define EGOTO3(where, ec, es, ep1, ep2, ep3) \
130 EPRINT3((ec),(es),(ep1),(ep2),(ep3)); \
137 { if (verbose) { fprintf(STDOUT, (es)); fflush(STDOUT); } }
138 #define VPRINT1(es, p) \
139 { if (verbose) { fprintf(STDOUT, (es), (p)); fflush(STDOUT); } }
140 #define VPRINT2(es, p1, p2) \
141 { if (verbose) { fprintf(STDOUT, (es), (p1), (p2)); fflush(STDOUT); } }
142 #define VPRINT3(es, p1, p2, p3) \
143 { if (verbose) { fprintf(STDOUT, (es), (p1), (p2), (p3)); fflush(STDOUT); } }
145 { if (verbose) { fprintf(STDOUT, " done\n"); fflush(STDOUT); } }
146 #define VEPRINT(es) \
147 { if (verbose) { fprintf(STDERR, (es)); fflush(STDERR); } }
148 #define VEPRINT1(es, p) \
149 { if (verbose) { fprintf(STDERR, (es), (p)); fflush(STDERR); } }
150 #define VEPRINT2(es, p1, p2) \
151 { if (verbose) { fprintf(STDERR, (es), (p1), (p2)); fflush(STDERR); } }
152 #define VEPRINT3(es, p1, p2, p3) \
153 { if (verbose) { fprintf(STDERR, (es), (p1), (p2), (p3)); fflush(STDERR); } }
155 { if (verbose) { fprintf(STDERR, " done\n"); fflush(STDERR); } }
159 /* getting rid of this */
160 #define ERROR_EXIT(code) {error=(code); goto error_exit;}
163 /* Protos for static routines */
164 static afs_int32 CheckAndDeleteVolume(struct rx_connection *aconn,
165 afs_int32 apart, afs_int32 okvol,
167 static int DelVol(struct rx_connection *conn, afs_int32 vid, afs_int32 part,
169 static int GetTrans(struct nvldbentry *vldbEntryPtr, afs_int32 index,
170 struct rx_connection **connPtr, afs_int32 * transPtr,
171 afs_int32 * crtimePtr, afs_int32 * uptimePtr);
172 static int SimulateForwardMultiple(struct rx_connection *fromconn,
173 afs_int32 fromtid, afs_int32 fromdate,
174 manyDests * tr, afs_int32 flags,
175 void *cookie, manyResults * results);
176 static afs_int32 CheckVolume(volintInfo * volumeinfo, afs_int32 aserver,
177 afs_int32 apart, afs_int32 * modentry,
178 afs_uint32 * maxvolid);
181 /*map the partition <partId> into partition name <partName>*/
183 MapPartIdIntoName(afs_int32 partId, char *partName)
185 if (partId < 26) { /* what if partId > = 26 ? */
186 strcpy(partName, "/vicep");
187 partName[6] = partId + 'a';
190 } else if (partId < VOLMAXPARTS) {
191 strcpy(partName, "/vicep");
193 partName[6] = 'a' + (partId / 26);
194 partName[7] = 'a' + (partId % 26);
206 fprintf(STDERR, "Do you want to %s? [yn](n): ", str);
207 response = c = getchar();
208 while (!(c == EOF || c == '\n'))
209 c = getchar(); /*skip to end of line */
210 code = (response == 'y' || response == 'Y');
216 PrintError(char *msg, afs_int32 errcode)
218 fprintf(STDERR, msg);
219 /*replace by a big switch statement */
224 fprintf(STDERR, "Possible communication failure\n");
227 fprintf(STDERR, "Volume needs to be salvaged\n");
230 fprintf(STDERR, "Bad vnode number quoted\n");
234 "Volume not attached, does not exist, or not on line\n");
237 fprintf(STDERR, "Volume already exists\n");
240 fprintf(STDERR, "Volume is not in service\n");
243 fprintf(STDERR, "Volume is off line\n");
246 fprintf(STDERR, "Volume is already on line\n");
249 fprintf(STDERR, "Partition is full\n");
252 fprintf(STDERR, "Volume max quota exceeded\n");
255 fprintf(STDERR, "Volume temporarily unavailable\n");
258 fprintf(STDERR, "Volume has moved to another server\n");
261 fprintf(STDERR, "VLDB: volume Id exists in the vldb\n");
264 fprintf(STDERR, "VLDB: a read terminated too early\n");
267 fprintf(STDERR, "VLDB: volume entry exists in the vldb\n");
270 fprintf(STDERR, "VLDB: internal creation failure\n");
273 fprintf(STDERR, "VLDB: no such entry\n");
276 fprintf(STDERR, "VLDB: vldb database is empty\n");
279 fprintf(STDERR, "VLDB: entry is deleted (soft delete)\n");
282 fprintf(STDERR, "VLDB: volume name is illegal\n");
285 fprintf(STDERR, "VLDB: index was out of range\n");
288 fprintf(STDERR, "VLDB: bad volume type\n");
291 fprintf(STDERR, "VLDB: illegal server number (not within limits)\n");
293 case VL_BADPARTITION:
294 fprintf(STDERR, "VLDB: bad partition number\n");
297 fprintf(STDERR, "VLDB: run out of space for replication sites\n");
300 fprintf(STDERR, "VLDB: no such repsite server exists\n");
302 case VL_DUPREPSERVER:
303 fprintf(STDERR, "VLDB: replication site server already exists\n");
306 fprintf(STDERR, "VLDB: parent r/w entry not found\n");
309 fprintf(STDERR, "VLDB: illegal reference count number\n");
311 case VL_SIZEEXCEEDED:
312 fprintf(STDERR, "VLDB: vldb size for attributes exceeded\n");
315 fprintf(STDERR, "VLDB: bad incoming vldb entry\n");
317 case VL_BADVOLIDBUMP:
318 fprintf(STDERR, "VLDB: illegal max volid increment\n");
320 case VL_IDALREADYHASHED:
321 fprintf(STDERR, "VLDB: (RO/BACK) Id already hashed\n");
324 fprintf(STDERR, "VLDB: vldb entry is already locked\n");
327 fprintf(STDERR, "VLDB: bad volume operation code\n");
329 case VL_BADRELLOCKTYPE:
330 fprintf(STDERR, "VLDB: bad release lock type\n");
333 fprintf(STDERR, "VLDB: status report: last release was aborted\n");
335 case VL_BADSERVERFLAG:
336 fprintf(STDERR, "VLDB: invalid replication site server flag\n");
339 fprintf(STDERR, "VLDB: no permission access for call\n");
341 case VOLSERREAD_DUMPERROR:
343 "VOLSER: Problems encountered in reading the dump file !\n");
345 case VOLSERDUMPERROR:
346 fprintf(STDERR, "VOLSER: Problems encountered in doing the dump !\n");
348 case VOLSERATTACH_ERROR:
349 fprintf(STDERR, "VOLSER: Could not attach the volume\n");
351 case VOLSERDETACH_ERROR:
352 fprintf(STDERR, "VOLSER: Could not detach the volume\n");
354 case VOLSERILLEGAL_PARTITION:
355 fprintf(STDERR, "VOLSER: encountered illegal partition number\n");
357 case VOLSERBAD_ACCESS:
358 fprintf(STDERR, "VOLSER: permission denied, not a super user\n");
360 case VOLSERVLDB_ERROR:
361 fprintf(STDERR, "VOLSER: error detected in the VLDB\n");
364 fprintf(STDERR, "VOLSER: error in volume name\n");
367 fprintf(STDERR, "VOLSER: volume has moved\n");
370 fprintf(STDERR, "VOLSER: illegal operation\n");
372 case VOLSERBADRELEASE:
373 fprintf(STDERR, "VOLSER: release could not be completed\n");
376 fprintf(STDERR, "VOLSER: volume is busy\n");
378 case VOLSERNO_MEMORY:
379 fprintf(STDERR, "VOLSER: volume server is out of memory\n");
383 "VOLSER: no such volume - location specified incorrectly or volume does not exist\n");
385 case VOLSERMULTIRWVOL:
387 "VOLSER: multiple RW volumes with same ID, one of which should be deleted\n");
391 "VOLSER: not all entries were successfully processed\n");
398 initialize_KA_error_table();
399 initialize_RXK_error_table();
400 initialize_KTC_error_table();
401 initialize_ACFG_error_table();
402 initialize_CMD_error_table();
403 initialize_VL_error_table();
405 offset = errcode & ((1 << ERRCODE_RANGE) - 1);
406 fprintf(STDERR, "%s: %s\n", afs_error_table_name(errcode),
407 afs_error_message(errcode));
414 void init_volintInfo(struct volintInfo *vinfo) {
415 memset(vinfo, 0, sizeof(struct volintInfo));
417 vinfo->maxquota = -1;
419 vinfo->creationDate = -1;
420 vinfo->updateDate = -1;
428 static struct rx_securityClass *uvclass = 0;
429 static int uvindex = -1;
430 /* called by VLDBClient_Init to set the security module to be used in the RPC */
432 UV_SetSecurity(register struct rx_securityClass *as, afs_int32 aindex)
439 /* bind to volser on <port> <aserver> */
440 /* takes server address in network order, port in host order. dumb */
441 struct rx_connection *
442 UV_Bind(afs_int32 aserver, afs_int32 port)
444 register struct rx_connection *tc;
446 tc = rx_NewConnection(aserver, htons(port), VOLSERVICE_ID, uvclass,
451 /* if <okvol> is allright(indicated by beibg able to
452 * start a transaction, delete the <delvol> */
454 CheckAndDeleteVolume(struct rx_connection *aconn, afs_int32 apart,
455 afs_int32 okvol, afs_int32 delvol)
457 afs_int32 error, code, tid, rcode;
463 code = AFSVolTransCreate(aconn, delvol, apart, ITOffline, &tid);
466 code = AFSVolDeleteVolume(aconn, tid);
469 code = AFSVolEndTrans(aconn, tid, &rcode);
476 code = AFSVolTransCreate(aconn, okvol, apart, ITOffline, &tid);
478 code = AFSVolEndTrans(aconn, tid, &rcode);
483 code = AFSVolTransCreate(aconn, delvol, apart, ITOffline, &tid);
486 code = AFSVolDeleteVolume(aconn, tid);
489 code = AFSVolEndTrans(aconn, tid, &rcode);
500 /* called by EmuerateEntry, show vldb entry in a reasonable format */
502 SubEnumerateEntry(struct nvldbentry *entry)
510 fprintf(STDOUT, " readWriteID %-10u ", entry->volumeId[RWVOL]);
511 if (entry->flags & RW_EXISTS)
512 fprintf(STDOUT, " valid \n");
514 fprintf(STDOUT, " invalid \n");
515 fprintf(STDOUT, " readOnlyID %-10u ", entry->volumeId[ROVOL]);
516 if (entry->flags & RO_EXISTS)
517 fprintf(STDOUT, " valid \n");
519 fprintf(STDOUT, " invalid \n");
520 fprintf(STDOUT, " backUpID %-10u ", entry->volumeId[BACKVOL]);
521 if (entry->flags & BACK_EXISTS)
522 fprintf(STDOUT, " valid \n");
524 fprintf(STDOUT, " invalid \n");
525 if ((entry->cloneId != 0) && (entry->flags & RO_EXISTS))
526 fprintf(STDOUT, " releaseClone %-10u \n", entry->cloneId);
528 if (entry->flags & RW_EXISTS)
529 fprintf(STDOUT, " RWrite: %-10u", entry->volumeId[RWVOL]);
530 if (entry->flags & RO_EXISTS)
531 fprintf(STDOUT, " ROnly: %-10u", entry->volumeId[ROVOL]);
532 if (entry->flags & BACK_EXISTS)
533 fprintf(STDOUT, " Backup: %-10u", entry->volumeId[BACKVOL]);
534 if ((entry->cloneId != 0) && (entry->flags & RO_EXISTS))
535 fprintf(STDOUT, " RClone: %-10lu", (unsigned long)entry->cloneId);
536 fprintf(STDOUT, "\n");
538 fprintf(STDOUT, " number of sites -> %lu\n",
539 (unsigned long)entry->nServers);
540 for (i = 0; i < entry->nServers; i++) {
541 if (entry->serverFlags[i] & NEW_REPSITE)
544 for (i = 0; i < entry->nServers; i++) {
545 MapPartIdIntoName(entry->serverPartition[i], pname);
546 fprintf(STDOUT, " server %s partition %s ",
547 noresolve ? afs_inet_ntoa_r(entry->serverNumber[i], hoststr) :
548 hostutil_GetNameByINet(entry->serverNumber[i]), pname);
549 if (entry->serverFlags[i] & ITSRWVOL)
550 fprintf(STDOUT, "RW Site ");
552 fprintf(STDOUT, "RO Site ");
554 if (entry->serverFlags[i] & NEW_REPSITE)
555 fprintf(STDOUT," -- New release");
557 if (!(entry->serverFlags[i] & ITSRWVOL))
558 fprintf(STDOUT," -- Old release");
560 if (entry->serverFlags[i] & RO_DONTUSE)
561 fprintf(STDOUT, " -- Not released");
563 fprintf(STDOUT, "\n");
570 /*enumerate the vldb entry corresponding to <entry> */
572 EnumerateEntry(struct nvldbentry *entry)
575 fprintf(STDOUT, "\n");
576 fprintf(STDOUT, "%s \n", entry->name);
577 SubEnumerateEntry(entry);
581 /* forcibly remove a volume. Very dangerous call */
583 UV_NukeVolume(afs_int32 server, afs_int32 partid, afs_int32 volid)
585 register struct rx_connection *tconn;
586 register afs_int32 code;
588 tconn = UV_Bind(server, AFSCONF_VOLUMEPORT);
590 code = AFSVolNukeVolume(tconn, partid, volid);
591 rx_DestroyConnection(tconn);
597 /* like df. Return usage of <pname> on <server> in <partition> */
599 UV_PartitionInfo64(afs_int32 server, char *pname,
600 struct diskPartition64 *partition)
602 register struct rx_connection *aconn;
605 aconn = (struct rx_connection *)0;
606 aconn = UV_Bind(server, AFSCONF_VOLUMEPORT);
607 code = AFSVolPartitionInfo64(aconn, pname, partition);
608 if (code == RXGEN_OPCODE) {
609 struct diskPartition *dpp =
610 (struct diskPartition *)malloc(sizeof(struct diskPartition));
611 code = AFSVolPartitionInfo(aconn, pname, dpp);
613 strncpy(partition->name, dpp->name, 32);
614 strncpy(partition->devName, dpp->devName, 32);
615 partition->lock_fd = dpp->lock_fd;
616 partition->free = dpp->free;
617 partition->minFree = dpp->minFree;
622 fprintf(STDERR, "Could not get information on partition %s\n", pname);
623 PrintError("", code);
626 rx_DestroyConnection(aconn);
630 /* old interface to create volume */
632 UV_CreateVolume(afs_int32 aserver, afs_int32 apart, char *aname,
636 code = UV_CreateVolume2(aserver, apart, aname, 5000, 0, 0, 0, 0, anewid);
640 /* create a volume, given a server, partition number, volume name --> sends
641 * back new vol id in <anewid>*/
643 UV_CreateVolume2(afs_int32 aserver, afs_int32 apart, char *aname,
644 afs_int32 aquota, afs_int32 aspare1, afs_int32 aspare2,
645 afs_int32 aspare3, afs_int32 aspare4, afs_int32 * anewid)
648 register struct rx_connection *aconn;
650 register afs_int32 code;
652 afs_int32 rcode, vcode;
653 struct nvldbentry entry, storeEntry; /*the new vldb entry */
654 struct volintInfo tstatus;
657 aconn = (struct rx_connection *)0;
660 init_volintInfo(&tstatus);
661 tstatus.maxquota = aquota;
663 aconn = UV_Bind(aserver, AFSCONF_VOLUMEPORT);
664 /* next the next 3 available ids from the VLDB */
665 vcode = ubik_VL_GetNewVolumeId(cstruct, 0, 3, anewid);
666 EGOTO1(cfail, vcode, "Could not get an Id for volume %s\n", aname);
669 AFSVolCreateVolume(aconn, apart, aname, volser_RW, 0, anewid, &tid);
670 EGOTO2(cfail, vcode, "Failed to create the volume %s %u \n", aname,
673 code = AFSVolSetInfo(aconn, tid, &tstatus);
675 EPRINT(code, "Could not change quota, continuing...\n");
677 code = AFSVolSetFlags(aconn, tid, 0); /* bring it online (mark it InService */
678 EGOTO2(cfail, vcode, "Could not bring the volume %s %u online \n", aname,
681 VPRINT2("Volume %s %u created and brought online\n", aname, *anewid);
683 /* set up the vldb entry for this volume */
684 strncpy(entry.name, aname, VOLSER_OLDMAXVOLNAME);
686 entry.serverNumber[0] = aserver; /* this should have another
687 * level of indirection later */
688 entry.serverPartition[0] = apart; /* this should also have
689 * another indirection level */
690 entry.flags = RW_EXISTS; /* this records that rw volume exists */
691 entry.serverFlags[0] = ITSRWVOL; /*this rep site has rw vol */
692 entry.volumeId[RWVOL] = *anewid;
693 entry.volumeId[ROVOL] = *anewid + 1; /* rw,ro, bk id are related in the default case */
694 entry.volumeId[BACKVOL] = *anewid + 2;
696 /*map into right byte order, before passing to xdr, the stuff has to be in host
697 * byte order. Xdr converts it into network order */
698 MapNetworkToHost(&entry, &storeEntry);
699 /* create the vldb entry */
700 vcode = VLDB_CreateEntry(&storeEntry);
703 "Could not create a VLDB entry for the volume %s %lu\n",
704 aname, (unsigned long)*anewid);
705 /*destroy the created volume */
706 VPRINT1("Deleting the newly created volume %u\n", *anewid);
707 AFSVolDeleteVolume(aconn, tid);
711 VPRINT2("Created the VLDB entry for the volume %s %u\n", aname, *anewid);
712 /* volume created, now terminate the transaction and release the connection */
713 code = AFSVolEndTrans(aconn, tid, &rcode); /*if it crashes before this
714 * the volume will come online anyway when transaction timesout , so if
715 * vldb entry exists then the volume is guaranteed to exist too wrt create */
719 "Failed to end the transaction on the volume %s %lu\n", aname,
720 (unsigned long)*anewid);
727 code = AFSVolEndTrans(aconn, tid, &rcode);
729 fprintf(STDERR, "WARNING: could not end transaction\n");
732 rx_DestroyConnection(aconn);
733 PrintError("", error);
739 /* create a volume, given a server, partition number, volume name --> sends
740 * back new vol id in <anewid>*/
742 UV_AddVLDBEntry(afs_int32 aserver, afs_int32 apart, char *aname,
745 register struct rx_connection *aconn;
748 struct nvldbentry entry, storeEntry; /*the new vldb entry */
750 aconn = (struct rx_connection *)0;
753 /* set up the vldb entry for this volume */
754 strncpy(entry.name, aname, VOLSER_OLDMAXVOLNAME);
756 entry.serverNumber[0] = aserver; /* this should have another
757 * level of indirection later */
758 entry.serverPartition[0] = apart; /* this should also have
759 * another indirection level */
760 entry.flags = RW_EXISTS; /* this records that rw volume exists */
761 entry.serverFlags[0] = ITSRWVOL; /*this rep site has rw vol */
762 entry.volumeId[RWVOL] = aid;
764 entry.volumeId[ROVOL] = anewid + 1; /* rw,ro, bk id are related in the default case */
765 entry.volumeId[BACKVOL] = *anewid + 2;
767 entry.volumeId[ROVOL] = 0;
768 entry.volumeId[BACKVOL] = 0;
771 /*map into right byte order, before passing to xdr, the stuff has to be in host
772 * byte order. Xdr converts it into network order */
773 MapNetworkToHost(&entry, &storeEntry);
774 /* create the vldb entry */
775 vcode = VLDB_CreateEntry(&storeEntry);
778 "Could not create a VLDB entry for the volume %s %lu\n",
779 aname, (unsigned long)aid);
783 VPRINT2("Created the VLDB entry for the volume %s %u\n", aname, aid);
787 rx_DestroyConnection(aconn);
788 PrintError("", error);
792 /* Delete the volume <volid>on <aserver> <apart>
793 * the physical entry gets removed from the vldb only if the ref count
797 UV_DeleteVolume(afs_int32 aserver, afs_int32 apart, afs_int32 avolid)
799 struct rx_connection *aconn = (struct rx_connection *)0;
801 afs_int32 code, rcode;
803 struct nvldbentry entry, storeEntry;
805 afs_int32 avoltype = -1, vtype;
806 int notondisk = 0, notinvldb = 0;
808 /* Find and read bhe VLDB entry for this volume */
809 code = ubik_VL_SetLock(cstruct, 0, avolid, avoltype, VLOP_DELETE);
811 if (code != VL_NOENT) {
812 EGOTO1(error_exit, code,
813 "Could not lock VLDB entry for the volume %u\n", avolid);
819 code = VLDB_GetEntryByID(avolid, avoltype, &entry);
820 EGOTO1(error_exit, code, "Could not fetch VLDB entry for volume %u\n",
822 MapHostToNetwork(&entry);
825 EnumerateEntry(&entry);
828 /* Whether volume is in the VLDB or not. Delete the volume on disk */
829 aconn = UV_Bind(aserver, AFSCONF_VOLUMEPORT);
830 code = AFSVolTransCreate(aconn, avolid, apart, ITOffline, &ttid);
832 if (code == VNOVOL) {
835 EGOTO1(error_exit, code, "Transaction on volume %u failed\n",
839 VPRINT1("Trying to delete the volume %u ...", avolid);
841 code = AFSVolDeleteVolume(aconn, ttid);
842 EGOTO1(error_exit, code, "Could not delete the volume %u \n", avolid);
844 code = AFSVolEndTrans(aconn, ttid, &rcode);
845 code = (code ? code : rcode);
847 EGOTO1(error_exit, code,
848 "Could not end the transaction for the volume %u \n", avolid);
852 /* Now update the VLDB entry.
853 * But first, verify we have a VLDB entry.
854 * Whether volume is on disk or not. Delete the volume in VLDB.
859 if (avolid == entry.volumeId[BACKVOL]) {
860 /* Its a backup volume, modify the VLDB entry. Check that the
861 * backup volume is on the server/partition we asked to delete.
863 if (!(entry.flags & BACK_EXISTS) || !Lp_Match(aserver, apart, &entry)) {
864 notinvldb = 2; /* Not on this server and partition */
868 VPRINT1("Marking the backup volume %u deleted in the VLDB\n", avolid);
870 entry.flags &= ~BACK_EXISTS;
874 else if (avolid == entry.volumeId[ROVOL]) {
875 /* Its a read-only volume, modify the VLDB entry. Check that the
876 * readonly volume is on the server/partition we asked to delete.
877 * If flags does not have RO_EIXSTS set, then this may mean the RO
878 * hasn't been released (and could exist in VLDB).
880 if (!Lp_ROMatch(aserver, apart, &entry)) {
881 notinvldb = 2; /* Not found on this server and partition */
887 "Marking the readonly volume %lu deleted in the VLDB\n",
888 (unsigned long)avolid);
890 Lp_SetROValue(&entry, aserver, apart, 0, 0); /* delete the site */
892 if (!Lp_ROMatch(0, 0, &entry))
893 entry.flags &= ~RO_EXISTS; /* This was the last ro volume */
897 else if (avolid == entry.volumeId[RWVOL]) {
898 /* It's a rw volume, delete the backup volume, modify the VLDB entry.
899 * Check that the readwrite volumes is on the server/partition we
902 if (!(entry.flags & RW_EXISTS) || !Lp_Match(aserver, apart, &entry)) {
903 notinvldb = 2; /* Not found on this server and partition */
907 /* Delete backup if it exists */
909 AFSVolTransCreate(aconn, entry.volumeId[BACKVOL], apart,
913 fprintf(STDOUT, "Trying to delete the backup volume %u ...",
914 entry.volumeId[BACKVOL]);
917 code = AFSVolDeleteVolume(aconn, ttid);
918 EGOTO1(error_exit, code, "Could not delete the volume %u \n",
919 entry.volumeId[BACKVOL]);
921 code = AFSVolEndTrans(aconn, ttid, &rcode);
923 code = (code ? code : rcode);
924 EGOTO1(error_exit, code,
925 "Could not end the transaction for the volume %u \n",
926 entry.volumeId[BACKVOL]);
928 fprintf(STDOUT, " done\n");
933 "Marking the readwrite volume %lu%s deleted in the VLDB\n",
934 (unsigned long)avolid,
936 flags & BACK_EXISTS) ? ", and its backup volume," :
939 Lp_SetRWValue(&entry, aserver, apart, 0L, 0L);
941 entry.flags &= ~(BACK_EXISTS | RW_EXISTS);
944 if (entry.flags & RO_EXISTS)
945 fprintf(STDERR, "WARNING: ReadOnly copy(s) may still exist\n");
949 notinvldb = 2; /* Not found on this server and partition */
953 /* Either delete or replace the VLDB entry */
954 if ((entry.nServers <= 0) || !(entry.flags & (RO_EXISTS | RW_EXISTS))) {
957 "Last reference to the VLDB entry for %lu - deleting entry\n",
958 (unsigned long)avolid);
959 code = ubik_VL_DeleteEntry(cstruct, 0, avolid, vtype);
960 EGOTO1(error_exit, code,
961 "Could not delete the VLDB entry for the volume %u \n",
964 MapNetworkToHost(&entry, &storeEntry);
966 VLDB_ReplaceEntry(avolid, vtype, &storeEntry,
967 (LOCKREL_OPCODE | LOCKREL_AFSID |
969 EGOTO1(error_exit, code,
970 "Could not update the VLDB entry for the volume %u \n",
979 if (notondisk && notinvldb) {
980 EPRINT2(VOLSERNOVOL, "Volume %u does not exist %s\n", avolid,
981 ((notinvldb == 2) ? "on server and partition" : ""));
984 } else if (notondisk) {
986 "WARNING: Volume %lu did not exist on the partition\n",
987 (unsigned long)avolid);
988 } else if (notinvldb) {
989 fprintf(STDERR, "WARNING: Volume %lu does not exist in VLDB %s\n",
990 (unsigned long)avolid,
991 ((notinvldb == 2) ? "on server and partition" : ""));
995 code = AFSVolEndTrans(aconn, ttid, &rcode);
996 code = (code ? code : rcode);
998 fprintf(STDERR, "Could not end transaction on the volume %lu\n",
999 (unsigned long)avolid);
1000 PrintError("", code);
1008 ubik_VL_ReleaseLock(cstruct, 0, avolid, -1,
1009 (LOCKREL_OPCODE | LOCKREL_AFSID |
1010 LOCKREL_TIMESTAMP));
1013 "Could not release the lock on the VLDB entry for the volume %u \n",
1021 rx_DestroyConnection(aconn);
1025 /* add recovery to UV_MoveVolume */
1027 #define TESTC 0 /* set to test recovery code, clear for production */
1033 sigint_handler(int x)
1038 fprintf(STDOUT, "\nSIGINT handler: vos move operation in progress\n");
1040 "WARNING: may leave AFS storage and metadata in indeterminate state\n");
1041 fprintf(STDOUT, "enter second control-c to exit\n");
1045 (void)signal(SIGINT, sigint_handler);
1050 /* Move volume <afromvol> on <afromserver> <afrompart> to <atoserver>
1051 * <atopart>. The operation is almost idempotent. The following
1052 * flags are recognized:
1054 * RV_NOCLONE - don't use a copy clone
1058 UV_MoveVolume2(afs_int32 afromvol, afs_int32 afromserver, afs_int32 afrompart,
1059 afs_int32 atoserver, afs_int32 atopart, int flags)
1061 struct rx_connection *toconn, *fromconn;
1062 afs_int32 fromtid, totid, clonetid;
1065 char tmpName[VOLSER_MAXVOLNAME + 1];
1068 struct restoreCookie cookie;
1069 register afs_int32 vcode, code;
1070 afs_int32 newVol, volid, backupId;
1071 struct volser_status tstatus;
1072 struct destServer destination;
1074 struct nvldbentry entry, storeEntry;
1075 int i, islocked, pntg;
1077 char in, lf; /* for test code */
1081 #ifdef ENABLE_BUGFIX_1165
1082 volEntries volumeInfo;
1083 struct volintInfo *infop = 0;
1087 fromconn = (struct rx_connection *)0;
1088 toconn = (struct rx_connection *)0;
1098 /* support control-c processing */
1101 (void)signal(SIGINT, sigint_handler);
1105 "\nThere are three tests points - verifies all code paths through recovery.\n");
1106 fprintf(STDOUT, "First test point - operation not started.\n");
1107 fprintf(STDOUT, "...test here (y, n)? ");
1109 fscanf(stdin, "%c", &in);
1110 fscanf(stdin, "%c", &lf); /* toss away */
1112 fprintf(STDOUT, "type control-c\n");
1114 fprintf(stdout, ".");
1119 /* or drop through */
1122 vcode = VLDB_GetEntryByID(afromvol, -1, &entry);
1123 EGOTO1(mfail, vcode,
1124 "Could not fetch the entry for the volume %u from the VLDB \n",
1127 if (entry.volumeId[RWVOL] != afromvol) {
1128 fprintf(STDERR, "Only RW volume can be moved\n");
1132 vcode = ubik_VL_SetLock(cstruct, 0, afromvol, RWVOL, VLOP_MOVE);
1133 EGOTO1(mfail, vcode, "Could not lock entry for volume %u \n", afromvol);
1136 vcode = VLDB_GetEntryByID(afromvol, RWVOL, &entry);
1137 EGOTO1(mfail, vcode,
1138 "Could not fetch the entry for the volume %u from the VLDB \n",
1141 backupId = entry.volumeId[BACKVOL];
1142 MapHostToNetwork(&entry);
1144 if (!Lp_Match(afromserver, afrompart, &entry)) {
1145 /* the from server and partition do not exist in the vldb entry corresponding to volid */
1146 if (!Lp_Match(atoserver, atopart, &entry)) {
1147 /* the to server and partition do not exist in the vldb entry corresponding to volid */
1148 fprintf(STDERR, "The volume %lu is not on the specified site. \n",
1149 (unsigned long)afromvol);
1150 fprintf(STDERR, "The current site is :");
1151 for (i = 0; i < entry.nServers; i++) {
1152 if (entry.serverFlags[i] == ITSRWVOL) {
1154 MapPartIdIntoName(entry.serverPartition[i], pname);
1155 fprintf(STDERR, " server %s partition %s \n",
1156 noresolve ? afs_inet_ntoa_r(entry.serverNumber[i], hoststr) :
1157 hostutil_GetNameByINet(entry.serverNumber[i]),
1162 ubik_VL_ReleaseLock(cstruct, 0, afromvol, -1,
1163 (LOCKREL_OPCODE | LOCKREL_AFSID |
1164 LOCKREL_TIMESTAMP));
1165 EGOTO1(mfail, vcode,
1166 " Could not release lock on the VLDB entry for the volume %u \n",
1169 return VOLSERVOLMOVED;
1172 /* delete the volume afromvol on src_server */
1173 /* from-info does not exist but to-info does =>
1174 * we have already done the move, but the volume
1175 * may still be existing physically on from fileserver
1177 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
1182 AFSVolTransCreate(fromconn, afromvol, afrompart, ITOffline,
1184 if (!code) { /* volume exists - delete it */
1185 VPRINT1("Setting flags on leftover source volume %u ...",
1188 AFSVolSetFlags(fromconn, fromtid,
1189 VTDeleteOnSalvage | VTOutOfService);
1191 "Failed to set flags on the leftover source volume %u\n",
1195 VPRINT1("Deleting leftover source volume %u ...", afromvol);
1196 code = AFSVolDeleteVolume(fromconn, fromtid);
1198 "Failed to delete the leftover source volume %u\n",
1202 VPRINT1("Ending transaction on leftover source volume %u ...",
1204 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1209 "Could not end the transaction for the leftover source volume %u \n",
1214 /*delete the backup volume now */
1217 AFSVolTransCreate(fromconn, backupId, afrompart, ITOffline,
1219 if (!code) { /* backup volume exists - delete it */
1220 VPRINT1("Setting flags on leftover backup volume %u ...",
1223 AFSVolSetFlags(fromconn, fromtid,
1224 VTDeleteOnSalvage | VTOutOfService);
1226 "Failed to set flags on the backup volume %u\n", backupId);
1229 VPRINT1("Deleting leftover backup volume %u ...", backupId);
1230 code = AFSVolDeleteVolume(fromconn, fromtid);
1232 "Could not delete the leftover backup volume %u\n",
1236 VPRINT1("Ending transaction on leftover backup volume %u ...",
1238 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1243 "Could not end the transaction for the leftover backup volume %u\n",
1253 /* From-info matches the vldb info about volid,
1254 * its ok start the move operation, the backup volume
1255 * on the old site is deleted in the process
1257 if (afrompart == atopart) {
1258 same = VLDB_IsSameAddrs(afromserver, atoserver, &error);
1259 EGOTO2(mfail, error,
1260 "Failed to get info about server's %d address(es) from vlserver (err=%d); aborting call!\n",
1261 afromserver, error);
1264 EGOTO1(mfail, VOLSERVOLMOVED,
1265 "Warning: Moving volume %u to its home partition ignored!\n",
1271 toconn = UV_Bind(atoserver, AFSCONF_VOLUMEPORT); /* get connections to the servers */
1272 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
1273 fromtid = totid = 0; /* initialize to uncreated */
1276 * clone the read/write volume locally.
1279 VPRINT1("Starting transaction on source volume %u ...", afromvol);
1280 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy, &fromtid);
1281 EGOTO1(mfail, code, "Failed to create transaction on the volume %u\n",
1285 if (!(flags & RV_NOCLONE)) {
1286 /* Get a clone id */
1287 VPRINT1("Allocating new volume id for clone of volume %u ...",
1290 vcode = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &newVol);
1291 EGOTO1(mfail, vcode,
1292 "Could not get an ID for the clone of volume %u from the VLDB\n",
1296 /* Do the clone. Default flags on clone are set to delete on salvage and out of service */
1297 VPRINT1("Cloning source volume %u ...", afromvol);
1298 strcpy(vname, "move-clone-temp");
1300 AFSVolClone(fromconn, fromtid, 0, readonlyVolume, vname, &newVol);
1301 EGOTO1(mfail, code, "Failed to clone the source volume %u\n",
1306 /* lookup the name of the volume we just cloned */
1308 code = AFSVolGetName(fromconn, fromtid, &volName);
1309 EGOTO1(mfail, code, "Failed to get the name of the volume %u\n",
1312 VPRINT1("Ending the transaction on the source volume %u ...", afromvol);
1314 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1319 "Failed to end the transaction on the source volume %u\n",
1324 * Create the destination volume
1327 if (!(flags & RV_NOCLONE)) {
1328 /* All of this is to get the fromDate */
1329 VPRINT1("Starting transaction on the cloned volume %u ...", newVol);
1331 AFSVolTransCreate(fromconn, newVol, afrompart, ITOffline,
1334 "Failed to start a transaction on the cloned volume%u\n",
1338 VPRINT1("Setting flags on cloned volume %u ...", newVol);
1340 AFSVolSetFlags(fromconn, clonetid,
1341 VTDeleteOnSalvage | VTOutOfService); /*redundant */
1342 EGOTO1(mfail, code, "Could not set flags on the cloned volume %u\n",
1346 /* remember time from which we've dumped the volume */
1347 VPRINT1("Getting status of cloned volume %u ...", newVol);
1348 code = AFSVolGetStatus(fromconn, clonetid, &tstatus);
1350 "Failed to get the status of the cloned volume %u\n",
1354 fromDate = CLOCKADJ(tstatus.creationDate);
1356 /* With RV_NOCLONE, just do a full copy from the source */
1361 #ifdef ENABLE_BUGFIX_1165
1363 * Get the internal volume state from the source volume. We'll use such info (i.e. dayUse)
1364 * to copy it to the new volume (via AFSSetInfo later on) so that when we move volumes we
1365 * don't use this information...
1367 volumeInfo.volEntries_val = (volintInfo *) 0; /*this hints the stub to allocate space */
1368 volumeInfo.volEntries_len = 0;
1369 code = AFSVolListOneVolume(fromconn, afrompart, afromvol, &volumeInfo);
1371 "Failed to get the volint Info of the cloned volume %u\n",
1374 infop = (volintInfo *) volumeInfo.volEntries_val;
1375 infop->maxquota = -1; /* Else it will replace the default quota */
1376 infop->creationDate = -1; /* Else it will use the source creation date */
1377 infop->updateDate = -1; /* Else it will use the source update date */
1380 /* create a volume on the target machine */
1382 code = AFSVolTransCreate(toconn, volid, atopart, ITOffline, &totid);
1384 /* Delete the existing volume.
1385 * While we are deleting the volume in these steps, the transaction
1386 * we started against the cloned volume (clonetid above) will be
1387 * sitting idle. It will get cleaned up after 600 seconds
1389 VPRINT1("Deleting pre-existing volume %u on destination ...", volid);
1390 code = AFSVolDeleteVolume(toconn, totid);
1392 "Could not delete the pre-existing volume %u on destination\n",
1397 ("Ending transaction on pre-existing volume %u on destination ...",
1399 code = AFSVolEndTrans(toconn, totid, &rcode);
1404 "Could not end the transaction on pre-existing volume %u on destination\n",
1409 VPRINT1("Creating the destination volume %u ...", volid);
1411 AFSVolCreateVolume(toconn, atopart, volName, volser_RW, volid, &volid,
1413 EGOTO1(mfail, code, "Failed to create the destination volume %u\n",
1417 strncpy(tmpName, volName, VOLSER_OLDMAXVOLNAME);
1421 VPRINT1("Setting volume flags on destination volume %u ...", volid);
1423 AFSVolSetFlags(toconn, totid, (VTDeleteOnSalvage | VTOutOfService));
1425 "Failed to set the flags on the destination volume %u\n", volid);
1429 * Now dump the clone to the new volume
1432 destination.destHost = ntohl(atoserver);
1433 destination.destPort = AFSCONF_VOLUMEPORT;
1434 destination.destSSID = 1;
1436 strncpy(cookie.name, tmpName, VOLSER_OLDMAXVOLNAME);
1437 cookie.type = RWVOL;
1438 cookie.parent = entry.volumeId[RWVOL];
1441 if (!(flags & RV_NOCLONE)) {
1442 /* Copy the clone to the new volume */
1443 VPRINT2("Dumping from clone %u on source to volume %u on destination ...",
1446 AFSVolForward(fromconn, clonetid, 0, &destination, totid,
1448 EGOTO1(mfail, code, "Failed to move data for the volume %u\n", volid);
1451 VPRINT1("Ending transaction on cloned volume %u ...", newVol);
1452 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
1457 "Failed to end the transaction on the cloned volume %u\n",
1463 * reattach to the main-line volume, and incrementally dump it.
1466 VPRINT1("Starting transaction on source volume %u ...", afromvol);
1467 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy, &fromtid);
1469 "Failed to create a transaction on the source volume %u\n",
1473 /* now do the incremental */
1475 ("Doing the%s dump from source to destination for volume %u ... ",
1476 (flags & RV_NOCLONE) ? "" : " incremental",
1479 AFSVolForward(fromconn, fromtid, fromDate, &destination, totid,
1482 "Failed to do the%s dump from rw volume on old site to rw volume on newsite\n",
1483 (flags & RV_NOCLONE) ? "" : " incremental");
1486 /* now adjust the flags so that the new volume becomes official */
1487 VPRINT1("Setting volume flags on old source volume %u ...", afromvol);
1488 code = AFSVolSetFlags(fromconn, fromtid, VTOutOfService);
1490 "Failed to set the flags to make old source volume offline\n");
1493 VPRINT1("Setting volume flags on new source volume %u ...", afromvol);
1494 code = AFSVolSetFlags(toconn, totid, 0);
1496 "Failed to set the flags to make new source volume online\n");
1499 #ifdef ENABLE_BUGFIX_1165
1500 VPRINT1("Setting volume status on destination volume %u ...", volid);
1501 code = AFSVolSetInfo(toconn, totid, infop);
1503 "Failed to set volume status on the destination volume %u\n",
1508 /* put new volume online */
1509 VPRINT1("Ending transaction on destination volume %u ...", afromvol);
1510 code = AFSVolEndTrans(toconn, totid, &rcode);
1515 "Failed to end the transaction on the volume %u on the new site\n",
1519 Lp_SetRWValue(&entry, afromserver, afrompart, atoserver, atopart);
1520 MapNetworkToHost(&entry, &storeEntry);
1521 storeEntry.flags &= ~BACK_EXISTS;
1525 "Second test point - operation in progress but not complete.\n");
1526 fprintf(STDOUT, "...test here (y, n)? ");
1528 fscanf(stdin, "%c", &in);
1529 fscanf(stdin, "%c", &lf); /* toss away */
1531 fprintf(STDOUT, "type control-c\n");
1533 fprintf(stdout, ".");
1538 /* or drop through */
1541 VPRINT1("Releasing lock on VLDB entry for volume %u ...", afromvol);
1543 VLDB_ReplaceEntry(afromvol, -1, &storeEntry,
1544 (LOCKREL_OPCODE | LOCKREL_AFSID |
1545 LOCKREL_TIMESTAMP));
1548 " Could not release the lock on the VLDB entry for the volume %s %lu \n",
1549 storeEntry.name, (unsigned long)afromvol);
1558 "Third test point - operation complete but no cleanup.\n");
1559 fprintf(STDOUT, "...test here (y, n)? ");
1561 fscanf(stdin, "%c", &in);
1562 fscanf(stdin, "%c", &lf); /* toss away */
1564 fprintf(STDOUT, "type control-c\n");
1566 fprintf(stdout, ".");
1571 /* or drop through */
1574 /* This is tricky. File server is very stupid, and if you mark the volume
1575 * as VTOutOfService, it may mark the *good* instance (if you're moving
1576 * between partitions on the same machine) as out of service. Since
1577 * we're cleaning this code up in DEcorum, we're just going to kludge around
1578 * it for now by removing this call. */
1579 /* already out of service, just zap it now */
1581 AFSVolSetFlags(fromconn, fromtid, VTDeleteOnSalvage | VTOutOfService);
1584 "Failed to set the flags to make the old source volume offline\n");
1588 if (atoserver != afromserver) {
1589 /* set forwarding pointer for moved volumes */
1590 VPRINT1("Setting forwarding pointer for volume %u ...", afromvol);
1591 code = AFSVolSetForwarding(fromconn, fromtid, atoserver);
1593 "Failed to set the forwarding pointer for the volume %u\n",
1598 VPRINT1("Deleting old volume %u on source ...", afromvol);
1599 code = AFSVolDeleteVolume(fromconn, fromtid); /* zap original volume */
1600 EGOTO1(mfail, code, "Failed to delete the old volume %u on source\n",
1604 VPRINT1("Ending transaction on old volume %u on the source ...",
1606 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1611 "Failed to end the transaction on the old volume %u on the source\n",
1615 /* Delete the backup volume on the original site */
1616 VPRINT1("Creating transaction for backup volume %u on source ...",
1619 AFSVolTransCreate(fromconn, backupId, afrompart, ITOffline, &fromtid);
1622 VPRINT1("Setting flags on backup volume %u on source ...", backupId);
1624 AFSVolSetFlags(fromconn, fromtid,
1625 VTDeleteOnSalvage | VTOutOfService);
1627 "Failed to set the flags on the backup volume %u on the source\n",
1631 VPRINT1("Deleting the backup volume %u on the source ...", backupId);
1632 code = AFSVolDeleteVolume(fromconn, fromtid);
1634 "Failed to delete the backup volume %u on the source\n",
1638 VPRINT1("Ending transaction on backup volume %u on source ...",
1640 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1645 "Failed to end the transaction on the backup volume %u on the source\n",
1649 code = 0; /* no backup volume? that's okay */
1652 if (!(flags & RV_NOCLONE)) {
1653 VPRINT1("Starting transaction on the cloned volume %u ...", newVol);
1655 AFSVolTransCreate(fromconn, newVol, afrompart, ITOffline,
1658 "Failed to start a transaction on the cloned volume%u\n",
1662 /* now delete the clone */
1663 VPRINT1("Deleting the cloned volume %u ...", newVol);
1664 code = AFSVolDeleteVolume(fromconn, clonetid);
1665 EGOTO1(mfail, code, "Failed to delete the cloned volume %u\n",
1669 VPRINT1("Ending transaction on cloned volume %u ...", newVol);
1670 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
1675 "Failed to end the transaction on the cloned volume %u\n",
1684 fprintf(STDOUT, "Fourth test point - operation complete.\n");
1685 fprintf(STDOUT, "...test here (y, n)? ");
1687 fscanf(stdin, "%c", &in);
1688 fscanf(stdin, "%c", &lf); /* toss away */
1690 fprintf(STDOUT, "type control-c\n");
1692 fprintf(stdout, ".");
1697 /* or drop through */
1700 /* normal cleanup code */
1702 if (entry.flags & RO_EXISTS)
1703 fprintf(STDERR, "WARNING : readOnly copies still exist \n");
1706 VPRINT1("Cleanup: Releasing VLDB lock on volume %u ...", afromvol);
1708 ubik_VL_ReleaseLock(cstruct, 0, afromvol, -1,
1709 (LOCKREL_OPCODE | LOCKREL_AFSID | LOCKREL_TIMESTAMP));
1713 " Could not release the lock on the VLDB entry for the volume %lu \n",
1714 (unsigned long)afromvol);
1722 VPRINT1("Cleanup: Ending transaction on source volume %u ...",
1724 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
1725 if (code || rcode) {
1728 "Could not end transaction on the source volume %lu\n",
1729 (unsigned long)afromvol);
1731 error = (code ? code : rcode);
1737 VPRINT1("Cleanup: Ending transaction on clone volume %u ...", newVol);
1738 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
1739 if (code || rcode) {
1742 "Could not end transaction on the source's clone volume %lu\n",
1743 (unsigned long)newVol);
1745 error = (code ? code : rcode);
1751 VPRINT1("Cleanup: Ending transaction on destination volume %u ...",
1753 code = AFSVolEndTrans(toconn, totid, &rcode);
1757 "Could not end transaction on destination volume %lu\n",
1758 (unsigned long)afromvol);
1760 error = (code ? code : rcode);
1766 #ifdef ENABLE_BUGFIX_1165
1771 rx_DestroyConnection(fromconn);
1773 rx_DestroyConnection(toconn);
1774 PrintError("", error);
1777 /* come here only when the sky falls */
1782 "vos move: operation interrupted, cleanup in progress...\n");
1783 fprintf(STDOUT, "clear transaction contexts\n");
1787 /* unlock VLDB entry */
1789 VPRINT1("Recovery: Releasing VLDB lock on volume %u ...", afromvol);
1790 ubik_VL_ReleaseLock(cstruct, 0, afromvol, -1,
1791 (LOCKREL_OPCODE | LOCKREL_AFSID | LOCKREL_TIMESTAMP));
1797 VPRINT("Recovery: Ending transaction on clone volume ...");
1798 AFSVolEndTrans(fromconn, clonetid, &rcode);
1802 VPRINT("Recovery: Ending transaction on destination volume ...");
1803 AFSVolEndTrans(toconn, totid, &rcode);
1806 if (fromtid) { /* put it on-line */
1807 VPRINT("Recovery: Setting volume flags on source volume ...");
1808 AFSVolSetFlags(fromconn, fromtid, 0);
1811 VPRINT("Recovery: Ending transaction on source volume ...");
1812 AFSVolEndTrans(fromconn, fromtid, &rcode);
1816 VPRINT("Recovery: Accessing VLDB.\n");
1817 vcode = VLDB_GetEntryByID(afromvol, -1, &entry);
1819 fprintf(STDOUT, "FATAL: VLDB access error: abort cleanup\n");
1823 MapHostToNetwork(&entry);
1825 /* Delete either the volume on the source location or the target location.
1826 * If the vldb entry still points to the source location, then we know the
1827 * volume move didn't finish so we remove the volume from the target
1828 * location. Otherwise, we remove the volume from the source location.
1830 if (Lp_Match(afromserver, afrompart, &entry)) { /* didn't move - delete target volume */
1833 "move incomplete - attempt cleanup of target partition - no guarantee\n");
1837 if (volid && toconn) {
1839 ("Recovery: Creating transaction for destination volume %u ...",
1842 AFSVolTransCreate(toconn, volid, atopart, ITOffline, &totid);
1848 ("Recovery: Setting flags on destination volume %u ...",
1850 AFSVolSetFlags(toconn, totid,
1851 VTDeleteOnSalvage | VTOutOfService);
1854 VPRINT1("Recovery: Deleting destination volume %u ...",
1856 AFSVolDeleteVolume(toconn, totid);
1860 ("Recovery: Ending transaction on destination volume %u ...",
1862 AFSVolEndTrans(toconn, totid, &rcode);
1866 ("\nRecovery: Unable to start transaction on destination volume %u.\n",
1871 /* put source volume on-line */
1873 VPRINT1("Recovery: Creating transaction on source volume %u ...",
1876 AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy,
1881 VPRINT1("Recovery: Setting flags on source volume %u ...",
1883 AFSVolSetFlags(fromconn, fromtid, 0);
1887 ("Recovery: Ending transaction on source volume %u ...",
1889 AFSVolEndTrans(fromconn, fromtid, &rcode);
1893 ("\nRecovery: Unable to start transaction on source volume %u.\n",
1897 } else { /* yep, move complete */
1900 "move complete - attempt cleanup of source partition - no guarantee\n");
1904 /* delete backup volume */
1906 VPRINT1("Recovery: Creating transaction on backup volume %u ...",
1909 AFSVolTransCreate(fromconn, backupId, afrompart, ITOffline,
1914 VPRINT1("Recovery: Setting flags on backup volume %u ...",
1916 AFSVolSetFlags(fromconn, fromtid,
1917 VTDeleteOnSalvage | VTOutOfService);
1920 VPRINT1("Recovery: Deleting backup volume %u ...", backupId);
1921 AFSVolDeleteVolume(fromconn, fromtid);
1925 ("Recovery: Ending transaction on backup volume %u ...",
1927 AFSVolEndTrans(fromconn, fromtid, &rcode);
1931 ("\nRecovery: Unable to start transaction on backup volume %u.\n",
1935 /* delete source volume */
1936 VPRINT1("Recovery: Creating transaction on source volume %u ...",
1939 AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy,
1944 VPRINT1("Recovery: Setting flags on backup volume %u ...",
1946 AFSVolSetFlags(fromconn, fromtid,
1947 VTDeleteOnSalvage | VTOutOfService);
1950 if (atoserver != afromserver) {
1951 VPRINT("Recovery: Setting volume forwarding pointer ...");
1952 AFSVolSetForwarding(fromconn, fromtid, atoserver);
1956 VPRINT1("Recovery: Deleting source volume %u ...", afromvol);
1957 AFSVolDeleteVolume(fromconn, fromtid);
1961 ("Recovery: Ending transaction on source volume %u ...",
1963 AFSVolEndTrans(fromconn, fromtid, &rcode);
1967 ("\nRecovery: Unable to start transaction on source volume %u.\n",
1973 /* common cleanup - delete local clone */
1975 VPRINT1("Recovery: Creating transaction on clone volume %u ...",
1978 AFSVolTransCreate(fromconn, newVol, afrompart, ITOffline,
1983 VPRINT1("Recovery: Deleting clone volume %u ...", newVol);
1984 AFSVolDeleteVolume(fromconn, clonetid);
1987 VPRINT1("Recovery: Ending transaction on clone volume %u ...",
1989 AFSVolEndTrans(fromconn, clonetid, &rcode);
1993 ("\nRecovery: Unable to start transaction on source volume %u.\n",
1998 /* unlock VLDB entry */
2000 VPRINT1("Recovery: Releasing lock on VLDB entry for volume %u ...",
2002 ubik_VL_ReleaseLock(cstruct, 0, afromvol, -1,
2003 (LOCKREL_OPCODE | LOCKREL_AFSID | LOCKREL_TIMESTAMP));
2007 done: /* routine cleanup */
2010 #ifdef ENABLE_BUGFIX_1165
2015 rx_DestroyConnection(fromconn);
2017 rx_DestroyConnection(toconn);
2020 fprintf(STDOUT, "cleanup complete - user verify desired result\n");
2028 UV_MoveVolume(afs_int32 afromvol, afs_int32 afromserver, afs_int32 afrompart,
2029 afs_int32 atoserver, afs_int32 atopart)
2031 return UV_MoveVolume2(afromvol, afromserver, afrompart,
2032 atoserver, atopart, 0);
2036 /* Copy volume <afromvol> from <afromserver> <afrompart> to <atoserver>
2037 * <atopart>. The new volume is named by <atovolname>. The new volume
2038 * has ID <atovolid> if that is nonzero; otherwise a new ID is allocated
2039 * from the VLDB. the following flags are supported:
2041 * RV_RDONLY - target volume is RO
2042 * RV_OFFLINE - leave target volume offline
2043 * RV_CPINCR - do incremental dump if target exists
2044 * RV_NOVLDB - don't create/update VLDB entry
2045 * RV_NOCLONE - don't use a copy clone
2048 UV_CopyVolume2(afs_int32 afromvol, afs_int32 afromserver, afs_int32 afrompart,
2049 char *atovolname, afs_int32 atoserver, afs_int32 atopart,
2050 afs_int32 atovolid, int flags)
2052 struct rx_connection *toconn, *fromconn;
2053 afs_int32 fromtid, totid, clonetid;
2056 afs_int32 fromDate, cloneFromDate;
2057 struct restoreCookie cookie;
2058 register afs_int32 vcode, code;
2059 afs_int32 cloneVol, newVol, volflag;
2060 struct volser_status tstatus;
2061 struct destServer destination;
2063 struct nvldbentry entry, newentry, storeEntry;
2069 fromconn = (struct rx_connection *)0;
2070 toconn = (struct rx_connection *)0;
2078 /* support control-c processing */
2081 (void)signal(SIGINT, sigint_handler);
2083 vcode = VLDB_GetEntryByID(afromvol, -1, &entry);
2084 EGOTO1(mfail, vcode,
2085 "Could not fetch the entry for the volume %u from the VLDB \n",
2087 MapHostToNetwork(&entry);
2090 toconn = UV_Bind(atoserver, AFSCONF_VOLUMEPORT); /* get connections to the servers */
2091 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
2092 fromtid = totid = 0; /* initialize to uncreated */
2095 /* check if we can shortcut and use a local clone instead of a full copy */
2096 if (afromserver == atoserver && afrompart == atopart) {
2101 * clone the read/write volume locally.
2105 if (!(flags & RV_NOCLONE)) {
2106 VPRINT1("Starting transaction on source volume %u ...", afromvol);
2107 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy,
2109 EGOTO1(mfail, code, "Failed to create transaction on the volume %u\n",
2113 /* Get a clone id */
2114 VPRINT1("Allocating new volume id for clone of volume %u ...",
2117 vcode = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &cloneVol);
2118 EGOTO1(mfail, vcode,
2119 "Could not get an ID for the clone of volume %u from the VLDB\n",
2127 /* Get a new volume id */
2128 VPRINT1("Allocating new volume id for copy of volume %u ...", afromvol);
2130 vcode = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &newVol);
2131 EGOTO1(mfail, vcode,
2132 "Could not get an ID for the copy of volume %u from the VLDB\n",
2137 if (!(flags & RV_NOCLONE)) {
2138 /* Do the clone. Default flags on clone are set to delete on salvage and out of service */
2139 VPRINT1("Cloning source volume %u ...", afromvol);
2140 strcpy(vname, "copy-clone-temp");
2142 AFSVolClone(fromconn, fromtid, 0, readonlyVolume, vname,
2144 EGOTO1(mfail, code, "Failed to clone the source volume %u\n",
2148 VPRINT1("Ending the transaction on the source volume %u ...", afromvol);
2150 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
2155 "Failed to end the transaction on the source volume %u\n",
2161 * Create the destination volume
2164 if (!(flags & RV_NOCLONE)) {
2165 VPRINT1("Starting transaction on the cloned volume %u ...", cloneVol);
2167 AFSVolTransCreate(fromconn, cloneVol, afrompart, ITOffline,
2170 "Failed to start a transaction on the cloned volume%u\n",
2174 VPRINT1("Setting flags on cloned volume %u ...", cloneVol);
2176 AFSVolSetFlags(fromconn, clonetid,
2177 VTDeleteOnSalvage | VTOutOfService); /*redundant */
2178 EGOTO1(mfail, code, "Could not set flags on the cloned volume %u\n",
2182 /* remember time from which we've dumped the volume */
2183 VPRINT1("Getting status of cloned volume %u ...", cloneVol);
2184 code = AFSVolGetStatus(fromconn, clonetid, &tstatus);
2186 "Failed to get the status of the cloned volume %u\n",
2190 fromDate = CLOCKADJ(tstatus.creationDate);
2195 /* create a volume on the target machine */
2197 code = AFSVolTransCreate(toconn, newVol, atopart, ITOffline, &totid);
2199 if ((flags & RV_CPINCR)) {
2200 VPRINT1("Getting status of pre-existing volume %u ...", newVol);
2201 code = AFSVolGetStatus(toconn, totid, &tstatus);
2203 "Failed to get the status of the pre-existing volume %u\n",
2207 /* Using the update date should be OK here, but add some fudge */
2208 cloneFromDate = CLOCKADJ(tstatus.updateDate);
2209 if ((flags & RV_NOCLONE))
2210 fromDate = cloneFromDate;
2212 /* XXX We should check that the source volume's creationDate is
2213 * XXX not newer than the existing target volume, and if not,
2214 * XXX throw away the existing target and do a full dump. */
2219 /* Delete the existing volume.
2220 * While we are deleting the volume in these steps, the transaction
2221 * we started against the cloned volume (clonetid above) will be
2222 * sitting idle. It will get cleaned up after 600 seconds
2224 VPRINT1("Deleting pre-existing volume %u on destination ...", newVol);
2225 code = AFSVolDeleteVolume(toconn, totid);
2227 "Could not delete the pre-existing volume %u on destination\n",
2232 ("Ending transaction on pre-existing volume %u on destination ...",
2234 code = AFSVolEndTrans(toconn, totid, &rcode);
2239 "Could not end the transaction on pre-existing volume %u on destination\n",
2244 VPRINT1("Creating the destination volume %u ...", newVol);
2246 AFSVolCreateVolume(toconn, atopart, atovolname,
2247 (flags & RV_RDONLY) ? volser_RO : volser_RW,
2248 newVol, &newVol, &totid);
2249 EGOTO1(mfail, code, "Failed to create the destination volume %u\n",
2253 VPRINT1("Setting volume flags on destination volume %u ...", newVol);
2255 AFSVolSetFlags(toconn, totid, (VTDeleteOnSalvage | VTOutOfService));
2257 "Failed to set the flags on the destination volume %u\n", newVol);
2262 destination.destHost = ntohl(atoserver);
2263 destination.destPort = AFSCONF_VOLUMEPORT;
2264 destination.destSSID = 1;
2266 strncpy(cookie.name, atovolname, VOLSER_OLDMAXVOLNAME);
2267 cookie.type = (flags & RV_RDONLY) ? ROVOL : RWVOL;
2272 * Now dump the clone to the new volume
2275 if (!(flags & RV_NOCLONE)) {
2276 /* XXX probably should have some code here that checks to see if
2277 * XXX we are copying to same server and partition - if so, just
2278 * XXX use a clone to save disk space */
2280 /* Copy the clone to the new volume */
2281 VPRINT2("Dumping from clone %u on source to volume %u on destination ...",
2284 AFSVolForward(fromconn, clonetid, cloneFromDate, &destination,
2286 EGOTO1(mfail, code, "Failed to move data for the volume %u\n",
2290 VPRINT1("Ending transaction on cloned volume %u ...", cloneVol);
2291 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
2296 "Failed to end the transaction on the cloned volume %u\n",
2302 * reattach to the main-line volume, and incrementally dump it.
2305 VPRINT1("Starting transaction on source volume %u ...", afromvol);
2306 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy, &fromtid);
2308 "Failed to create a transaction on the source volume %u\n",
2312 /* now do the incremental */
2314 ("Doing the%s dump from source to destination for volume %u ... ",
2315 (flags & RV_NOCLONE) ? "" : " incremental",
2318 AFSVolForward(fromconn, fromtid, fromDate, &destination, totid,
2321 "Failed to do the%s dump from old site to new site\n",
2325 VPRINT1("Setting volume flags on destination volume %u ...", newVol);
2326 volflag = ((flags & RV_OFFLINE) ? VTOutOfService : 0); /* off or on-line */
2327 code = AFSVolSetFlags(toconn, totid, volflag);
2329 "Failed to set the flags to make destination volume online\n");
2332 /* put new volume online */
2333 VPRINT1("Ending transaction on destination volume %u ...", newVol);
2334 code = AFSVolEndTrans(toconn, totid, &rcode);
2339 "Failed to end the transaction on the destination volume %u\n",
2343 VPRINT1("Ending transaction on source volume %u ...", afromvol);
2344 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
2349 "Failed to end the transaction on the source volume %u\n",
2355 if (!(flags & RV_NOCLONE)) {
2356 VPRINT1("Starting transaction on the cloned volume %u ...", cloneVol);
2358 AFSVolTransCreate(fromconn, cloneVol, afrompart, ITOffline,
2361 "Failed to start a transaction on the cloned volume%u\n",
2365 /* now delete the clone */
2366 VPRINT1("Deleting the cloned volume %u ...", cloneVol);
2367 code = AFSVolDeleteVolume(fromconn, clonetid);
2368 EGOTO1(mfail, code, "Failed to delete the cloned volume %u\n",
2372 VPRINT1("Ending transaction on cloned volume %u ...", cloneVol);
2373 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
2378 "Failed to end the transaction on the cloned volume %u\n",
2383 if (!(flags & RV_NOVLDB)) {
2384 /* create the vldb entry for the copied volume */
2385 strncpy(newentry.name, atovolname, VOLSER_OLDMAXVOLNAME);
2386 newentry.nServers = 1;
2387 newentry.serverNumber[0] = atoserver;
2388 newentry.serverPartition[0] = atopart;
2389 newentry.flags = (flags & RV_RDONLY) ? RO_EXISTS : RW_EXISTS;
2390 newentry.serverFlags[0] = (flags & RV_RDONLY) ? ITSROVOL : ITSRWVOL;
2391 newentry.volumeId[RWVOL] = newVol;
2392 newentry.volumeId[ROVOL] = (flags & RV_RDONLY) ? newVol : 0;
2393 newentry.volumeId[BACKVOL] = 0;
2394 newentry.cloneId = 0;
2395 /*map into right byte order, before passing to xdr, the stuff has to be in host
2396 * byte order. Xdr converts it into network order */
2397 MapNetworkToHost(&newentry, &storeEntry);
2398 /* create the vldb entry */
2399 vcode = VLDB_CreateEntry(&storeEntry);
2402 "Could not create a VLDB entry for the volume %s %lu\n",
2403 atovolname, (unsigned long)newVol);
2404 /*destroy the created volume */
2405 VPRINT1("Deleting the newly created volume %u\n", newVol);
2406 AFSVolDeleteVolume(toconn, totid);
2410 VPRINT2("Created the VLDB entry for the volume %s %u\n", atovolname,
2414 /* normal cleanup code */
2417 VPRINT1("Cleanup: Ending transaction on source volume %u ...",
2419 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
2420 if (code || rcode) {
2423 "Could not end transaction on the source volume %lu\n",
2424 (unsigned long)afromvol);
2426 error = (code ? code : rcode);
2432 VPRINT1("Cleanup: Ending transaction on clone volume %u ...",
2434 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
2435 if (code || rcode) {
2438 "Could not end transaction on the source's clone volume %lu\n",
2439 (unsigned long)cloneVol);
2441 error = (code ? code : rcode);
2447 VPRINT1("Cleanup: Ending transaction on destination volume %u ...",
2449 code = AFSVolEndTrans(toconn, totid, &rcode);
2453 "Could not end transaction on destination volume %lu\n",
2454 (unsigned long)newVol);
2456 error = (code ? code : rcode);
2461 rx_DestroyConnection(fromconn);
2463 rx_DestroyConnection(toconn);
2464 PrintError("", error);
2467 /* come here only when the sky falls */
2472 "vos copy: operation interrupted, cleanup in progress...\n");
2473 fprintf(STDOUT, "clear transaction contexts\n");
2478 VPRINT("Recovery: Ending transaction on clone volume ...");
2479 AFSVolEndTrans(fromconn, clonetid, &rcode);
2483 VPRINT("Recovery: Ending transaction on destination volume ...");
2484 AFSVolEndTrans(toconn, totid, &rcode);
2487 if (fromtid) { /* put it on-line */
2488 VPRINT("Recovery: Ending transaction on source volume ...");
2489 AFSVolEndTrans(fromconn, fromtid, &rcode);
2493 VPRINT("Recovery: Accessing VLDB.\n");
2494 vcode = VLDB_GetEntryByID(afromvol, -1, &entry);
2496 fprintf(STDOUT, "FATAL: VLDB access error: abort cleanup\n");
2500 MapHostToNetwork(&entry);
2502 /* common cleanup - delete local clone */
2504 VPRINT1("Recovery: Creating transaction on clone volume %u ...",
2507 AFSVolTransCreate(fromconn, cloneVol, afrompart, ITOffline,
2512 VPRINT1("Recovery: Deleting clone volume %u ...", cloneVol);
2513 AFSVolDeleteVolume(fromconn, clonetid);
2516 VPRINT1("Recovery: Ending transaction on clone volume %u ...",
2518 AFSVolEndTrans(fromconn, clonetid, &rcode);
2522 ("\nRecovery: Unable to start transaction on clone volume %u.\n",
2527 done: /* routine cleanup */
2529 rx_DestroyConnection(fromconn);
2531 rx_DestroyConnection(toconn);
2534 fprintf(STDOUT, "cleanup complete - user verify desired result\n");
2542 UV_CopyVolume(afs_int32 afromvol, afs_int32 afromserver, afs_int32 afrompart,
2543 char *atovolname, afs_int32 atoserver, afs_int32 atopart)
2545 return UV_CopyVolume2(afromvol, afromserver, afrompart,
2546 atovolname, atoserver, atopart, 0, 0);
2551 /* Make a new backup of volume <avolid> on <aserver> and <apart>
2552 * if one already exists, update it
2556 UV_BackupVolume(afs_int32 aserver, afs_int32 apart, afs_int32 avolid)
2558 struct rx_connection *aconn = (struct rx_connection *)0;
2559 afs_int32 ttid = 0, btid = 0;
2561 afs_int32 code = 0, rcode = 0;
2562 char vname[VOLSER_MAXVOLNAME + 1];
2563 struct nvldbentry entry, storeEntry;
2564 afs_int32 error = 0;
2565 int vldblocked = 0, vldbmod = 0, backexists = 1;
2567 aconn = UV_Bind(aserver, AFSCONF_VOLUMEPORT);
2569 /* the calls to VLDB will succeed only if avolid is a RW volume,
2570 * since we are following the RW hash chain for searching */
2571 code = VLDB_GetEntryByID(avolid, RWVOL, &entry);
2574 "Could not fetch the entry for the volume %lu from the VLDB \n",
2575 (unsigned long)avolid);
2579 MapHostToNetwork(&entry);
2581 /* These operations require the VLDB be locked since it means the VLDB
2582 * will change or the vldb is already locked.
2584 if (!(entry.flags & BACK_EXISTS) || /* backup volume doesnt exist */
2585 (entry.flags & VLOP_ALLOPERS) || /* vldb lock already held */
2586 (entry.volumeId[BACKVOL] == INVALID_BID)) { /* no assigned backup volume id */
2588 code = ubik_VL_SetLock(cstruct, 0, avolid, RWVOL, VLOP_BACKUP);
2591 "Could not lock the VLDB entry for the volume %lu\n",
2592 (unsigned long)avolid);
2598 /* Reread the vldb entry */
2599 code = VLDB_GetEntryByID(avolid, RWVOL, &entry);
2602 "Could not fetch the entry for the volume %lu from the VLDB \n",
2603 (unsigned long)avolid);
2607 MapHostToNetwork(&entry);
2610 if (!ISNAMEVALID(entry.name)) {
2611 fprintf(STDERR, "Name of the volume %s exceeds the size limit\n",
2613 error = VOLSERBADNAME;
2617 backupID = entry.volumeId[BACKVOL];
2618 if (backupID == INVALID_BID) {
2619 /* Get a backup volume id from the VLDB and update the vldb
2622 code = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &backupID);
2625 "Could not allocate ID for the backup volume of %lu from the VLDB\n",
2626 (unsigned long)avolid);
2630 entry.volumeId[BACKVOL] = backupID;
2634 /* Test to see if the backup volume exists by trying to create
2635 * a transaction on the backup volume. We've assumed the backup exists.
2637 code = AFSVolTransCreate(aconn, backupID, apart, ITOffline, &btid);
2639 if (code != VNOVOL) {
2640 fprintf(STDERR, "Could not reach the backup volume %lu\n",
2641 (unsigned long)backupID);
2645 backexists = 0; /* backup volume does not exist */
2648 code = AFSVolEndTrans(aconn, btid, &rcode);
2650 if (code || rcode) {
2652 "Could not end transaction on the previous backup volume %lu\n",
2653 (unsigned long)backupID);
2654 error = (code ? code : rcode);
2659 /* Now go ahead and try to clone the RW volume.
2660 * First start a transaction on the RW volume
2662 code = AFSVolTransCreate(aconn, avolid, apart, ITBusy, &ttid);
2664 fprintf(STDERR, "Could not start a transaction on the volume %lu\n",
2665 (unsigned long)avolid);
2670 /* Clone or reclone the volume, depending on whether the backup
2671 * volume exists or not
2674 VPRINT1("Re-cloning backup volume %u ...", backupID);
2676 code = AFSVolReClone(aconn, ttid, backupID);
2678 fprintf(STDERR, "Could not re-clone backup volume %lu\n",
2679 (unsigned long)backupID);
2684 VPRINT1("Creating a new backup clone %u ...", backupID);
2686 strcpy(vname, entry.name);
2687 strcat(vname, ".backup");
2689 code = AFSVolClone(aconn, ttid, 0, backupVolume, vname, &backupID);
2691 fprintf(STDERR, "Failed to clone the volume %lu\n",
2692 (unsigned long)avolid);
2698 /* End the transaction on the RW volume */
2699 code = AFSVolEndTrans(aconn, ttid, &rcode);
2701 if (code || rcode) {
2703 "Failed to end the transaction on the rw volume %lu\n",
2704 (unsigned long)avolid);
2705 error = (code ? code : rcode);
2709 /* Mork vldb as backup exists */
2710 if (!(entry.flags & BACK_EXISTS)) {
2711 entry.flags |= BACK_EXISTS;
2715 /* Now go back to the backup volume and bring it on line */
2716 code = AFSVolTransCreate(aconn, backupID, apart, ITOffline, &btid);
2719 "Failed to start a transaction on the backup volume %lu\n",
2720 (unsigned long)backupID);
2725 code = AFSVolSetFlags(aconn, btid, 0);
2727 fprintf(STDERR, "Could not mark the backup volume %lu on line \n",
2728 (unsigned long)backupID);
2733 code = AFSVolEndTrans(aconn, btid, &rcode);
2735 if (code || rcode) {
2737 "Failed to end the transaction on the backup volume %lu\n",
2738 (unsigned long)backupID);
2739 error = (code ? code : rcode);
2745 /* Will update the vldb below */
2749 code = AFSVolEndTrans(aconn, ttid, &rcode);
2750 if (code || rcode) {
2751 fprintf(STDERR, "Could not end transaction on the volume %lu\n",
2752 (unsigned long)avolid);
2754 error = (code ? code : rcode);
2759 code = AFSVolEndTrans(aconn, btid, &rcode);
2760 if (code || rcode) {
2762 "Could not end transaction the backup volume %lu\n",
2763 (unsigned long)backupID);
2765 error = (code ? code : rcode);
2769 /* Now update the vldb - if modified */
2772 MapNetworkToHost(&entry, &storeEntry);
2774 VLDB_ReplaceEntry(avolid, RWVOL, &storeEntry,
2775 (LOCKREL_OPCODE | LOCKREL_AFSID |
2776 LOCKREL_TIMESTAMP));
2779 "Could not update the VLDB entry for the volume %lu \n",
2780 (unsigned long)avolid);
2786 ubik_VL_ReleaseLock(cstruct, 0, avolid, RWVOL,
2787 (LOCKREL_OPCODE | LOCKREL_AFSID |
2788 LOCKREL_TIMESTAMP));
2791 "Could not unlock the VLDB entry for the volume %lu \n",
2792 (unsigned long)avolid);
2800 rx_DestroyConnection(aconn);
2802 PrintError("", error);
2806 /* Make a new clone of volume <avolid> on <aserver> and <apart>
2807 * using volume ID <acloneid>, or a new ID allocated from the VLDB.
2808 * The new volume is named by <aname>, or by appending ".clone" to
2809 * the existing name if <aname> is NULL. The following flags are
2812 * RV_RDONLY - target volume is RO
2813 * RV_OFFLINE - leave target volume offline
2817 UV_CloneVolume(afs_int32 aserver, afs_int32 apart, afs_int32 avolid,
2818 afs_int32 acloneid, char *aname, int flags)
2820 struct rx_connection *aconn = (struct rx_connection *)0;
2821 afs_int32 ttid = 0, btid = 0;
2822 afs_int32 code = 0, rcode = 0;
2823 char vname[VOLSER_MAXVOLNAME + 1];
2824 afs_int32 error = 0;
2826 volEntries volumeInfo;
2828 aconn = UV_Bind(aserver, AFSCONF_VOLUMEPORT);
2831 volumeInfo.volEntries_val = (volintInfo *) 0;
2832 volumeInfo.volEntries_len = 0;
2833 code = AFSVolListOneVolume(aconn, apart, avolid, &volumeInfo);
2835 fprintf(stderr, "Could not get info for volume %lu\n",
2836 (unsigned long)avolid);
2840 strncpy(vname, volumeInfo.volEntries_val[0].name,
2841 VOLSER_OLDMAXVOLNAME - 7);
2842 vname[VOLSER_OLDMAXVOLNAME - 7] = 0;
2843 strcat(vname, ".clone");
2845 if (volumeInfo.volEntries_val)
2846 free(volumeInfo.volEntries_val);
2850 /* Get a clone id */
2851 VPRINT1("Allocating new volume id for clone of volume %u ...",
2853 code = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &acloneid);
2855 "Could not get an ID for the clone of volume %u from the VLDB\n",
2860 /* Test to see if the clone volume exists by trying to create
2861 * a transaction on the clone volume. We've assumed the clone exists.
2863 /* XXX I wonder what happens if the clone has some other parent... */
2864 code = AFSVolTransCreate(aconn, acloneid, apart, ITOffline, &btid);
2866 if (code != VNOVOL) {
2867 fprintf(STDERR, "Could not reach the clone volume %lu\n",
2868 (unsigned long)acloneid);
2872 backexists = 0; /* backup volume does not exist */
2875 code = AFSVolEndTrans(aconn, btid, &rcode);
2877 if (code || rcode) {
2879 "Could not end transaction on the previous clone volume %lu\n",
2880 (unsigned long)acloneid);
2881 error = (code ? code : rcode);
2886 /* Now go ahead and try to clone the RW volume.
2887 * First start a transaction on the RW volume
2889 code = AFSVolTransCreate(aconn, avolid, apart, ITBusy, &ttid);
2891 fprintf(STDERR, "Could not start a transaction on the volume %lu\n",
2892 (unsigned long)avolid);
2897 /* Clone or reclone the volume, depending on whether the backup
2898 * volume exists or not
2901 VPRINT1("Re-cloning clone volume %u ...", acloneid);
2903 code = AFSVolReClone(aconn, ttid, acloneid);
2905 fprintf(STDERR, "Could not re-clone backup volume %lu\n",
2906 (unsigned long)acloneid);
2911 VPRINT1("Creating a new clone %u ...", acloneid);
2913 code = AFSVolClone(aconn, ttid, 0,
2914 (flags & RV_RDONLY) ? readonlyVolume : backupVolume,
2917 fprintf(STDERR, "Failed to clone the volume %lu\n",
2918 (unsigned long)avolid);
2924 /* End the transaction on the RW volume */
2925 code = AFSVolEndTrans(aconn, ttid, &rcode);
2927 if (code || rcode) {
2929 "Failed to end the transaction on the rw volume %lu\n",
2930 (unsigned long)avolid);
2931 error = (code ? code : rcode);
2935 /* Now go back to the backup volume and bring it on line */
2936 if (!(flags & RV_OFFLINE)) {
2937 code = AFSVolTransCreate(aconn, acloneid, apart, ITOffline, &btid);
2940 "Failed to start a transaction on the clone volume %lu\n",
2941 (unsigned long)acloneid);
2946 code = AFSVolSetFlags(aconn, btid, 0);
2948 fprintf(STDERR, "Could not mark the clone volume %lu on line \n",
2949 (unsigned long)acloneid);
2954 code = AFSVolEndTrans(aconn, btid, &rcode);
2956 if (code || rcode) {
2958 "Failed to end the transaction on the clone volume %lu\n",
2959 (unsigned long)acloneid);
2960 error = (code ? code : rcode);
2969 code = AFSVolEndTrans(aconn, ttid, &rcode);
2970 if (code || rcode) {
2971 fprintf(STDERR, "Could not end transaction on the volume %lu\n",
2972 (unsigned long)avolid);
2974 error = (code ? code : rcode);
2979 code = AFSVolEndTrans(aconn, btid, &rcode);
2980 if (code || rcode) {
2982 "Could not end transaction on the clone volume %lu\n",
2983 (unsigned long)acloneid);
2985 error = (code ? code : rcode);
2990 rx_DestroyConnection(aconn);
2992 PrintError("", error);
2997 DelVol(struct rx_connection *conn, afs_int32 vid, afs_int32 part,
3000 afs_int32 acode, ccode, rcode, tid;
3001 ccode = rcode = tid = 0;
3003 acode = AFSVolTransCreate(conn, vid, part, flags, &tid);
3004 if (!acode) { /* It really was there */
3005 acode = AFSVolDeleteVolume(conn, tid);
3007 fprintf(STDERR, "Failed to delete volume %lu.\n",
3008 (unsigned long)vid);
3009 PrintError("", acode);
3011 ccode = AFSVolEndTrans(conn, tid, &rcode);
3015 fprintf(STDERR, "Failed to end transaction on volume %lu.\n",
3016 (unsigned long)vid);
3017 PrintError("", ccode);
3024 #define ONERROR(ec, ep, es) if (ec) { fprintf(STDERR, (es), (ep)); error = (ec); goto rfail; }
3025 #define ERROREXIT(ec) { error = (ec); goto rfail; }
3027 /* Get a "transaction" on this replica. Create the volume
3028 * if necessary. Return the time from which a dump should
3029 * be made (0 if it's a new volume)
3032 GetTrans(struct nvldbentry *vldbEntryPtr, afs_int32 index,
3033 struct rx_connection **connPtr, afs_int32 * transPtr,
3034 afs_int32 * crtimePtr, afs_int32 * uptimePtr)
3037 struct volser_status tstatus;
3042 *connPtr = (struct rx_connection *)0;
3047 /* get connection to the replication site */
3048 *connPtr = UV_Bind(vldbEntryPtr->serverNumber[index], AFSCONF_VOLUMEPORT);
3050 goto fail; /* server is down */
3052 volid = vldbEntryPtr->volumeId[ROVOL];
3055 AFSVolTransCreate(*connPtr, volid,
3056 vldbEntryPtr->serverPartition[index], ITOffline,
3059 /* If the volume does not exist, create it */
3060 if (!volid || code) {
3064 if (volid && (code != VNOVOL)) {
3065 PrintError("Failed to start a transaction on the RO volume.\n",
3070 strcpy(volname, vldbEntryPtr->name);
3071 strcat(volname, ".readonly");
3075 "Creating new volume %lu on replication site %s: ",
3076 (unsigned long)volid,
3077 noresolve ? afs_inet_ntoa_r(vldbEntryPtr->
3078 serverNumber[index], hoststr) :
3079 hostutil_GetNameByINet(vldbEntryPtr->
3080 serverNumber[index]));
3085 AFSVolCreateVolume(*connPtr, vldbEntryPtr->serverPartition[index],
3087 vldbEntryPtr->volumeId[RWVOL], &volid,
3090 PrintError("Failed to create the ro volume: ", code);
3093 vldbEntryPtr->volumeId[ROVOL] = volid;
3097 /* The following is a bit redundant, since create sets these flags by default */
3099 AFSVolSetFlags(*connPtr, *transPtr,
3100 VTDeleteOnSalvage | VTOutOfService);
3102 PrintError("Failed to set flags on the ro volume: ", code);
3107 /* Otherwise, the transaction did succeed, so get the creation date of the
3108 * latest RO volume on the replication site
3111 VPRINT2("Updating existing ro volume %u on %s ...\n", volid,
3112 noresolve ? afs_inet_ntoa_r(vldbEntryPtr->
3113 serverNumber[index], hoststr) :
3114 hostutil_GetNameByINet(vldbEntryPtr->serverNumber[index]));
3116 code = AFSVolGetStatus(*connPtr, *transPtr, &tstatus);
3118 PrintError("Failed to get status of volume on destination: ",
3122 *crtimePtr = CLOCKADJ(tstatus.creationDate);
3123 *uptimePtr = CLOCKADJ(tstatus.updateDate);
3130 tcode = AFSVolEndTrans(*connPtr, *transPtr, &rcode);
3135 PrintError("Could not end transaction on a ro volume: ", tcode);
3142 SimulateForwardMultiple(struct rx_connection *fromconn, afs_int32 fromtid,
3143 afs_int32 fromdate, manyDests * tr, afs_int32 flags,
3144 void *cookie, manyResults * results)
3148 for (i = 0; i < tr->manyDests_len; i++) {
3149 results->manyResults_val[i] =
3150 AFSVolForward(fromconn, fromtid, fromdate,
3151 &(tr->manyDests_val[i].server),
3152 tr->manyDests_val[i].trans, cookie);
3158 /* UV_ReleaseVolume()
3159 * Release volume <afromvol> on <afromserver> <afrompart> to all
3160 * its RO sites (full release). Unless the previous release was
3161 * incomplete: in which case we bring the remaining incomplete
3162 * volumes up to date with the volumes that were released
3164 * forceflag: Performs a full release.
3166 * Will create a clone from the RW, then dump the clone out to
3167 * the remaining replicas. If there is more than 1 RO sites,
3168 * ensure that the VLDB says at least one RO is available all
3169 * the time: Influences when we write back the VLDB entry.
3173 UV_ReleaseVolume(afs_int32 afromvol, afs_int32 afromserver,
3174 afs_int32 afrompart, int forceflag)
3178 afs_int32 vcode, rcode, tcode;
3179 afs_int32 cloneVolId, roVolId;
3180 struct replica *replicas = 0;
3181 struct nvldbentry entry, storeEntry;
3182 int i, volcount, m, fullrelease, vldbindex;
3184 struct restoreCookie cookie;
3185 struct rx_connection **toconns = 0;
3186 struct release *times = 0;
3188 struct rx_connection *fromconn = (struct rx_connection *)0;
3189 afs_int32 error = 0;
3191 afs_int32 clonetid = 0, onlinetid;
3192 afs_int32 fromtid = 0;
3193 afs_uint32 fromdate = 0;
3194 afs_uint32 thisdate;
3198 manyResults results;
3199 int rwindex, roindex, roclone, roexists;
3200 afs_int32 rwcrdate = 0;
3201 afs_int32 rwupdate, clcrdate;
3205 } remembertime[NMAXNSERVERS];
3206 int releasecount = 0;
3207 struct volser_status volstatus;
3210 memset((char *)remembertime, 0, sizeof(remembertime));
3211 memset((char *)&results, 0, sizeof(results));
3213 vcode = ubik_VL_SetLock(cstruct, 0, afromvol, RWVOL, VLOP_RELEASE);
3214 if (vcode != VL_RERELEASE)
3215 ONERROR(vcode, afromvol,
3216 "Could not lock the VLDB entry for the volume %u.\n");
3219 /* Get the vldb entry in readable format */
3220 vcode = VLDB_GetEntryByID(afromvol, RWVOL, &entry);
3221 ONERROR(vcode, afromvol,
3222 "Could not fetch the entry for the volume %u from the VLDB.\n");
3223 MapHostToNetwork(&entry);
3226 EnumerateEntry(&entry);
3228 if (!ISNAMEVALID(entry.name))
3229 ONERROR(VOLSERBADOP, entry.name,
3230 "Volume name %s is too long, rename before releasing.\n");
3231 if (entry.volumeId[RWVOL] != afromvol)
3232 ONERROR(VOLSERBADOP, afromvol,
3233 "The volume %u being released is not a read-write volume.\n");
3234 if (entry.nServers <= 1)
3235 ONERROR(VOLSERBADOP, afromvol,
3236 "Volume %u has no replicas - release operation is meaningless!\n");
3237 if (strlen(entry.name) > (VOLSER_OLDMAXVOLNAME - 10))
3238 ONERROR(VOLSERBADOP, entry.name,
3239 "RO volume name %s exceeds (VOLSER_OLDMAXVOLNAME - 10) character limit\n");
3241 /* roclone is true if one of the RO volumes is on the same
3242 * partition as the RW volume. In this case, we make the RO volume
3243 * on the same partition a clone instead of a complete copy.
3246 roindex = Lp_ROMatch(afromserver, afrompart, &entry) - 1;
3247 roclone = ((roindex == -1) ? 0 : 1);
3248 rwindex = Lp_GetRwIndex(&entry);
3250 ONERROR(VOLSERNOVOL, 0, "There is no RW volume \n");
3252 /* Make sure we have a RO volume id to work with */
3253 if (entry.volumeId[ROVOL] == INVALID_BID) {
3254 /* need to get a new RO volume id */
3255 vcode = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &roVolId);
3256 ONERROR(vcode, entry.name, "Cant allocate ID for RO volume of %s\n");
3258 entry.volumeId[ROVOL] = roVolId;
3259 MapNetworkToHost(&entry, &storeEntry);
3260 vcode = VLDB_ReplaceEntry(afromvol, RWVOL, &storeEntry, 0);
3261 ONERROR(vcode, entry.name, "Could not update vldb entry for %s.\n");
3264 /* Will we be completing a previously unfinished release. -force overrides */
3265 for (s = 0, m = 0, fullrelease=0, i=0; (i<entry.nServers); i++) {
3266 if (entry.serverFlags[i] & ITSROVOL) {
3268 if (entry.serverFlags[i] & NEW_REPSITE) s++;
3271 if ((forceflag && !fullrelease) || (s == m) || (s == 0))
3274 /* Determine which volume id to use and see if it exists */
3277 || (entry.cloneId == 0)) ? entry.volumeId[ROVOL] : entry.cloneId);
3278 code = VolumeExists(afromserver, afrompart, cloneVolId);
3279 roexists = ((code == ENODEV) ? 0 : 1);
3281 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
3283 ONERROR(-1, afromserver,
3284 "Cannot establish connection with server 0x%x\n");
3288 fullrelease = 1; /* Do a full release if RO clone does not exist */
3290 /* Begin transaction on RW and mark it busy while we query it */
3291 code = AFSVolTransCreate(
3292 fromconn, afromvol, afrompart, ITBusy, &fromtid
3294 ONERROR(code, afromvol,
3295 "Failed to start transaction on RW volume %u\n");
3297 /* Query the creation date for the RW */
3298 code = AFSVolGetStatus(fromconn, fromtid, &volstatus);
3299 ONERROR(code, afromvol,
3300 "Failed to get the status of RW volume %u\n");
3301 rwcrdate = volstatus.creationDate;
3302 rwupdate = volstatus.updateDate;
3304 /* End transaction on RW */
3305 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
3307 ONERROR((code ? code : rcode), afromvol,
3308 "Failed to end transaction on RW volume %u\n");
3310 /* Begin transaction on clone and mark it busy while we query it */
3311 code = AFSVolTransCreate(
3312 fromconn, cloneVolId, afrompart, ITBusy, &clonetid
3314 ONERROR(code, cloneVolId,
3315 "Failed to start transaction on RW clone %u\n");
3317 /* Query the creation date for the clone */
3318 code = AFSVolGetStatus(fromconn, clonetid, &volstatus);
3319 ONERROR(code, cloneVolId,
3320 "Failed to get the status of RW clone %u\n");
3321 clcrdate = volstatus.creationDate;
3323 /* End transaction on clone */
3324 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
3326 ONERROR((code ? code : rcode), cloneVolId,
3327 "Failed to end transaction on RW clone %u\n");
3329 if (rwcrdate > clcrdate)
3330 fullrelease = 2;/* Do a full release if RO clone older than RW */
3335 switch (fullrelease) {
3337 fprintf(STDOUT, "RW %lu changed, doing a complete release\n",
3338 (unsigned long)afromvol);
3341 fprintf(STDOUT, "This is a complete release of volume %lu\n",
3342 (unsigned long)afromvol);
3345 fprintf(STDOUT, "This is a completion of a previous release\n");
3351 /* If the RO clone exists, then if the clone is a temporary
3352 * clone, delete it. Or if the RO clone is marked RO_DONTUSE
3353 * (it was recently added), then also delete it. We do not
3354 * want to "reclone" a temporary RO clone.
3357 && (!roclone || (entry.serverFlags[roindex] & RO_DONTUSE))) {
3358 code = DelVol(fromconn, cloneVolId, afrompart, ITOffline);
3359 if (code && (code != VNOVOL))
3364 /* Mark all the ROs in the VLDB entry as RO_DONTUSE. We don't
3365 * write this entry out to the vlserver until after the first
3366 * RO volume is released (temp RO clones don't count).
3368 for (i = 0; i < entry.nServers; i++) {
3369 entry.serverFlags[i] &= ~NEW_REPSITE;
3370 entry.serverFlags[i] |= RO_DONTUSE;
3372 entry.serverFlags[rwindex] |= NEW_REPSITE;
3373 entry.serverFlags[rwindex] &= ~RO_DONTUSE;
3375 /* Begin transaction on RW and mark it busy while we clone it */
3377 AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy,
3379 ONERROR(code, afromvol, "Failed to start transaction on volume %u\n");
3381 /* Clone or reclone the volume */
3383 VPRINT1("Recloning RW volume %u...", cloneVolId);
3384 code = AFSVolReClone(fromconn, clonetid, cloneVolId);
3385 ONERROR(code, afromvol, "Failed to reclone the RW volume %u\n");
3389 strcpy(vname, entry.name);
3390 strcat(vname, ".readonly");
3391 VPRINT1("Cloning RW volume %u to permanent RO...", afromvol);
3393 strcpy(vname, "readonly-clone-temp");
3394 VPRINT1("Cloning RW volume %u to temporary RO...", afromvol);
3397 AFSVolClone(fromconn, clonetid, 0, readonlyVolume, vname,
3399 ONERROR(code, afromvol, "Failed to clone the RW volume %u\n");
3403 /* Get the time the RW was created for future information */
3404 VPRINT1("Getting status of RW volume %u...", afromvol);
3405 code = AFSVolGetStatus(fromconn, clonetid, &volstatus);
3406 ONERROR(code, afromvol,
3407 "Failed to get the status of the RW volume %u\n");
3409 rwcrdate = volstatus.creationDate;
3410 rwupdate = volstatus.updateDate;
3412 /* End the transaction on the RW volume */
3413 VPRINT1("Ending cloning transaction on RW volume %u...", afromvol);
3414 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
3416 ONERROR((code ? code : rcode), afromvol,
3417 "Failed to end cloning transaction on RW %u\n");
3420 /* Remember clone volume ID in case we fail or are interrupted */
3421 entry.cloneId = cloneVolId;
3424 /* Bring the RO clone online - though not if it's a temporary clone */
3425 VPRINT1("Starting transaction on RO clone volume %u...",
3428 AFSVolTransCreate(fromconn, cloneVolId, afrompart, ITOffline,
3430 ONERROR(code, cloneVolId,
3431 "Failed to start transaction on volume %u\n");
3434 VPRINT1("Setting volume flags for volume %u...", cloneVolId);
3435 tcode = AFSVolSetFlags(fromconn, onlinetid, 0);
3438 VPRINT1("Ending transaction on volume %u...", cloneVolId);
3439 code = AFSVolEndTrans(fromconn, onlinetid, &rcode);
3440 ONERROR((code ? code : rcode), cloneVolId,
3441 "Failed to end transaction on RO clone %u\n");
3444 ONERROR(tcode, cloneVolId, "Could not bring volume %u on line\n");
3446 /* Sleep so that a client searching for an online volume won't
3447 * find the clone offline and then the next RO offline while the
3448 * release brings the clone online and the next RO offline (race).
3449 * There is a fix in the 3.4 client that does not need this sleep
3450 * anymore, but we don't know what clients we have.
3452 if (entry.nServers > 2)
3455 /* Mark the RO clone in the VLDB as a good site (already released) */
3456 entry.serverFlags[roindex] |= NEW_REPSITE;
3457 entry.serverFlags[roindex] &= ~RO_DONTUSE;
3458 entry.flags |= RO_EXISTS;
3462 /* Write out the VLDB entry only if the clone is not a temporary
3463 * clone. If we did this to a temporary clone then we would end
3464 * up marking all the ROs as "old release" making the ROs
3465 * temporarily unavailable.
3467 MapNetworkToHost(&entry, &storeEntry);
3468 VPRINT1("Replacing VLDB entry for %s...", entry.name);
3469 vcode = VLDB_ReplaceEntry(afromvol, RWVOL, &storeEntry, 0);
3470 ONERROR(vcode, entry.name,
3471 "Could not update vldb entry for %s.\n");
3476 /* Now we will release from the clone to the remaining RO replicas.
3477 * The first 2 ROs (counting the non-temporary RO clone) are released
3478 * individually: releasecount. This is to reduce the race condition
3479 * of clients trying to find an on-line RO volume. The remaining ROs
3480 * are released in parallel but no more than half the number of ROs
3481 * (rounded up) at a time: nservers.
3484 strcpy(vname, entry.name);
3485 strcat(vname, ".readonly");
3486 memset(&cookie, 0, sizeof(cookie));
3487 strncpy(cookie.name, vname, VOLSER_OLDMAXVOLNAME);
3488 cookie.type = ROVOL;
3489 cookie.parent = entry.volumeId[RWVOL];
3492 nservers = entry.nServers / 2; /* how many to do at once, excluding clone */
3494 (struct replica *)malloc(sizeof(struct replica) * nservers + 1);
3495 times = (struct release *)malloc(sizeof(struct release) * nservers + 1);
3497 (struct rx_connection **)malloc(sizeof(struct rx_connection *) *
3499 results.manyResults_val =
3500 (afs_int32 *) malloc(sizeof(afs_int32) * nservers + 1);
3501 if (!replicas || !times || !!!results.manyResults_val || !toconns)
3503 "Failed to create transaction on the release clone\n");
3505 memset(replicas, 0, (sizeof(struct replica) * nservers + 1));
3506 memset(times, 0, (sizeof(struct release) * nservers + 1));
3507 memset(toconns, 0, (sizeof(struct rx_connection *) * nservers + 1));
3508 memset(results.manyResults_val, 0, (sizeof(afs_int32) * nservers + 1));
3510 /* Create a transaction on the cloned volume */
3511 VPRINT1("Starting transaction on cloned volume %u...", cloneVolId);
3513 AFSVolTransCreate(fromconn, cloneVolId, afrompart, ITBusy, &fromtid);
3514 if (!fullrelease && code)
3515 ONERROR(VOLSERNOVOL, afromvol,
3516 "Old clone is inaccessible. Try vos release -f %u.\n");
3517 ONERROR(code, 0, "Failed to create transaction on the release clone\n");
3520 /* For each index in the VLDB */
3521 for (vldbindex = 0; vldbindex < entry.nServers;) {
3523 /* Get a transaction on the replicas. Pick replacas which have an old release. */
3525 ((volcount < nservers) && (vldbindex < entry.nServers));
3527 /* The first two RO volumes will be released individually.
3528 * The rest are then released in parallel. This is a hack
3529 * for clients not recognizing right away when a RO volume
3530 * comes back on-line.
3532 if ((volcount == 1) && (releasecount < 2))
3535 if (vldbindex == roindex)
3536 continue; /* the clone */
3537 if ((entry.serverFlags[vldbindex] & NEW_REPSITE)
3538 && !(entry.serverFlags[vldbindex] & RO_DONTUSE))
3540 if (!(entry.serverFlags[vldbindex] & ITSROVOL))
3541 continue; /* not a RO vol */
3544 /* Get a Transaction on this replica. Get a new connection if
3545 * necessary. Create the volume if necessary. Return the
3546 * time from which the dump should be made (0 if it's a new
3547 * volume). Each volume might have a different time.
3549 replicas[volcount].server.destHost =
3550 ntohl(entry.serverNumber[vldbindex]);
3551 replicas[volcount].server.destPort = AFSCONF_VOLUMEPORT;
3552 replicas[volcount].server.destSSID = 1;
3553 times[volcount].vldbEntryIndex = vldbindex;
3556 GetTrans(&entry, vldbindex, &(toconns[volcount]),
3557 &(replicas[volcount].trans),
3558 &(times[volcount].crtime),
3559 &(times[volcount].uptime));
3563 /* Thisdate is the date from which we want to pick up all changes */
3564 if (forceflag || !fullrelease
3565 || (rwcrdate > times[volcount].crtime)) {
3566 /* If the forceflag is set, then we want to do a full dump.
3567 * If it's not a full release, we can't be sure that the creation
3568 * date is good (so we also do a full dump).
3569 * If the RW volume was replaced (its creation date is newer than
3570 * the last release), then we can't be sure what has changed (so
3571 * we do a full dump).
3574 } else if (remembertime[vldbindex].validtime) {
3575 /* Trans was prev ended. Use the time from the prev trans
3576 * because, prev trans may have created the volume. In which
3577 * case time[volcount].time would be now instead of 0.
3580 (remembertime[vldbindex].uptime < times[volcount].uptime)
3581 ? remembertime[vldbindex].uptime
3582 : times[volcount].uptime;
3584 thisdate = times[volcount].uptime;
3586 remembertime[vldbindex].validtime = 1;
3587 remembertime[vldbindex].uptime = thisdate;
3589 if (volcount == 0) {
3590 fromdate = thisdate;
3592 /* Include this volume if it is within 15 minutes of the earliest */
3594 thisdate) ? (fromdate - thisdate) : (thisdate -
3596 AFSVolEndTrans(toconns[volcount],
3597 replicas[volcount].trans, &rcode);
3598 replicas[volcount].trans = 0;
3601 if (thisdate < fromdate)
3602 fromdate = thisdate;
3610 fprintf(STDOUT, "Starting ForwardMulti from %lu to %u on %s",
3611 (unsigned long)cloneVolId, entry.volumeId[ROVOL],
3612 noresolve ? afs_inet_ntoa_r(entry.serverNumber[times[0].
3613 vldbEntryIndex], hoststr) :
3614 hostutil_GetNameByINet(entry.
3615 serverNumber[times[0].
3618 for (s = 1; s < volcount; s++) {
3619 fprintf(STDOUT, " and %s",
3620 noresolve ? afs_inet_ntoa_r(entry.serverNumber[times[s].
3621 vldbEntryIndex], hoststr) :
3622 hostutil_GetNameByINet(entry.
3623 serverNumber[times[s].
3628 fprintf(STDOUT, " (full release)");
3631 fprintf(STDOUT, " (as of %.24s)", ctime(&tmv));
3633 fprintf(STDOUT, ".\n");
3637 /* Release the ones we have collected */
3638 tr.manyDests_val = &(replicas[0]);
3639 tr.manyDests_len = results.manyResults_len = volcount;
3641 AFSVolForwardMultiple(fromconn, fromtid, fromdate, &tr,
3642 0 /*spare */ , &cookie, &results);
3643 if (code == RXGEN_OPCODE) { /* RPC Interface Mismatch */
3645 SimulateForwardMultiple(fromconn, fromtid, fromdate, &tr,
3646 0 /*spare */ , &cookie, &results);
3651 PrintError("Release failed: ", code);
3653 for (m = 0; m < volcount; m++) {
3654 if (results.manyResults_val[m]) {
3655 if ((m == 0) || (results.manyResults_val[m] != ENOENT)) {
3656 /* we retry timed out transaction. When it is
3657 * not the first volume and the transaction wasn't found
3658 * (assume it timed out and was garbage collected by volser).
3661 ("Failed to dump volume from clone to a ro site: ",
3662 results.manyResults_val[m]);
3668 AFSVolSetIdsTypes(toconns[m], replicas[m].trans, vname,
3669 ROVOL, entry.volumeId[RWVOL], 0, 0);
3671 if ((m == 0) || (code != ENOENT)) {
3672 PrintError("Failed to set correct names and ids: ",
3678 /* have to clear dest. flags to ensure new vol goes online:
3679 * because the restore (forwarded) operation copied
3680 * the V_inService(=0) flag over to the destination.
3682 code = AFSVolSetFlags(toconns[m], replicas[m].trans, 0);
3684 if ((m == 0) || (code != ENOENT)) {
3685 PrintError("Failed to set flags on ro volume: ",
3691 entry.serverFlags[times[m].vldbEntryIndex] |= NEW_REPSITE;
3692 entry.serverFlags[times[m].vldbEntryIndex] &= ~RO_DONTUSE;
3693 entry.flags |= RO_EXISTS;
3698 /* End the transactions and destroy the connections */
3699 for (s = 0; s < volcount; s++) {
3700 if (replicas[s].trans)
3701 code = AFSVolEndTrans(toconns[s], replicas[s].trans, &rcode);
3702 replicas[s].trans = 0;
3706 if ((s == 0) || (code != ENOENT)) {
3707 PrintError("Could not end transaction on a ro volume: ",
3711 ("Transaction timed out on a ro volume. Will retry.\n",
3713 if (times[s].vldbEntryIndex < vldbindex)
3714 vldbindex = times[s].vldbEntryIndex;
3719 rx_DestroyConnection(toconns[s]);
3723 MapNetworkToHost(&entry, &storeEntry);
3724 vcode = VLDB_ReplaceEntry(afromvol, RWVOL, &storeEntry, 0);
3725 ONERROR(vcode, afromvol,
3726 " Could not update VLDB entry for volume %u\n");
3727 } /* for each index in the vldb */
3729 /* End the transaction on the cloned volume */
3730 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
3735 PrintError("Failed to end transaction on rw volume: ", code);
3737 /* Figure out if any volume were not released and say so */
3738 for (failure = 0, i = 0; i < entry.nServers; i++) {
3739 if (!(entry.serverFlags[i] & NEW_REPSITE))
3745 "The volume %lu could not be released to the following %d sites:\n",
3746 (unsigned long)afromvol, failure);
3747 for (i = 0; i < entry.nServers; i++) {
3748 if (!(entry.serverFlags[i] & NEW_REPSITE)) {
3749 MapPartIdIntoName(entry.serverPartition[i], pname);
3750 fprintf(STDERR, "\t%35s %s\n",
3751 noresolve ? afs_inet_ntoa_r(entry.serverNumber[i], hoststr) :
3752 hostutil_GetNameByINet(entry.serverNumber[i]), pname);
3756 MapNetworkToHost(&entry, &storeEntry);
3758 VLDB_ReplaceEntry(afromvol, RWVOL, &storeEntry,
3760 ONERROR(vcode, afromvol,
3761 " Could not update VLDB entry for volume %u\n");
3763 ERROREXIT(VOLSERBADRELEASE);
3766 /* All the ROs were release successfully. Remove the temporary clone */
3769 fprintf(STDOUT, "Deleting the releaseClone %lu ...",
3770 (unsigned long)cloneVolId);
3773 code = DelVol(fromconn, cloneVolId, afrompart, ITOffline);
3774 ONERROR(code, cloneVolId, "Failed to delete volume %u.\n");
3779 for (i = 0; i < entry.nServers; i++)
3780 entry.serverFlags[i] &= ~NEW_REPSITE;
3782 /* Update the VLDB */
3783 VPRINT("updating VLDB ...");
3785 MapNetworkToHost(&entry, &storeEntry);
3787 VLDB_ReplaceEntry(afromvol, RWVOL, &storeEntry,
3788 LOCKREL_OPCODE | LOCKREL_AFSID | LOCKREL_TIMESTAMP);
3789 ONERROR(vcode, afromvol, " Could not update VLDB entry for volume %u\n");
3794 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
3798 "Failed to end cloning transaction on the RW volume %lu\n",
3799 (unsigned long)afromvol);
3805 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
3809 "Failed to end transaction on the release clone %lu\n",
3810 (unsigned long)cloneVolId);
3815 for (i = 0; i < nservers; i++) {
3816 if (replicas && replicas[i].trans) {
3817 code = AFSVolEndTrans(toconns[i], replicas[i].trans, &rcode);
3818 replicas[i].trans = 0;
3821 "Failed to end transaction on ro volume %u at server %s\n",
3822 entry.volumeId[ROVOL],
3823 noresolve ? afs_inet_ntoa_r(htonl(replicas[i].server.
3824 destHost), hoststr) :
3825 hostutil_GetNameByINet(htonl
3826 (replicas[i].server.destHost)));
3831 if (toconns && toconns[i]) {
3832 rx_DestroyConnection(toconns[i]);
3838 ubik_VL_ReleaseLock(cstruct, 0, afromvol, RWVOL,
3839 LOCKREL_OPCODE | LOCKREL_AFSID | LOCKREL_TIMESTAMP);
3842 "Could not release lock on the VLDB entry for volume %lu\n",
3843 (unsigned long)afromvol);
3849 PrintError("", error);
3852 rx_DestroyConnection(fromconn);
3853 if (results.manyResults_val)
3854 free(results.manyResults_val);
3866 dump_sig_handler(int x)
3868 fprintf(STDERR, "\nSignal handler: vos dump operation\n");
3872 /* Dump the volume <afromvol> on <afromserver> and
3873 * <afrompart> to <afilename> starting from <fromdate>.
3874 * DumpFunction does the real work behind the scenes after
3875 * extracting parameters from the rock
3878 UV_DumpVolume(afs_int32 afromvol, afs_int32 afromserver, afs_int32 afrompart,
3879 afs_int32 fromdate, afs_int32(*DumpFunction) (), char *rock,
3882 struct rx_connection *fromconn = (struct rx_connection *)0;
3883 struct rx_call *fromcall = (struct rx_call *)0;
3884 afs_int32 fromtid = 0, rxError = 0, rcode = 0;
3885 afs_int32 code, error = 0, retry = 0;
3886 time_t tmv = fromdate;
3890 #ifndef AFS_NT40_ENV
3891 (void)signal(SIGPIPE, dump_sig_handler);
3893 (void)signal(SIGINT, dump_sig_handler);
3896 VEPRINT("Full Dump ...\n");
3898 VEPRINT1("Incremental Dump (as of %.24s)...\n",
3902 /* get connections to the servers */
3903 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
3905 VEPRINT1("Starting transaction on volume %u...", afromvol);
3906 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy, &fromtid);
3907 EGOTO1(error_exit, code,
3908 "Could not start transaction on the volume %u to be dumped\n",
3912 fromcall = rx_NewCall(fromconn);
3914 VEPRINT1("Starting volume dump on volume %u...", afromvol);
3915 if (flags & VOLDUMPV2_OMITDIRS)
3916 code = StartAFSVolDumpV2(fromcall, fromtid, fromdate, flags);
3919 code = StartAFSVolDump(fromcall, fromtid, fromdate);
3920 EGOTO(error_exit, code, "Could not start the dump process \n");
3923 VEPRINT1("Dumping volume %u...", afromvol);
3924 code = DumpFunction(fromcall, rock);
3925 if (code == RXGEN_OPCODE)
3927 EGOTO(error_exit, code, "Error while dumping volume \n");
3932 code = rx_EndCall(fromcall, rxError);
3933 if (code && code != RXGEN_OPCODE)
3934 fprintf(STDERR, "Error in rx_EndCall\n");
3939 VEPRINT1("Ending transaction on volume %u...", afromvol);
3940 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
3941 if (code || rcode) {
3942 fprintf(STDERR, "Could not end transaction on the volume %lu\n",
3943 (unsigned long)afromvol);
3945 error = (code ? code : rcode);
3950 rx_DestroyConnection(fromconn);
3954 if (error != RXGEN_OPCODE)
3955 PrintError("", error);
3959 /* Clone the volume <afromvol> on <afromserver> and
3960 * <afrompart>, and then dump the clone volume to
3961 * <afilename> starting from <fromdate>.
3962 * DumpFunction does the real work behind the scenes after
3963 * extracting parameters from the rock
3966 UV_DumpClonedVolume(afs_int32 afromvol, afs_int32 afromserver,
3967 afs_int32 afrompart, afs_int32 fromdate,
3968 afs_int32(*DumpFunction) (), char *rock, afs_int32 flags)
3970 struct rx_connection *fromconn = (struct rx_connection *)0;
3971 struct rx_call *fromcall = (struct rx_call *)0;
3972 afs_int32 fromtid = 0, rxError = 0, rcode = 0;
3973 afs_int32 clonetid = 0;
3974 afs_int32 code = 0, vcode = 0, error = 0;
3975 afs_int32 clonevol = 0;
3977 time_t tmv = fromdate;
3981 #ifndef AFS_NT40_ENV
3982 (void)signal(SIGPIPE, dump_sig_handler);
3984 (void)signal(SIGINT, dump_sig_handler);
3987 VEPRINT("Full Dump ...\n");
3989 VEPRINT1("Incremental Dump (as of %.24s)...\n",
3993 /* get connections to the servers */
3994 fromconn = UV_Bind(afromserver, AFSCONF_VOLUMEPORT);
3996 VEPRINT1("Starting transaction on volume %u...", afromvol);
3997 code = AFSVolTransCreate(fromconn, afromvol, afrompart, ITBusy, &fromtid);
3998 EGOTO1(error_exit, code,
3999 "Could not start transaction on the volume %u to be dumped\n",
4003 /* Get a clone id */
4004 VEPRINT1("Allocating new volume id for clone of volume %u ...", afromvol);
4005 code = ubik_VL_GetNewVolumeId(cstruct, 0, 1, &clonevol);
4006 EGOTO1(error_exit, code,
4007 "Could not get an ID for the clone of volume %u from the VLDB\n",
4011 /* Do the clone. Default flags on clone are set to delete on salvage and out of service */
4012 VEPRINT2("Cloning source volume %u to clone volume %u...", afromvol,
4014 strcpy(vname, "dump-clone-temp");
4016 AFSVolClone(fromconn, fromtid, 0, readonlyVolume, vname, &clonevol);
4017 EGOTO1(error_exit, code, "Failed to clone the source volume %u\n",
4021 VEPRINT1("Ending the transaction on the volume %u ...", afromvol);
4023 code = AFSVolEndTrans(fromconn, fromtid, &rcode);
4027 EGOTO1(error_exit, code,
4028 "Failed to end the transaction on the volume %u\n", afromvol);
4032 VEPRINT1("Starting transaction on the cloned volume %u ...", clonevol);
4034 AFSVolTransCreate(fromconn, clonevol, afrompart, ITOffline,
4036 EGOTO1(error_exit, code,
4037 "Failed to start a transaction on the cloned volume%u\n",
4041 VEPRINT1("Setting flags on cloned volume %u ...", clonevol);
4042 code = AFSVolSetFlags(fromconn, clonetid, VTDeleteOnSalvage | VTOutOfService); /*redundant */
4043 EGOTO1(error_exit, code, "Could not set falgs on the cloned volume %u\n",
4048 fromcall = rx_NewCall(fromconn);
4050 VEPRINT1("Starting volume dump from cloned volume %u...", clonevol);
4051 if (flags & VOLDUMPV2_OMITDIRS)
4052 code = StartAFSVolDumpV2(fromcall, clonetid, fromdate, flags);
4054 code = StartAFSVolDump(fromcall, clonetid, fromdate);
4055 EGOTO(error_exit, code, "Could not start the dump process \n");
4058 VEPRINT1("Dumping volume %u...", afromvol);
4059 code = DumpFunction(fromcall, rock);
4060 EGOTO(error_exit, code, "Error while dumping volume \n");
4064 /* now delete the clone */
4065 VEPRINT1("Deleting the cloned volume %u ...", clonevol);
4066 code = AFSVolDeleteVolume(fromconn, clonetid);
4068 fprintf(STDERR, "Failed to delete the cloned volume %lu\n",
4069 (unsigned long)clonevol);
4075 code = rx_EndCall(fromcall, rxError);
4077 fprintf(STDERR, "Error in rx_EndCall\n");
4083 VEPRINT1("Ending transaction on cloned volume %u...", clonevol);
4084 code = AFSVolEndTrans(fromconn, clonetid, &rcode);
4085 if (code || rcode) {
4087 "Could not end transaction on the cloned volume %lu\n",
4088 (unsigned long)clonevol);
4090 error = (code ? code : rcode);
4095 rx_DestroyConnection(fromconn);
4097 PrintError("", error);
4104 * Restore a volume <tovolid> <tovolname> on <toserver> <topart> from
4105 * the dump file <afilename>. WriteData does all the real work
4106 * after extracting params from the rock
4109 UV_RestoreVolume2(afs_int32 toserver, afs_int32 topart, afs_int32 tovolid,
4110 afs_int32 toparentid, char tovolname[], int flags,
4111 afs_int32(*WriteData) (), char *rock)
4113 struct rx_connection *toconn, *tempconn;
4114 struct rx_call *tocall;
4115 afs_int32 totid, code, rcode, vcode, terror = 0;
4116 afs_int32 rxError = 0;
4117 struct volser_status tstatus;
4118 struct volintInfo vinfo;
4120 char tovolreal[VOLSER_OLDMAXVOLNAME];
4121 afs_int32 pvolid, pparentid;
4124 struct nvldbentry entry, storeEntry;
4127 struct restoreCookie cookie;
4129 afs_int32 volflag, voltype, volsertype;
4130 afs_int32 oldCreateDate, oldUpdateDate, newCreateDate, newUpdateDate;
4131 int index, same, errcode;
4135 memset(&cookie, 0,&nb