/* * Copyright 2000, International Business Machines Corporation and others. * All Rights Reserved. * * This software has been released under the terms of the IBM Public * License. For details, see the LICENSE file in the top-level source * directory or online at http://www.openafs.org/dl/license10.html * * Portions Copyright (c) 2006-2008 Sine Nomine Associates */ /* System: VICE-TWO Module: fssync.c Institution: The Information Technology Center, Carnegie-Mellon University */ #ifdef notdef /* All this is going away in early 1989 */ int newVLDB; /* Compatibility flag */ #endif static int newVLDB = 1; #ifndef AFS_PTHREAD_ENV #define USUAL_PRIORITY (LWP_MAX_PRIORITY - 2) /* * stack size increased from 8K because the HP machine seemed to have trouble * with the smaller stack */ #define USUAL_STACK_SIZE (24 * 1024) #endif /* !AFS_PTHREAD_ENV */ /* fssync-server.c File server synchronization with external volume utilities. server-side implementation */ /* This controls the size of an fd_set; it must be defined early before * the system headers define that type and the macros that operate on it. * Its value should be as large as the maximum file descriptor limit we * are likely to run into on any platform. Right now, that is 65536 * which is the default hard fd limit on Solaris 9 */ #ifndef _WIN32 #define FD_SETSIZE 65536 #endif #include #include RCSID ("$Header$"); #include #include #ifdef AFS_NT40_ENV #include #include #else #include #include #include #include #include #endif #include #ifdef AFS_PTHREAD_ENV #include #else /* AFS_PTHREAD_ENV */ #include #endif /* AFS_PTHREAD_ENV */ #include #include #include #include #include "nfs.h" #include #include "daemon_com.h" #include "fssync.h" #include "lwp.h" #include "lock.h" #include #include "ihandle.h" #include "vnode.h" #include "volume.h" #include "volume_inline.h" #include "partition.h" #ifdef HAVE_POLL #include #endif /* HAVE_POLL */ #ifdef USE_UNIX_SOCKETS #include #include #endif /* USE_UNIX_SOCKETS */ #ifdef FSSYNC_BUILD_SERVER /*@printflike@*/ extern void Log(const char *format, ...); #ifdef osi_Assert #undef osi_Assert #endif #define osi_Assert(e) (void)(e) int (*V_BreakVolumeCallbacks) (); #define MAXHANDLERS 4 /* Up to 4 clients; must be at least 2, so that * move = dump+restore can run on single server */ #define MAXOFFLINEVOLUMES 128 /* This needs to be as big as the maximum * number that would be offline for 1 operation. * Current winner is salvage, which needs all * cloned read-only copies offline when salvaging * a single read-write volume */ static struct offlineInfo OfflineVolumes[MAXHANDLERS][MAXOFFLINEVOLUMES]; /** * fssync server socket handle. */ static SYNC_server_state_t fssync_server_state = { -1, /* file descriptor */ FSSYNC_ENDPOINT_DECL, /* server endpoint */ FSYNC_PROTO_VERSION, /* protocol version */ 5, /* bind() retry limit */ 100, /* listen() queue depth */ "FSSYNC", /* protocol name string */ }; /* Forward declarations */ static void * FSYNC_sync(void *); static void FSYNC_newconnection(); static void FSYNC_com(); static void FSYNC_Drop(); static void AcceptOn(); static void AcceptOff(); static void InitHandler(); static int AddHandler(); static int FindHandler(); static int FindHandler_r(); static int RemoveHandler(); #if defined(HAVE_POLL) && defined (AFS_PTHREAD_ENV) static void CallHandler(struct pollfd *fds, int nfds, int mask); static void GetHandler(struct pollfd *fds, int maxfds, int events, int *nfds); #else static void CallHandler(fd_set * fdsetp); static void GetHandler(fd_set * fdsetp, int *maxfdp); #endif extern int LogLevel; static afs_int32 FSYNC_com_VolOp(int fd, SYNC_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolError(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolOn(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolOff(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolMove(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolBreakCBKs(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolDone(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolQuery(FSSYNC_VolOp_command * com, SYNC_response * res); static afs_int32 FSYNC_com_VolHdrQuery(FSSYNC_VolOp_command * com, SYNC_response * res); #ifdef AFS_DEMAND_ATTACH_FS static afs_int32 FSYNC_com_VolOpQuery(FSSYNC_VolOp_command * com, SYNC_response * res); #endif /* AFS_DEMAND_ATTACH_FS */ static afs_int32 FSYNC_com_VnQry(int fd, SYNC_command * com, SYNC_response * res); static afs_int32 FSYNC_com_StatsOp(int fd, SYNC_command * com, SYNC_response * res); static afs_int32 FSYNC_com_StatsOpGeneral(FSSYNC_StatsOp_command * scom, SYNC_response * res); static afs_int32 FSYNC_com_StatsOpViceP(FSSYNC_StatsOp_command * scom, SYNC_response * res); static afs_int32 FSYNC_com_StatsOpHash(FSSYNC_StatsOp_command * scom, SYNC_response * res); static afs_int32 FSYNC_com_StatsOpHdr(FSSYNC_StatsOp_command * scom, SYNC_response * res); static afs_int32 FSYNC_com_StatsOpVLRU(FSSYNC_StatsOp_command * scom, SYNC_response * res); static void FSYNC_com_to_info(FSSYNC_VolOp_command * vcom, FSSYNC_VolOp_info * info); /* * This lock controls access to the handler array. The overhead * is minimal in non-preemptive environments. */ struct Lock FSYNC_handler_lock; void FSYNC_fsInit(void) { #ifdef AFS_PTHREAD_ENV pthread_t tid; pthread_attr_t tattr; #else /* AFS_PTHREAD_ENV */ PROCESS pid; #endif /* AFS_PTHREAD_ENV */ Lock_Init(&FSYNC_handler_lock); #ifdef AFS_PTHREAD_ENV assert(pthread_attr_init(&tattr) == 0); assert(pthread_attr_setdetachstate(&tattr, PTHREAD_CREATE_DETACHED) == 0); assert(pthread_create(&tid, &tattr, FSYNC_sync, NULL) == 0); #else /* AFS_PTHREAD_ENV */ assert(LWP_CreateProcess (FSYNC_sync, USUAL_STACK_SIZE, USUAL_PRIORITY, (void *)0, "FSYNC_sync", &pid) == LWP_SUCCESS); #endif /* AFS_PTHREAD_ENV */ } #if defined(HAVE_POLL) && defined(AFS_PTHREAD_ENV) static struct pollfd FSYNC_readfds[MAXHANDLERS]; #else static fd_set FSYNC_readfds; #endif static void * FSYNC_sync(void * args) { #ifdef USE_UNIX_SOCKETS char tbuffer[AFSDIR_PATH_MAX]; #endif /* USE_UNIX_SOCKETS */ int on = 1; extern int VInit; int code; int numTries; #ifdef AFS_PTHREAD_ENV int tid; #endif SYNC_server_state_t * state = &fssync_server_state; SYNC_getAddr(&state->endpoint, &state->addr); SYNC_cleanupSock(state); #ifndef AFS_NT40_ENV (void)signal(SIGPIPE, SIG_IGN); #endif #ifdef AFS_PTHREAD_ENV /* set our 'thread-id' so that the host hold table works */ MUTEX_ENTER(&rx_stats_mutex); /* protects rxi_pthread_hinum */ tid = ++rxi_pthread_hinum; MUTEX_EXIT(&rx_stats_mutex); pthread_setspecific(rx_thread_id_key, (void *)tid); Log("Set thread id %d for FSYNC_sync\n", tid); #endif /* AFS_PTHREAD_ENV */ while (!VInit) { /* Let somebody else run until level > 0. That doesn't mean that * all volumes have been attached. */ #ifdef AFS_PTHREAD_ENV pthread_yield(); #else /* AFS_PTHREAD_ENV */ LWP_DispatchProcess(); #endif /* AFS_PTHREAD_ENV */ } state->fd = SYNC_getSock(&state->endpoint); code = SYNC_bindSock(state); assert(!code); InitHandler(); AcceptOn(); for (;;) { #if defined(HAVE_POLL) && defined(AFS_PTHREAD_ENV) int nfds; GetHandler(FSYNC_readfds, MAXHANDLERS, POLLIN|POLLPRI, &nfds); if (poll(FSYNC_readfds, nfds, -1) >=1) CallHandler(FSYNC_readfds, nfds, POLLIN|POLLPRI); #else int maxfd; GetHandler(&FSYNC_readfds, &maxfd); /* Note: check for >= 1 below is essential since IOMGR_select * doesn't have exactly same semantics as select. */ #ifdef AFS_PTHREAD_ENV if (select(maxfd + 1, &FSYNC_readfds, NULL, NULL, NULL) >= 1) #else /* AFS_PTHREAD_ENV */ if (IOMGR_Select(maxfd + 1, &FSYNC_readfds, NULL, NULL, NULL) >= 1) #endif /* AFS_PTHREAD_ENV */ CallHandler(&FSYNC_readfds); #endif } } static void FSYNC_newconnection(int afd) { #ifdef USE_UNIX_SOCKETS struct sockaddr_un other; #else /* USE_UNIX_SOCKETS */ struct sockaddr_in other; #endif int junk, fd; junk = sizeof(other); fd = accept(afd, (struct sockaddr *)&other, &junk); if (fd == -1) { Log("FSYNC_newconnection: accept failed, errno==%d\n", errno); assert(1 == 2); } else if (!AddHandler(fd, FSYNC_com)) { AcceptOff(); assert(AddHandler(fd, FSYNC_com)); } } /* this function processes commands from an fssync file descriptor (fd) */ afs_int32 FS_cnt = 0; static void FSYNC_com(int fd) { SYNC_command com; SYNC_response res; SYNC_PROTO_BUF_DECL(com_buf); SYNC_PROTO_BUF_DECL(res_buf); memset(&res.hdr, 0, sizeof(res.hdr)); com.payload.buf = (void *)com_buf; com.payload.len = SYNC_PROTO_MAX_LEN; res.hdr.response_len = sizeof(res.hdr); res.hdr.proto_version = FSYNC_PROTO_VERSION; res.payload.len = SYNC_PROTO_MAX_LEN; res.payload.buf = (void *)res_buf; FS_cnt++; if (SYNC_getCom(fd, &com)) { Log("FSYNC_com: read failed; dropping connection (cnt=%d)\n", FS_cnt); FSYNC_Drop(fd); return; } if (com.recv_len < sizeof(com.hdr)) { Log("FSSYNC_com: invalid protocol message length (%u)\n", com.recv_len); res.hdr.response = SYNC_COM_ERROR; res.hdr.reason = SYNC_REASON_MALFORMED_PACKET; res.hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; goto respond; } if (com.hdr.proto_version != FSYNC_PROTO_VERSION) { Log("FSYNC_com: invalid protocol version (%u)\n", com.hdr.proto_version); res.hdr.response = SYNC_COM_ERROR; res.hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; goto respond; } if (com.hdr.command == SYNC_COM_CHANNEL_CLOSE) { res.hdr.response = SYNC_OK; res.hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; goto respond; } VOL_LOCK; switch (com.hdr.command) { case FSYNC_VOL_ON: case FSYNC_VOL_ATTACH: case FSYNC_VOL_LEAVE_OFF: case FSYNC_VOL_OFF: case FSYNC_VOL_FORCE_ERROR: case FSYNC_VOL_LISTVOLUMES: case FSYNC_VOL_NEEDVOLUME: case FSYNC_VOL_MOVE: case FSYNC_VOL_BREAKCBKS: case FSYNC_VOL_DONE: case FSYNC_VOL_QUERY: case FSYNC_VOL_QUERY_HDR: case FSYNC_VOL_QUERY_VOP: res.hdr.response = FSYNC_com_VolOp(fd, &com, &res); break; case FSYNC_VOL_STATS_GENERAL: case FSYNC_VOL_STATS_VICEP: case FSYNC_VOL_STATS_HASH: case FSYNC_VOL_STATS_HDR: case FSYNC_VOL_STATS_VLRU: res.hdr.response = FSYNC_com_StatsOp(fd, &com, &res); break; case FSYNC_VOL_QUERY_VNODE: res.hdr.response = FSYNC_com_VnQry(fd, &com, &res); break; default: res.hdr.response = SYNC_BAD_COMMAND; break; } VOL_UNLOCK; respond: SYNC_putRes(fd, &res); if (res.hdr.flags & SYNC_FLAG_CHANNEL_SHUTDOWN) { FSYNC_Drop(fd); } } static afs_int32 FSYNC_com_VolOp(int fd, SYNC_command * com, SYNC_response * res) { int i; afs_int32 code = SYNC_OK; FSSYNC_VolOp_command vcom; if (com->recv_len != (sizeof(com->hdr) + sizeof(FSSYNC_VolOp_hdr))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; res->hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; return SYNC_COM_ERROR; } vcom.hdr = &com->hdr; vcom.vop = (FSSYNC_VolOp_hdr *) com->payload.buf; vcom.com = com; vcom.volumes = OfflineVolumes[FindHandler(fd)]; for (vcom.v = NULL, i = 0; i < MAXOFFLINEVOLUMES; i++) { if ((vcom.volumes[i].volumeID == vcom.vop->volume) && (strncmp(vcom.volumes[i].partName, vcom.vop->partName, sizeof(vcom.volumes[i].partName)) == 0)) { vcom.v = &vcom.volumes[i]; break; } } switch (com->hdr.command) { case FSYNC_VOL_ON: case FSYNC_VOL_ATTACH: case FSYNC_VOL_LEAVE_OFF: code = FSYNC_com_VolOn(&vcom, res); break; case FSYNC_VOL_OFF: case FSYNC_VOL_NEEDVOLUME: code = FSYNC_com_VolOff(&vcom, res); break; case FSYNC_VOL_LISTVOLUMES: code = SYNC_OK; break; case FSYNC_VOL_MOVE: code = FSYNC_com_VolMove(&vcom, res); break; case FSYNC_VOL_BREAKCBKS: code = FSYNC_com_VolBreakCBKs(&vcom, res); break; case FSYNC_VOL_DONE: code = FSYNC_com_VolDone(&vcom, res); break; case FSYNC_VOL_QUERY: code = FSYNC_com_VolQuery(&vcom, res); break; case FSYNC_VOL_QUERY_HDR: code = FSYNC_com_VolHdrQuery(&vcom, res); break; #ifdef AFS_DEMAND_ATTACH_FS case FSYNC_VOL_FORCE_ERROR: code = FSYNC_com_VolError(&vcom, res); break; case FSYNC_VOL_QUERY_VOP: code = FSYNC_com_VolOpQuery(&vcom, res); break; #endif /* AFS_DEMAND_ATTACH_FS */ default: code = SYNC_BAD_COMMAND; } return code; } static afs_int32 FSYNC_com_VolOn(FSSYNC_VolOp_command * vcom, SYNC_response * res) { afs_int32 code = SYNC_OK; char tvolName[VMAXPATHLEN]; Volume * vp; Error error; if (SYNC_verifyProtocolString(vcom->vop->partName, sizeof(vcom->vop->partName))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; code = SYNC_FAILED; goto done; } /* This is where a detatched volume gets reattached. However in the special case where the volume is merely busy, it is already attatched and it is only necessary to clear the busy flag. See defect #2080 for details. */ /* is the volume already attatched? */ #ifdef notdef /* * XXX With the following enabled we had bizarre problems where the backup id would * be reset to 0; that was due to the interaction between fileserver/volserver in that they * both keep volumes in memory and the changes wouldn't be made to the fileserver. Some of * the problems were due to refcnt changes as result of VGetVolume/VPutVolume which would call * VOffline, etc. when we don't want to; someday the whole #2080 issue should be revisited to * be done right XXX */ vp = VGetVolume_r(&error, vcom->vop->volume); if (vp) { /* yep, is the BUSY flag set? */ if (vp->specialStatus == VBUSY) { /* yep, clear BUSY flag */ vp->specialStatus = 0; /* make sure vol is online */ if (vcom->v) { vcom->v->volumeID = 0; V_inUse(vp) = 1; /* online */ } VPutVolume_r(vp); break; } VPutVolume_r(vp); } #endif /* notdef */ /* so, we need to attach the volume */ #ifdef AFS_DEMAND_ATTACH_FS /* check DAFS permissions */ vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); if (vp && !strcmp(VPartitionPath(V_partition(vp)), vcom->vop->partName) && vp->pending_vol_op && (vcom->hdr->programType != vp->pending_vol_op->com.programType)) { /* a different program has this volume checked out. deny. */ Log("FSYNC_VolOn: WARNING: program type %u has attempted to manipulate " "state for volume %u using command code %u while the volume is " "checked out by program type %u for command code %u.\n", vcom->hdr->programType, vcom->vop->volume, vcom->hdr->command, vp->pending_vol_op->com.programType, vp->pending_vol_op->com.command); code = SYNC_DENIED; res->hdr.reason = FSYNC_EXCLUSIVE; goto done; } #endif if (vcom->v) vcom->v->volumeID = 0; if (vcom->hdr->command == FSYNC_VOL_LEAVE_OFF) { /* nothing much to do if we're leaving the volume offline */ #ifdef AFS_DEMAND_ATTACH_FS if (vp && !strcmp(VPartitionPath(V_partition(vp)), vcom->vop->partName)) { VDeregisterVolOp_r(vp); VChangeState_r(vp, VOL_STATE_UNATTACHED); } #endif goto done; } #ifdef AFS_DEMAND_ATTACH_FS /* first, check to see whether we have such a volume defined */ vp = VPreAttachVolumeById_r(&error, vcom->vop->partName, vcom->vop->volume); if (vp) { VDeregisterVolOp_r(vp); } #else /* !AFS_DEMAND_ATTACH_FS */ tvolName[0] = '/'; snprintf(&tvolName[1], sizeof(tvolName)-1, VFORMAT, vcom->vop->volume); tvolName[sizeof(tvolName)-1] = '\0'; vp = VAttachVolumeByName_r(&error, vcom->vop->partName, tvolName, V_VOLUPD); if (vp) VPutVolume_r(vp); if (error) { code = SYNC_DENIED; res->hdr.reason = error; } #endif /* !AFS_DEMAND_ATTACH_FS */ done: return code; } static afs_int32 FSYNC_com_VolOff(FSSYNC_VolOp_command * vcom, SYNC_response * res) { FSSYNC_VolOp_info info; afs_int32 code = SYNC_OK; int i; Volume * vp, * nvp; Error error; if (SYNC_verifyProtocolString(vcom->vop->partName, sizeof(vcom->vop->partName))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; code = SYNC_FAILED; goto done; } /* not already offline, we need to find a slot for newly offline volume */ if (vcom->hdr->programType == debugUtility) { /* debug utilities do not have their operations tracked */ vcom->v = NULL; } else { if (!vcom->v) { for (i = 0; i < MAXOFFLINEVOLUMES; i++) { if (vcom->volumes[i].volumeID == 0) { vcom->v = &vcom->volumes[i]; break; } } } if (!vcom->v) { goto deny; } } FSYNC_com_to_info(vcom, &info); #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); #else vp = VGetVolume_r(&error, vcom->vop->volume); #endif if (vp) { if ((vcom->vop->partName[0] != 0) && (strncmp(vcom->vop->partName, vp->partition->name, sizeof(vcom->vop->partName)) != 0)) { /* volume on desired partition is not online, so we * should treat this as an offline volume. */ #ifndef AFS_DEMAND_ATTACH_FS VPutVolume_r(vp); #endif vp = NULL; goto done; } } #ifdef AFS_DEMAND_ATTACH_FS if (vp) { ProgramType type = (ProgramType) vcom->hdr->programType; /* do initial filtering of requests */ /* enforce mutual exclusion for volume ops */ if (vp->pending_vol_op) { if (vp->pending_vol_op->com.programType != type) { Log("volume %u already checked out\n", vp->hashid); /* XXX debug */ Log("vp->vop = { com = { ver=%u, prog=%d, com=%d, reason=%d, len=%u, flags=0x%x }, vop = { vol=%u, part='%s' } }\n", vp->pending_vol_op->com.proto_version, vp->pending_vol_op->com.programType, vp->pending_vol_op->com.command, vp->pending_vol_op->com.reason, vp->pending_vol_op->com.command_len, vp->pending_vol_op->com.flags, vp->pending_vol_op->vop.volume, vp->pending_vol_op->vop.partName ); Log("vcom = { com = { ver=%u, prog=%d, com=%d, reason=%d, len=%u, flags=0x%x } , vop = { vol=%u, part='%s' } }\n", vcom->hdr->proto_version, vcom->hdr->programType, vcom->hdr->command, vcom->hdr->reason, vcom->hdr->command_len, vcom->hdr->flags, vcom->vop->volume, vcom->vop->partName); res->hdr.reason = FSYNC_EXCLUSIVE; goto deny; } else { Log("warning: volume %u recursively checked out by programType id %d\n", vp->hashid, vcom->hdr->programType); } } /* filter based upon requestor * * volume utilities are not allowed to check out volumes * which are in an error state * * unknown utility programs will be denied on principal */ switch (type) { case salvageServer: case debugUtility: /* give the salvageserver lots of liberty */ break; case volumeUtility: if ((V_attachState(vp) == VOL_STATE_ERROR) || (V_attachState(vp) == VOL_STATE_SALVAGING)) { goto deny; } break; default: Log("bad program type passed to FSSYNC\n"); goto deny; } /* short circuit for offline volume states * so we can avoid I/O penalty of attachment */ switch (V_attachState(vp)) { case VOL_STATE_UNATTACHED: case VOL_STATE_PREATTACHED: case VOL_STATE_SALVAGING: case VOL_STATE_ERROR: /* register the volume operation metadata with the volume * * if the volume is currently pre-attached, attach2() * will evaluate the vol op metadata to determine whether * attaching the volume would be safe */ VRegisterVolOp_r(vp, &info); goto done; default: break; } /* convert to heavyweight ref */ nvp = VGetVolumeByVp_r(&error, vp); /* register the volume operation metadata with the volume */ VRegisterVolOp_r(vp, &info); if (!nvp) { Log("FSYNC_com_VolOff: failed to get heavyweight reference to volume %u\n", vcom->vop->volume); res->hdr.reason = FSYNC_VOL_PKG_ERROR; goto deny; } vp = nvp; } #endif /* AFS_DEMAND_ATTACH_FS */ if (vp) { if (VVolOpLeaveOnline_r(vp, &info)) { VUpdateVolume_r(&error, vp, VOL_UPDATE_WAIT); /* At least get volume stats right */ if (LogLevel) { Log("FSYNC: Volume %u (%s) was left on line for an external %s request\n", V_id(vp), V_name(vp), vcom->hdr->reason == V_CLONE ? "clone" : vcom->hdr->reason == V_READONLY ? "readonly" : vcom->hdr->reason == V_DUMP ? "dump" : "UNKNOWN"); } VPutVolume_r(vp); } else { if (VVolOpSetVBusy_r(vp, &info)) { vp->specialStatus = VBUSY; } /* remember what volume we got, so we can keep track of how * many volumes the volserver or whatever is using. Note that * vp is valid since leaveonline is only set when vp is valid. */ if (vcom->v) { vcom->v->volumeID = vcom->vop->volume; strlcpy(vcom->v->partName, vp->partition->name, sizeof(vcom->v->partName)); } VOffline_r(vp, "A volume utility is running."); vp = NULL; } } done: return code; deny: return SYNC_DENIED; } static afs_int32 FSYNC_com_VolMove(FSSYNC_VolOp_command * vcom, SYNC_response * res) { Error error; Volume * vp; /* Yuch: the "reason" for the move is the site it got moved to... */ /* still set specialStatus so we stop sending back VBUSY. * also should still break callbacks. Note that I don't know * how to tell if we should break all or not, so we just do it * since it doesn't matter much if we do an extra break * volume callbacks on a volume move within the same server */ #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); #else vp = VGetVolume_r(&error, vcom->vop->volume); #endif if (vp) { vp->specialStatus = VMOVED; #ifndef AFS_DEMAND_ATTACH_FS VPutVolume_r(vp); #endif } if (V_BreakVolumeCallbacks) { Log("fssync: volume %u moved to %x; breaking all call backs\n", vcom->vop->volume, vcom->hdr->reason); VOL_UNLOCK; (*V_BreakVolumeCallbacks) (vcom->vop->volume); VOL_LOCK; } return SYNC_OK; } static afs_int32 FSYNC_com_VolDone(FSSYNC_VolOp_command * vcom, SYNC_response * res) { #ifdef AFS_DEMAND_ATTACH_FS Error error; Volume * vp; #endif /* don't try to put online, this call is made only after deleting * a volume, in which case we want to remove the vol # from the * OfflineVolumes array only */ if (vcom->v) vcom->v->volumeID = 0; #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); if (vp) { VChangeState_r(vp, VOL_STATE_UNATTACHED); VDeregisterVolOp_r(vp); } #endif return SYNC_OK; } #ifdef AFS_DEMAND_ATTACH_FS /** * force a volume into the hard error state. */ static afs_int32 FSYNC_com_VolError(FSSYNC_VolOp_command * vcom, SYNC_response * res) { Error error; Volume * vp; afs_int32 code = SYNC_DENIED; vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); if (vp && !strcmp(VPartitionPath(V_partition(vp)), vcom->vop->partName)) { memset(&vp->salvage, 0, sizeof(vp->salvage)); VChangeState_r(vp, VOL_STATE_ERROR); code = SYNC_OK; } else { res->hdr.reason = FSYNC_UNKNOWN_VOLID; } return code; } #endif static afs_int32 FSYNC_com_VolBreakCBKs(FSSYNC_VolOp_command * vcom, SYNC_response * res) { /* if the volume is being restored, break all callbacks on it */ if (V_BreakVolumeCallbacks) { Log("fssync: breaking all call backs for volume %u\n", vcom->vop->volume); VOL_UNLOCK; (*V_BreakVolumeCallbacks) (vcom->vop->volume); VOL_LOCK; } return SYNC_OK; } static afs_int32 FSYNC_com_VolQuery(FSSYNC_VolOp_command * vcom, SYNC_response * res) { afs_int32 code = SYNC_OK; Error error; Volume * vp; #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); #else /* !AFS_DEMAND_ATTACH_FS */ vp = VGetVolume_r(&error, vcom->vop->volume); #endif /* !AFS_DEMAND_ATTACH_FS */ if (vp) { assert(sizeof(Volume) <= res->payload.len); memcpy(res->payload.buf, vp, sizeof(Volume)); res->hdr.response_len += sizeof(Volume); #ifndef AFS_DEMAND_ATTACH_FS VPutVolume_r(vp); #endif } else { res->hdr.reason = FSYNC_UNKNOWN_VOLID; code = SYNC_FAILED; } return code; } static afs_int32 FSYNC_com_VolHdrQuery(FSSYNC_VolOp_command * vcom, SYNC_response * res) { afs_int32 code = SYNC_OK; Error error; Volume * vp; int hdr_ok = 0; #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); if (vp && (vp->header != NULL) && (V_attachFlags(vp) & VOL_HDR_ATTACHED) && (V_attachFlags(vp) & VOL_HDR_LOADED)) { hdr_ok = 1; } #else /* !AFS_DEMAND_ATTACH_FS */ vp = VGetVolume_r(&error, vcom->vop->volume); if (vp && vp->header) { hdr_ok = 1; } #endif /* !AFS_DEMAND_ATTACH_FS */ load_done: if (hdr_ok) { assert(sizeof(VolumeDiskData) <= res->payload.len); memcpy(res->payload.buf, &V_disk(vp), sizeof(VolumeDiskData)); res->hdr.response_len += sizeof(VolumeDiskData); #ifndef AFS_DEMAND_ATTACH_FS VPutVolume_r(vp); #endif } else { if (vp) { res->hdr.reason = FSYNC_HDR_NOT_ATTACHED; } else { res->hdr.reason = FSYNC_UNKNOWN_VOLID; } code = SYNC_FAILED; } return code; } #ifdef AFS_DEMAND_ATTACH_FS static afs_int32 FSYNC_com_VolOpQuery(FSSYNC_VolOp_command * vcom, SYNC_response * res) { afs_int32 code = SYNC_OK; Error error; Volume * vp; vp = VLookupVolume_r(&error, vcom->vop->volume, NULL); if (vp && vp->pending_vol_op) { assert(sizeof(FSSYNC_VolOp_info) <= res->payload.len); memcpy(res->payload.buf, vp->pending_vol_op, sizeof(FSSYNC_VolOp_info)); res->hdr.response_len += sizeof(FSSYNC_VolOp_info); } else { if (vp) { res->hdr.reason = FSYNC_NO_PENDING_VOL_OP; } else { res->hdr.reason = FSYNC_UNKNOWN_VOLID; } code = SYNC_FAILED; } return code; } #endif /* AFS_DEMAND_ATTACH_FS */ static afs_int32 FSYNC_com_VnQry(int fd, SYNC_command * com, SYNC_response * res) { afs_int32 code = SYNC_OK; FSSYNC_VnQry_hdr * qry = com->payload.buf; Volume * vp; Vnode * vnp; Error error; if (com->recv_len != (sizeof(com->hdr) + sizeof(FSSYNC_VnQry_hdr))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; res->hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; return SYNC_COM_ERROR; } #ifdef AFS_DEMAND_ATTACH_FS vp = VLookupVolume_r(&error, qry->volume, NULL); #else /* !AFS_DEMAND_ATTACH_FS */ vp = VGetVolume_r(&error, qry->volume); #endif /* !AFS_DEMAND_ATTACH_FS */ if (!vp) { res->hdr.reason = FSYNC_UNKNOWN_VOLID; code = SYNC_FAILED; goto done; } vnp = VLookupVnode(vp, qry->vnode); if (!vnp) { res->hdr.reason = FSYNC_UNKNOWN_VNID; code = SYNC_FAILED; goto cleanup; } if (Vn_class(vnp)->residentSize > res->payload.len) { res->hdr.reason = SYNC_REASON_ENCODING_ERROR; code = SYNC_FAILED; goto cleanup; } memcpy(res->payload.buf, vnp, Vn_class(vnp)->residentSize); res->hdr.response_len += Vn_class(vnp)->residentSize; cleanup: #ifndef AFS_DEMAND_ATTACH_FS VPutVolume_r(vp); #endif done: return code; } static afs_int32 FSYNC_com_StatsOp(int fd, SYNC_command * com, SYNC_response * res) { afs_int32 code = SYNC_OK; FSSYNC_StatsOp_command scom; if (com->recv_len != (sizeof(com->hdr) + sizeof(FSSYNC_StatsOp_hdr))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; res->hdr.flags |= SYNC_FLAG_CHANNEL_SHUTDOWN; return SYNC_COM_ERROR; } scom.hdr = &com->hdr; scom.sop = (FSSYNC_StatsOp_hdr *) com->payload.buf; scom.com = com; switch (com->hdr.command) { case FSYNC_VOL_STATS_GENERAL: code = FSYNC_com_StatsOpGeneral(&scom, res); break; #ifdef AFS_DEMAND_ATTACH_FS /* statistics for the following subsystems are only tracked * for demand attach fileservers */ case FSYNC_VOL_STATS_VICEP: code = FSYNC_com_StatsOpViceP(&scom, res); break; case FSYNC_VOL_STATS_HASH: code = FSYNC_com_StatsOpHash(&scom, res); break; case FSYNC_VOL_STATS_HDR: code = FSYNC_com_StatsOpHdr(&scom, res); break; case FSYNC_VOL_STATS_VLRU: code = FSYNC_com_StatsOpVLRU(&scom, res); break; #endif /* AFS_DEMAND_ATTACH_FS */ default: code = SYNC_BAD_COMMAND; } return code; } static afs_int32 FSYNC_com_StatsOpGeneral(FSSYNC_StatsOp_command * scom, SYNC_response * res) { afs_int32 code = SYNC_OK; memcpy(res->payload.buf, &VStats, sizeof(VStats)); res->hdr.response_len += sizeof(VStats); return code; } #ifdef AFS_DEMAND_ATTACH_FS static afs_int32 FSYNC_com_StatsOpViceP(FSSYNC_StatsOp_command * scom, SYNC_response * res) { afs_int32 code = SYNC_OK; struct DiskPartition64 * dp; struct DiskPartitionStats64 * stats; if (SYNC_verifyProtocolString(scom->sop->args.partName, sizeof(scom->sop->args.partName))) { res->hdr.reason = SYNC_REASON_MALFORMED_PACKET; code = SYNC_FAILED; goto done; } dp = VGetPartition_r(scom->sop->args.partName, 0); if (!dp) { code = SYNC_FAILED; } else { stats = (struct DiskPartitionStats64 *) res->payload.buf; stats->free = dp->free; stats->totalUsable = dp->totalUsable; stats->minFree = dp->minFree; stats->f_files = dp->f_files; stats->vol_list_len = dp->vol_list.len; res->hdr.response_len += sizeof(struct DiskPartitionStats64); } done: return code; } static afs_int32 FSYNC_com_StatsOpHash(FSSYNC_StatsOp_command * scom, SYNC_response * res) { afs_int32 code = SYNC_OK; struct VolumeHashChainStats * stats; struct VolumeHashChainHead * head; if (scom->sop->args.hash_bucket >= VolumeHashTable.Size) { return SYNC_FAILED; } head = &VolumeHashTable.Table[scom->sop->args.hash_bucket]; stats = (struct VolumeHashChainStats *) res->payload.buf; stats->table_size = VolumeHashTable.Size; stats->chain_len = head->len; stats->chain_cacheCheck = head->cacheCheck; stats->chain_busy = head->busy; AssignInt64(head->looks, &stats->chain_looks); AssignInt64(head->gets, &stats->chain_gets); AssignInt64(head->reorders, &stats->chain_reorders); res->hdr.response_len += sizeof(struct VolumeHashChainStats); return code; } static afs_int32 FSYNC_com_StatsOpHdr(FSSYNC_StatsOp_command * scom, SYNC_response * res) { afs_int32 code = SYNC_OK; memcpy(res->payload.buf, &volume_hdr_LRU.stats, sizeof(volume_hdr_LRU.stats)); res->hdr.response_len += sizeof(volume_hdr_LRU.stats); return code; } static afs_int32 FSYNC_com_StatsOpVLRU(FSSYNC_StatsOp_command * scom, SYNC_response * res) { afs_int32 code = SYNC_OK; code = SYNC_BAD_COMMAND; return code; } #endif /* AFS_DEMAND_ATTACH_FS */ static void FSYNC_com_to_info(FSSYNC_VolOp_command * vcom, FSSYNC_VolOp_info * info) { memcpy(&info->com, vcom->hdr, sizeof(SYNC_command_hdr)); memcpy(&info->vop, vcom->vop, sizeof(FSSYNC_VolOp_hdr)); } static void FSYNC_Drop(int fd) { struct offlineInfo *p; int i; Error error; char tvolName[VMAXPATHLEN]; VOL_LOCK; p = OfflineVolumes[FindHandler(fd)]; for (i = 0; i < MAXOFFLINEVOLUMES; i++) { if (p[i].volumeID) { Volume *vp; tvolName[0] = '/'; sprintf(&tvolName[1], VFORMAT, p[i].volumeID); vp = VAttachVolumeByName_r(&error, p[i].partName, tvolName, V_VOLUPD); if (vp) VPutVolume_r(vp); p[i].volumeID = 0; } } VOL_UNLOCK; RemoveHandler(fd); #ifdef AFS_NT40_ENV closesocket(fd); #else close(fd); #endif AcceptOn(); } static int AcceptHandler = -1; /* handler id for accept, if turned on */ static void AcceptOn() { if (AcceptHandler == -1) { assert(AddHandler(fssync_server_state.fd, FSYNC_newconnection)); AcceptHandler = FindHandler(fssync_server_state.fd); } } static void AcceptOff() { if (AcceptHandler != -1) { assert(RemoveHandler(fssync_server_state.fd)); AcceptHandler = -1; } } /* The multiple FD handling code. */ static int HandlerFD[MAXHANDLERS]; static int (*HandlerProc[MAXHANDLERS]) (); static void InitHandler() { register int i; ObtainWriteLock(&FSYNC_handler_lock); for (i = 0; i < MAXHANDLERS; i++) { HandlerFD[i] = -1; HandlerProc[i] = 0; } ReleaseWriteLock(&FSYNC_handler_lock); } #if defined(HAVE_POLL) && defined(AFS_PTHREAD_ENV) static void CallHandler(struct pollfd *fds, int nfds, int mask) { int i; int handler; ObtainReadLock(&FSYNC_handler_lock); for (i = 0; i < nfds; i++) { if (fds[i].revents & mask) { handler = FindHandler_r(fds[i].fd); ReleaseReadLock(&FSYNC_handler_lock); (*HandlerProc[handler]) (fds[i].fd); ObtainReadLock(&FSYNC_handler_lock); } } ReleaseReadLock(&FSYNC_handler_lock); } #else static void CallHandler(fd_set * fdsetp) { register int i; ObtainReadLock(&FSYNC_handler_lock); for (i = 0; i < MAXHANDLERS; i++) { if (HandlerFD[i] >= 0 && FD_ISSET(HandlerFD[i], fdsetp)) { ReleaseReadLock(&FSYNC_handler_lock); (*HandlerProc[i]) (HandlerFD[i]); ObtainReadLock(&FSYNC_handler_lock); } } ReleaseReadLock(&FSYNC_handler_lock); } #endif static int AddHandler(int afd, int (*aproc) ()) { register int i; ObtainWriteLock(&FSYNC_handler_lock); for (i = 0; i < MAXHANDLERS; i++) if (HandlerFD[i] == -1) break; if (i >= MAXHANDLERS) { ReleaseWriteLock(&FSYNC_handler_lock); return 0; } HandlerFD[i] = afd; HandlerProc[i] = aproc; ReleaseWriteLock(&FSYNC_handler_lock); return 1; } static int FindHandler(register int afd) { register int i; ObtainReadLock(&FSYNC_handler_lock); for (i = 0; i < MAXHANDLERS; i++) if (HandlerFD[i] == afd) { ReleaseReadLock(&FSYNC_handler_lock); return i; } ReleaseReadLock(&FSYNC_handler_lock); /* just in case */ assert(1 == 2); return -1; /* satisfy compiler */ } static int FindHandler_r(register int afd) { register int i; for (i = 0; i < MAXHANDLERS; i++) if (HandlerFD[i] == afd) { return i; } assert(1 == 2); return -1; /* satisfy compiler */ } static int RemoveHandler(register int afd) { ObtainWriteLock(&FSYNC_handler_lock); HandlerFD[FindHandler_r(afd)] = -1; ReleaseWriteLock(&FSYNC_handler_lock); return 1; } #if defined(HAVE_POLL) && defined(AFS_PTHREAD_ENV) static void GetHandler(struct pollfd *fds, int maxfds, int events, int *nfds) { int i; int fdi = 0; ObtainReadLock(&FSYNC_handler_lock); for (i = 0; i < MAXHANDLERS; i++) if (HandlerFD[i] != -1) { assert(fdi