/* * Copyright 2000, International Business Machines Corporation and others. * All Rights Reserved. * * This software has been released under the terms of the IBM Public * License. For details, see the LICENSE file in the top-level source * directory or online at http://www.openafs.org/dl/license10.html */ /* * Implements: * afs_FlushVCache * afs_AllocCBR * afs_FreeCBR * afs_FlushVCBs * afs_QueueVCB * afs_RemoveVCB * afs_NewVCache * afs_FlushActiveVcaches * afs_VerifyVCache2 * afs_WriteVCache * afs_SimpleVStat * afs_ProcessFS * TellALittleWhiteLie * afs_RemoteLookup * afs_GetVCache * afs_LookupVCache * afs_GetRootVCache * afs_FetchStatus * afs_StuffVcache * afs_PutVCache * afs_FindVCache * afs_NFSFindVCache * afs_vcacheInit * shutdown_vcache * */ #include #include "../afs/param.h" RCSID("$Header$"); #include "../afs/sysincludes.h" /*Standard vendor system headers*/ #include "../afs/afsincludes.h" /*AFS-based standard headers*/ #include "../afs/afs_stats.h" #include "../afs/afs_cbqueue.h" #include "../afs/afs_osidnlc.h" #ifdef AFS_OSF_ENV afs_int32 afs_maxvcount = 0; /* max number of vcache entries */ afs_int32 afs_vcount = 0; /* number of vcache in use now */ #if defined(AFS_OSF30_ENV) extern int max_vnodes; /* number of total system vnodes */ #else extern int nvnode; /* number of total system vnodes */ #endif #ifndef AFS_OSF30_ENV extern int numvnodes; /* number vnodes in use now */ #endif #endif /* AFS_OSF_ENV */ #ifdef AFS_SGI_ENV int afsvnumbers = 0; #endif /* Imported variables */ extern struct server *afs_servers[NSERVERS]; extern afs_rwlock_t afs_xserver; extern afs_rwlock_t afs_xcbhash; extern struct vcache *afs_globalVp; #ifdef AFS_OSF_ENV extern struct mount *afs_globalVFS; extern struct vnodeops Afs_vnodeops; #elif defined(AFS_DARWIN_ENV) || defined(AFS_FBSD_ENV) extern struct mount *afs_globalVFS; #else extern struct vfs *afs_globalVFS; #endif /* AFS_OSF_ENV */ #if defined(AFS_DUX40_ENV) extern struct vfs_ubcops afs_ubcops; #endif #ifdef AFS_SGI62_ENV extern struct vnodeops Afs_vnodeops; #endif #ifdef AFS_SGI64_ENV char *makesname(); #endif /* AFS_SGI64_ENV */ /* Exported variables */ afs_rwlock_t afs_xvcache; /*Lock: alloc new stat cache entries*/ afs_lock_t afs_xvcb; /*Lock: fids on which there are callbacks*/ struct vcache *freeVCList; /*Free list for stat cache entries*/ struct vcache *Initial_freeVCList; /*Initial list for above*/ struct afs_q VLRU; /*vcache LRU*/ afs_int32 vcachegen = 0; unsigned int afs_paniconwarn = 0; struct vcache *afs_vhashT[VCSIZE]; afs_int32 afs_bulkStatsLost; int afs_norefpanic = 0; /* Forward declarations */ static afs_int32 afs_QueueVCB(struct vcache *avc); /* * afs_FlushVCache * * Description: * Flush the given vcache entry. * * Parameters: * avc : Pointer to vcache entry to flush. * slept : Pointer to int to set 1 if we sleep/drop locks, 0 if we don't. * * Environment: * afs_xvcache lock must be held for writing upon entry to * prevent people from changing the vrefCount field, and to * protect the lruq and hnext fields. * LOCK: afs_FlushVCache afs_xvcache W * REFCNT: vcache ref count must be zero on entry except for osf1 * RACE: lock is dropped and reobtained, permitting race in caller */ int afs_FlushVCache(struct vcache *avc, int *slept) { /*afs_FlushVCache*/ register afs_int32 i, code; register struct vcache **uvc, *wvc, *tvc; *slept = 0; AFS_STATCNT(afs_FlushVCache); afs_Trace2(afs_iclSetp, CM_TRACE_FLUSHV, ICL_TYPE_POINTER, avc, ICL_TYPE_INT32, avc->states); #ifdef AFS_OSF_ENV AFS_GUNLOCK(); VN_LOCK((struct vnode *)avc); AFS_GLOCK(); #endif code = osi_VM_FlushVCache(avc, slept); if (code) goto bad; if (avc->states & CVFlushed) { code = EBUSY; goto bad; } if (avc->nextfree || !avc->vlruq.prev || !avc->vlruq.next) { /* qv afs.h */ refpanic ("LRU vs. Free inconsistency"); } avc->states |= CVFlushed; /* pull the entry out of the lruq and put it on the free list */ QRemove(&avc->vlruq); avc->vlruq.prev = avc->vlruq.next = (struct afs_q *) 0; /* keep track of # of files that we bulk stat'd, but never used * before they got recycled. */ if (avc->states & CBulkStat) afs_bulkStatsLost++; vcachegen++; /* remove entry from the hash chain */ i = VCHash(&avc->fid); uvc = &afs_vhashT[i]; for(wvc = *uvc; wvc; uvc = &wvc->hnext, wvc = *uvc) { if (avc == wvc) { *uvc = avc->hnext; avc->hnext = (struct vcache *) NULL; break; } } if (!wvc) osi_Panic("flushvcache"); /* not in correct hash bucket */ if (avc->mvid) osi_FreeSmallSpace(avc->mvid); avc->mvid = (struct VenusFid*)0; if (avc->linkData) { afs_osi_Free(avc->linkData, strlen(avc->linkData)+1); avc->linkData = NULL; } afs_FreeAllAxs(&(avc->Access)); /* we can't really give back callbacks on RO files, since the * server only tracks them on a per-volume basis, and we don't * know whether we still have some other files from the same * volume. */ if ((avc->states & CRO) == 0 && avc->callback) { afs_QueueVCB(avc); } ObtainWriteLock(&afs_xcbhash, 460); afs_DequeueCallback(avc); /* remove it from queued callbacks list */ avc->states &= ~(CStatd | CUnique); ReleaseWriteLock(&afs_xcbhash); afs_symhint_inval(avc); if ((avc->states & CForeign) || (avc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (avc); /* if it (could be) a directory */ else osi_dnlc_purgevp (avc); /* * Next, keep track of which vnodes we've deleted for create's * optimistic synchronization algorithm */ afs_allZaps++; if (avc->fid.Fid.Vnode & 1) afs_oddZaps++; else afs_evenZaps++; #if !defined(AFS_OSF_ENV) /* put the entry in the free list */ avc->nextfree = freeVCList; freeVCList = avc; if (avc->vlruq.prev || avc->vlruq.next) { refpanic ("LRU vs. Free inconsistency"); } #else /* This should put it back on the vnode free list since usecount is 1 */ afs_vcount--; vSetType(avc, VREG); if (VREFCOUNT(avc) > 0) { VN_UNLOCK((struct vnode *)avc); AFS_RELE((struct vnode *)avc); } else { if (afs_norefpanic) { printf ("flush vc refcnt < 1"); afs_norefpanic++; (void) vgone(avc, VX_NOSLEEP, (struct vnodeops *) 0); AFS_GLOCK(); VN_UNLOCK((struct vnode *)avc); } else osi_Panic ("flush vc refcnt < 1"); } #endif /* AFS_OSF_ENV */ avc->states |= CVFlushed; return 0; bad: #ifdef AFS_OSF_ENV VN_UNLOCK((struct vnode *)avc); #endif return code; } /*afs_FlushVCache*/ #ifndef AFS_SGI_ENV /* * afs_InactiveVCache * * The core of the inactive vnode op for all but IRIX. */ void afs_InactiveVCache(struct vcache *avc, struct AFS_UCRED *acred) { extern afs_rwlock_t afs_xdcache, afs_xvcache; AFS_STATCNT(afs_inactive); if (avc->states & CDirty) { /* we can't keep trying to push back dirty data forever. Give up. */ afs_InvalidateAllSegments(avc); /* turns off dirty bit */ } avc->states &= ~CMAPPED; /* mainly used by SunOS 4.0.x */ avc->states &= ~CDirty; /* Turn it off */ if (avc->states & CUnlinked) { if (CheckLock(&afs_xvcache) || CheckLock(&afs_xdcache)) { avc->states |= CUnlinkedDel; return; } afs_remunlink(avc, 1); /* ignore any return code */ } } #endif /* * afs_AllocCBR * * Description: allocate a callback return structure from the * free list and return it. * * Env: The alloc and free routines are both called with the afs_xvcb lock * held, so we don't have to worry about blocking in osi_Alloc. */ static struct afs_cbr *afs_cbrSpace = 0; struct afs_cbr *afs_AllocCBR() { register struct afs_cbr *tsp; int i; while (!afs_cbrSpace) { if (afs_stats_cmperf.CallBackAlloced >= 2) { /* don't allocate more than 2 * AFS_NCBRS for now */ afs_FlushVCBs(0); afs_stats_cmperf.CallBackFlushes++; } else { /* try allocating */ tsp = (struct afs_cbr *) afs_osi_Alloc(AFS_NCBRS * sizeof(struct afs_cbr)); for(i=0; i < AFS_NCBRS-1; i++) { tsp[i].next = &tsp[i+1]; } tsp[AFS_NCBRS-1].next = 0; afs_cbrSpace = tsp; afs_stats_cmperf.CallBackAlloced++; } } tsp = afs_cbrSpace; afs_cbrSpace = tsp->next; return tsp; } /* * afs_FreeCBR * * Description: free a callback return structure. * * Parameters: * asp -- the address of the structure to free. * * Environment: the xvcb lock is held over these calls. */ afs_FreeCBR(asp) register struct afs_cbr *asp; { asp->next = afs_cbrSpace; afs_cbrSpace = asp; return 0; } /* * afs_FlushVCBs * * Description: flush all queued callbacks to all servers. * * Parameters: none. * * Environment: holds xvcb lock over RPC to guard against race conditions * when a new callback is granted for the same file later on. */ afs_int32 afs_FlushVCBs (afs_int32 lockit) { struct AFSFid tfids[AFS_MAXCBRSCALL]; struct AFSCallBack callBacks[1]; struct AFSCBFids fidArray; struct AFSCBs cbArray; afs_int32 code; struct afs_cbr *tcbrp; int tcount; struct server *tsp; int i; struct vrequest treq; struct conn *tc; int safety1, safety2, safety3; extern int afs_totalServers; XSTATS_DECLS if (code = afs_InitReq(&treq, &afs_osi_cred)) return code; treq.flags |= O_NONBLOCK; if (lockit) MObtainWriteLock(&afs_xvcb,273); ObtainReadLock(&afs_xserver); for(i=0; inext, safety1++) { /* don't have any */ if (tsp->cbrs == (struct afs_cbr *) 0) continue; /* otherwise, grab a block of AFS_MAXCBRSCALL from the list * and make an RPC, over and over again. */ tcount = 0; /* number found so far */ for (safety2 = 0; safety2 < afs_cacheStats ; safety2++) { if (tcount >= AFS_MAXCBRSCALL || !tsp->cbrs) { /* if buffer is full, or we've queued all we're going * to from this server, we should flush out the * callbacks. */ fidArray.AFSCBFids_len = tcount; fidArray.AFSCBFids_val = (struct AFSFid *) tfids; cbArray.AFSCBs_len = 1; cbArray.AFSCBs_val = callBacks; callBacks[0].CallBackType = CB_EXCLUSIVE; for (safety3 = 0; safety3 < MAXHOSTS*2; safety3++) { tc = afs_ConnByHost(tsp, tsp->cell->fsport, tsp->cell->cell, &treq, 0, SHARED_LOCK); if (tc) { XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_GIVEUPCALLBACKS); RX_AFS_GUNLOCK(); code = RXAFS_GiveUpCallBacks(tc->id, &fidArray, &cbArray); RX_AFS_GLOCK(); XSTATS_END_TIME; } else code = -1; if (!afs_Analyze(tc, code, 0, &treq, AFS_STATS_FS_RPCIDX_GIVEUPCALLBACKS, SHARED_LOCK, tsp->cell)) { break; } } /* ignore return code, since callbacks may have * been returned anyway, we shouldn't leave them * around to be returned again. * * Next, see if we are done with this server, and if so, * break to deal with the next one. */ if (!tsp->cbrs) break; tcount = 0; } /* if to flush full buffer */ /* if we make it here, we have an entry at the head of cbrs, * which we should copy to the file ID array and then free. */ tcbrp = tsp->cbrs; tfids[tcount++] = tcbrp->fid; tsp->cbrs = tcbrp->next; afs_FreeCBR(tcbrp); } /* while loop for this one server */ if (safety2 > afs_cacheStats) { afs_warn("possible internal error afs_flushVCBs (%d)\n", safety2); } } /* for loop for this hash chain */ } /* loop through all hash chains */ if (safety1 > afs_totalServers+2) { afs_warn("AFS internal error (afs_flushVCBs) (%d > %d), continuing...\n", safety1, afs_totalServers+2); if (afs_paniconwarn) osi_Panic("afs_flushVCBS safety1"); } ReleaseReadLock(&afs_xserver); if (lockit) MReleaseWriteLock(&afs_xvcb); return 0; } /* * afs_QueueVCB * * Description: * Queue a callback on the given fid. * * Parameters: * avc: vcache entry * * Environment: * Locks the xvcb lock. * Called when the xvcache lock is already held. */ static afs_int32 afs_QueueVCB(struct vcache *avc) { register struct server *tsp; register struct afs_cbr *tcbp; AFS_STATCNT(afs_QueueVCB); /* The callback is really just a struct server ptr. */ tsp = (struct server *)(avc->callback); /* we now have a pointer to the server, so we just allocate * a queue entry and queue it. */ MObtainWriteLock(&afs_xvcb,274); tcbp = afs_AllocCBR(); tcbp->fid = avc->fid.Fid; tcbp->next = tsp->cbrs; tsp->cbrs = tcbp; /* now release locks and return */ MReleaseWriteLock(&afs_xvcb); return 0; } /* * afs_RemoveVCB * * Description: * Remove a queued callback by looking through all the servers * to see if any have this callback queued. * * Parameters: * afid: The fid we want cleansed of queued callbacks. * * Environment: * Locks xvcb and xserver locks. * Typically called with xdcache, xvcache and/or individual vcache * entries locked. */ afs_RemoveVCB(afid) register struct VenusFid *afid; { /*afs_RemoveVCB*/ register int i, j; register struct server *tsp; register struct afs_cbr *tcbrp; struct afs_cbr **lcbrpp; AFS_STATCNT(afs_RemoveVCB); MObtainWriteLock(&afs_xvcb,275); ObtainReadLock(&afs_xserver); for(i=0;inext) { /* if cell is known, and is wrong, then skip this server */ if (tsp->cell && tsp->cell->cell != afid->Cell) continue; /* * Otherwise, iterate through file IDs we're sending to the * server. */ lcbrpp = &tsp->cbrs; /* first queued return callback */ for(tcbrp = *lcbrpp; tcbrp; lcbrpp = &tcbrp->next, tcbrp = *lcbrpp) { if (afid->Fid.Volume == tcbrp->fid.Volume && afid->Fid.Unique == tcbrp->fid.Unique && afid->Fid.Vnode == tcbrp->fid.Vnode) { *lcbrpp = tcbrp->next; /* unthread from list */ afs_FreeCBR(tcbrp); goto done; } } } } done: ReleaseReadLock(&afs_xserver); MReleaseWriteLock(&afs_xvcb); return 0; } /*afs_RemoveVCB*/ /* * afs_NewVCache * * Description: * This routine is responsible for allocating a new cache entry * from the free list. It formats the cache entry and inserts it * into the appropriate hash tables. It must be called with * afs_xvcache write-locked so as to prevent several processes from * trying to create a new cache entry simultaneously. * * Parameters: * afid : The file id of the file whose cache entry is being * created. */ /* LOCK: afs_NewVCache afs_xvcache W */ struct vcache *afs_NewVCache(struct VenusFid *afid, struct server *serverp, afs_int32 lockit, afs_int32 locktype) { struct vcache *tvc; afs_int32 i; afs_int32 anumber = VCACHE_FREE; #ifdef AFS_AIX_ENV struct gnode *gnodepnt; #endif #ifdef AFS_MACH_ENV struct vm_info * vm_info_ptr; #endif /* AFS_MACH_ENV */ #ifdef AFS_OSF_ENV struct vcache *nvc; #endif /* AFS_OSF_ENV */ struct afs_q *tq, *uq; int code, fv_slept; AFS_STATCNT(afs_NewVCache); #ifdef AFS_LINUX22_ENV if (!freeVCList) { /* Free some if possible. */ struct afs_q *tq, *uq; int i; char *panicstr; int vmax = 2 * afs_cacheStats; int vn = VCACHE_FREE; i = 0; for(tq = VLRU.prev; tq != &VLRU && vn > 0; tq = uq) { tvc = QTOV(tq); uq = QPrev(tq); if (tvc->states & CVFlushed) refpanic ("CVFlushed on VLRU"); else if (i++ > vmax) refpanic ("Exceeded pool of AFS vnodes(VLRU cycle?)"); else if (QNext(uq) != tq) refpanic ("VLRU inconsistent"); if (tvc == afs_globalVp) continue; if ( VREFCOUNT(tvc) && tvc->opens == 0 ) { struct inode *ip = (struct inode*)tvc; if (list_empty(&ip->i_dentry)) { vn --; } else { struct list_head *cur; struct list_head *head = &ip->i_dentry; int all = 1; restart: DLOCK(); cur = head; while ((cur = cur->next) != head) { struct dentry *dentry = list_entry(cur, struct dentry, d_alias); if (!DCOUNT(dentry)) { AFS_GUNLOCK(); DGET(dentry); DUNLOCK(); d_drop(dentry); dput(dentry); AFS_GLOCK(); goto restart; } else { all = 0; } } DUNLOCK(); if (all) vn --; } } if (tq == uq) break; } } #endif /* AFS_LINUX22_ENV */ #ifdef AFS_OSF_ENV #ifdef AFS_OSF30_ENV if (afs_vcount >= afs_maxvcount) #else /* * If we are using > 33 % of the total system vnodes for AFS vcache * entries or we are using the maximum number of vcache entries, * then free some. (if our usage is > 33% we should free some, if * our usage is > afs_maxvcount, set elsewhere to 0.5*nvnode, * we _must_ free some -- no choice). */ if ( (( 3 * afs_vcount ) > nvnode) || ( afs_vcount >= afs_maxvcount )) #endif { struct afs_q *tq, *uq; int i; char *panicstr; i = 0; for(tq = VLRU.prev; tq != &VLRU && anumber > 0; tq = uq) { tvc = QTOV(tq); uq = QPrev(tq); if (tvc->states & CVFlushed) refpanic ("CVFlushed on VLRU"); else if (i++ > afs_maxvcount) refpanic ("Exceeded pool of AFS vnodes(VLRU cycle?)"); else if (QNext(uq) != tq) refpanic ("VLRU inconsistent"); else if (VREFCOUNT(tvc) < 1) refpanic ("refcnt 0 on VLRU"); if ( VREFCOUNT(tvc) == 1 && tvc->opens == 0 && (tvc->states & CUnlinkedDel) == 0) { code = afs_FlushVCache(tvc, &fv_slept); if (code == 0) { anumber--; } if (fv_slept) { uq = VLRU.prev; i = 0; continue; /* start over - may have raced. */ } } if (tq == uq) break; } if (anumber == VCACHE_FREE) { printf("NewVCache: warning none freed, using %d of %d\n", afs_vcount, afs_maxvcount); if (afs_vcount >= afs_maxvcount) { osi_Panic("NewVCache - none freed"); /* XXX instead of panicing, should do afs_maxvcount++ and magic up another one */ } } } AFS_GUNLOCK(); if (getnewvnode(MOUNT_AFS, &Afs_vnodeops, &nvc)) { /* What should we do ???? */ osi_Panic("afs_NewVCache: no more vnodes"); } AFS_GLOCK(); tvc = nvc; tvc->nextfree = (struct vcache *)0; afs_vcount++; #else /* AFS_OSF_ENV */ /* pull out a free cache entry */ if (!freeVCList) { i = 0; for(tq = VLRU.prev; (anumber > 0) && (tq != &VLRU); tq = uq) { tvc = QTOV(tq); uq = QPrev(tq); if (tvc->states & CVFlushed) refpanic("CVFlushed on VLRU"); else if (i++ > 2*afs_cacheStats) /* even allowing for a few xallocs...*/ refpanic("Increase -stat parameter of afsd(VLRU cycle?)"); else if (QNext(uq) != tq) refpanic("VLRU inconsistent"); #ifdef AFS_DARWIN_ENV if (tvc->opens == 0 && ((tvc->states & CUnlinkedDel) == 0) && VREFCOUNT(tvc) == 1 && UBCINFOEXISTS(&tvc->v)) { osi_VM_TryReclaim(tvc, &fv_slept); if (fv_slept) { uq = VLRU.prev; i = 0; continue; /* start over - may have raced. */ } } #endif #if defined(AFS_FBSD_ENV) if (VREFCOUNT(tvc) == 1 && tvc->opens == 0 && (tvc->states & CUnlinkedDel) == 0) { if (!(VOP_LOCK(&tvc->v, LK_EXCLUSIVE, curproc))) { if (VREFCOUNT(tvc) == 1 && tvc->opens == 0 && (tvc->states & CUnlinkedDel) == 0) { VREFCOUNT_DEC(tvc); AFS_GUNLOCK(); /* perhaps inline inactive for locking */ VOP_INACTIVE(&tvc->v, curproc); AFS_GLOCK(); } else { VOP_UNLOCK(&tvc->v, 0, curproc); } } } #endif if (VREFCOUNT(tvc) == 0 && tvc->opens == 0 && (tvc->states & CUnlinkedDel) == 0) { code = afs_FlushVCache(tvc, &fv_slept); if (code == 0) { anumber--; } if (fv_slept) { uq = VLRU.prev; i = 0; continue; /* start over - may have raced. */ } } if (tq == uq ) break; } } if (!freeVCList) { /* none free, making one is better than a panic */ afs_stats_cmperf.vcacheXAllocs++; /* count in case we have a leak */ tvc = (struct vcache *) afs_osi_Alloc(sizeof (struct vcache)); #ifdef AFS_AIX32_ENV pin((char *)tvc, sizeof(struct vcache)); /* XXX */ #endif #ifdef AFS_MACH_ENV /* In case it still comes here we need to fill this */ tvc->v.v_vm_info = VM_INFO_NULL; vm_info_init(tvc->v.v_vm_info); /* perhaps we should also do close_flush on non-NeXT mach systems; * who knows; we don't currently have the sources. */ #endif /* AFS_MACH_ENV */ #if defined(AFS_SGI_ENV) { char name[METER_NAMSZ]; memset(tvc, 0, sizeof(struct vcache)); tvc->v.v_number = ++afsvnumbers; tvc->vc_rwlockid = OSI_NO_LOCKID; initnsema(&tvc->vc_rwlock, 1, makesname(name, "vrw", tvc->v.v_number)); #ifndef AFS_SGI53_ENV initnsema(&tvc->v.v_sync, 0, makesname(name, "vsy", tvc->v.v_number)); #endif #ifndef AFS_SGI62_ENV initnlock(&tvc->v.v_lock, makesname(name, "vlk", tvc->v.v_number)); #endif } #endif /* AFS_SGI_ENV */ } else { tvc = freeVCList; /* take from free list */ freeVCList = tvc->nextfree; tvc->nextfree = (struct vcache *)0; } #endif /* AFS_OSF_ENV */ #ifdef AFS_MACH_ENV vm_info_ptr = tvc->v.v_vm_info; #endif /* AFS_MACH_ENV */ #if !defined(AFS_SGI_ENV) && !defined(AFS_OSF_ENV) memset((char *)tvc, 0, sizeof(struct vcache)); #else tvc->uncred = 0; #endif RWLOCK_INIT(&tvc->lock, "vcache lock"); #if defined(AFS_SUN5_ENV) RWLOCK_INIT(&tvc->vlock, "vcache vlock"); #endif /* defined(AFS_SUN5_ENV) */ #ifdef AFS_MACH_ENV tvc->v.v_vm_info = vm_info_ptr; tvc->v.v_vm_info->pager = MEMORY_OBJECT_NULL; #endif /* AFS_MACH_ENV */ tvc->parentVnode = 0; tvc->mvid = (struct VenusFid *) 0; tvc->linkData = (char *) 0; tvc->cbExpires = 0; tvc->opens = 0; tvc->execsOrWriters = 0; tvc->flockCount = 0; tvc->anyAccess = 0; tvc->states = 0; tvc->last_looker = 0; tvc->fid = *afid; tvc->asynchrony = -1; tvc->vc_error = 0; afs_symhint_inval(tvc); #ifdef AFS_TEXT_ENV tvc->flushDV.low = tvc->flushDV.high = AFS_MAXDV; #endif hzero(tvc->mapDV); tvc->truncPos = AFS_NOTRUNC; /* don't truncate until we need to */ hzero(tvc->m.DataVersion); /* in case we copy it into flushDV */ #ifdef AFS_OSF_ENV /* Hold it for the LRU (should make count 2) */ VN_HOLD((struct vnode *)tvc); #else /* AFS_OSF_ENV */ VREFCOUNT_SET(tvc, 1); /* us */ #endif /* AFS_OSF_ENV */ #ifdef AFS_AIX32_ENV LOCK_INIT(&tvc->pvmlock, "vcache pvmlock"); tvc->vmh = tvc->segid = NULL; tvc->credp = NULL; #endif #if defined(AFS_SUN_ENV) || defined(AFS_ALPHA_ENV) || defined(AFS_SUN5_ENV) #if defined(AFS_SUN5_ENV) rw_init(&tvc->rwlock, "vcache rwlock", RW_DEFAULT, NULL); #if defined(AFS_SUN55_ENV) /* This is required if the kaio (kernel aynchronous io) ** module is installed. Inside the kernel, the function ** check_vp( common/os/aio.c) checks to see if the kernel has ** to provide asynchronous io for this vnode. This ** function extracts the device number by following the ** v_data field of the vnode. If we do not set this field ** then the system panics. The value of the v_data field ** is not really important for AFS vnodes because the kernel ** does not do asynchronous io for regular files. Hence, ** for the time being, we fill up the v_data field with the ** vnode pointer itself. */ tvc->v.v_data = (char *)tvc; #endif /* AFS_SUN55_ENV */ #endif afs_BozonInit(&tvc->pvnLock, tvc); #endif tvc->Access = NULL; tvc->callback = serverp; /* to minimize chance that clear request is lost */ /* initialize vnode data, note vrefCount is v.v_count */ #ifdef AFS_AIX_ENV /* Don't forget to free the gnode space */ tvc->v.v_gnode = gnodepnt = (struct gnode *) osi_AllocSmallSpace(sizeof(struct gnode)); memset((char *)gnodepnt, 0, sizeof(struct gnode)); #endif #ifdef AFS_SGI64_ENV memset((void*)&(tvc->vc_bhv_desc), 0, sizeof(tvc->vc_bhv_desc)); bhv_desc_init(&(tvc->vc_bhv_desc), tvc, tvc, &Afs_vnodeops); #ifdef AFS_SGI65_ENV vn_bhv_head_init(&(tvc->v.v_bh), "afsvp"); vn_bhv_insert_initial(&(tvc->v.v_bh), &(tvc->vc_bhv_desc)); #else bhv_head_init(&(tvc->v.v_bh)); bhv_insert_initial(&(tvc->v.v_bh), &(tvc->vc_bhv_desc)); #endif #ifdef AFS_SGI65_ENV tvc->v.v_mreg = tvc->v.v_mregb = (struct pregion*)tvc; #ifdef VNODE_TRACING tvc->v.v_trace = ktrace_alloc(VNODE_TRACE_SIZE, 0); #endif init_bitlock(&tvc->v.v_pcacheflag, VNODE_PCACHE_LOCKBIT, "afs_pcache", tvc->v.v_number); init_mutex(&tvc->v.v_filocksem, MUTEX_DEFAULT, "afsvfl", (long)tvc); init_mutex(&tvc->v.v_buf_lock, MUTEX_DEFAULT, "afsvnbuf", (long)tvc); #endif vnode_pcache_init(&tvc->v); #if defined(DEBUG) && defined(VNODE_INIT_BITLOCK) /* Above define is never true execpt in SGI test kernels. */ init_bitlock(&(tvc->v.v_flag, VLOCK, "vnode", tvc->v.v_number); #endif #ifdef INTR_KTHREADS AFS_VN_INIT_BUF_LOCK(&(tvc->v)); #endif #else SetAfsVnode((struct vnode *)tvc); #endif /* AFS_SGI64_ENV */ #ifdef AFS_DARWIN_ENV tvc->v.v_ubcinfo = UBC_INFO_NULL; lockinit(&tvc->rwlock, PINOD, "vcache rwlock", 0, 0); cache_purge((struct vnode *)tvc); tvc->v.v_data=tvc; tvc->v.v_tag=VT_AFS; /* VLISTNONE(&tvc->v); */ tvc->v.v_freelist.tqe_next=0; tvc->v.v_freelist.tqe_prev=(struct vnode **)0xdeadb; /*tvc->vrefCount++;*/ #endif #ifdef AFS_FBSD_ENV lockinit(&tvc->rwlock, PINOD, "vcache rwlock", 0, 0); cache_purge((struct vnode *)tvc); tvc->v.v_data=tvc; tvc->v.v_tag=VT_AFS; tvc->v.v_usecount++; /* steal an extra ref for now so vfree never happens */ /* This extra ref is dealt with above... */ #endif /* * The proper value for mvstat (for root fids) is setup by the caller. */ tvc->mvstat = 0; if (afid->Fid.Vnode == 1 && afid->Fid.Unique == 1) tvc->mvstat = 2; if (afs_globalVFS == 0) osi_Panic("afs globalvfs"); vSetVfsp(tvc, afs_globalVFS); vSetType(tvc, VREG); #ifdef AFS_AIX_ENV tvc->v.v_vfsnext = afs_globalVFS->vfs_vnodes; /* link off vfs */ tvc->v.v_vfsprev = NULL; afs_globalVFS->vfs_vnodes = &tvc->v; if (tvc->v.v_vfsnext != NULL) tvc->v.v_vfsnext->v_vfsprev = &tvc->v; tvc->v.v_next = gnodepnt->gn_vnode; /*Single vnode per gnode for us!*/ gnodepnt->gn_vnode = &tvc->v; #endif #ifdef AFS_DEC_ENV tvc->v.g_dev = ((struct mount *)afs_globalVFS->vfs_data)->m_dev; #endif #if defined(AFS_DUX40_ENV) insmntque(tvc, afs_globalVFS, &afs_ubcops); #else #ifdef AFS_OSF_ENV /* Is this needed??? */ insmntque(tvc, afs_globalVFS); #endif /* AFS_OSF_ENV */ #endif /* AFS_DUX40_ENV */ #if defined(AFS_SGI_ENV) VN_SET_DPAGES(&(tvc->v), (struct pfdat*)NULL); osi_Assert((tvc->v.v_flag & VINACT) == 0); tvc->v.v_flag = 0; osi_Assert(VN_GET_PGCNT(&(tvc->v)) == 0); osi_Assert(tvc->mapcnt == 0 && tvc->vc_locktrips == 0); osi_Assert(tvc->vc_rwlockid == OSI_NO_LOCKID); osi_Assert(tvc->v.v_filocks == NULL); #if !defined(AFS_SGI65_ENV) osi_Assert(tvc->v.v_filocksem == NULL); #endif osi_Assert(tvc->cred == NULL); #ifdef AFS_SGI64_ENV vnode_pcache_reinit(&tvc->v); tvc->v.v_rdev = NODEV; #endif vn_initlist((struct vnlist *)&tvc->v); tvc->lastr = 0; #endif /* AFS_SGI_ENV */ #if defined(AFS_LINUX22_ENV) { struct inode *ip = (struct inode*)tvc; sema_init(&ip->i_sem, 1); #if defined(AFS_LINUX24_ENV) sema_init(&ip->i_zombie, 1); init_waitqueue_head(&ip->i_wait); spin_lock_init(&ip->i_data.i_shared_lock); #ifdef STRUCT_ADDRESS_SPACE_HAS_PAGE_LOCK spin_lock_init(&ip->i_data.page_lock); #endif INIT_LIST_HEAD(&ip->i_data.clean_pages); INIT_LIST_HEAD(&ip->i_data.dirty_pages); INIT_LIST_HEAD(&ip->i_data.locked_pages); INIT_LIST_HEAD(&ip->i_dirty_buffers); #ifdef STRUCT_INODE_HAS_I_DIRTY_DATA_BUFFERS INIT_LIST_HEAD(&ip->i_dirty_data_buffers); #endif #ifdef STRUCT_INODE_HAS_I_DEVICES INIT_LIST_HEAD(&ip->i_devices); #endif ip->i_data.host = (void*) ip; ip->i_mapping = &ip->i_data; #ifdef STRUCT_INODE_HAS_I_TRUNCATE_SEM init_rwsem(&ip->i_truncate_sem); #endif #else sema_init(&ip->i_atomic_write, 1); init_waitqueue(&ip->i_wait); #endif INIT_LIST_HEAD(&ip->i_hash); INIT_LIST_HEAD(&ip->i_dentry); if (afs_globalVFS) { ip->i_dev = afs_globalVFS->s_dev; ip->i_sb = afs_globalVFS; } } #endif tvc->h1.dchint = 0; osi_dnlc_purgedp(tvc); /* this may be overkill */ memset((char *)&(tvc->quick), 0, sizeof(struct vtodc)); memset((char *)&(tvc->callsort), 0, sizeof(struct afs_q)); tvc->slocks = (struct SimpleLocks *)0; i = VCHash(afid); tvc->hnext = afs_vhashT[i]; afs_vhashT[i] = tvc; if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("NewVCache VLRU inconsistent"); } QAdd(&VLRU, &tvc->vlruq); /* put in lruq */ if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("NewVCache VLRU inconsistent2"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("NewVCache VLRU inconsistent3"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("NewVCache VLRU inconsistent4"); } vcachegen++; return tvc; } /*afs_NewVCache*/ /* * afs_FlushActiveVcaches * * Description: * ??? * * Parameters: * doflocks : Do we handle flocks? */ /* LOCK: afs_FlushActiveVcaches afs_xvcache N */ void afs_FlushActiveVcaches(doflocks) register afs_int32 doflocks; { /*afs_FlushActiveVcaches*/ register struct vcache *tvc; register int i; register struct conn *tc; register afs_int32 code; register struct AFS_UCRED *cred; struct vrequest treq, ureq; struct AFSVolSync tsync; int didCore; XSTATS_DECLS AFS_STATCNT(afs_FlushActiveVcaches); ObtainReadLock(&afs_xvcache); for(i=0;ihnext) { if (doflocks && tvc->flockCount != 0) { /* if this entry has an flock, send a keep-alive call out */ osi_vnhold(tvc, 0); ReleaseReadLock(&afs_xvcache); ObtainWriteLock(&tvc->lock,51); do { afs_InitReq(&treq, &afs_osi_cred); treq.flags |= O_NONBLOCK; tc = afs_Conn(&tvc->fid, &treq, SHARED_LOCK); if (tc) { XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_EXTENDLOCK); RX_AFS_GUNLOCK(); code = RXAFS_ExtendLock(tc->id, (struct AFSFid *) &tvc->fid.Fid, &tsync); RX_AFS_GLOCK(); XSTATS_END_TIME; } else code = -1; } while (afs_Analyze(tc, code, &tvc->fid, &treq, AFS_STATS_FS_RPCIDX_EXTENDLOCK, SHARED_LOCK, (struct cell *)0)); ReleaseWriteLock(&tvc->lock); ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); } didCore = 0; if ((tvc->states & CCore) || (tvc->states & CUnlinkedDel)) { /* * Don't let it evaporate in case someone else is in * this code. Also, drop the afs_xvcache lock while * getting vcache locks. */ osi_vnhold(tvc,0); ReleaseReadLock(&afs_xvcache); #if defined(AFS_SUN_ENV) || defined(AFS_ALPHA_ENV) afs_BozonLock(&tvc->pvnLock, tvc); #endif #if defined(AFS_SGI_ENV) /* * That's because if we come in via the CUnlinkedDel bit state path we'll be have 0 refcnt */ osi_Assert(VREFCOUNT(tvc) > 0); AFS_RWLOCK((vnode_t *)tvc, VRWLOCK_WRITE); #endif ObtainWriteLock(&tvc->lock,52); if (tvc->states & CCore) { tvc->states &= ~CCore; /* XXXX Find better place-holder for cred XXXX */ cred = (struct AFS_UCRED *) tvc->linkData; tvc->linkData = (char *) 0; /* XXX */ afs_InitReq(&ureq, cred); afs_Trace2(afs_iclSetp, CM_TRACE_ACTCCORE, ICL_TYPE_POINTER, tvc, ICL_TYPE_INT32, tvc->execsOrWriters); code = afs_StoreOnLastReference(tvc, &ureq); ReleaseWriteLock(&tvc->lock); #if defined(AFS_SUN_ENV) || defined(AFS_ALPHA_ENV) afs_BozonUnlock(&tvc->pvnLock, tvc); #endif hzero(tvc->flushDV); osi_FlushText(tvc); didCore = 1; if (code && code != VNOVNODE) { afs_StoreWarn(code, tvc->fid.Fid.Volume, /* /dev/console */ 1); } } else if (tvc->states & CUnlinkedDel) { /* * Ignore errors */ ReleaseWriteLock(&tvc->lock); #if defined(AFS_SUN_ENV) || defined(AFS_ALPHA_ENV) afs_BozonUnlock(&tvc->pvnLock, tvc); #endif #if defined(AFS_SGI_ENV) AFS_RWUNLOCK((vnode_t *)tvc, VRWLOCK_WRITE); #endif afs_remunlink(tvc, 0); #if defined(AFS_SGI_ENV) AFS_RWLOCK((vnode_t *)tvc, VRWLOCK_WRITE); #endif } else { /* lost (or won, perhaps) the race condition */ ReleaseWriteLock(&tvc->lock); #if defined(AFS_SUN_ENV) || defined(AFS_ALPHA_ENV) afs_BozonUnlock(&tvc->pvnLock, tvc); #endif } #if defined(AFS_SGI_ENV) AFS_RWUNLOCK((vnode_t *)tvc, VRWLOCK_WRITE); #endif ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); if (didCore) { #ifdef AFS_GFS_ENV VREFCOUNT_DEC(tvc); #else AFS_RELE((struct vnode *)tvc); #endif /* Matches write code setting CCore flag */ crfree(cred); } } #ifdef AFS_DARWIN_ENV if (VREFCOUNT(tvc) == 1 && UBCINFOEXISTS(&tvc->v)) { if (tvc->opens) panic("flushactive open, hasubc, but refcnt 1"); osi_VM_TryReclaim(tvc,0); } #endif } } ReleaseReadLock(&afs_xvcache); } /*afs_FlushActiveVcaches*/ /* * afs_VerifyVCache * * Description: * Make sure a cache entry is up-to-date status-wise. * * NOTE: everywhere that calls this can potentially be sped up * by checking CStatd first, and avoiding doing the InitReq * if this is up-to-date. * * Anymore, the only places that call this KNOW already that the * vcache is not up-to-date, so we don't screw around. * * Parameters: * avc : Ptr to vcache entry to verify. * areq : ??? */ int afs_VerifyVCache2(struct vcache *avc, struct vrequest *areq) { register struct vcache *tvc; AFS_STATCNT(afs_VerifyVCache); #if defined(AFS_OSF_ENV) ObtainReadLock(&avc->lock); if (afs_IsWired(avc)) { ReleaseReadLock(&avc->lock); return 0; } ReleaseReadLock(&avc->lock); #endif /* AFS_OSF_ENV */ /* otherwise we must fetch the status info */ ObtainWriteLock(&avc->lock,53); if (avc->states & CStatd) { ReleaseWriteLock(&avc->lock); return 0; } ObtainWriteLock(&afs_xcbhash, 461); avc->states &= ~( CStatd | CUnique ); avc->callback = (struct server *)0; afs_DequeueCallback(avc); ReleaseWriteLock(&afs_xcbhash); ReleaseWriteLock(&avc->lock); /* since we've been called back, or the callback has expired, * it's possible that the contents of this directory, or this * file's name have changed, thus invalidating the dnlc contents. */ if ((avc->states & CForeign) || (avc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (avc); else osi_dnlc_purgevp (avc); /* fetch the status info */ tvc = afs_GetVCache(&avc->fid, areq, (afs_int32*)0, avc, READ_LOCK); if (!tvc) return ENOENT; /* Put it back; caller has already incremented vrefCount */ afs_PutVCache(tvc, READ_LOCK); return 0; } /*afs_VerifyVCache*/ /* * afs_SimpleVStat * * Description: * Simple copy of stat info into cache. * * Parameters: * avc : Ptr to vcache entry involved. * astat : Ptr to stat info to copy. * * Environment: * Nothing interesting. * * Callers: as of 1992-04-29, only called by WriteVCache */ static void afs_SimpleVStat(avc, astat, areq) register struct vcache *avc; register struct AFSFetchStatus *astat; struct vrequest *areq; { /*afs_SimpleVStat*/ afs_size_t length; AFS_STATCNT(afs_SimpleVStat); #ifdef AFS_SGI_ENV if ((avc->execsOrWriters <= 0) && !afs_DirtyPages(avc) && !AFS_VN_MAPPED((vnode_t*)avc)) #else if ((avc->execsOrWriters <= 0) && !afs_DirtyPages(avc)) #endif { #ifdef AFS_64BIT_ClIENT FillInt64(length, astat->Length_hi, astat->Length); #else /* AFS_64BIT_CLIENT */ length = astat->Length; #endif /* AFS_64BIT_CLIENT */ #if defined(AFS_SGI_ENV) osi_Assert((valusema(&avc->vc_rwlock) <= 0) && (OSI_GET_LOCKID() == avc->vc_rwlockid)); if (length < avc->m.Length) { vnode_t *vp = (vnode_t *)avc; osi_Assert(WriteLocked(&avc->lock)); ReleaseWriteLock(&avc->lock); AFS_GUNLOCK(); PTOSSVP(vp, (off_t)length, (off_t)MAXLONG); AFS_GLOCK(); ObtainWriteLock(&avc->lock,67); } #endif /* if writing the file, don't fetch over this value */ afs_Trace3(afs_iclSetp, CM_TRACE_SIMPLEVSTAT, ICL_TYPE_POINTER, avc, ICL_TYPE_OFFSET, ICL_HANDLE_OFFSET(avc->m.Length), ICL_TYPE_OFFSET, ICL_HANDLE_OFFSET(length)); avc->m.Length = length; avc->m.Date = astat->ClientModTime; } avc->m.Owner = astat->Owner; avc->m.Group = astat->Group; avc->m.Mode = astat->UnixModeBits; if (vType(avc) == VREG) { avc->m.Mode |= S_IFREG; } else if (vType(avc) == VDIR) { avc->m.Mode |= S_IFDIR; } else if (vType(avc) == VLNK) { avc->m.Mode |= S_IFLNK; if ((avc->m.Mode & 0111) == 0) avc->mvstat = 1; } if (avc->states & CForeign) { struct axscache *ac; avc->anyAccess = astat->AnonymousAccess; #ifdef badidea if ((astat->CallerAccess & ~astat->AnonymousAccess)) /* USED TO SAY : * Caller has at least one bit not covered by anonymous, and * thus may have interesting rights. * * HOWEVER, this is a really bad idea, because any access query * for bits which aren't covered by anonymous, on behalf of a user * who doesn't have any special rights, will result in an answer of * the form "I don't know, lets make a FetchStatus RPC and find out!" * It's an especially bad idea under Ultrix, since (due to the lack of * a proper access() call) it must perform several afs_access() calls * in order to create magic mode bits that vary according to who makes * the call. In other words, _every_ stat() generates a test for * writeability... */ #endif /* badidea */ if (avc->Access && (ac = afs_FindAxs(avc->Access, areq->uid))) ac->axess = astat->CallerAccess; else /* not found, add a new one if possible */ afs_AddAxs(avc->Access, areq->uid, astat->CallerAccess); } } /*afs_SimpleVStat*/ /* * afs_WriteVCache * * Description: * Store the status info *only* back to the server for a * fid/vrequest. * * Parameters: * avc : Ptr to the vcache entry. * astatus : Ptr to the status info to store. * areq : Ptr to the associated vrequest. * * Environment: * Must be called with a shared lock held on the vnode. */ afs_WriteVCache(avc, astatus, areq) register struct vcache *avc; register struct AFSStoreStatus *astatus; struct vrequest *areq; { /*afs_WriteVCache*/ afs_int32 code; struct conn *tc; struct AFSFetchStatus OutStatus; struct AFSVolSync tsync; XSTATS_DECLS AFS_STATCNT(afs_WriteVCache); afs_Trace2(afs_iclSetp, CM_TRACE_WVCACHE, ICL_TYPE_POINTER, avc, ICL_TYPE_OFFSET, ICL_HANDLE_OFFSET(avc->m.Length)); do { tc = afs_Conn(&avc->fid, areq, SHARED_LOCK); if (tc) { XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_STORESTATUS); RX_AFS_GUNLOCK(); code = RXAFS_StoreStatus(tc->id, (struct AFSFid *) &avc->fid.Fid, astatus, &OutStatus, &tsync); RX_AFS_GLOCK(); XSTATS_END_TIME; } else code = -1; } while (afs_Analyze(tc, code, &avc->fid, areq, AFS_STATS_FS_RPCIDX_STORESTATUS, SHARED_LOCK, (struct cell *)0)); UpgradeSToWLock(&avc->lock,20); if (code == 0) { /* success, do the changes locally */ afs_SimpleVStat(avc, &OutStatus, areq); /* * Update the date, too. SimpleVStat didn't do this, since * it thought we were doing this after fetching new status * over a file being written. */ avc->m.Date = OutStatus.ClientModTime; } else { /* failure, set up to check with server next time */ ObtainWriteLock(&afs_xcbhash, 462); afs_DequeueCallback(avc); avc->states &= ~( CStatd | CUnique); /* turn off stat valid flag */ ReleaseWriteLock(&afs_xcbhash); if ((avc->states & CForeign) || (avc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (avc); /* if it (could be) a directory */ } ConvertWToSLock(&avc->lock); return code; } /*afs_WriteVCache*/ /* * afs_ProcessFS * * Description: * Copy astat block into vcache info * * Parameters: * avc : Ptr to vcache entry. * astat : Ptr to stat block to copy in. * areq : Ptr to associated request. * * Environment: * Must be called under a write lock * * Note: this code may get dataversion and length out of sync if the file has * been modified. This is less than ideal. I haven't thought about * it sufficiently to be certain that it is adequate. */ void afs_ProcessFS(avc, astat, areq) register struct vcache *avc; struct vrequest *areq; register struct AFSFetchStatus *astat; { /*afs_ProcessFS*/ register int i; afs_size_t length; AFS_STATCNT(afs_ProcessFS); #ifdef AFS_64BIT_CLIENT FillInt64(length, astat->Length_hi, astat->Length); #else /* AFS_64BIT_CLIENT */ length = astat->Length; #endif /* AFS_64BIT_CLIENT */ /* WARNING: afs_DoBulkStat uses the Length field to store a sequence * number for each bulk status request. Under no circumstances * should afs_DoBulkStat store a sequence number if the new * length will be ignored when afs_ProcessFS is called with * new stats. If you change the following conditional then you * also need to change the conditional in afs_DoBulkStat. */ #ifdef AFS_SGI_ENV if ((avc->execsOrWriters <= 0) && !afs_DirtyPages(avc) && !AFS_VN_MAPPED((vnode_t*)avc)) #else if ((avc->execsOrWriters <= 0) && !afs_DirtyPages(avc)) #endif { /* if we're writing or mapping this file, don't fetch over these * values. */ afs_Trace3(afs_iclSetp, CM_TRACE_PROCESSFS, ICL_TYPE_POINTER, avc, ICL_TYPE_OFFSET, ICL_HANDLE_OFFSET(avc->m.Length), ICL_TYPE_OFFSET, ICL_HANDLE_OFFSET(length)); avc->m.Length = length; avc->m.Date = astat->ClientModTime; } hset64(avc->m.DataVersion, astat->dataVersionHigh, astat->DataVersion); avc->m.Owner = astat->Owner; avc->m.Mode = astat->UnixModeBits; avc->m.Group = astat->Group; avc->m.LinkCount = astat->LinkCount; if (astat->FileType == File) { vSetType(avc, VREG); avc->m.Mode |= S_IFREG; } else if (astat->FileType == Directory) { vSetType(avc, VDIR); avc->m.Mode |= S_IFDIR; } else if (astat->FileType == SymbolicLink) { vSetType(avc, VLNK); avc->m.Mode |= S_IFLNK; if ((avc->m.Mode & 0111) == 0) avc->mvstat = 1; } avc->anyAccess = astat->AnonymousAccess; #ifdef badidea if ((astat->CallerAccess & ~astat->AnonymousAccess)) /* USED TO SAY : * Caller has at least one bit not covered by anonymous, and * thus may have interesting rights. * * HOWEVER, this is a really bad idea, because any access query * for bits which aren't covered by anonymous, on behalf of a user * who doesn't have any special rights, will result in an answer of * the form "I don't know, lets make a FetchStatus RPC and find out!" * It's an especially bad idea under Ultrix, since (due to the lack of * a proper access() call) it must perform several afs_access() calls * in order to create magic mode bits that vary according to who makes * the call. In other words, _every_ stat() generates a test for * writeability... */ #endif /* badidea */ { struct axscache *ac; if (avc->Access && (ac = afs_FindAxs(avc->Access, areq->uid))) ac->axess = astat->CallerAccess; else /* not found, add a new one if possible */ afs_AddAxs(avc->Access, areq->uid, astat->CallerAccess); } #ifdef AFS_LINUX22_ENV vcache2inode(avc); /* Set the inode attr cache */ #endif } /*afs_ProcessFS*/ afs_RemoteLookup(afid, areq, name, nfid, OutStatusp, CallBackp, serverp, tsyncp) register struct VenusFid *afid; struct vrequest *areq; char *name; struct VenusFid *nfid; struct AFSFetchStatus *OutStatusp; struct AFSCallBack *CallBackp; struct server **serverp; struct AFSVolSync *tsyncp; { afs_int32 code, i; register struct vcache *tvc; struct volume *tvp; afs_uint32 start; register struct conn *tc; struct AFSFetchStatus OutDirStatus; XSTATS_DECLS if (!name) name = ""; /* XXX */ do { tc = afs_Conn(afid, areq, SHARED_LOCK); if (tc) { if (serverp) *serverp = tc->srvr->server; start = osi_Time(); XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_XLOOKUP); RX_AFS_GUNLOCK(); code = RXAFS_Lookup(tc->id, (struct AFSFid *) &afid->Fid, name, (struct AFSFid *) &nfid->Fid, OutStatusp, &OutDirStatus, CallBackp, tsyncp); RX_AFS_GLOCK(); XSTATS_END_TIME; } else code = -1; } while (afs_Analyze(tc, code, afid, areq, AFS_STATS_FS_RPCIDX_XLOOKUP, SHARED_LOCK, (struct cell *)0)); return code; } /* * afs_GetVCache * * Description: * Given a file id and a vrequest structure, fetch the status * information associated with the file. * * Parameters: * afid : File ID. * areq : Ptr to associated vrequest structure, specifying the * user whose authentication tokens will be used. * avc : caller may already have a vcache for this file, which is * already held. * * Environment: * The cache entry is returned with an increased vrefCount field. * The entry must be discarded by calling afs_PutVCache when you * are through using the pointer to the cache entry. * * You should not hold any locks when calling this function, except * locks on other vcache entries. If you lock more than one vcache * entry simultaneously, you should lock them in this order: * * 1. Lock all files first, then directories. * 2. Within a particular type, lock entries in Fid.Vnode order. * * This locking hierarchy is convenient because it allows locking * of a parent dir cache entry, given a file (to check its access * control list). It also allows renames to be handled easily by * locking directories in a constant order. * NB. NewVCache -> FlushVCache presently (4/10/95) drops the xvcache lock. */ struct vcache *afs_GetVCache(afid, areq, cached, avc, locktype) register struct VenusFid *afid; struct vrequest *areq; afs_int32 *cached; afs_int32 locktype; struct vcache *avc; /* might have a vcache structure already, which must * already be held by the caller */ { /*afs_GetVCache*/ afs_int32 code, i, newvcache=0; register struct vcache *tvc; struct volume *tvp; afs_int32 retry; AFS_STATCNT(afs_GetVCache); if (cached) *cached = 0; /* Init just in case */ loop: ObtainSharedLock(&afs_xvcache,5); tvc = afs_FindVCache(afid, 0, 0, &retry, DO_STATS | DO_VLRU ); if (tvc && retry) { #if defined(AFS_SGI_ENV) && !defined(AFS_SGI53_ENV) ReleaseSharedLock(&afs_xvcache); spunlock_psema(tvc->v.v_lock, retry, &tvc->v.v_sync, PINOD); goto loop; #endif } if (tvc) { if (cached) *cached = 1; if (tvc->states & CStatd) { ReleaseSharedLock(&afs_xvcache); return tvc; } } else { UpgradeSToWLock(&afs_xvcache,21); /* no cache entry, better grab one */ tvc = afs_NewVCache(afid, (struct server *)0, 1, WRITE_LOCK); newvcache = 1; ConvertWToSLock(&afs_xvcache); afs_stats_cmperf.vcacheMisses++; } ReleaseSharedLock(&afs_xvcache); ObtainWriteLock(&tvc->lock,54); if (tvc->states & CStatd) { #ifdef AFS_LINUX22_ENV vcache2inode(tvc); #endif ReleaseWriteLock(&tvc->lock); #ifdef AFS_DARWIN_ENV osi_VM_Setup(tvc); #endif return tvc; } #if defined(AFS_OSF_ENV) if (afs_IsWired(tvc)) { ReleaseWriteLock(&tvc->lock); return tvc; } #endif /* AFS_OSF_ENV */ ObtainWriteLock(&afs_xcbhash, 464); tvc->states &= ~CUnique; tvc->callback = 0; afs_DequeueCallback(tvc); ReleaseWriteLock(&afs_xcbhash); /* It is always appropriate to throw away all the access rights? */ afs_FreeAllAxs(&(tvc->Access)); tvp = afs_GetVolume(afid, areq, READ_LOCK); /* copy useful per-volume info */ if (tvp) { if ((tvp->states & VForeign)) { if (newvcache) tvc->states |= CForeign; if (newvcache && (tvp->rootVnode == afid->Fid.Vnode) && (tvp->rootUnique == afid->Fid.Unique)) { tvc->mvstat = 2; } } if (tvp->states & VRO) tvc->states |= CRO; if (tvp->states & VBackup) tvc->states |= CBackup; /* now copy ".." entry back out of volume structure, if necessary */ if (tvc->mvstat == 2 && tvp->dotdot.Fid.Volume != 0) { if (!tvc->mvid) tvc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid)); *tvc->mvid = tvp->dotdot; } afs_PutVolume(tvp, READ_LOCK); } /* stat the file */ afs_RemoveVCB(afid); { struct AFSFetchStatus OutStatus; if (afs_DynrootNewVnode(tvc, &OutStatus)) { afs_ProcessFS(tvc, &OutStatus, areq); tvc->states |= CStatd | CUnique; code = 0; } else { code = afs_FetchStatus(tvc, afid, areq, &OutStatus); } } if (code) { ReleaseWriteLock(&tvc->lock); ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); ReleaseReadLock(&afs_xvcache); return (struct vcache *) 0; } ReleaseWriteLock(&tvc->lock); #ifdef AFS_DARWIN_ENV osi_VM_Setup(avc); #endif return tvc; } /*afs_GetVCache*/ struct vcache *afs_LookupVCache(struct VenusFid *afid, struct vrequest *areq, afs_int32 *cached, afs_int32 locktype, struct vcache *adp, char *aname) { afs_int32 code, now, newvcache=0, hash; struct VenusFid nfid; register struct vcache *tvc; struct volume *tvp; struct AFSFetchStatus OutStatus; struct AFSCallBack CallBack; struct AFSVolSync tsync; struct server *serverp = 0; afs_int32 origCBs; afs_int32 retry; AFS_STATCNT(afs_GetVCache); if (cached) *cached = 0; /* Init just in case */ loop1: ObtainReadLock(&afs_xvcache); tvc = afs_FindVCache(afid, 0, 0, &retry, DO_STATS /* no vlru */); if (tvc) { ReleaseReadLock(&afs_xvcache); if (retry) { #if defined(AFS_SGI_ENV) && !defined(AFS_SGI53_ENV) spunlock_psema(tvc->v.v_lock, retry, &tvc->v.v_sync, PINOD); goto loop1; #endif } ObtainReadLock(&tvc->lock); if (tvc->states & CStatd) { if (cached) { *cached = 1; } ReleaseReadLock(&tvc->lock); return tvc; } tvc->states &= ~CUnique; ReleaseReadLock(&tvc->lock); ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); } /* if (tvc) */ ReleaseReadLock(&afs_xvcache); /* lookup the file */ nfid = *afid; now = osi_Time(); origCBs = afs_allCBs; /* if anything changes, we don't have a cb */ code = afs_RemoteLookup(&adp->fid, areq, aname, &nfid, &OutStatus, &CallBack, &serverp, &tsync); loop2: ObtainSharedLock(&afs_xvcache,6); tvc = afs_FindVCache(&nfid, 0, 0, &retry, DO_VLRU /* no xstats now*/); if (tvc && retry) { #if defined(AFS_SGI_ENV) && !defined(AFS_SGI53_ENV) ReleaseSharedLock(&afs_xvcache); spunlock_psema(tvc->v.v_lock, retry, &tvc->v.v_sync, PINOD); goto loop2; #endif } if (!tvc) { /* no cache entry, better grab one */ UpgradeSToWLock(&afs_xvcache,22); tvc = afs_NewVCache(&nfid, (struct server *)0, 1, WRITE_LOCK); newvcache = 1; ConvertWToSLock(&afs_xvcache); } ReleaseSharedLock(&afs_xvcache); ObtainWriteLock(&tvc->lock,55); /* It is always appropriate to throw away all the access rights? */ afs_FreeAllAxs(&(tvc->Access)); tvp = afs_GetVolume(afid, areq, READ_LOCK); /* copy useful per-vol info */ if (tvp) { if ((tvp->states & VForeign)) { if (newvcache) tvc->states |= CForeign; if (newvcache && (tvp->rootVnode == afid->Fid.Vnode) && (tvp->rootUnique == afid->Fid.Unique)) tvc->mvstat = 2; } if (tvp->states & VRO) tvc->states |= CRO; if (tvp->states & VBackup) tvc->states |= CBackup; /* now copy ".." entry back out of volume structure, if necessary */ if (tvc->mvstat == 2 && tvp->dotdot.Fid.Volume != 0) { if (!tvc->mvid) tvc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid)); *tvc->mvid = tvp->dotdot; } } if (code) { ObtainWriteLock(&afs_xcbhash, 465); afs_DequeueCallback(tvc); tvc->states &= ~( CStatd | CUnique ); ReleaseWriteLock(&afs_xcbhash); if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ if ( tvp ) afs_PutVolume(tvp, READ_LOCK); ReleaseWriteLock(&tvc->lock); ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); ReleaseReadLock(&afs_xvcache); return (struct vcache *) 0; } ObtainWriteLock(&afs_xcbhash, 466); if (origCBs == afs_allCBs) { if (CallBack.ExpirationTime) { tvc->callback = serverp; tvc->cbExpires = CallBack.ExpirationTime+now; tvc->states |= CStatd | CUnique; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(CallBack.ExpirationTime), tvp); } else if (tvc->states & CRO) { /* adapt gives us an hour. */ tvc->cbExpires = 3600+osi_Time(); /*XXX*/ tvc->states |= CStatd | CUnique; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(3600), tvp); } else { tvc->callback = (struct server *)0; afs_DequeueCallback(tvc); tvc->states &= ~(CStatd | CUnique); if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ } } else { afs_DequeueCallback(tvc); tvc->states &= ~CStatd; tvc->states &= ~CUnique; tvc->callback = (struct server *)0; if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ } ReleaseWriteLock(&afs_xcbhash); if ( tvp ) afs_PutVolume(tvp, READ_LOCK); afs_ProcessFS(tvc, &OutStatus, areq); ReleaseWriteLock(&tvc->lock); #ifdef AFS_DARWIN_ENV osi_VM_Setup(tvc); #endif return tvc; } struct vcache *afs_GetRootVCache(struct VenusFid *afid, struct vrequest *areq, afs_int32 *cached, struct volume *tvolp, afs_int32 locktype) { afs_int32 code, i, newvcache = 0, haveStatus = 0; afs_int32 getNewFid = 0; afs_uint32 start; struct VenusFid nfid; register struct vcache *tvc; struct server *serverp = 0; struct AFSFetchStatus OutStatus; struct AFSCallBack CallBack; struct AFSVolSync tsync; int origCBs; start = osi_Time(); newmtpt: if (!tvolp->rootVnode || getNewFid) { struct VenusFid tfid; tfid = *afid; tfid.Fid.Vnode = 0; /* Means get rootfid of volume */ origCBs = afs_allCBs; /* ignore InitCallBackState */ code = afs_RemoteLookup(&tfid, areq, (char *)0, &nfid, &OutStatus, &CallBack, &serverp, &tsync); if (code) { return (struct vcache *)0; } /* ReleaseReadLock(&tvolp->lock); */ ObtainWriteLock(&tvolp->lock,56); tvolp->rootVnode = afid->Fid.Vnode = nfid.Fid.Vnode; tvolp->rootUnique = afid->Fid.Unique = nfid.Fid.Unique; ReleaseWriteLock(&tvolp->lock); /* ObtainReadLock(&tvolp->lock);*/ haveStatus = 1; } else { afid->Fid.Vnode = tvolp->rootVnode; afid->Fid.Unique = tvolp->rootUnique; } ObtainSharedLock(&afs_xvcache,7); i = VCHash(afid); for (tvc = afs_vhashT[i]; tvc; tvc = tvc->hnext) { if (!FidCmp(&(tvc->fid), afid)) { #ifdef AFS_OSF_ENV /* Grab this vnode, possibly reactivating from the free list */ /* for the present (95.05.25) everything on the hash table is * definitively NOT in the free list -- at least until afs_reclaim * can be safely implemented */ int vg; AFS_GUNLOCK(); vg = vget((struct vnode *)tvc); /* this bumps ref count */ AFS_GLOCK(); if (vg) continue; #endif /* AFS_OSF_ENV */ break; } } if (!haveStatus && (!tvc || !(tvc->states & CStatd))) { /* Mount point no longer stat'd or unknown. FID may have changed. */ #ifdef AFS_OSF_ENV if (tvc) AFS_RELE(tvc); #endif tvc = (struct vcache*)0; getNewFid = 1; ReleaseSharedLock(&afs_xvcache); goto newmtpt; } if (!tvc) { UpgradeSToWLock(&afs_xvcache,23); /* no cache entry, better grab one */ tvc = afs_NewVCache(afid, (struct server *)0, 1, WRITE_LOCK); newvcache = 1; afs_stats_cmperf.vcacheMisses++; } else { if (cached) *cached = 1; afs_stats_cmperf.vcacheHits++; #ifdef AFS_OSF_ENV /* we already bumped the ref count in the for loop above */ #else /* AFS_OSF_ENV */ osi_vnhold(tvc,0); #endif UpgradeSToWLock(&afs_xvcache,24); if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("GRVC VLRU inconsistent0"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("GRVC VLRU inconsistent1"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("GRVC VLRU inconsistent2"); } QRemove(&tvc->vlruq); /* move to lruq head */ QAdd(&VLRU, &tvc->vlruq); if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("GRVC VLRU inconsistent3"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("GRVC VLRU inconsistent4"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("GRVC VLRU inconsistent5"); } vcachegen++; } ReleaseWriteLock(&afs_xvcache); if (tvc->states & CStatd) { return tvc; } else { ObtainReadLock(&tvc->lock); tvc->states &= ~CUnique; tvc->callback = (struct server *)0; /* redundant, perhaps */ ReleaseReadLock(&tvc->lock); } ObtainWriteLock(&tvc->lock,57); /* It is always appropriate to throw away all the access rights? */ afs_FreeAllAxs(&(tvc->Access)); if (newvcache) tvc->states |= CForeign; if (tvolp->states & VRO) tvc->states |= CRO; if (tvolp->states & VBackup) tvc->states |= CBackup; /* now copy ".." entry back out of volume structure, if necessary */ if (newvcache && (tvolp->rootVnode == afid->Fid.Vnode) && (tvolp->rootUnique == afid->Fid.Unique)) { tvc->mvstat = 2; } if (tvc->mvstat == 2 && tvolp->dotdot.Fid.Volume != 0) { if (!tvc->mvid) tvc->mvid = (struct VenusFid *)osi_AllocSmallSpace(sizeof(struct VenusFid)); *tvc->mvid = tvolp->dotdot; } /* stat the file */ afs_RemoveVCB(afid); if (!haveStatus) { struct VenusFid tfid; tfid = *afid; tfid.Fid.Vnode = 0; /* Means get rootfid of volume */ origCBs = afs_allCBs; /* ignore InitCallBackState */ code = afs_RemoteLookup(&tfid, areq, (char *)0, &nfid, &OutStatus, &CallBack, &serverp, &tsync); } if (code) { ObtainWriteLock(&afs_xcbhash, 467); afs_DequeueCallback(tvc); tvc->callback = (struct server *)0; tvc->states &= ~(CStatd|CUnique); ReleaseWriteLock(&afs_xcbhash); if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ ReleaseWriteLock(&tvc->lock); ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(tvc); ReleaseReadLock(&afs_xvcache); return (struct vcache *) 0; } ObtainWriteLock(&afs_xcbhash, 468); if (origCBs == afs_allCBs) { tvc->states |= CTruth; tvc->callback = serverp; if (CallBack.ExpirationTime != 0) { tvc->cbExpires = CallBack.ExpirationTime+start; tvc->states |= CStatd; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(CallBack.ExpirationTime), tvolp); } else if (tvc->states & CRO) { /* adapt gives us an hour. */ tvc->cbExpires = 3600+osi_Time(); /*XXX*/ tvc->states |= CStatd; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(3600), tvolp); } } else { afs_DequeueCallback(tvc); tvc->callback = (struct server *)0; tvc->states &= ~(CStatd | CUnique); if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ } ReleaseWriteLock(&afs_xcbhash); afs_ProcessFS(tvc, &OutStatus, areq); ReleaseWriteLock(&tvc->lock); return tvc; } /* * must be called with avc write-locked * don't absolutely have to invalidate the hint unless the dv has * changed, but be sure to get it right else there will be consistency bugs. */ afs_int32 afs_FetchStatus(struct vcache *avc, struct VenusFid *afid, struct vrequest *areq, struct AFSFetchStatus *Outsp) { int code; afs_uint32 start; register struct conn *tc; struct AFSCallBack CallBack; struct AFSVolSync tsync; struct volume* volp; XSTATS_DECLS do { tc = afs_Conn(afid, areq, SHARED_LOCK); avc->quick.stamp = 0; avc->h1.dchint = NULL; /* invalidate hints */ if (tc) { avc->callback = tc->srvr->server; start = osi_Time(); XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_FETCHSTATUS); RX_AFS_GUNLOCK(); code = RXAFS_FetchStatus(tc->id, (struct AFSFid *) &afid->Fid, Outsp, &CallBack, &tsync); RX_AFS_GLOCK(); XSTATS_END_TIME; } else code = -1; } while (afs_Analyze(tc, code, afid, areq, AFS_STATS_FS_RPCIDX_FETCHSTATUS, SHARED_LOCK, (struct cell *)0)); if (!code) { afs_ProcessFS(avc, Outsp, areq); volp = afs_GetVolume(afid, areq, READ_LOCK); ObtainWriteLock(&afs_xcbhash, 469); avc->states |= CTruth; if (avc->callback /* check for race */) { if (CallBack.ExpirationTime != 0) { avc->cbExpires = CallBack.ExpirationTime+start; avc->states |= CStatd; avc->states &= ~CBulkFetching; afs_QueueCallback(avc, CBHash(CallBack.ExpirationTime), volp); } else if (avc->states & CRO) { /* ordinary callback on a read-only volume -- AFS 3.2 style */ avc->cbExpires = 3600+start; avc->states |= CStatd; avc->states &= ~CBulkFetching; afs_QueueCallback(avc, CBHash(3600), volp); } else { afs_DequeueCallback(avc); avc->callback = (struct server *)0; avc->states &= ~(CStatd|CUnique); if ((avc->states & CForeign) || (avc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (avc); /* if it (could be) a directory */ } } else { afs_DequeueCallback(avc); avc->callback = (struct server *)0; avc->states &= ~(CStatd|CUnique); if ((avc->states & CForeign) || (avc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (avc); /* if it (could be) a directory */ } ReleaseWriteLock(&afs_xcbhash); if ( volp ) afs_PutVolume(volp, READ_LOCK); } else { /* used to undo the local callback, but that's too extreme. * There are plenty of good reasons that fetchstatus might return * an error, such as EPERM. If we have the vnode cached, statd, * with callback, might as well keep track of the fact that we * don't have access... */ if (code == EPERM || code == EACCES) { struct axscache *ac; if (avc->Access && (ac = afs_FindAxs(avc->Access, areq->uid))) ac->axess = 0; else /* not found, add a new one if possible */ afs_AddAxs(avc->Access, areq->uid, 0); } } return code; } #if 0 /* * afs_StuffVcache * * Description: * Stuff some information into the vcache for the given file. * * Parameters: * afid : File in question. * OutStatus : Fetch status on the file. * CallBack : Callback info. * tc : RPC connection involved. * areq : vrequest involved. * * Environment: * Nothing interesting. */ void afs_StuffVcache(afid, OutStatus, CallBack, tc, areq) register struct VenusFid *afid; struct AFSFetchStatus *OutStatus; struct AFSCallBack *CallBack; register struct conn *tc; struct vrequest *areq; { /*afs_StuffVcache*/ register afs_int32 code, i, newvcache=0; register struct vcache *tvc; struct AFSVolSync tsync; struct volume *tvp; struct axscache *ac; afs_int32 retry; AFS_STATCNT(afs_StuffVcache); #ifdef IFS_VCACHECOUNT ifs_gvcachecall++; #endif loop: ObtainSharedLock(&afs_xvcache,8); tvc = afs_FindVCache(afid, 0, 0, &retry, DO_VLRU /* no stats */); if (tvc && retry) { #if defined(AFS_SGI_ENV) && !defined(AFS_SGI53_ENV) ReleaseSharedLock(&afs_xvcache); spunlock_psema(tvc->v.v_lock, retry, &tvc->v.v_sync, PINOD); goto loop; #endif } if (!tvc) { /* no cache entry, better grab one */ UpgradeSToWLock(&afs_xvcache,25); tvc = afs_NewVCache(afid, (struct server *)0, 1, WRITE_LOCK); newvcache = 1; ConvertWToSLock(&afs_xvcache); } ReleaseSharedLock(&afs_xvcache); ObtainWriteLock(&tvc->lock,58); tvc->states &= ~CStatd; if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ /* Is it always appropriate to throw away all the access rights? */ afs_FreeAllAxs(&(tvc->Access)); /*Copy useful per-volume info*/ tvp = afs_GetVolume(afid, areq, READ_LOCK); if (tvp) { if (newvcache && (tvp->states & VForeign)) tvc->states |= CForeign; if (tvp->states & VRO) tvc->states |= CRO; if (tvp->states & VBackup) tvc->states |= CBackup; /* * Now, copy ".." entry back out of volume structure, if * necessary */ if (tvc->mvstat == 2 && tvp->dotdot.Fid.Volume != 0) { if (!tvc->mvid) tvc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid)); *tvc->mvid = tvp->dotdot; } } /* store the stat on the file */ afs_RemoveVCB(afid); afs_ProcessFS(tvc, OutStatus, areq); tvc->callback = tc->srvr->server; /* we use osi_Time twice below. Ideally, we would use the time at which * the FetchStatus call began, instead, but we don't have it here. So we * make do with "now". In the CRO case, it doesn't really matter. In * the other case, we hope that the difference between "now" and when the * call actually began execution on the server won't be larger than the * padding which the server keeps. Subtract 1 second anyway, to be on * the safe side. Can't subtract more because we don't know how big * ExpirationTime is. Possible consistency problems may arise if the call * timeout period becomes longer than the server's expiration padding. */ ObtainWriteLock(&afs_xcbhash, 470); if (CallBack->ExpirationTime != 0) { tvc->cbExpires = CallBack->ExpirationTime+osi_Time()-1; tvc->states |= CStatd; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(CallBack->ExpirationTime), tvp); } else if (tvc->states & CRO) { /* old-fashioned AFS 3.2 style */ tvc->cbExpires = 3600+osi_Time(); /*XXX*/ tvc->states |= CStatd; tvc->states &= ~CBulkFetching; afs_QueueCallback(tvc, CBHash(3600), tvp); } else { afs_DequeueCallback(tvc); tvc->callback = (struct server *)0; tvc->states &= ~(CStatd|CUnique); if ((tvc->states & CForeign) || (tvc->fid.Fid.Vnode & 1)) osi_dnlc_purgedp (tvc); /* if it (could be) a directory */ } ReleaseWriteLock(&afs_xcbhash); if ( tvp ) afs_PutVolume(tvp, READ_LOCK); /* look in per-pag cache */ if (tvc->Access && (ac = afs_FindAxs(tvc->Access, areq->uid))) ac->axess = OutStatus->CallerAccess; /* substitute pags */ else /* not found, add a new one if possible */ afs_AddAxs(tvc->Access, areq->uid, OutStatus->CallerAccess); ReleaseWriteLock(&tvc->lock); afs_Trace4(afs_iclSetp, CM_TRACE_STUFFVCACHE, ICL_TYPE_POINTER, tvc, ICL_TYPE_POINTER, tvc->callback, ICL_TYPE_INT32, tvc->cbExpires, ICL_TYPE_INT32, tvc->cbExpires-osi_Time()); /* * Release ref count... hope this guy stays around... */ afs_PutVCache(tvc, WRITE_LOCK); } /*afs_StuffVcache*/ #endif /* * afs_PutVCache * * Description: * Decrements the reference count on a cache entry. * * Parameters: * avc : Pointer to the cache entry to decrement. * * Environment: * Nothing interesting. */ void afs_PutVCache(avc, locktype) register struct vcache *avc; afs_int32 locktype; { /*afs_PutVCache*/ AFS_STATCNT(afs_PutVCache); /* * Can we use a read lock here? */ ObtainReadLock(&afs_xvcache); AFS_FAST_RELE(avc); ReleaseReadLock(&afs_xvcache); } /*afs_PutVCache*/ /* * afs_FindVCache * * Description: * Find a vcache entry given a fid. * * Parameters: * afid : Pointer to the fid whose cache entry we desire. * retry: (SGI-specific) tell the caller to drop the lock on xvcache, * unlock the vnode, and try again. * flags: bit 1 to specify whether to compute hit statistics. Not * set if FindVCache is called as part of internal bookkeeping. * * Environment: * Must be called with the afs_xvcache lock at least held at * the read level. In order to do the VLRU adjustment, the xvcache lock * must be shared-- we upgrade it here. */ struct vcache *afs_FindVCache(struct VenusFid *afid, afs_int32 lockit, afs_int32 locktype, afs_int32 *retry, afs_int32 flag) { register struct vcache *tvc; afs_int32 i; AFS_STATCNT(afs_FindVCache); i = VCHash(afid); for(tvc = afs_vhashT[i]; tvc; tvc = tvc->hnext) { if (FidMatches(afid, tvc)) { #ifdef AFS_OSF_ENV /* Grab this vnode, possibly reactivating from the free list */ int vg; AFS_GUNLOCK(); vg = vget((struct vnode *)tvc); AFS_GLOCK(); if (vg) continue; #endif /* AFS_OSF_ENV */ break; } } /* should I have a read lock on the vnode here? */ if (tvc) { if (retry) *retry = 0; #if !defined(AFS_OSF_ENV) osi_vnhold(tvc, retry); /* already held, above */ if (retry && *retry) return 0; #endif /* * only move to front of vlru if we have proper vcache locking) */ if (flag & DO_VLRU) { if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent2"); } UpgradeSToWLock(&afs_xvcache,26); QRemove(&tvc->vlruq); QAdd(&VLRU, &tvc->vlruq); ConvertWToSLock(&afs_xvcache); if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent2"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent3"); } } vcachegen++; } if (flag & DO_STATS) { if (tvc) afs_stats_cmperf.vcacheHits++; else afs_stats_cmperf.vcacheMisses++; if (afid->Cell == LOCALCELL) afs_stats_cmperf.vlocalAccesses++; else afs_stats_cmperf.vremoteAccesses++; } #ifdef AFS_LINUX22_ENV if (tvc && (tvc->states & CStatd)) vcache2inode(tvc); /* mainly to reset i_nlink */ #endif #ifdef AFS_DARWIN_ENV if (tvc) osi_VM_Setup(tvc); #endif return tvc; } /*afs_FindVCache*/ /* * afs_NFSFindVCache * * Description: * Find a vcache entry given a fid. Does a wildcard match on what we * have for the fid. If more than one entry, don't return anything. * * Parameters: * avcp : Fill in pointer if we found one and only one. * afid : Pointer to the fid whose cache entry we desire. * retry: (SGI-specific) tell the caller to drop the lock on xvcache, * unlock the vnode, and try again. * flags: bit 1 to specify whether to compute hit statistics. Not * set if FindVCache is called as part of internal bookkeeping. * * Environment: * Must be called with the afs_xvcache lock at least held at * the read level. In order to do the VLRU adjustment, the xvcache lock * must be shared-- we upgrade it here. * * Return value: * number of matches found. */ int afs_duplicate_nfs_fids=0; afs_int32 afs_NFSFindVCache(avcp, afid, lockit) struct vcache **avcp; struct VenusFid *afid; afs_int32 lockit; { /*afs_FindVCache*/ register struct vcache *tvc; afs_int32 i; afs_int32 retry = 0; afs_int32 count = 0; struct vcache *found_tvc = NULL; AFS_STATCNT(afs_FindVCache); loop: ObtainSharedLock(&afs_xvcache,331); i = VCHash(afid); for(tvc = afs_vhashT[i]; tvc; tvc = tvc->hnext) { /* Match only on what we have.... */ if (((tvc->fid.Fid.Vnode & 0xffff) == afid->Fid.Vnode) && (tvc->fid.Fid.Volume == afid->Fid.Volume) && ((tvc->fid.Fid.Unique & 0xffffff) == afid->Fid.Unique) && (tvc->fid.Cell == afid->Cell)) { #ifdef AFS_OSF_ENV /* Grab this vnode, possibly reactivating from the free list */ int vg; AFS_GUNLOCK(); vg = vget((struct vnode *)tvc); AFS_GLOCK(); if (vg) { /* This vnode no longer exists. */ continue; } #endif /* AFS_OSF_ENV */ count ++; if (found_tvc) { /* Duplicates */ #ifdef AFS_OSF_ENV /* Drop our reference counts. */ vrele((struct vnode *)tvc); vrele((struct vnode *)found_tvc); #endif afs_duplicate_nfs_fids++; ReleaseSharedLock(&afs_xvcache); return count; } found_tvc = tvc; } } tvc = found_tvc; /* should I have a read lock on the vnode here? */ if (tvc) { #if defined(AFS_SGI_ENV) && !defined(AFS_SGI53_ENV) osi_vnhold(tvc, &retry); if (retry) { count = 0; found_tvc = (struct vcache*)0; ReleaseSharedLock(&afs_xvcache); spunlock_psema(tvc->v.v_lock, retry, &tvc->v.v_sync, PINOD); goto loop; } #else #if !defined(AFS_OSF_ENV) osi_vnhold(tvc, (int*)0); /* already held, above */ #endif #endif /* * We obtained the xvcache lock above. */ if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent2"); } UpgradeSToWLock(&afs_xvcache,568); QRemove(&tvc->vlruq); QAdd(&VLRU, &tvc->vlruq); ConvertWToSLock(&afs_xvcache); if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) { refpanic ("FindVC VLRU inconsistent1"); } if (tvc->vlruq.next->prev != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent2"); } if (tvc->vlruq.prev->next != &(tvc->vlruq)) { refpanic ("FindVC VLRU inconsistent3"); } } vcachegen++; if (tvc) afs_stats_cmperf.vcacheHits++; else afs_stats_cmperf.vcacheMisses++; if (afid->Cell == LOCALCELL) afs_stats_cmperf.vlocalAccesses++; else afs_stats_cmperf.vremoteAccesses++; *avcp = tvc; /* May be null */ ReleaseSharedLock(&afs_xvcache); return (tvc ? 1 : 0); } /*afs_NFSFindVCache*/ /* * afs_vcacheInit * * Initialize vcache related variables */ void afs_vcacheInit(int astatSize) { register struct vcache *tvp; int i; #if defined(AFS_OSF_ENV) if (!afs_maxvcount) { #if defined(AFS_OSF30_ENV) afs_maxvcount = max_vnodes/2; /* limit ourselves to half the total */ #else afs_maxvcount = nvnode/2; /* limit ourselves to half the total */ #endif if (astatSize < afs_maxvcount) { afs_maxvcount = astatSize; } } #else /* AFS_OSF_ENV */ freeVCList = (struct vcache *)0; #endif RWLOCK_INIT(&afs_xvcache, "afs_xvcache"); LOCK_INIT(&afs_xvcb, "afs_xvcb"); #if !defined(AFS_OSF_ENV) /* Allocate and thread the struct vcache entries */ tvp = (struct vcache *) afs_osi_Alloc(astatSize * sizeof(struct vcache)); memset((char *)tvp, 0, sizeof(struct vcache)*astatSize); Initial_freeVCList = tvp; freeVCList = &(tvp[0]); for(i=0; i < astatSize-1; i++) { tvp[i].nextfree = &(tvp[i+1]); } tvp[astatSize-1].nextfree = (struct vcache *) 0; #ifdef AFS_AIX32_ENV pin((char *)tvp, astatSize * sizeof(struct vcache)); /* XXX */ #endif #endif #if defined(AFS_SGI_ENV) for(i=0; i < astatSize; i++) { char name[METER_NAMSZ]; struct vcache *tvc = &tvp[i]; tvc->v.v_number = ++afsvnumbers; tvc->vc_rwlockid = OSI_NO_LOCKID; initnsema(&tvc->vc_rwlock, 1, makesname(name, "vrw", tvc->v.v_number)); #ifndef AFS_SGI53_ENV initnsema(&tvc->v.v_sync, 0, makesname(name, "vsy", tvc->v.v_number)); #endif #ifndef AFS_SGI62_ENV initnlock(&tvc->v.v_lock, makesname(name, "vlk", tvc->v.v_number)); #endif /* AFS_SGI62_ENV */ } #endif QInit(&VLRU); } /* * shutdown_vcache * */ void shutdown_vcache(void) { int i; struct afs_cbr *tsp, *nsp; /* * XXX We may potentially miss some of the vcaches because if when there're no * free vcache entries and all the vcache entries are active ones then we allocate * an additional one - admittedly we almost never had that occur. */ #if !defined(AFS_OSF_ENV) afs_osi_Free(Initial_freeVCList, afs_cacheStats * sizeof(struct vcache)); #endif #ifdef AFS_AIX32_ENV unpin(Initial_freeVCList, afs_cacheStats * sizeof(struct vcache)); #endif { register struct afs_q *tq, *uq; register struct vcache *tvc; for (tq = VLRU.prev; tq != &VLRU; tq = uq) { tvc = QTOV(tq); uq = QPrev(tq); if (tvc->mvid) { osi_FreeSmallSpace(tvc->mvid); tvc->mvid = (struct VenusFid*)0; } #ifdef AFS_AIX_ENV aix_gnode_rele((struct vnode *)tvc); #endif if (tvc->linkData) { afs_osi_Free(tvc->linkData, strlen(tvc->linkData)+1); tvc->linkData = 0; } } /* * Also free the remaining ones in the Cache */ for (i=0; i < VCSIZE; i++) { for (tvc = afs_vhashT[i]; tvc; tvc = tvc->hnext) { if (tvc->mvid) { osi_FreeSmallSpace(tvc->mvid); tvc->mvid = (struct VenusFid*)0; } #ifdef AFS_AIX_ENV if (tvc->v.v_gnode) afs_osi_Free(tvc->v.v_gnode, sizeof(struct gnode)); #ifdef AFS_AIX32_ENV if (tvc->segid) { AFS_GUNLOCK(); vms_delete(tvc->segid); AFS_GLOCK(); tvc->segid = tvc->vmh = NULL; if (VREFCOUNT(tvc)) osi_Panic("flushVcache: vm race"); } if (tvc->credp) { crfree(tvc->credp); tvc->credp = NULL; } #endif #endif #if defined(AFS_SUN5_ENV) if (tvc->credp) { crfree(tvc->credp); tvc->credp = NULL; } #endif if (tvc->linkData) { afs_osi_Free(tvc->linkData, strlen(tvc->linkData)+1); tvc->linkData = 0; } afs_FreeAllAxs(&(tvc->Access)); } afs_vhashT[i] = 0; } } /* * Free any leftover callback queue */ for (tsp = afs_cbrSpace; tsp; tsp = nsp ) { nsp = tsp->next; afs_osi_Free((char *)tsp, AFS_NCBRS * sizeof(struct afs_cbr)); } afs_cbrSpace = 0; #if !defined(AFS_OSF_ENV) freeVCList = Initial_freeVCList = 0; #endif RWLOCK_INIT(&afs_xvcache, "afs_xvcache"); LOCK_INIT(&afs_xvcb, "afs_xvcb"); QInit(&VLRU); }