2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
18 * AFS_EQ_ATSYS (macro)
22 #include "../afs/param.h" /* Should be always first */
23 #include "../afs/sysincludes.h" /* Standard vendor system headers */
24 #include "../afs/afsincludes.h" /* Afs-based standard headers */
25 #include "../afs/afs_stats.h" /* statistics */
26 #include "../afs/afs_cbqueue.h"
27 #include "../afs/nfsclient.h"
28 #include "../afs/exporter.h"
29 #include "../afs/afs_osidnlc.h"
33 * A few definitions. This is until we have a proper header file
34 * which has prototypes for all functions
37 extern struct DirEntry * afs_dir_GetBlob();
39 extern afs_rwlock_t afs_xvcache;
40 extern afs_rwlock_t afs_xcbhash;
41 extern struct afs_exporter *afs_nfsexporter;
42 extern char *afs_sysname;
43 extern struct afs_q VLRU; /*vcache LRU*/
44 #ifdef AFS_LINUX22_ENV
45 extern struct inode_operations afs_symlink_iops, afs_dir_iops;
49 afs_int32 afs_bulkStatsDone;
50 static int bulkStatCounter = 0; /* counter for bulk stat seq. numbers */
53 /* this would be faster if it did comparison as int32word, but would be
54 * dependant on byte-order and alignment, and I haven't figured out
55 * what "@sys" is in binary... */
56 #define AFS_EQ_ATSYS(name) (((name)[0]=='@')&&((name)[1]=='s')&&((name)[2]=='y')&&((name)[3]=='s')&&(!(name)[4]))
60 register char *s1, *s2;
76 register char *a, c; {
78 AFS_STATCNT(afs_index);
80 if (tc == c) return a;
86 /* call under write lock, evaluate mvid field from a mt pt.
87 * avc is the vnode of the mount point object.
88 * advc is the vnode of the containing directory
89 * avolpp is where we return a pointer to the volume named by the mount pt, if success
90 * areq is the identity of the caller.
92 * NOTE: this function returns a held volume structure in *volpp if it returns 0!
94 EvalMountPoint(avc, advc, avolpp, areq)
95 register struct vcache *avc;
96 struct volume **avolpp;
97 struct vcache *advc; /* the containing dir */
98 register struct vrequest *areq;
101 struct volume *tvp = 0;
102 struct VenusFid tfid;
104 char *cpos, *volnamep;
106 afs_int32 prefetchRO; /* 1=>No 2=>Yes */
107 afs_int32 mtptCell, assocCell, hac=0;
108 afs_int32 samecell, roname, len;
110 AFS_STATCNT(EvalMountPoint);
112 if (avc->mvid && (avc->states & CMValid)) return 0; /* done while racing */
114 *avolpp = (struct volume *)0;
115 code = afs_HandleLink(avc, areq);
116 if (code) return code;
118 /* Determine which cell and volume the mointpoint goes to */
119 type = avc->linkData[0]; /* '#'=>Regular '%'=>RW */
120 cpos = afs_index(&avc->linkData[1], ':'); /* if cell name present */
124 tcell = afs_GetCellByName(&avc->linkData[1], READ_LOCK);
127 volnamep = &avc->linkData[1];
128 tcell = afs_GetCell(avc->fid.Cell, READ_LOCK);
130 if (!tcell) return ENODEV;
132 mtptCell = tcell->cell; /* The cell for the mountpoint */
134 hac = 1; /* has associated cell */
135 assocCell = tcell->lcellp->cell; /* The associated cell */
137 afs_PutCell(tcell, READ_LOCK);
139 /* Is volume name a "<n>.backup" or "<n>.readonly" name */
140 len = strlen(volnamep);
141 roname = ((len > 9) && (strcmp(&volnamep[len - 9],".readonly") == 0)) ||
142 ((len > 7) && (strcmp(&volnamep[len - 7],".backup") == 0));
144 /* When we cross mountpoint, do we stay in the same cell */
145 samecell = (avc->fid.Cell == mtptCell) || (hac && (avc->fid.Cell == assocCell));
147 /* Decide whether to prefetch the RO. Also means we want the RO.
148 * If this is a regular mountpoint with a RW volume name and
149 * we cross a cell boundary -or- start from a RO volume, then we will
150 * want to prefetch the RO volume when we get the RW below.
152 if ( (type == '#') && !roname && (!samecell || (avc->states & CRO)) ) {
153 prefetchRO = 2; /* Yes, prefetch the RO */
155 prefetchRO = 1; /* No prefetch of the RO */
158 /* Get the volume struct. Unless this volume name has ".readonly" or
159 * ".backup" in it, this will get the volume struct for the RW volume.
160 * The RO volume will be prefetched if requested (but not returned).
162 tvp = afs_GetVolumeByName(volnamep, mtptCell, prefetchRO, areq, WRITE_LOCK);
164 /* If no volume was found in this cell, try the associated linked cell */
165 if (!tvp && hac && areq->volumeError) {
166 tvp = afs_GetVolumeByName(volnamep, assocCell, prefetchRO, areq, WRITE_LOCK);
169 /* Still not found. If we are looking for the RO, then perhaps the RW
170 * doesn't exist? Try adding ".readonly" to volname and look for that.
171 * Don't know why we do this. Would have still found it in above call - jpm.
173 if (!tvp && (prefetchRO == 2)) {
174 strcpy(buf, volnamep);
175 afs_strcat(buf, ".readonly");
177 tvp = afs_GetVolumeByName(buf, mtptCell, 1, areq, WRITE_LOCK);
179 /* Try the associated linked cell if failed */
180 if (!tvp && hac && areq->volumeError) {
181 tvp = afs_GetVolumeByName(buf, assocCell, 1, areq, WRITE_LOCK);
185 if (!tvp) return ENOENT; /* Couldn't find the volume */
187 /* Don't cross mountpoint from a BK to a BK volume */
188 if ((avc->states & CBackup) && (tvp->states & VBackup)) {
189 afs_PutVolume(tvp, WRITE_LOCK);
193 /* If we want (prefetched) the RO and it exists, then drop the
194 * RW volume and get the RO. Othewise, go with the RW.
196 if ((prefetchRO == 2) && tvp->roVol) {
197 tfid.Fid.Volume = tvp->roVol; /* remember RO volume */
198 tfid.Cell = tvp->cell;
199 afs_PutVolume(tvp, WRITE_LOCK); /* release old volume */
200 tvp = afs_GetVolume(&tfid, areq, WRITE_LOCK); /* get the new one */
201 if (!tvp) return ENOENT; /* oops, can't do it */
205 avc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
206 avc->mvid->Cell = tvp->cell;
207 avc->mvid->Fid.Volume = tvp->volume;
208 avc->mvid->Fid.Vnode = 1;
209 avc->mvid->Fid.Unique = 1;
210 avc->states |= CMValid;
212 /* Used to: if the mount point is stored within a backup volume,
213 * then we should only update the parent pointer information if
214 * there's none already set, so as to avoid updating a volume's ..
215 * info with something in an OldFiles directory.
217 * Next two lines used to be under this if:
219 * if (!(avc->states & CBackup) || tvp->dotdot.Fid.Volume == 0)
221 * Now: update mount point back pointer on every call, so that we handle
222 * multiple mount points better. This way, when du tries to go back
223 * via chddir(".."), it will end up exactly where it started, yet
224 * cd'ing via a new path to a volume will reset the ".." pointer
227 tvp->mtpoint = avc->fid; /* setup back pointer to mtpoint */
228 tvp->dotdot = advc->fid;
235 register char *aname; {
239 AFS_STATCNT(ENameOK);
240 tlen = strlen(aname);
241 if (tlen >= 4 && strcmp(aname+tlen-4, "@sys") == 0) return 0;
245 Check_AtSys(avc, aname, outb, areq)
246 register struct vcache *avc;
248 struct vrequest *areq;
250 register char *tname;
251 register int error = 0, offset = -1;
253 for (tname=aname; *tname; tname++) /*Move to the end of the string*/;
256 * If the current string is 4 chars long or more, check to see if the
257 * tail end is "@sys".
259 if ((tname >= aname + 4) && (AFS_EQ_ATSYS(tname-4)))
260 offset = (tname - 4) - aname;
264 tname = (char *) osi_AllocLargeSpace(AFS_LRALLOCSIZ);
266 strncpy(tname, aname, offset);
267 if (!afs_nfsexporter)
268 strcpy(tname+offset, (afs_sysname ? afs_sysname : SYS_NAME ));
270 register struct unixuser *au;
271 register afs_int32 error;
272 au = afs_GetUser(areq->uid, avc->fid.Cell, 0); afs_PutUser(au, 0);
274 error = EXP_SYSNAME(au->exporter, (char *)0, tname+offset);
276 strcpy(tname+offset, "@sys");
278 strcpy(tname+offset, (afs_sysname ? afs_sysname : SYS_NAME ));
288 char *afs_getsysname(areq, adp)
289 register struct vrequest *areq;
290 register struct vcache *adp; {
291 static char sysname[MAXSYSNAME];
292 register struct unixuser *au;
293 register afs_int32 error;
295 AFS_STATCNT(getsysname);
296 /* this whole interface is wrong, it should take a buffer ptr and copy
299 au = afs_GetUser(areq->uid, adp->fid.Cell, 0);
302 error = EXP_SYSNAME(au->exporter, (char *)0, sysname);
303 if (error) return "@sys";
306 return (afs_sysname == 0? SYS_NAME : afs_sysname);
310 void afs_HandleAtName(aname, aresult, areq, adp)
311 register char *aname;
312 register char *aresult;
313 register struct vrequest *areq;
314 register struct vcache *adp; {
316 AFS_STATCNT(HandleAtName);
317 tlen = strlen(aname);
318 if (tlen >= 4 && strcmp(aname+tlen-4, "@sys")==0) {
319 strncpy(aresult, aname, tlen-4);
320 strcpy(aresult+tlen-4, afs_getsysname(areq, adp));
322 else strcpy(aresult, aname);
325 #if (defined(AFS_SGI62_ENV) || defined(AFS_SUN57_64BIT_ENV))
326 extern int BlobScan(ino64_t *afile, afs_int32 ablob);
328 extern int BlobScan(afs_int32 *afile, afs_int32 ablob);
332 /* called with an unlocked directory and directory cookie. Areqp
333 * describes who is making the call.
334 * Scans the next N (about 30, typically) directory entries, and does
335 * a bulk stat call to stat them all.
337 * Must be very careful when merging in RPC responses, since we dont
338 * want to overwrite newer info that was added by a file system mutating
339 * call that ran concurrently with our bulk stat call.
341 * We do that, as described below, by not merging in our info (always
342 * safe to skip the merge) if the status info is valid in the vcache entry.
344 * If adapt ever implements the bulk stat RPC, then this code will need to
345 * ensure that vcaches created for failed RPC's to older servers have the
348 struct vcache * BStvc = (struct vcache *) 0;
349 void afs_DoBulkStat(adp, dirCookie, areqp)
352 struct vrequest *areqp;
354 int nentries; /* # of entries to prefetch */
355 int nskip; /* # of slots in the LRU queue to skip */
356 struct vcache *lruvcp; /* vcache ptr of our goal pos in LRU queue */
357 struct dcache *dcp; /* chunk containing the dir block */
358 char *statMemp; /* status memory block */
359 char *cbfMemp; /* callback and fid memory block */
360 long temp; /* temp for holding chunk length, &c. */
361 struct AFSFid *fidsp; /* file IDs were collecting */
362 struct AFSCallBack *cbsp; /* call back pointers */
363 struct AFSCallBack *tcbp; /* temp callback ptr */
364 struct AFSFetchStatus *statsp; /* file status info */
365 struct AFSVolSync volSync; /* vol sync return info */
366 struct vcache *tvcp; /* temp vcp */
367 struct afs_q *tq; /* temp queue variable */
368 AFSCBFids fidParm; /* file ID parm for bulk stat */
369 AFSBulkStats statParm; /* stat info parm for bulk stat */
370 int fidIndex; /* which file were stating */
371 struct conn *tcp; /* conn for call */
372 AFSCBs cbParm; /* callback parm for bulk stat */
373 struct server *hostp = 0; /* host we got callback from */
374 long origEvenCBs; /* original # of callbacks for even-fid files */
375 long origOddCBs; /* original # of callbacks for odd-fid files */
376 long origEvenZaps; /* original # of recycles for even-fid files */
377 long origOddZaps; /* original # of recycles for odd-fid files */
378 long startTime; /* time we started the call,
379 * for callback expiration base
381 int statSeqNo; /* Valued of file size to detect races */
382 int code; /* error code */
383 long newIndex; /* new index in the dir */
384 struct DirEntry *dirEntryp; /* dir entry we are examining */
386 struct VenusFid afid; /* file ID we are using now */
387 struct VenusFid tfid; /* another temp. file ID */
388 afs_int32 retry; /* handle low-level SGI MP race conditions */
389 long volStates; /* flags from vol structure */
390 struct volume *volp=0; /* volume ptr */
391 struct VenusFid dotdot;
392 int flagIndex; /* First file with bulk fetch flag set */
395 /* first compute some basic parameters. We dont want to prefetch more
396 * than a fraction of the cache in any given call, and we want to preserve
397 * a portion of the LRU queue in any event, so as to avoid thrashing
398 * the entire stat cache (we will at least leave some of it alone).
399 * presently dont stat more than 1/8 the cache in any one call. */
400 nentries = afs_cacheStats / 8;
402 /* dont bother prefetching more than one calls worth of info */
403 if (nentries > AFSCBMAX) nentries = AFSCBMAX;
405 /* heuristic to make sure that things fit in 4K. This means that
406 * we shouldnt make it any bigger than 47 entries. I am typically
407 * going to keep it a little lower, since we don't want to load
408 * too much of the stat cache.
410 if (nentries > 30) nentries = 30;
412 /* now, to reduce the stack size, well allocate two 4K blocks,
413 * one for fids and callbacks, and one for stat info. Well set
414 * up our pointers to the memory from there, too.
416 statMemp = osi_AllocLargeSpace(nentries * sizeof(AFSFetchStatus));
417 statsp = (struct AFSFetchStatus *) statMemp;
418 cbfMemp = osi_AllocLargeSpace(nentries *
419 (sizeof(AFSCallBack) + sizeof(AFSFid)));
420 fidsp = (AFSFid *) cbfMemp;
421 cbsp = (AFSCallBack *) (cbfMemp + nentries * sizeof(AFSFid));
423 /* next, we must iterate over the directory, starting from the specified
424 * cookie offset (dirCookie), and counting out nentries file entries.
425 * We skip files that already have stat cache entries, since we
426 * dont want to bulk stat files that are already in the cache.
429 code = afs_VerifyVCache(adp, areqp);
432 dcp = afs_GetDCache(adp, 0, areqp, &temp, &temp, 1);
438 /* lock the directory cache entry */
439 ObtainReadLock(&adp->lock);
442 * Make sure that the data in the cache is current. There are two
443 * cases we need to worry about:
444 * 1. The cache data is being fetched by another process.
445 * 2. The cache data is no longer valid
447 while ((adp->states & CStatd)
448 && (dcp->flags & DFFetching)
449 && hsame(adp->m.DataVersion, dcp->f.versionNo)) {
450 dcp->flags |= DFWaiting;
451 ReleaseReadLock(&adp->lock);
452 afs_osi_Sleep(&dcp->validPos);
453 ObtainReadLock(&adp->lock);
455 if (!(adp->states & CStatd)
456 || !hsame(adp->m.DataVersion, dcp->f.versionNo)) {
457 ReleaseReadLock(&adp->lock);
462 /* Generate a sequence number so we can tell whether we should
463 * store the attributes when processing the response. This number is
464 * stored in the file size when we set the CBulkFetching bit. If the
465 * CBulkFetching is still set and this value hasn't changed, then
466 * we know we were the last to set CBulkFetching bit for this file,
467 * and it is safe to set the status information for this file.
469 statSeqNo = bulkStatCounter++;
471 /* now we have dir data in the cache, so scan the dir page */
474 while (1) { /* Should probably have some constant bound */
475 /* look for first safe entry to examine in the directory. BlobScan
476 * looks for a the 1st allocated dir after the dirCookie slot.
478 newIndex = BlobScan(&dcp->f.inode, (dirCookie>>5));
479 if (newIndex == 0) break;
481 /* remember the updated directory cookie */
482 dirCookie = newIndex << 5;
484 /* get a ptr to the dir entry */
485 dirEntryp =(struct DirEntry *)afs_dir_GetBlob(&dcp->f.inode, newIndex);
486 if (!dirEntryp) break;
488 /* dont copy more than we have room for */
489 if (fidIndex >= nentries) {
490 DRelease((char *) dirEntryp, 0);
494 /* now, if the dir entry looks good, copy it out to our list. Vnode
495 * 0 means deleted, although it should also be free were it deleted.
497 if (dirEntryp->fid.vnode != 0) {
498 /* dont copy entries we have in our cache. This check will
499 * also make us skip "." and probably "..", unless it has
500 * disappeared from the cache since we did our namei call.
502 tfid.Cell = adp->fid.Cell;
503 tfid.Fid.Volume = adp->fid.Fid.Volume;
504 tfid.Fid.Vnode = ntohl(dirEntryp->fid.vnode);
505 tfid.Fid.Unique = ntohl(dirEntryp->fid.vunique);
508 ObtainWriteLock(&afs_xvcache, 130);
509 tvcp = afs_FindVCache(&tfid, 0, 0, &retry, 0 /* no stats | LRU */);
511 ReleaseWriteLock(&afs_xvcache);
514 } while (tvcp && retry);
515 if (!tvcp) { /* otherwise, create manually */
516 tvcp = afs_NewVCache(&tfid, hostp, 0, 0);
517 ObtainWriteLock(&tvcp->lock, 505);
518 ReleaseWriteLock(&afs_xvcache);
519 afs_RemoveVCB(&tfid);
520 ReleaseWriteLock(&tvcp->lock);
522 ReleaseWriteLock(&afs_xvcache);
525 goto done; /* can't happen at present, more's the pity */
527 /* WARNING: afs_DoBulkStat uses the Length field to store a
528 * sequence number for each bulk status request. Under no
529 * circumstances should afs_DoBulkStat store a sequence number
530 * if the new length will be ignored when afs_ProcessFS is
531 * called with new stats. */
533 if (!(tvcp->states & (CStatd|CBulkFetching))
534 && (tvcp->execsOrWriters <= 0)
535 && !afs_DirtyPages(tvcp)
536 && !AFS_VN_MAPPED((vnode_t*)tvcp))
538 if (!(tvcp->states & (CStatd|CBulkFetching))
539 && (tvcp->execsOrWriters <= 0)
540 && !afs_DirtyPages(tvcp))
544 /* this entry doesnt exist in the cache, and is not
545 * already being fetched by someone else, so add it to the
546 * list of file IDs to obtain.
548 * We detect a callback breaking race condition by checking the
549 * CBulkFetching state bit and the value in the file size.
550 * It is safe to set the status only if the CBulkFetching
551 * flag is still set and the value in the file size does
554 * Don't fetch status for dirty files. We need to
555 * preserve the value of the file size. We could
556 * flush the pages, but it wouldn't be worthwhile.
558 bcopy((char *) &tfid.Fid, (char *)(fidsp+fidIndex),
560 tvcp->states |= CBulkFetching;
561 tvcp->m.Length = statSeqNo;
565 } /* if dir vnode has non-zero entry */
567 /* move to the next dir entry by adding in the # of entries
568 * used by this dir entry.
570 temp = afs_dir_NameBlobs(dirEntryp->name) << 5;
571 DRelease((char *) dirEntryp, 0);
572 if (temp <= 0) break;
574 } /* while loop over all dir entries */
576 /* now release the dir lock and prepare to make the bulk RPC */
577 ReleaseReadLock(&adp->lock);
579 /* release the chunk */
582 /* dont make a null call */
583 if (fidIndex == 0) goto done;
586 /* setup the RPC parm structures */
587 fidParm.AFSCBFids_len = fidIndex;
588 fidParm.AFSCBFids_val = fidsp;
589 statParm.AFSBulkStats_len = fidIndex;
590 statParm.AFSBulkStats_val = statsp;
591 cbParm.AFSCBs_len = fidIndex;
592 cbParm.AFSCBs_val = cbsp;
594 /* start the timer; callback expirations are relative to this */
595 startTime = osi_Time();
597 tcp = afs_Conn(&adp->fid, areqp, SHARED_LOCK);
599 hostp = tcp->srvr->server;
600 XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_BULKSTATUS);
601 #ifdef RX_ENABLE_LOCKS
603 #endif /* RX_ENABLE_LOCKS */
604 code = RXAFS_BulkStatus(tcp->id, &fidParm, &statParm, &cbParm,
606 #ifdef RX_ENABLE_LOCKS
608 #endif /* RX_ENABLE_LOCKS */
612 } while (afs_Analyze(tcp, code, &adp->fid, areqp,
613 AFS_STATS_FS_RPCIDX_BULKSTATUS, SHARED_LOCK, (struct cell *)0));
615 /* now, if we didnt get the info, bail out. */
618 /* we need vol flags to create the entries properly */
619 dotdot.Fid.Volume = 0;
620 volp = afs_GetVolume(&adp->fid, areqp, READ_LOCK);
622 volStates = volp->states;
623 if (volp->dotdot.Fid.Volume != 0)
624 dotdot = volp->dotdot;
628 /* find the place to merge the info into We do this by skipping
629 * nskip entries in the LRU queue. The more we skip, the more
630 * we preserve, since the head of the VLRU queue is the most recently
634 nskip = afs_cacheStats / 2; /* preserved fraction of the cache */
635 ObtainReadLock(&afs_xvcache);
637 /* actually a serious error, probably should panic. Probably will
638 * panic soon, oh well. */
639 ReleaseReadLock(&afs_xvcache);
640 afs_warnuser("afs_DoBulkStat: VLRU empty!");
643 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
644 refpanic ("Bulkstat VLRU inconsistent");
646 for(tq = VLRU.next; tq != &VLRU; tq = QNext(tq)) {
647 if (--nskip <= 0) break;
648 else if (QNext(QPrev(tq)) != tq) {
650 refpanic ("BulkStat VLRU inconsistent");
653 if (tq != &VLRU) lruvcp = QTOV(tq);
654 else lruvcp = QTOV(VLRU.next);
656 /* now we have to hold this entry, so that it does not get moved
657 * into the free list while we're running. It could still get
658 * moved within the lru queue, but hopefully that will be rare; it
659 * doesn't hurt nearly as much.
662 osi_vnhold(lruvcp, &retry);
663 ReleaseReadLock(&afs_xvcache); /* could be read lock */
667 /* otherwise, merge in the info. We have to be quite careful here,
668 * since we need to ensure that we don't merge old info over newer
669 * stuff in a stat cache entry. We're very conservative here: we don't
670 * do the merge at all unless we ourselves create the stat cache
671 * entry. That's pretty safe, and should work pretty well, since we
672 * typically expect to do the stat cache creation ourselves.
674 * We also have to take into account racing token revocations.
676 for(i=0; i<fidIndex; i++) {
677 afid.Cell = adp->fid.Cell;
678 afid.Fid.Volume = adp->fid.Fid.Volume;
679 afid.Fid.Vnode = fidsp[i].Vnode;
680 afid.Fid.Unique = fidsp[i].Unique;
683 ObtainReadLock(&afs_xvcache);
684 tvcp = afs_FindVCache(&afid, 1, 0, &retry, 0/* !stats&!lru*/);
685 ReleaseReadLock(&afs_xvcache);
686 } while (tvcp && retry);
688 /* The entry may no longer exist */
693 /* now we have the entry held, but we need to fill it in */
694 ObtainWriteLock(&tvcp->lock,131);
696 /* if CBulkFetching is not set, or if the file size no longer
697 * matches the value we placed there when we set the CBulkFetching
698 * flag, then someone else has done something with this node,
699 * and we may not have the latest status information for this
700 * file. Leave the entry alone.
702 if (!(tvcp->states & CBulkFetching) || (tvcp->m.Length != statSeqNo)) {
704 ReleaseWriteLock(&tvcp->lock);
709 /* now copy ".." entry back out of volume structure, if necessary */
710 if (tvcp->mvstat == 2 && (dotdot.Fid.Volume != 0)) {
712 tvcp->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
713 *tvcp->mvid = dotdot;
716 ObtainWriteLock(&afs_xvcache,132);
717 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
718 refpanic ("Bulkstat VLRU inconsistent2");
720 if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
721 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq))
722 refpanic ("Bulkstat VLRU inconsistent4");
723 if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
724 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq))
725 refpanic ("Bulkstat VLRU inconsistent5");
727 if (tvcp != lruvcp) { /* if they are == don't move it, don't corrupt vlru */
728 QRemove(&tvcp->vlruq);
729 QAdd(&lruvcp->vlruq, &tvcp->vlruq);
732 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
733 refpanic ("Bulkstat VLRU inconsistent3");
735 if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
736 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq))
737 refpanic ("Bulkstat VLRU inconsistent5");
738 if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
739 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq))
740 refpanic ("Bulkstat VLRU inconsistent6");
741 ReleaseWriteLock(&afs_xvcache);
743 ObtainWriteLock(&afs_xcbhash, 494);
745 /* We need to check the flags again. We may have missed
746 * something while we were waiting for a lock.
748 if (!(tvcp->states & CBulkFetching) || (tvcp->m.Length != statSeqNo)) {
750 ReleaseWriteLock(&tvcp->lock);
751 ReleaseWriteLock(&afs_xcbhash);
756 /* now merge in the resulting status back into the vnode.
757 * We only do this if the entry looks clear.
759 afs_ProcessFS(tvcp, &statsp[i], areqp);
760 #ifdef AFS_LINUX22_ENV
761 /* overwrite the ops if it's a directory or symlink. */
762 if (vType(tvcp) == VDIR)
763 tvcp->v.v_op = &afs_dir_iops;
764 else if (vType(tvcp) == VLNK)
765 tvcp->v.v_op = &afs_symlink_iops;
768 /* do some accounting for bulk stats: mark this entry as
769 * loaded, so we can tell if we use it before it gets
772 tvcp->states |= CBulkStat;
773 tvcp->states &= ~CBulkFetching;
777 /* merge in vol info */
778 if (volStates & VRO) tvcp->states |= CRO;
779 if (volStates & VBackup) tvcp->states |= CBackup;
780 if (volStates & VForeign) tvcp->states |= CForeign;
782 /* merge in the callback info */
783 tvcp->states |= CTruth;
785 /* get ptr to the callback we are interested in */
788 if (tcbp->ExpirationTime != 0) {
789 tvcp->cbExpires = tcbp->ExpirationTime+startTime;
790 tvcp->callback = hostp;
791 tvcp->states |= CStatd;
792 afs_QueueCallback(tvcp, CBHash(tcbp->ExpirationTime), volp);
794 else if (tvcp->states & CRO) {
795 /* ordinary callback on a read-only volume -- AFS 3.2 style */
796 tvcp->cbExpires = 3600+startTime;
797 tvcp->callback = hostp;
798 tvcp->states |= CStatd;
799 afs_QueueCallback(tvcp, CBHash(3600), volp);
803 tvcp->states &= ~(CStatd|CUnique);
804 afs_DequeueCallback(tvcp);
805 if ((tvcp->states & CForeign) || (vType(tvcp) == VDIR))
806 osi_dnlc_purgedp (tvcp); /* if it (could be) a directory */
808 ReleaseWriteLock(&afs_xcbhash);
810 ReleaseWriteLock(&tvcp->lock);
811 /* finally, we're done with the entry */
813 } /* for all files we got back */
815 /* finally return the pointer into the LRU queue */
816 afs_PutVCache(lruvcp);
819 /* Be sure to turn off the CBulkFetching flags */
820 for(i=flagIndex; i<fidIndex; i++) {
821 afid.Cell = adp->fid.Cell;
822 afid.Fid.Volume = adp->fid.Fid.Volume;
823 afid.Fid.Vnode = fidsp[i].Vnode;
824 afid.Fid.Unique = fidsp[i].Unique;
827 ObtainReadLock(&afs_xvcache);
828 tvcp = afs_FindVCache(&afid, 1, 0, &retry, 0/* !stats&!lru*/);
829 ReleaseReadLock(&afs_xvcache);
830 } while (tvcp && retry);
832 && (tvcp->states & CBulkFetching)
833 && (tvcp->m.Length == statSeqNo)) {
834 tvcp->states &= ~CBulkFetching;
841 afs_PutVolume(volp, READ_LOCK);
843 osi_FreeLargeSpace(statMemp);
844 osi_FreeLargeSpace(cbfMemp);
847 /* was: (AFS_DEC_ENV) || defined(AFS_OSF30_ENV) || defined(AFS_NCR_ENV) */
853 struct nameidata *ndp; {
854 char aname[MAXNAMLEN+1]; /* XXX */
855 struct vcache **avcp = (struct vcache **)&(ndp->ni_vp);
856 struct ucred *acred = ndp->ni_cred;
857 int wantparent = ndp->ni_nameiop & WANTPARENT;
858 int opflag = ndp->ni_nameiop & OPFLAG;
859 #else /* AFS_OSF_ENV */
860 #if defined(AFS_SUN5_ENV) || defined(AFS_SGI_ENV)
861 afs_lookup(OSI_VC_ARG(adp), aname, avcp, pnp, flags, rdir, acred)
862 struct pathname *pnp;
866 afs_lookup(adp, aname, avcp, acred)
869 struct vcache **avcp;
871 struct AFS_UCRED *acred; {
873 struct vrequest treq;
874 char *tname = (char *)0;
875 register struct vcache *tvc=0;
876 register afs_int32 code;
877 int pass = 0, hit = 0;
879 extern afs_int32 afs_mariner; /*Writing activity to log?*/
881 afs_hyper_t versionNo;
883 AFS_STATCNT(afs_lookup);
885 ndp->ni_dvp = (struct vnode *)adp;
886 bcopy(ndp->ni_ptr, aname, ndp->ni_namelen);
887 aname[ndp->ni_namelen] = '\0';
888 #endif /* AFS_OSF_ENV */
890 *avcp = (struct vcache *) 0; /* Since some callers don't initialize it */
892 if (code = afs_InitReq(&treq, acred)) {
896 /* lookup the name aname in the appropriate dir, and return a cache entry
897 on the resulting fid */
900 * check for, and handle "@sys" if it's there. We should be able
901 * to avoid the alloc and the strcpy with a little work, but it's
902 * not pressing. If there aren't any remote users (ie, via the
903 * NFS translator), we have a slightly easier job.
904 * the faster way to do this is to check for *aname == '@' and if
905 * it's there, check for @sys, otherwise, assume there's no @sys
906 * then, if the lookup fails, check for .*@sys...
908 if (!AFS_EQ_ATSYS(aname)) {
912 tname = (char *) osi_AllocLargeSpace(AFS_SMALLOCSIZ);
913 if (!afs_nfsexporter)
914 strcpy(tname, (afs_sysname ? afs_sysname : SYS_NAME ));
916 register struct unixuser *au;
917 register afs_int32 error;
918 au = afs_GetUser(treq.uid, adp->fid.Cell, 0); afs_PutUser(au, 0);
920 error = EXP_SYSNAME(au->exporter, (char *)0, tname);
922 strcpy(tname, "@sys");
924 strcpy(tname, (afs_sysname ? afs_sysname : SYS_NAME ));
929 /* come back to here if we encounter a non-existent object in a read-only
930 volume's directory */
933 *avcp = (struct vcache *) 0; /* Since some callers don't initialize it */
935 if (!(adp->states & CStatd)) {
936 if (code = afs_VerifyVCache2(adp, &treq))
941 /* watch for ".." in a volume root */
942 if (adp->mvstat == 2 && tname[0] == '.' && tname[1] == '.' && !tname[2]) {
943 /* looking up ".." in root via special hacks */
944 if (adp->mvid == (struct VenusFid *) 0 || adp->mvid->Fid.Volume == 0) {
946 extern struct vcache *afs_globalVp;
947 if (adp == afs_globalVp) {
948 struct vnode *rvp = (struct vnode *)adp;
950 ndp->ni_vp = rvp->v_vfsp->vfs_vnodecovered;
951 ndp->ni_dvp = ndp->ni_vp;
961 /* otherwise we have the fid here, so we use it */
962 tvc = afs_GetVCache(adp->mvid, &treq, (afs_int32 *)0,
963 (struct vcache*)0, 0);
964 afs_Trace3(afs_iclSetp, CM_TRACE_GETVCDOTDOT,
965 ICL_TYPE_FID, adp->mvid, ICL_TYPE_POINTER, tvc,
966 ICL_TYPE_INT32, code);
968 code = (tvc ? 0 : ENOENT);
970 if (tvc && !tvc->vrefCount) {
974 /*printf("LOOKUP GETVCDOTDOT -> %d\n", code);*/
979 /* now check the access */
980 if (treq.uid != adp->last_looker) {
981 if (!afs_AccessOK(adp, PRSFS_LOOKUP, &treq, CHECK_MODE_BITS)) {
982 *avcp = (struct vcache *)0;
986 else adp->last_looker = treq.uid;
990 /* special case lookup of ".". Can we check for it sooner in this code,
991 * for instance, way up before "redo:" ??
992 * I'm not fiddling with the LRUQ here, either, perhaps I should, or else
993 * invent a lightweight version of GetVCache.
995 if (tname[0] == '.' && !tname[1]) { /* special case */
996 ObtainReadLock(&afs_xvcache);
998 ReleaseReadLock(&afs_xvcache);
1002 if (adp && !adp->vrefCount) {
1008 tvc = osi_dnlc_lookup (adp, tname, WRITE_LOCK);
1009 *avcp = tvc; /* maybe wasn't initialized, but it is now */
1010 #ifdef AFS_LINUX22_ENV
1012 if (tvc->mvstat == 2) { /* we don't trust the dnlc for root vcaches */
1022 #else /* non - LINUX */
1028 #endif /* linux22 */
1031 register struct dcache *tdc;
1032 afs_int32 dirOffset, dirLen;
1034 struct VenusFid tfid;
1036 /* now we have to lookup the next fid */
1037 tdc = afs_GetDCache(adp, 0, &treq, &dirOffset, &dirLen, 1);
1039 *avcp = (struct vcache *)0; /* redundant, but harmless */
1044 /* now we will just call dir package with appropriate inode.
1045 Dirs are always fetched in their entirety for now */
1046 /* If the first lookup doesn't succeed, maybe it's got @sys in the name */
1047 ObtainReadLock(&adp->lock);
1050 * Make sure that the data in the cache is current. There are two
1051 * cases we need to worry about:
1052 * 1. The cache data is being fetched by another process.
1053 * 2. The cache data is no longer valid
1055 while ((adp->states & CStatd)
1056 && (tdc->flags & DFFetching)
1057 && hsame(adp->m.DataVersion, tdc->f.versionNo)) {
1058 tdc->flags |= DFWaiting;
1059 ReleaseReadLock(&adp->lock);
1060 afs_osi_Sleep(&tdc->validPos);
1061 ObtainReadLock(&adp->lock);
1063 if (!(adp->states & CStatd)
1064 || !hsame(adp->m.DataVersion, tdc->f.versionNo)) {
1065 ReleaseReadLock(&adp->lock);
1070 /* Save the version number for when we call osi_dnlc_enter */
1071 hset(versionNo, tdc->f.versionNo);
1073 theDir = tdc->f.inode;
1074 code = afs_dir_LookupOffset(&theDir, tname, &tfid.Fid, &dirCookie);
1075 if (code == ENOENT && tname == aname) {
1077 len = strlen(aname);
1078 if (len >= 4 && AFS_EQ_ATSYS(aname+len-4)) {
1079 tname = (char *) osi_AllocLargeSpace(AFS_LRALLOCSIZ);
1080 afs_HandleAtName(aname, tname, &treq, adp);
1081 code = afs_dir_LookupOffset(&theDir, tname, &tfid.Fid, &dirCookie);
1084 ReleaseReadLock(&adp->lock);
1087 /* new fid has same cell and volume */
1088 tfid.Cell = adp->fid.Cell;
1089 tfid.Fid.Volume = adp->fid.Fid.Volume;
1090 afs_Trace4(afs_iclSetp, CM_TRACE_LOOKUP, ICL_TYPE_POINTER, adp,
1091 ICL_TYPE_STRING, tname,
1092 ICL_TYPE_FID, &tfid, ICL_TYPE_INT32, code);
1095 if (code != ENOENT) {
1096 printf("LOOKUP dirLookupOff -> %d\n", code);
1101 /* prefetch some entries, if the dir is currently open. The variable
1102 * dirCookie tells us where to start prefetching from.
1104 if (AFSDOBULK && adp->opens > 0 && !(adp->states & CForeign)) {
1106 /* if the entry is not in the cache, or is in the cache,
1107 * but hasn't been statd, then do a bulk stat operation.
1111 ObtainReadLock(&afs_xvcache);
1112 tvc = afs_FindVCache(&tfid, 1, 0, &retry, 0/* !stats,!lru */);
1113 ReleaseReadLock(&afs_xvcache);
1114 } while (tvc && retry);
1116 if (!tvc || !(tvc->states & CStatd)) {
1117 afs_DoBulkStat(adp, dirCookie, &treq);
1120 /* if the vcache isn't usable, release it */
1121 if (tvc && !(tvc->states & CStatd)) {
1123 tvc = (struct vcache *) 0;
1126 else tvc = (struct vcache *) 0;
1128 /* now get the status info, if we don't already have it */
1129 /* This is kind of weird, but we might wind up accidentally calling
1130 * RXAFS_Lookup because we happened upon a file which legitimately
1131 * has a 0 uniquifier. That is the result of allowing unique to wrap
1132 * to 0. This was fixed in AFS 3.4. For CForeigh, Unique == 0 means that
1133 * the file has not yet been looked up.
1136 afs_int32 cached = 0;
1137 if (!tfid.Fid.Unique && (adp->states & CForeign)) {
1138 tvc = afs_LookupVCache(&tfid, &treq, &cached, WRITE_LOCK,
1141 if (!tvc) { /* lookup failed or wasn't called */
1142 tvc = afs_GetVCache(&tfid, &treq, &cached, (struct vcache*)0,
1146 } /* sub-block just to reduce stack usage */
1149 if (adp->states & CForeign)
1150 tvc->states |= CForeign;
1151 tvc->parentVnode = adp->fid.Fid.Vnode;
1152 tvc->parentUnique = adp->fid.Fid.Unique;
1153 tvc->states &= ~CBulkStat;
1154 if (tvc->mvstat == 1) {
1155 /* a mt point, possibly unevaluated */
1156 struct volume *tvolp;
1158 ObtainWriteLock(&tvc->lock,133);
1159 code = EvalMountPoint(tvc, adp, &tvolp, &treq);
1160 ReleaseWriteLock(&tvc->lock);
1161 /* next, we want to continue using the target of the mt point */
1162 if (tvc->mvid && (tvc->states & CMValid)) {
1164 /* now lookup target, to set .. pointer */
1165 afs_Trace2(afs_iclSetp, CM_TRACE_LOOKUP1,
1166 ICL_TYPE_POINTER, tvc, ICL_TYPE_FID, &tvc->fid);
1167 uvc = tvc; /* remember for later */
1169 if (tvolp && (tvolp->states & VForeign)) {
1170 /* XXXX tvolp has ref cnt on but not locked! XXX */
1171 tvc = afs_GetRootVCache(tvc->mvid, &treq, (afs_int32 *)0, tvolp, WRITE_LOCK);
1173 tvc = afs_GetVCache(tvc->mvid, &treq, (afs_int32 *)0,
1174 (struct vcache*)0, WRITE_LOCK);
1176 afs_PutVCache(uvc, WRITE_LOCK); /* we're done with it */
1181 afs_PutVolume(tvolp, WRITE_LOCK);
1186 /* now, if we came via a new mt pt (say because of a new
1187 * release of a R/O volume), we must reevaluate the ..
1188 * ptr to point back to the appropriate place */
1190 ObtainWriteLock(&tvc->lock,134);
1191 if (tvc->mvid == (struct VenusFid *) 0) {
1192 tvc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
1194 /* setup backpointer */
1195 *tvc->mvid = tvolp->dotdot;
1196 ReleaseWriteLock(&tvc->lock);
1197 afs_PutVolume(tvolp, WRITE_LOCK);
1201 afs_PutVCache(tvc, WRITE_LOCK);
1203 if (tvolp) afs_PutVolume(tvolp, WRITE_LOCK);
1208 if (tvc && !tvc->vrefCount) {
1214 /* if we get here, we found something in a directory that couldn't
1215 be located (a Multics "connection failure"). If the volume is
1216 read-only, we try flushing this entry from the cache and trying
1220 tv = afs_GetVolume(&adp->fid, &treq, READ_LOCK);
1222 if (tv->states & VRO) {
1223 pass = 1; /* try this *once* */
1224 ObtainWriteLock(&afs_xcbhash, 495);
1225 afs_DequeueCallback(adp);
1226 /* re-stat to get later version */
1227 adp->states &= ~CStatd;
1228 ReleaseWriteLock(&afs_xcbhash);
1229 osi_dnlc_purgedp(adp);
1230 afs_PutVolume(tv, READ_LOCK);
1233 afs_PutVolume(tv, READ_LOCK);
1240 /* put the network buffer back, if need be */
1241 if (tname != aname && tname) osi_FreeLargeSpace(tname);
1244 /* Handle RENAME; only need to check rename "." */
1245 if (opflag == RENAME && wantparent && *ndp->ni_next == 0) {
1246 if (!FidCmp(&(tvc->fid), &(adp->fid))) {
1247 afs_PutVCache(*avcp, WRITE_LOCK);
1249 return afs_CheckCode(EISDIR, &treq, 18);
1252 #endif /* AFS_OSF_ENV */
1255 afs_AddMarinerName(aname, tvc);
1257 osi_dnlc_enter (adp, aname, tvc, &versionNo);
1260 #ifdef AFS_LINUX20_ENV
1261 /* So Linux inode cache is up to date. */
1262 code = afs_VerifyVCache(tvc, &treq);
1264 return 0; /* can't have been any errors if hit and !code */
1268 code = afs_CheckCode(code, &treq, 19);
1270 /* If there is an error, make sure *avcp is null.
1271 * Alphas panic otherwise - defect 10719.
1273 *avcp = (struct vcache *)0;