2 * Copyright 2000, International Business Machines Corporation and others.
5 * This software has been released under the terms of the IBM Public
6 * License. For details, see the LICENSE file in the top-level source
7 * directory or online at http://www.openafs.org/dl/license10.html
18 * AFS_EQ_ATSYS (macro)
22 #include "../afs/param.h" /* Should be always first */
23 #include "../afs/sysincludes.h" /* Standard vendor system headers */
24 #include "../afs/afsincludes.h" /* Afs-based standard headers */
25 #include "../afs/afs_stats.h" /* statistics */
26 #include "../afs/afs_cbqueue.h"
27 #include "../afs/nfsclient.h"
28 #include "../afs/exporter.h"
29 #include "../afs/afs_osidnlc.h"
33 * A few definitions. This is until we have a proper header file
34 * which has prototypes for all functions
37 extern struct DirEntry * afs_dir_GetBlob();
39 extern afs_rwlock_t afs_xvcache;
40 extern afs_rwlock_t afs_xcbhash;
41 extern struct afs_exporter *afs_nfsexporter;
42 extern char *afs_sysname;
43 extern struct afs_q VLRU; /*vcache LRU*/
44 #ifdef AFS_LINUX22_ENV
45 extern struct inode_operations afs_symlink_iops, afs_dir_iops;
49 afs_int32 afs_bulkStatsDone;
50 static int bulkStatCounter = 0; /* counter for bulk stat seq. numbers */
53 /* this would be faster if it did comparison as int32word, but would be
54 * dependant on byte-order and alignment, and I haven't figured out
55 * what "@sys" is in binary... */
56 #define AFS_EQ_ATSYS(name) (((name)[0]=='@')&&((name)[1]=='s')&&((name)[2]=='y')&&((name)[3]=='s')&&(!(name)[4]))
60 register char *s1, *s2;
76 register char *a, c; {
78 AFS_STATCNT(afs_index);
80 if (tc == c) return a;
86 /* call under write lock, evaluate mvid field from a mt pt.
87 * avc is the vnode of the mount point object.
88 * advc is the vnode of the containing directory
89 * avolpp is where we return a pointer to the volume named by the mount pt, if success
90 * areq is the identity of the caller.
92 * NOTE: this function returns a held volume structure in *volpp if it returns 0!
94 EvalMountPoint(avc, advc, avolpp, areq)
95 register struct vcache *avc;
96 struct volume **avolpp;
97 struct vcache *advc; /* the containing dir */
98 register struct vrequest *areq;
101 struct volume *tvp = 0;
102 struct VenusFid tfid;
104 char *cpos, *volnamep;
106 afs_int32 prefetchRO; /* 1=>No 2=>Yes */
107 afs_int32 mtptCell, assocCell, hac=0;
108 afs_int32 samecell, roname, len;
110 AFS_STATCNT(EvalMountPoint);
112 if (avc->mvid && (avc->states & CMValid)) return 0; /* done while racing */
114 *avolpp = (struct volume *)0;
115 code = afs_HandleLink(avc, areq);
116 if (code) return code;
118 /* Determine which cell and volume the mointpoint goes to */
119 type = avc->linkData[0]; /* '#'=>Regular '%'=>RW */
120 cpos = afs_index(&avc->linkData[1], ':'); /* if cell name present */
124 tcell = afs_GetCellByName(&avc->linkData[1], READ_LOCK);
127 volnamep = &avc->linkData[1];
128 tcell = afs_GetCell(avc->fid.Cell, READ_LOCK);
130 if (!tcell) return ENODEV;
132 mtptCell = tcell->cell; /* The cell for the mountpoint */
134 hac = 1; /* has associated cell */
135 assocCell = tcell->lcellp->cell; /* The associated cell */
137 afs_PutCell(tcell, READ_LOCK);
139 /* Is volume name a "<n>.backup" or "<n>.readonly" name */
140 len = strlen(volnamep);
141 roname = ((len > 9) && (strcmp(&volnamep[len - 9],".readonly") == 0)) ||
142 ((len > 7) && (strcmp(&volnamep[len - 7],".backup") == 0));
144 /* When we cross mountpoint, do we stay in the same cell */
145 samecell = (avc->fid.Cell == mtptCell) || (hac && (avc->fid.Cell == assocCell));
147 /* Decide whether to prefetch the RO. Also means we want the RO.
148 * If this is a regular mountpoint with a RW volume name and
149 * we cross a cell boundary -or- start from a RO volume, then we will
150 * want to prefetch the RO volume when we get the RW below.
152 if ( (type == '#') && !roname && (!samecell || (avc->states & CRO)) ) {
153 prefetchRO = 2; /* Yes, prefetch the RO */
155 prefetchRO = 1; /* No prefetch of the RO */
158 /* Get the volume struct. Unless this volume name has ".readonly" or
159 * ".backup" in it, this will get the volume struct for the RW volume.
160 * The RO volume will be prefetched if requested (but not returned).
162 tvp = afs_GetVolumeByName(volnamep, mtptCell, prefetchRO, areq, WRITE_LOCK);
164 /* If no volume was found in this cell, try the associated linked cell */
165 if (!tvp && hac && areq->volumeError) {
166 tvp = afs_GetVolumeByName(volnamep, assocCell, prefetchRO, areq, WRITE_LOCK);
169 /* Still not found. If we are looking for the RO, then perhaps the RW
170 * doesn't exist? Try adding ".readonly" to volname and look for that.
171 * Don't know why we do this. Would have still found it in above call - jpm.
173 if (!tvp && (prefetchRO == 2)) {
174 strcpy(buf, volnamep);
175 afs_strcat(buf, ".readonly");
177 tvp = afs_GetVolumeByName(buf, mtptCell, 1, areq, WRITE_LOCK);
179 /* Try the associated linked cell if failed */
180 if (!tvp && hac && areq->volumeError) {
181 tvp = afs_GetVolumeByName(buf, assocCell, 1, areq, WRITE_LOCK);
185 if (!tvp) return ENOENT; /* Couldn't find the volume */
187 /* Don't cross mountpoint from a BK to a BK volume */
188 if ((avc->states & CBackup) && (tvp->states & VBackup)) {
189 afs_PutVolume(tvp, WRITE_LOCK);
193 /* If we want (prefetched) the RO and it exists, then drop the
194 * RW volume and get the RO. Othewise, go with the RW.
196 if ((prefetchRO == 2) && tvp->roVol) {
197 tfid.Fid.Volume = tvp->roVol; /* remember RO volume */
198 tfid.Cell = tvp->cell;
199 afs_PutVolume(tvp, WRITE_LOCK); /* release old volume */
200 tvp = afs_GetVolume(&tfid, areq, WRITE_LOCK); /* get the new one */
201 if (!tvp) return ENOENT; /* oops, can't do it */
205 avc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
206 avc->mvid->Cell = tvp->cell;
207 avc->mvid->Fid.Volume = tvp->volume;
208 avc->mvid->Fid.Vnode = 1;
209 avc->mvid->Fid.Unique = 1;
210 avc->states |= CMValid;
212 /* Used to: if the mount point is stored within a backup volume,
213 * then we should only update the parent pointer information if
214 * there's none already set, so as to avoid updating a volume's ..
215 * info with something in an OldFiles directory.
217 * Next two lines used to be under this if:
219 * if (!(avc->states & CBackup) || tvp->dotdot.Fid.Volume == 0)
221 * Now: update mount point back pointer on every call, so that we handle
222 * multiple mount points better. This way, when du tries to go back
223 * via chddir(".."), it will end up exactly where it started, yet
224 * cd'ing via a new path to a volume will reset the ".." pointer
227 tvp->mtpoint = avc->fid; /* setup back pointer to mtpoint */
228 tvp->dotdot = advc->fid;
235 register char *aname; {
239 AFS_STATCNT(ENameOK);
240 tlen = strlen(aname);
241 if (tlen >= 4 && strcmp(aname+tlen-4, "@sys") == 0) return 0;
245 Check_AtSys(avc, aname, outb, areq)
246 register struct vcache *avc;
248 struct vrequest *areq;
250 register char *tname;
251 register int error = 0, offset = -1;
253 for (tname=aname; *tname; tname++) /*Move to the end of the string*/;
256 * If the current string is 4 chars long or more, check to see if the
257 * tail end is "@sys".
259 if ((tname >= aname + 4) && (AFS_EQ_ATSYS(tname-4)))
260 offset = (tname - 4) - aname;
264 tname = (char *) osi_AllocLargeSpace(AFS_LRALLOCSIZ);
266 strncpy(tname, aname, offset);
267 if (!afs_nfsexporter)
268 strcpy(tname+offset, (afs_sysname ? afs_sysname : SYS_NAME ));
270 register struct unixuser *au;
271 register afs_int32 error;
272 au = afs_GetUser(areq->uid, avc->fid.Cell, 0); afs_PutUser(au, 0);
274 error = EXP_SYSNAME(au->exporter, (char *)0, tname+offset);
276 strcpy(tname+offset, "@sys");
278 strcpy(tname+offset, (afs_sysname ? afs_sysname : SYS_NAME ));
288 char *afs_getsysname(areq, adp)
289 register struct vrequest *areq;
290 register struct vcache *adp; {
291 static char sysname[MAXSYSNAME];
292 register struct unixuser *au;
293 register afs_int32 error;
295 AFS_STATCNT(getsysname);
296 /* this whole interface is wrong, it should take a buffer ptr and copy
299 au = afs_GetUser(areq->uid, adp->fid.Cell, 0);
302 error = EXP_SYSNAME(au->exporter, (char *)0, sysname);
303 if (error) return "@sys";
306 return (afs_sysname == 0? SYS_NAME : afs_sysname);
310 void afs_HandleAtName(aname, aresult, areq, adp)
311 register char *aname;
312 register char *aresult;
313 register struct vrequest *areq;
314 register struct vcache *adp; {
316 AFS_STATCNT(HandleAtName);
317 tlen = strlen(aname);
318 if (tlen >= 4 && strcmp(aname+tlen-4, "@sys")==0) {
319 strncpy(aresult, aname, tlen-4);
320 strcpy(aresult+tlen-4, afs_getsysname(areq, adp));
322 else strcpy(aresult, aname);
325 #if (defined(AFS_SGI62_ENV) || defined(AFS_SUN57_64BIT_ENV))
326 extern int BlobScan(ino64_t *afile, afs_int32 ablob);
328 extern int BlobScan(afs_int32 *afile, afs_int32 ablob);
332 /* called with an unlocked directory and directory cookie. Areqp
333 * describes who is making the call.
334 * Scans the next N (about 30, typically) directory entries, and does
335 * a bulk stat call to stat them all.
337 * Must be very careful when merging in RPC responses, since we dont
338 * want to overwrite newer info that was added by a file system mutating
339 * call that ran concurrently with our bulk stat call.
341 * We do that, as described below, by not merging in our info (always
342 * safe to skip the merge) if the status info is valid in the vcache entry.
344 * If adapt ever implements the bulk stat RPC, then this code will need to
345 * ensure that vcaches created for failed RPC's to older servers have the
348 struct vcache * BStvc = (struct vcache *) 0;
349 void afs_DoBulkStat(adp, dirCookie, areqp)
352 struct vrequest *areqp;
354 int nentries; /* # of entries to prefetch */
355 int nskip; /* # of slots in the LRU queue to skip */
356 struct vcache *lruvcp; /* vcache ptr of our goal pos in LRU queue */
357 struct dcache *dcp; /* chunk containing the dir block */
358 char *statMemp; /* status memory block */
359 char *cbfMemp; /* callback and fid memory block */
360 long temp; /* temp for holding chunk length, &c. */
361 struct AFSFid *fidsp; /* file IDs were collecting */
362 struct AFSCallBack *cbsp; /* call back pointers */
363 struct AFSCallBack *tcbp; /* temp callback ptr */
364 struct AFSFetchStatus *statsp; /* file status info */
365 struct AFSVolSync volSync; /* vol sync return info */
366 struct vcache *tvcp; /* temp vcp */
367 struct afs_q *tq; /* temp queue variable */
368 AFSCBFids fidParm; /* file ID parm for bulk stat */
369 AFSBulkStats statParm; /* stat info parm for bulk stat */
370 int fidIndex; /* which file were stating */
371 struct conn *tcp; /* conn for call */
372 AFSCBs cbParm; /* callback parm for bulk stat */
373 struct server *hostp = 0; /* host we got callback from */
374 long origEvenCBs; /* original # of callbacks for even-fid files */
375 long origOddCBs; /* original # of callbacks for odd-fid files */
376 long origEvenZaps; /* original # of recycles for even-fid files */
377 long origOddZaps; /* original # of recycles for odd-fid files */
378 long startTime; /* time we started the call,
379 * for callback expiration base
381 int statSeqNo; /* Valued of file size to detect races */
382 int code; /* error code */
383 long newIndex; /* new index in the dir */
384 struct DirEntry *dirEntryp; /* dir entry we are examining */
386 struct VenusFid afid; /* file ID we are using now */
387 struct VenusFid tfid; /* another temp. file ID */
388 afs_int32 retry; /* handle low-level SGI MP race conditions */
389 long volStates; /* flags from vol structure */
390 struct volume *volp=0; /* volume ptr */
391 struct VenusFid dotdot;
392 int flagIndex; /* First file with bulk fetch flag set */
395 /* first compute some basic parameters. We dont want to prefetch more
396 * than a fraction of the cache in any given call, and we want to preserve
397 * a portion of the LRU queue in any event, so as to avoid thrashing
398 * the entire stat cache (we will at least leave some of it alone).
399 * presently dont stat more than 1/8 the cache in any one call. */
400 nentries = afs_cacheStats / 8;
402 /* dont bother prefetching more than one calls worth of info */
403 if (nentries > AFSCBMAX) nentries = AFSCBMAX;
405 /* heuristic to make sure that things fit in 4K. This means that
406 * we shouldnt make it any bigger than 47 entries. I am typically
407 * going to keep it a little lower, since we don't want to load
408 * too much of the stat cache.
410 if (nentries > 30) nentries = 30;
412 /* now, to reduce the stack size, well allocate two 4K blocks,
413 * one for fids and callbacks, and one for stat info. Well set
414 * up our pointers to the memory from there, too.
416 statMemp = osi_AllocLargeSpace(nentries * sizeof(AFSFetchStatus));
417 statsp = (struct AFSFetchStatus *) statMemp;
418 cbfMemp = osi_AllocLargeSpace(nentries *
419 (sizeof(AFSCallBack) + sizeof(AFSFid)));
420 fidsp = (AFSFid *) cbfMemp;
421 cbsp = (AFSCallBack *) (cbfMemp + nentries * sizeof(AFSFid));
423 /* next, we must iterate over the directory, starting from the specified
424 * cookie offset (dirCookie), and counting out nentries file entries.
425 * We skip files that already have stat cache entries, since we
426 * dont want to bulk stat files that are already in the cache.
429 code = afs_VerifyVCache(adp, areqp);
432 dcp = afs_GetDCache(adp, 0, areqp, &temp, &temp, 1);
438 /* lock the directory cache entry */
439 ObtainReadLock(&adp->lock);
442 * Make sure that the data in the cache is current. There are two
443 * cases we need to worry about:
444 * 1. The cache data is being fetched by another process.
445 * 2. The cache data is no longer valid
447 while ((adp->states & CStatd)
448 && (dcp->flags & DFFetching)
449 && hsame(adp->m.DataVersion, dcp->f.versionNo)) {
450 dcp->flags |= DFWaiting;
451 ReleaseReadLock(&adp->lock);
452 afs_osi_Sleep(&dcp->validPos);
453 ObtainReadLock(&adp->lock);
455 if (!(adp->states & CStatd)
456 || !hsame(adp->m.DataVersion, dcp->f.versionNo)) {
457 ReleaseReadLock(&adp->lock);
462 /* Generate a sequence number so we can tell whether we should
463 * store the attributes when processing the response. This number is
464 * stored in the file size when we set the CBulkFetching bit. If the
465 * CBulkFetching is still set and this value hasn't changed, then
466 * we know we were the last to set CBulkFetching bit for this file,
467 * and it is safe to set the status information for this file.
469 statSeqNo = bulkStatCounter++;
471 /* now we have dir data in the cache, so scan the dir page */
474 while (1) { /* Should probably have some constant bound */
475 /* look for first safe entry to examine in the directory. BlobScan
476 * looks for a the 1st allocated dir after the dirCookie slot.
478 newIndex = BlobScan(&dcp->f.inode, (dirCookie>>5));
479 if (newIndex == 0) break;
481 /* remember the updated directory cookie */
482 dirCookie = newIndex << 5;
484 /* get a ptr to the dir entry */
485 dirEntryp =(struct DirEntry *)afs_dir_GetBlob(&dcp->f.inode, newIndex);
486 if (!dirEntryp) break;
488 /* dont copy more than we have room for */
489 if (fidIndex >= nentries) {
490 DRelease((char *) dirEntryp, 0);
494 /* now, if the dir entry looks good, copy it out to our list. Vnode
495 * 0 means deleted, although it should also be free were it deleted.
497 if (dirEntryp->fid.vnode != 0) {
498 /* dont copy entries we have in our cache. This check will
499 * also make us skip "." and probably "..", unless it has
500 * disappeared from the cache since we did our namei call.
502 tfid.Cell = adp->fid.Cell;
503 tfid.Fid.Volume = adp->fid.Fid.Volume;
504 tfid.Fid.Vnode = ntohl(dirEntryp->fid.vnode);
505 tfid.Fid.Unique = ntohl(dirEntryp->fid.vunique);
508 ObtainWriteLock(&afs_xvcache, 130);
509 tvcp = afs_FindVCache(&tfid, 0, 0, &retry, 0 /* no stats | LRU */);
511 ReleaseWriteLock(&afs_xvcache);
514 } while (tvcp && retry);
515 if (!tvcp) { /* otherwise, create manually */
516 tvcp = afs_NewVCache(&tfid, hostp, 0, 0);
517 ObtainWriteLock(&tvcp->lock, 505);
518 ReleaseWriteLock(&afs_xvcache);
519 afs_RemoveVCB(&tfid);
520 ReleaseWriteLock(&tvcp->lock);
522 ReleaseWriteLock(&afs_xvcache);
525 goto done; /* can't happen at present, more's the pity */
527 /* WARNING: afs_DoBulkStat uses the Length field to store a
528 * sequence number for each bulk status request. Under no
529 * circumstances should afs_DoBulkStat store a sequence number
530 * if the new length will be ignored when afs_ProcessFS is
531 * called with new stats. */
533 if (!(tvcp->states & (CStatd|CBulkFetching))
534 && (tvcp->execsOrWriters <= 0)
535 && !afs_DirtyPages(tvcp)
536 && !AFS_VN_MAPPED((vnode_t*)tvcp))
538 if (!(tvcp->states & (CStatd|CBulkFetching))
539 && (tvcp->execsOrWriters <= 0)
540 && !afs_DirtyPages(tvcp))
544 /* this entry doesnt exist in the cache, and is not
545 * already being fetched by someone else, so add it to the
546 * list of file IDs to obtain.
548 * We detect a callback breaking race condition by checking the
549 * CBulkFetching state bit and the value in the file size.
550 * It is safe to set the status only if the CBulkFetching
551 * flag is still set and the value in the file size does
554 * Don't fetch status for dirty files. We need to
555 * preserve the value of the file size. We could
556 * flush the pages, but it wouldn't be worthwhile.
558 bcopy((char *) &tfid.Fid, (char *)(fidsp+fidIndex),
560 tvcp->states |= CBulkFetching;
561 tvcp->m.Length = statSeqNo;
565 } /* if dir vnode has non-zero entry */
567 /* move to the next dir entry by adding in the # of entries
568 * used by this dir entry.
570 temp = afs_dir_NameBlobs(dirEntryp->name) << 5;
571 DRelease((char *) dirEntryp, 0);
572 if (temp <= 0) break;
574 } /* while loop over all dir entries */
576 /* now release the dir lock and prepare to make the bulk RPC */
577 ReleaseReadLock(&adp->lock);
579 /* release the chunk */
582 /* dont make a null call */
583 if (fidIndex == 0) goto done;
586 /* setup the RPC parm structures */
587 fidParm.AFSCBFids_len = fidIndex;
588 fidParm.AFSCBFids_val = fidsp;
589 statParm.AFSBulkStats_len = fidIndex;
590 statParm.AFSBulkStats_val = statsp;
591 cbParm.AFSCBs_len = fidIndex;
592 cbParm.AFSCBs_val = cbsp;
594 /* start the timer; callback expirations are relative to this */
595 startTime = osi_Time();
597 tcp = afs_Conn(&adp->fid, areqp, SHARED_LOCK);
599 hostp = tcp->srvr->server;
600 XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_BULKSTATUS);
601 #ifdef RX_ENABLE_LOCKS
603 #endif /* RX_ENABLE_LOCKS */
604 code = RXAFS_BulkStatus(tcp->id, &fidParm, &statParm, &cbParm,
606 #ifdef RX_ENABLE_LOCKS
608 #endif /* RX_ENABLE_LOCKS */
612 } while (afs_Analyze(tcp, code, &adp->fid, areqp,
613 AFS_STATS_FS_RPCIDX_BULKSTATUS, SHARED_LOCK, (struct cell *)0));
615 /* now, if we didnt get the info, bail out. */
618 /* we need vol flags to create the entries properly */
619 dotdot.Fid.Volume = 0;
620 volp = afs_GetVolume(&adp->fid, areqp, READ_LOCK);
622 volStates = volp->states;
623 if (volp->dotdot.Fid.Volume != 0)
624 dotdot = volp->dotdot;
628 /* find the place to merge the info into We do this by skipping
629 * nskip entries in the LRU queue. The more we skip, the more
630 * we preserve, since the head of the VLRU queue is the most recently
634 nskip = afs_cacheStats / 2; /* preserved fraction of the cache */
635 ObtainReadLock(&afs_xvcache);
637 /* actually a serious error, probably should panic. Probably will
638 * panic soon, oh well. */
639 ReleaseReadLock(&afs_xvcache);
642 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
643 refpanic ("Bulkstat VLRU inconsistent");
645 for(tq = VLRU.next; tq != &VLRU; tq = QNext(tq)) {
646 if (--nskip <= 0) break;
647 else if (QNext(QPrev(tq)) != tq) {
649 refpanic ("BulkStat VLRU inconsistent");
652 if (tq != &VLRU) lruvcp = QTOV(tq);
653 else lruvcp = QTOV(VLRU.next);
655 /* now we have to hold this entry, so that it does not get moved
656 * into the free list while we're running. It could still get
657 * moved within the lru queue, but hopefully that will be rare; it
658 * doesn't hurt nearly as much.
661 osi_vnhold(lruvcp, &retry);
662 ReleaseReadLock(&afs_xvcache); /* could be read lock */
666 /* otherwise, merge in the info. We have to be quite careful here,
667 * since we need to ensure that we don't merge old info over newer
668 * stuff in a stat cache entry. We're very conservative here: we don't
669 * do the merge at all unless we ourselves create the stat cache
670 * entry. That's pretty safe, and should work pretty well, since we
671 * typically expect to do the stat cache creation ourselves.
673 * We also have to take into account racing token revocations.
675 for(i=0; i<fidIndex; i++) {
676 afid.Cell = adp->fid.Cell;
677 afid.Fid.Volume = adp->fid.Fid.Volume;
678 afid.Fid.Vnode = fidsp[i].Vnode;
679 afid.Fid.Unique = fidsp[i].Unique;
682 ObtainReadLock(&afs_xvcache);
683 tvcp = afs_FindVCache(&afid, 1, 0, &retry, 0/* !stats&!lru*/);
684 ReleaseReadLock(&afs_xvcache);
685 } while (tvcp && retry);
687 /* The entry may no longer exist */
692 /* now we have the entry held, but we need to fill it in */
693 ObtainWriteLock(&tvcp->lock,131);
695 /* if CBulkFetching is not set, or if the file size no longer
696 * matches the value we placed there when we set the CBulkFetching
697 * flag, then someone else has done something with this node,
698 * and we may not have the latest status information for this
699 * file. Leave the entry alone.
701 if (!(tvcp->states & CBulkFetching) || (tvcp->m.Length != statSeqNo)) {
703 ReleaseWriteLock(&tvcp->lock);
708 /* now copy ".." entry back out of volume structure, if necessary */
709 if (tvcp->mvstat == 2 && (dotdot.Fid.Volume != 0)) {
711 tvcp->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
712 *tvcp->mvid = dotdot;
715 ObtainWriteLock(&afs_xvcache,132);
716 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
717 refpanic ("Bulkstat VLRU inconsistent2");
719 if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
720 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq))
721 refpanic ("Bulkstat VLRU inconsistent4");
722 if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
723 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq))
724 refpanic ("Bulkstat VLRU inconsistent5");
726 if (tvcp != lruvcp) { /* if they are == don't move it, don't corrupt vlru */
727 QRemove(&tvcp->vlruq);
728 QAdd(&lruvcp->vlruq, &tvcp->vlruq);
731 if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
732 refpanic ("Bulkstat VLRU inconsistent3");
734 if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
735 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq))
736 refpanic ("Bulkstat VLRU inconsistent5");
737 if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
738 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq))
739 refpanic ("Bulkstat VLRU inconsistent6");
740 ReleaseWriteLock(&afs_xvcache);
742 /* We need to check the flags again. We may have missed
743 * something while we were waiting for a lock.
745 if (!(tvcp->states & CBulkFetching) || (tvcp->m.Length != statSeqNo)) {
747 ReleaseWriteLock(&tvcp->lock);
752 /* now merge in the resulting status back into the vnode.
753 * We only do this if the entry looks clear.
755 afs_ProcessFS(tvcp, &statsp[i], areqp);
756 #ifdef AFS_LINUX22_ENV
757 /* overwrite the ops if it's a directory or symlink. */
758 if (vType(tvcp) == VDIR)
759 tvcp->v.v_op = &afs_dir_iops;
760 else if (vType(tvcp) == VLNK)
761 tvcp->v.v_op = &afs_symlink_iops;
764 ObtainWriteLock(&afs_xcbhash, 494);
766 /* We need to check the flags once more. We may have missed
767 * something while we were waiting for a lock.
769 if (!(tvcp->states & CBulkFetching) || (tvcp->m.Length != statSeqNo)) {
771 ReleaseWriteLock(&afs_xcbhash);
772 ReleaseWriteLock(&tvcp->lock);
777 /* do some accounting for bulk stats: mark this entry as
778 * loaded, so we can tell if we use it before it gets
781 tvcp->states |= CBulkStat;
782 tvcp->states &= ~CBulkFetching;
786 /* merge in vol info */
787 if (volStates & VRO) tvcp->states |= CRO;
788 if (volStates & VBackup) tvcp->states |= CBackup;
789 if (volStates & VForeign) tvcp->states |= CForeign;
791 /* merge in the callback info */
792 tvcp->states |= CTruth;
794 /* get ptr to the callback we are interested in */
797 if (tcbp->ExpirationTime != 0) {
798 tvcp->cbExpires = tcbp->ExpirationTime+startTime;
799 tvcp->callback = hostp;
800 tvcp->states |= CStatd;
801 afs_QueueCallback(tvcp, CBHash(tcbp->ExpirationTime), volp);
803 else if (tvcp->states & CRO) {
804 /* ordinary callback on a read-only volume -- AFS 3.2 style */
805 tvcp->cbExpires = 3600+startTime;
806 tvcp->callback = hostp;
807 tvcp->states |= CStatd;
808 afs_QueueCallback(tvcp, CBHash(3600), volp);
812 tvcp->states &= ~(CStatd|CUnique);
813 afs_DequeueCallback(tvcp);
814 if ((tvcp->states & CForeign) || (vType(tvcp) == VDIR))
815 osi_dnlc_purgedp (tvcp); /* if it (could be) a directory */
817 ReleaseWriteLock(&afs_xcbhash);
819 ReleaseWriteLock(&tvcp->lock);
820 /* finally, we're done with the entry */
822 } /* for all files we got back */
824 /* finally return the pointer into the LRU queue */
825 afs_PutVCache(lruvcp);
828 /* Be sure to turn off the CBulkFetching flags */
829 for(i=flagIndex; i<fidIndex; i++) {
830 afid.Cell = adp->fid.Cell;
831 afid.Fid.Volume = adp->fid.Fid.Volume;
832 afid.Fid.Vnode = fidsp[i].Vnode;
833 afid.Fid.Unique = fidsp[i].Unique;
836 ObtainReadLock(&afs_xvcache);
837 tvcp = afs_FindVCache(&afid, 1, 0, &retry, 0/* !stats&!lru*/);
838 ReleaseReadLock(&afs_xvcache);
839 } while (tvcp && retry);
841 && (tvcp->states & CBulkFetching)
842 && (tvcp->m.Length == statSeqNo)) {
843 tvcp->states &= ~CBulkFetching;
850 afs_PutVolume(volp, READ_LOCK);
852 osi_FreeLargeSpace(statMemp);
853 osi_FreeLargeSpace(cbfMemp);
856 /* was: (AFS_DEC_ENV) || defined(AFS_OSF30_ENV) || defined(AFS_NCR_ENV) */
862 struct nameidata *ndp; {
863 char aname[MAXNAMLEN+1]; /* XXX */
864 struct vcache **avcp = (struct vcache **)&(ndp->ni_vp);
865 struct ucred *acred = ndp->ni_cred;
866 int wantparent = ndp->ni_nameiop & WANTPARENT;
867 int opflag = ndp->ni_nameiop & OPFLAG;
868 #else /* AFS_OSF_ENV */
869 #if defined(AFS_SUN5_ENV) || defined(AFS_SGI_ENV)
870 afs_lookup(OSI_VC_ARG(adp), aname, avcp, pnp, flags, rdir, acred)
871 struct pathname *pnp;
875 afs_lookup(adp, aname, avcp, acred)
878 struct vcache **avcp;
880 struct AFS_UCRED *acred; {
882 struct vrequest treq;
883 char *tname = (char *)0;
884 register struct vcache *tvc=0;
885 register afs_int32 code;
886 int pass = 0, hit = 0;
888 extern afs_int32 afs_mariner; /*Writing activity to log?*/
890 afs_hyper_t versionNo;
892 AFS_STATCNT(afs_lookup);
894 ndp->ni_dvp = (struct vnode *)adp;
895 bcopy(ndp->ni_ptr, aname, ndp->ni_namelen);
896 aname[ndp->ni_namelen] = '\0';
897 #endif /* AFS_OSF_ENV */
899 *avcp = (struct vcache *) 0; /* Since some callers don't initialize it */
901 if (code = afs_InitReq(&treq, acred)) {
905 /* lookup the name aname in the appropriate dir, and return a cache entry
906 on the resulting fid */
909 * check for, and handle "@sys" if it's there. We should be able
910 * to avoid the alloc and the strcpy with a little work, but it's
911 * not pressing. If there aren't any remote users (ie, via the
912 * NFS translator), we have a slightly easier job.
913 * the faster way to do this is to check for *aname == '@' and if
914 * it's there, check for @sys, otherwise, assume there's no @sys
915 * then, if the lookup fails, check for .*@sys...
917 if (!AFS_EQ_ATSYS(aname)) {
921 tname = (char *) osi_AllocLargeSpace(AFS_SMALLOCSIZ);
922 if (!afs_nfsexporter)
923 strcpy(tname, (afs_sysname ? afs_sysname : SYS_NAME ));
925 register struct unixuser *au;
926 register afs_int32 error;
927 au = afs_GetUser(treq.uid, adp->fid.Cell, 0); afs_PutUser(au, 0);
929 error = EXP_SYSNAME(au->exporter, (char *)0, tname);
931 strcpy(tname, "@sys");
933 strcpy(tname, (afs_sysname ? afs_sysname : SYS_NAME ));
938 /* come back to here if we encounter a non-existent object in a read-only
939 volume's directory */
942 *avcp = (struct vcache *) 0; /* Since some callers don't initialize it */
944 if (!(adp->states & CStatd)) {
945 if (code = afs_VerifyVCache2(adp, &treq))
950 /* watch for ".." in a volume root */
951 if (adp->mvstat == 2 && tname[0] == '.' && tname[1] == '.' && !tname[2]) {
952 /* looking up ".." in root via special hacks */
953 if (adp->mvid == (struct VenusFid *) 0 || adp->mvid->Fid.Volume == 0) {
955 extern struct vcache *afs_globalVp;
956 if (adp == afs_globalVp) {
957 struct vnode *rvp = (struct vnode *)adp;
959 ndp->ni_vp = rvp->v_vfsp->vfs_vnodecovered;
960 ndp->ni_dvp = ndp->ni_vp;
970 /* otherwise we have the fid here, so we use it */
971 tvc = afs_GetVCache(adp->mvid, &treq, (afs_int32 *)0,
972 (struct vcache*)0, 0);
973 afs_Trace3(afs_iclSetp, CM_TRACE_GETVCDOTDOT,
974 ICL_TYPE_FID, adp->mvid, ICL_TYPE_POINTER, tvc,
975 ICL_TYPE_INT32, code);
977 code = (tvc ? 0 : ENOENT);
979 if (tvc && !tvc->vrefCount) {
983 /*printf("LOOKUP GETVCDOTDOT -> %d\n", code);*/
988 /* now check the access */
989 if (treq.uid != adp->last_looker) {
990 if (!afs_AccessOK(adp, PRSFS_LOOKUP, &treq, CHECK_MODE_BITS)) {
991 *avcp = (struct vcache *)0;
995 else adp->last_looker = treq.uid;
999 /* special case lookup of ".". Can we check for it sooner in this code,
1000 * for instance, way up before "redo:" ??
1001 * I'm not fiddling with the LRUQ here, either, perhaps I should, or else
1002 * invent a lightweight version of GetVCache.
1004 if (tname[0] == '.' && !tname[1]) { /* special case */
1005 ObtainReadLock(&afs_xvcache);
1007 ReleaseReadLock(&afs_xvcache);
1011 if (adp && !adp->vrefCount) {
1017 tvc = osi_dnlc_lookup (adp, tname, WRITE_LOCK);
1018 *avcp = tvc; /* maybe wasn't initialized, but it is now */
1019 #ifdef AFS_LINUX22_ENV
1021 if (tvc->mvstat == 2) { /* we don't trust the dnlc for root vcaches */
1031 #else /* non - LINUX */
1037 #endif /* linux22 */
1040 register struct dcache *tdc;
1041 afs_int32 dirOffset, dirLen;
1043 struct VenusFid tfid;
1045 /* now we have to lookup the next fid */
1046 tdc = afs_GetDCache(adp, 0, &treq, &dirOffset, &dirLen, 1);
1048 *avcp = (struct vcache *)0; /* redundant, but harmless */
1053 /* now we will just call dir package with appropriate inode.
1054 Dirs are always fetched in their entirety for now */
1055 /* If the first lookup doesn't succeed, maybe it's got @sys in the name */
1056 ObtainReadLock(&adp->lock);
1059 * Make sure that the data in the cache is current. There are two
1060 * cases we need to worry about:
1061 * 1. The cache data is being fetched by another process.
1062 * 2. The cache data is no longer valid
1064 while ((adp->states & CStatd)
1065 && (tdc->flags & DFFetching)
1066 && hsame(adp->m.DataVersion, tdc->f.versionNo)) {
1067 tdc->flags |= DFWaiting;
1068 ReleaseReadLock(&adp->lock);
1069 afs_osi_Sleep(&tdc->validPos);
1070 ObtainReadLock(&adp->lock);
1072 if (!(adp->states & CStatd)
1073 || !hsame(adp->m.DataVersion, tdc->f.versionNo)) {
1074 ReleaseReadLock(&adp->lock);
1079 /* Save the version number for when we call osi_dnlc_enter */
1080 hset(versionNo, tdc->f.versionNo);
1082 theDir = tdc->f.inode;
1083 code = afs_dir_LookupOffset(&theDir, tname, &tfid.Fid, &dirCookie);
1084 if (code == ENOENT && tname == aname) {
1086 len = strlen(aname);
1087 if (len >= 4 && AFS_EQ_ATSYS(aname+len-4)) {
1088 tname = (char *) osi_AllocLargeSpace(AFS_LRALLOCSIZ);
1089 afs_HandleAtName(aname, tname, &treq, adp);
1090 code = afs_dir_LookupOffset(&theDir, tname, &tfid.Fid, &dirCookie);
1093 ReleaseReadLock(&adp->lock);
1096 /* new fid has same cell and volume */
1097 tfid.Cell = adp->fid.Cell;
1098 tfid.Fid.Volume = adp->fid.Fid.Volume;
1099 afs_Trace4(afs_iclSetp, CM_TRACE_LOOKUP, ICL_TYPE_POINTER, adp,
1100 ICL_TYPE_STRING, tname,
1101 ICL_TYPE_FID, &tfid, ICL_TYPE_INT32, code);
1104 if (code != ENOENT) {
1105 printf("LOOKUP dirLookupOff -> %d\n", code);
1110 /* prefetch some entries, if the dir is currently open. The variable
1111 * dirCookie tells us where to start prefetching from.
1113 if (AFSDOBULK && adp->opens > 0 && !(adp->states & CForeign)) {
1115 /* if the entry is not in the cache, or is in the cache,
1116 * but hasn't been statd, then do a bulk stat operation.
1120 ObtainReadLock(&afs_xvcache);
1121 tvc = afs_FindVCache(&tfid, 1, 0, &retry, 0/* !stats,!lru */);
1122 ReleaseReadLock(&afs_xvcache);
1123 } while (tvc && retry);
1125 if (!tvc || !(tvc->states & CStatd)) {
1126 afs_DoBulkStat(adp, dirCookie, &treq);
1129 /* if the vcache isn't usable, release it */
1130 if (tvc && !(tvc->states & CStatd)) {
1132 tvc = (struct vcache *) 0;
1135 else tvc = (struct vcache *) 0;
1137 /* now get the status info, if we don't already have it */
1138 /* This is kind of weird, but we might wind up accidentally calling
1139 * RXAFS_Lookup because we happened upon a file which legitimately
1140 * has a 0 uniquifier. That is the result of allowing unique to wrap
1141 * to 0. This was fixed in AFS 3.4. For CForeigh, Unique == 0 means that
1142 * the file has not yet been looked up.
1145 afs_int32 cached = 0;
1146 if (!tfid.Fid.Unique && (adp->states & CForeign)) {
1147 tvc = afs_LookupVCache(&tfid, &treq, &cached, WRITE_LOCK,
1150 if (!tvc) { /* lookup failed or wasn't called */
1151 tvc = afs_GetVCache(&tfid, &treq, &cached, (struct vcache*)0,
1155 } /* sub-block just to reduce stack usage */
1158 if (adp->states & CForeign)
1159 tvc->states |= CForeign;
1160 tvc->parentVnode = adp->fid.Fid.Vnode;
1161 tvc->parentUnique = adp->fid.Fid.Unique;
1162 tvc->states &= ~CBulkStat;
1163 if (tvc->mvstat == 1) {
1164 /* a mt point, possibly unevaluated */
1165 struct volume *tvolp;
1167 ObtainWriteLock(&tvc->lock,133);
1168 code = EvalMountPoint(tvc, adp, &tvolp, &treq);
1169 ReleaseWriteLock(&tvc->lock);
1170 /* next, we want to continue using the target of the mt point */
1171 if (tvc->mvid && (tvc->states & CMValid)) {
1173 /* now lookup target, to set .. pointer */
1174 afs_Trace2(afs_iclSetp, CM_TRACE_LOOKUP1,
1175 ICL_TYPE_POINTER, tvc, ICL_TYPE_FID, &tvc->fid);
1176 uvc = tvc; /* remember for later */
1178 if (tvolp && (tvolp->states & VForeign)) {
1179 /* XXXX tvolp has ref cnt on but not locked! XXX */
1180 tvc = afs_GetRootVCache(tvc->mvid, &treq, (afs_int32 *)0, tvolp, WRITE_LOCK);
1182 tvc = afs_GetVCache(tvc->mvid, &treq, (afs_int32 *)0,
1183 (struct vcache*)0, WRITE_LOCK);
1185 afs_PutVCache(uvc, WRITE_LOCK); /* we're done with it */
1190 afs_PutVolume(tvolp, WRITE_LOCK);
1195 /* now, if we came via a new mt pt (say because of a new
1196 * release of a R/O volume), we must reevaluate the ..
1197 * ptr to point back to the appropriate place */
1199 ObtainWriteLock(&tvc->lock,134);
1200 if (tvc->mvid == (struct VenusFid *) 0) {
1201 tvc->mvid = (struct VenusFid *) osi_AllocSmallSpace(sizeof(struct VenusFid));
1203 /* setup backpointer */
1204 *tvc->mvid = tvolp->dotdot;
1205 ReleaseWriteLock(&tvc->lock);
1206 afs_PutVolume(tvolp, WRITE_LOCK);
1210 afs_PutVCache(tvc, WRITE_LOCK);
1212 if (tvolp) afs_PutVolume(tvolp, WRITE_LOCK);
1217 if (tvc && !tvc->vrefCount) {
1223 /* if we get here, we found something in a directory that couldn't
1224 be located (a Multics "connection failure"). If the volume is
1225 read-only, we try flushing this entry from the cache and trying
1229 tv = afs_GetVolume(&adp->fid, &treq, READ_LOCK);
1231 if (tv->states & VRO) {
1232 pass = 1; /* try this *once* */
1233 ObtainWriteLock(&afs_xcbhash, 495);
1234 afs_DequeueCallback(adp);
1235 /* re-stat to get later version */
1236 adp->states &= ~CStatd;
1237 ReleaseWriteLock(&afs_xcbhash);
1238 osi_dnlc_purgedp(adp);
1239 afs_PutVolume(tv, READ_LOCK);
1242 afs_PutVolume(tv, READ_LOCK);
1249 /* put the network buffer back, if need be */
1250 if (tname != aname && tname) osi_FreeLargeSpace(tname);
1253 /* Handle RENAME; only need to check rename "." */
1254 if (opflag == RENAME && wantparent && *ndp->ni_next == 0) {
1255 if (!FidCmp(&(tvc->fid), &(adp->fid))) {
1256 afs_PutVCache(*avcp, WRITE_LOCK);
1258 return afs_CheckCode(EISDIR, &treq, 18);
1261 #endif /* AFS_OSF_ENV */
1264 afs_AddMarinerName(aname, tvc);
1266 osi_dnlc_enter (adp, aname, tvc, &versionNo);
1269 #ifdef AFS_LINUX20_ENV
1270 /* So Linux inode cache is up to date. */
1271 code = afs_VerifyVCache(tvc, &treq);
1273 return 0; /* can't have been any errors if hit and !code */
1277 code = afs_CheckCode(code, &treq, 19);
1279 /* If there is an error, make sure *avcp is null.
1280 * Alphas panic otherwise - defect 10719.
1282 *avcp = (struct vcache *)0;