src/afs/VNOPS/afs_vnop_lookup.c

   1 /*
   2  * Copyright 2000, International Business Machines Corporation and others.
   3  * All Rights Reserved.
   4  *
   5  * This software has been released under the terms of the IBM Public
   6  * License.  For details, see the LICENSE file in the top-level source
   7  * directory or online at http://www.openafs.org/dl/license10.html
   8  */
   9
  10 /*
  11  * Implements:
  12  * afs_lookup
  13  * EvalMountPoint
  14  * afs_DoBulkStat
  15  */
  16
  17 #include <afsconfig.h>
  18 #include "afs/param.h"
  19
  20 #include "afs/sysincludes.h"    /* Standard vendor system headers */
  21 #include "afsincludes.h"        /* Afs-based standard headers */
  22 #include "afs/afs_stats.h"      /* statistics */
  23 #include "afs/afs_cbqueue.h"
  24 #include "afs/nfsclient.h"
  25 #include "afs/exporter.h"
  26 #include "afs/afs_osidnlc.h"
  27 #include "afs/afs_dynroot.h"
  28
  29 extern struct vcache *afs_globalVp;
  30
  31 afs_int32 afs_bkvolpref = 0;
  32 afs_int32 afs_bulkStatsDone;
  33 static int bulkStatCounter = 0; /* counter for bulk stat seq. numbers */
  34 int afs_fakestat_enable = 0;    /* 1: fakestat-all, 2: fakestat-crosscell */
  35
  36
  37 /* this would be faster if it did comparison as int32word, but would be
  38  * dependant on byte-order and alignment, and I haven't figured out
  39  * what "@sys" is in binary... */
  40 #define AFS_EQ_ATSYS(name) (((name)[0]=='@')&&((name)[1]=='s')&&((name)[2]=='y')&&((name)[3]=='s')&&(!(name)[4]))
  41
  42 /* call under write lock, evaluate mvid field from a mt pt.
  43  * avc is the vnode of the mount point object; must be write-locked.
  44  * advc is the vnode of the containing directory (optional; if NULL and
  45  *   EvalMountPoint succeeds, caller must initialize *avolpp->dotdot)
  46  * avolpp is where we return a pointer to the volume named by the mount pt, if success
  47  * areq is the identity of the caller.
  48  *
  49  * NOTE: this function returns a held volume structure in *volpp if it returns 0!
  50  */
  51 static int
  52 EvalMountData(char type, char *data, afs_uint32 states, afs_uint32 cellnum,
  53               struct volume **avolpp, register struct vrequest *areq,
  54               afs_uint32 *acellidxp, afs_uint32 *avolnump,
  55               afs_uint32 *avnoidp, afs_uint32 *auniqp)
  56 {
  57     struct volume *tvp = 0;
  58     struct VenusFid tfid;
  59     struct cell *tcell;
  60     char *cpos, *volnamep;
  61     char *buf, *endptr;
  62     afs_int32 prefetch;         /* 1=>None  2=>RO  3=>BK */
  63     afs_int32 mtptCell, assocCell = 0, hac = 0;
  64     afs_int32 samecell, roname, len;
  65     afs_uint32 volid = 0, cellidx, vnoid = 0, uniq = 0;
  66
  67     /* Start by figuring out and finding the cell */
  68     cpos = afs_strchr(data, ':');       /* if cell name present */
  69     if (cpos) {
  70         volnamep = cpos + 1;
  71         *cpos = 0;
  72         if ((afs_strtoi_r(data, &endptr, &cellnum) == 0) &&
  73             (endptr == cpos))
  74             tcell = afs_GetCell(cellnum, READ_LOCK);
  75         else {
  76             tcell = afs_GetCellByName(data, READ_LOCK);
  77             cellnum = 0;
  78         }
  79         *cpos = ':';
  80     } else if (cellnum) {
  81         volnamep = data;
  82         tcell = afs_GetCell(cellnum, READ_LOCK);
  83     } else {
  84         /* No cellname or cellnum; return ENODEV */
  85         return ENODEV;
  86     }
  87     if (!tcell) {
  88         /* no cell found; return ENODEV */
  89         return ENODEV;
  90     }
  91
  92     cellidx = tcell->cellIndex;
  93     mtptCell = tcell->cellNum;  /* The cell for the mountpoint */
  94     if (tcell->lcellp) {
  95         hac = 1;                /* has associated cell */
  96         assocCell = tcell->lcellp->cellNum;     /* The associated cell */
  97     }
  98     afs_PutCell(tcell, READ_LOCK);
  99
 100     /* If there's nothing to look up, we can't proceed */
 101     if (!*volnamep)
 102         return ENODEV;
 103
 104     /* cell found. figure out volume */
 105     cpos = afs_strchr(volnamep, ':');
 106     if (cpos)
 107         *cpos = 0;
 108
 109     /* Look for an all-numeric volume ID */
 110     if ((afs_strtoi_r(volnamep, &endptr, &volid) == 0) &&
 111         ((endptr == cpos) || (!*endptr)))
 112     {
 113         /* Ok. Is there a vnode and uniq? */
 114         if (cpos) {
 115             char *vnodep = (char *)(cpos + 1);
 116             char *uniqp = NULL;
 117             if ((!*vnodep) /* no vnode after colon */
 118                 || !(uniqp = afs_strchr(vnodep, ':')) /* no colon for uniq */
 119                 || (!*(++uniqp)) /* no uniq after colon */
 120                 || (afs_strtoi_r(vnodep, &endptr, &vnoid) != 0) /* bad vno */
 121                 || (*endptr != ':') /* bad vnode field */
 122                 || (afs_strtoi_r(uniqp, &endptr, &uniq) != 0) /* bad uniq */
 123                 || (*endptr)) /* anything after uniq */
 124             {
 125                 *cpos = ':';
 126                 /* sorry. vnode and uniq, or nothing */
 127                 return ENODEV;
 128             }
 129         }
 130     } else
 131             volid = 0;
 132
 133     /*
 134      * If the volume ID was all-numeric, and they didn't ask for a
 135      * pointer to the volume structure, then just return the number
 136      * as-is.  This is currently only used for handling name lookups
 137      * in the dynamic mount directory.
 138      */
 139     if (volid && !avolpp) {
 140         if (*cpos)
 141             *cpos = ':';
 142         goto done;
 143     }
 144
 145     /*
 146      * If the volume ID was all-numeric, and the type was '%', then
 147      * assume whoever made the mount point knew what they were doing,
 148      * and don't second-guess them by forcing use of a RW volume when
 149      * they gave the ID of something else.
 150      */
 151     if (volid && type == '%') {
 152         tfid.Fid.Volume = volid;        /* remember BK volume */
 153         tfid.Cell = mtptCell;
 154         tvp = afs_GetVolume(&tfid, areq, WRITE_LOCK);   /* get the new one */
 155         if (cpos) /* one way or another we're done */
 156             *cpos = ':';
 157         if (!tvp)
 158             return ENODEV; /* afs_GetVolume failed; return ENODEV */
 159         goto done;
 160     }
 161
 162     /* Is volume name a "<n>.backup" or "<n>.readonly" name */
 163     len = strlen(volnamep);
 164     roname = ((len > 9) && (strcmp(&volnamep[len - 9], ".readonly") == 0))
 165         || ((len > 7) && (strcmp(&volnamep[len - 7], ".backup") == 0));
 166
 167     /* When we cross mountpoint, do we stay in the same cell */
 168     samecell = (cellnum == mtptCell) || (hac && (cellnum == assocCell));
 169
 170     /* Decide whether to prefetch the BK, or RO.  Also means we want the BK or
 171      * RO.
 172      * If this is a regular mountpoint with a RW volume name
 173      * - If BK preference is enabled AND we remain within the same cell AND
 174      *   start from a BK volume, then we will want to prefetch the BK volume.
 175      * - If we cross a cell boundary OR start from a RO volume, then we will
 176      *   want to prefetch the RO volume.
 177      */
 178     if ((type == '#') && !roname) {
 179         if (afs_bkvolpref && samecell && (states & CBackup))
 180             prefetch = 3;       /* Prefetch the BK */
 181         else if (!samecell || (states & CRO))
 182             prefetch = 2;       /* Prefetch the RO */
 183         else
 184             prefetch = 1;       /* Do not prefetch */
 185     } else {
 186         prefetch = 1;           /* Do not prefetch */
 187     }
 188
 189     /* Get the volume struct. Unless this volume name has ".readonly" or
 190      * ".backup" in it, this will get the volume struct for the RW volume.
 191      * The RO volume will be prefetched if requested (but not returned).
 192      * Set up to use volname first.
 193      */
 194     tvp = afs_GetVolumeByName(volnamep, mtptCell, prefetch, areq, WRITE_LOCK);
 195
 196     /* If no volume was found in this cell, try the associated linked cell */
 197     if (!tvp && hac && areq->volumeError) {
 198         tvp =
 199             afs_GetVolumeByName(volnamep, assocCell, prefetch, areq,
 200                                 WRITE_LOCK);
 201     }
 202
 203     /* Still not found. If we are looking for the RO, then perhaps the RW
 204      * doesn't exist? Try adding ".readonly" to volname and look for that.
 205      * Don't know why we do this. Would have still found it in above call - jpm.
 206      */
 207     if (!tvp && (prefetch == 2) && len < AFS_SMALLOCSIZ - 10) {
 208         buf = (char *)osi_AllocSmallSpace(len + 10);
 209
 210         strcpy(buf, volnamep);
 211         afs_strcat(buf, ".readonly");
 212
 213         tvp = afs_GetVolumeByName(buf, mtptCell, 1, areq, WRITE_LOCK);
 214
 215         /* Try the associated linked cell if failed */
 216         if (!tvp && hac && areq->volumeError) {
 217             tvp = afs_GetVolumeByName(buf, assocCell, 1, areq, WRITE_LOCK);
 218         }
 219         osi_FreeSmallSpace(buf);
 220     }
 221     /* done with volname */
 222     if (cpos)
 223         *cpos = ':';
 224     if (!tvp)
 225         return ENODEV;          /* Couldn't find the volume */
 226     else
 227         volid = tvp->volume;
 228
 229     /* Don't cross mountpoint from a BK to a BK volume */
 230     if ((states & CBackup) && (tvp->states & VBackup)) {
 231         afs_PutVolume(tvp, WRITE_LOCK);
 232         return ENODEV;
 233     }
 234
 235     /* If we want (prefetched) the BK and it exists, then drop the RW volume
 236      * and get the BK.
 237      * Otherwise, if we want (prefetched0 the RO and it exists, then drop the
 238      * RW volume and get the RO.
 239      * Otherwise, go with the RW.
 240      */
 241     if ((prefetch == 3) && tvp->backVol) {
 242         tfid.Fid.Volume = tvp->backVol; /* remember BK volume */
 243         tfid.Cell = tvp->cell;
 244         afs_PutVolume(tvp, WRITE_LOCK); /* release old volume */
 245         tvp = afs_GetVolume(&tfid, areq, WRITE_LOCK);   /* get the new one */
 246         if (!tvp)
 247             return ENODEV;      /* oops, can't do it */
 248     } else if ((prefetch >= 2) && tvp->roVol) {
 249         tfid.Fid.Volume = tvp->roVol;   /* remember RO volume */
 250         tfid.Cell = tvp->cell;
 251         afs_PutVolume(tvp, WRITE_LOCK); /* release old volume */
 252         tvp = afs_GetVolume(&tfid, areq, WRITE_LOCK);   /* get the new one */
 253         if (!tvp)
 254             return ENODEV;      /* oops, can't do it */
 255     }
 256
 257 done:
 258     if (acellidxp)
 259         *acellidxp = cellidx;
 260     if (avolnump)
 261         *avolnump = volid;
 262     if (avnoidp)
 263         *avnoidp = vnoid;
 264     if (auniqp)
 265         *auniqp = uniq;
 266     if (avolpp)
 267         *avolpp = tvp;
 268     else if (tvp)
 269         afs_PutVolume(tvp, WRITE_LOCK);
 270     return 0;
 271 }
 272
 273 int
 274 EvalMountPoint(register struct vcache *avc, struct vcache *advc,
 275                struct volume **avolpp, register struct vrequest *areq)
 276 {
 277     afs_int32 code;
 278     afs_uint32 avnoid, auniq;
 279
 280     AFS_STATCNT(EvalMountPoint);
 281 #ifdef notdef
 282     if (avc->mvid && (avc->f.states & CMValid))
 283         return 0;               /* done while racing */
 284 #endif
 285     *avolpp = NULL;
 286     code = afs_HandleLink(avc, areq);
 287     if (code)
 288         return code;
 289
 290     /* Determine which cell and volume the mointpoint goes to */
 291     code = EvalMountData(avc->linkData[0], avc->linkData + 1,
 292                          avc->f.states, avc->f.fid.Cell, avolpp, areq, 0, 0,
 293                          &avnoid, &auniq);
 294     if (code) return code;
 295
 296     if (!avnoid)
 297         avnoid = 1;
 298
 299     if (!auniq)
 300         auniq = 1;
 301
 302     if (avc->mvid == 0)
 303         avc->mvid =
 304             (struct VenusFid *)osi_AllocSmallSpace(sizeof(struct VenusFid));
 305     avc->mvid->Cell = (*avolpp)->cell;
 306     avc->mvid->Fid.Volume = (*avolpp)->volume;
 307     avc->mvid->Fid.Vnode = avnoid;
 308     avc->mvid->Fid.Unique = auniq;
 309     avc->f.states |= CMValid;
 310
 311     /* Used to: if the mount point is stored within a backup volume,
 312      * then we should only update the parent pointer information if
 313      * there's none already set, so as to avoid updating a volume's ..
 314      * info with something in an OldFiles directory.
 315      *
 316      * Next two lines used to be under this if:
 317      *
 318      * if (!(avc->f.states & CBackup) || tvp->dotdot.Fid.Volume == 0)
 319      *
 320      * Now: update mount point back pointer on every call, so that we handle
 321      * multiple mount points better.  This way, when du tries to go back
 322      * via chddir(".."), it will end up exactly where it started, yet
 323      * cd'ing via a new path to a volume will reset the ".." pointer
 324      * to the new path.
 325      */
 326     (*avolpp)->mtpoint = avc->f.fid;    /* setup back pointer to mtpoint */
 327
 328     if (advc)
 329         (*avolpp)->dotdot = advc->f.fid;
 330
 331     return 0;
 332 }
 333
 334 /*
 335  * afs_InitFakeStat
 336  *
 337  * Must be called on an afs_fakestat_state object before calling
 338  * afs_EvalFakeStat or afs_PutFakeStat.  Calling afs_PutFakeStat
 339  * without calling afs_EvalFakeStat is legal, as long as this
 340  * function is called.
 341  */
 342 void
 343 afs_InitFakeStat(struct afs_fakestat_state *state)
 344 {
 345     if (!afs_fakestat_enable)
 346         return;
 347
 348     state->valid = 1;
 349     state->did_eval = 0;
 350     state->need_release = 0;
 351 }
 352
 353 /*
 354  * afs_EvalFakeStat_int
 355  *
 356  * The actual implementation of afs_EvalFakeStat and afs_TryEvalFakeStat,
 357  * which is called by those wrapper functions.
 358  *
 359  * Only issues RPCs if canblock is non-zero.
 360  */
 361 static int
 362 afs_EvalFakeStat_int(struct vcache **avcp, struct afs_fakestat_state *state,
 363                      struct vrequest *areq, int canblock)
 364 {
 365     struct vcache *tvc, *root_vp;
 366     struct volume *tvolp = NULL;
 367     int code = 0;
 368
 369     if (!afs_fakestat_enable)
 370         return 0;
 371
 372     osi_Assert(state->valid == 1);
 373     osi_Assert(state->did_eval == 0);
 374     state->did_eval = 1;
 375
 376     tvc = *avcp;
 377     if (tvc->mvstat != 1)
 378         return 0;
 379
 380     if (canblock) {
 381         /* Is the call to VerifyVCache really necessary? */
 382         code = afs_VerifyVCache(tvc, areq);
 383         if (code)
 384             goto done;
 385
 386         ObtainWriteLock(&tvc->lock, 599);
 387         code = EvalMountPoint(tvc, NULL, &tvolp, areq);
 388         ReleaseWriteLock(&tvc->lock);
 389         if (code)
 390             goto done;
 391         if (tvolp) {
 392             tvolp->dotdot = tvc->f.fid;
 393             tvolp->dotdot.Fid.Vnode = tvc->f.parent.vnode;
 394             tvolp->dotdot.Fid.Unique = tvc->f.parent.unique;
 395         }
 396     }
 397     if (tvc->mvid && (tvc->f.states & CMValid)) {
 398         if (!canblock) {
 399             afs_int32 retry;
 400
 401             do {
 402                 retry = 0;
 403                 ObtainWriteLock(&afs_xvcache, 597);
 404                 root_vp = afs_FindVCache(tvc->mvid, &retry, IS_WLOCK);
 405                 if (root_vp && retry) {
 406                     ReleaseWriteLock(&afs_xvcache);
 407                     afs_PutVCache(root_vp);
 408                 }
 409             } while (root_vp && retry);
 410             ReleaseWriteLock(&afs_xvcache);
 411         } else {
 412             root_vp = afs_GetVCache(tvc->mvid, areq, NULL, NULL);
 413         }
 414         if (!root_vp) {
 415             code = canblock ? ENOENT : 0;
 416             goto done;
 417         }
 418 #ifdef AFS_DARWIN80_ENV
 419         root_vp->f.m.Type = VDIR;
 420         AFS_GUNLOCK();
 421         code = afs_darwin_finalizevnode(root_vp, NULL, NULL, 0, 0);
 422         AFS_GLOCK();
 423         if (code) goto done;
 424         vnode_ref(AFSTOV(root_vp));
 425 #endif
 426         if (tvolp && !afs_InReadDir(root_vp)) {
 427             /* Is this always kosher?  Perhaps we should instead use
 428              * NBObtainWriteLock to avoid potential deadlock.
 429              */
 430             ObtainWriteLock(&root_vp->lock, 598);
 431             if (!root_vp->mvid)
 432                 root_vp->mvid = osi_AllocSmallSpace(sizeof(struct VenusFid));
 433             *root_vp->mvid = tvolp->dotdot;
 434             ReleaseWriteLock(&root_vp->lock);
 435         }
 436         state->need_release = 1;
 437         state->root_vp = root_vp;
 438         *avcp = root_vp;
 439         code = 0;
 440     } else {
 441         code = canblock ? ENOENT : 0;
 442     }
 443
 444   done:
 445     if (tvolp)
 446         afs_PutVolume(tvolp, WRITE_LOCK);
 447     return code;
 448 }
 449
 450 /*
 451  * afs_EvalFakeStat
 452  *
 453  * Automatically does the equivalent of EvalMountPoint for vcache entries
 454  * which are mount points.  Remembers enough state to properly release
 455  * the volume root vcache when afs_PutFakeStat() is called.
 456  *
 457  * State variable must be initialized by afs_InitFakeState() beforehand.
 458  *
 459  * Returns 0 when everything succeeds and *avcp points to the vcache entry
 460  * that should be used for the real vnode operation.  Returns non-zero if
 461  * something goes wrong and the error code should be returned to the user.
 462  */
 463 int
 464 afs_EvalFakeStat(struct vcache **avcp, struct afs_fakestat_state *state,
 465                  struct vrequest *areq)
 466 {
 467     return afs_EvalFakeStat_int(avcp, state, areq, 1);
 468 }
 469
 470 /*
 471  * afs_TryEvalFakeStat
 472  *
 473  * Same as afs_EvalFakeStat, but tries not to talk to remote servers
 474  * and only evaluate the mount point if all the data is already in
 475  * local caches.
 476  *
 477  * Returns 0 if everything succeeds and *avcp points to a valid
 478  * vcache entry (possibly evaluated).
 479  */
 480 int
 481 afs_TryEvalFakeStat(struct vcache **avcp, struct afs_fakestat_state *state,
 482                     struct vrequest *areq)
 483 {
 484     return afs_EvalFakeStat_int(avcp, state, areq, 0);
 485 }
 486
 487 /*
 488  * afs_PutFakeStat
 489  *
 490  * Perform any necessary cleanup at the end of a vnode op, given that
 491  * afs_InitFakeStat was previously called with this state.
 492  */
 493 void
 494 afs_PutFakeStat(struct afs_fakestat_state *state)
 495 {
 496     if (!afs_fakestat_enable)
 497         return;
 498
 499     osi_Assert(state->valid == 1);
 500     if (state->need_release)
 501         afs_PutVCache(state->root_vp);
 502     state->valid = 0;
 503 }
 504
 505 int
 506 afs_ENameOK(register char *aname)
 507 {
 508     register int tlen;
 509
 510     AFS_STATCNT(ENameOK);
 511     tlen = strlen(aname);
 512     if (tlen >= 4 && strcmp(aname + tlen - 4, "@sys") == 0)
 513         return 0;
 514     return 1;
 515 }
 516
 517 static int
 518 afs_getsysname(register struct vrequest *areq, register struct vcache *adp,
 519                register char *bufp, int *num, char **sysnamelist[])
 520 {
 521     register struct unixuser *au;
 522     register afs_int32 error;
 523
 524     AFS_STATCNT(getsysname);
 525
 526     *sysnamelist = afs_sysnamelist;
 527
 528     if (!afs_nfsexporter)
 529         strcpy(bufp, (*sysnamelist)[0]);
 530     else {
 531         au = afs_GetUser(areq->uid, adp->f.fid.Cell, 0);
 532         if (au->exporter) {
 533             error = EXP_SYSNAME(au->exporter, (char *)0, sysnamelist, num, 0);
 534             if (error) {
 535                 strcpy(bufp, "@sys");
 536                 afs_PutUser(au, 0);
 537                 return -1;
 538             } else {
 539                 strcpy(bufp, (*sysnamelist)[0]);
 540             }
 541         } else
 542             strcpy(bufp, afs_sysname);
 543         afs_PutUser(au, 0);
 544     }
 545     return 0;
 546 }
 547
 548 void
 549 Check_AtSys(register struct vcache *avc, const char *aname,
 550             struct sysname_info *state, struct vrequest *areq)
 551 {
 552     int num = 0;
 553     char **sysnamelist[MAXNUMSYSNAMES];
 554
 555     if (AFS_EQ_ATSYS(aname)) {
 556         state->offset = 0;
 557         state->name = (char *)osi_AllocLargeSpace(MAXSYSNAME);
 558         state->allocked = 1;
 559         state->index =
 560             afs_getsysname(areq, avc, state->name, &num, sysnamelist);
 561     } else {
 562         state->offset = -1;
 563         state->allocked = 0;
 564         state->index = 0;
 565         state->name = (char *)aname;
 566     }
 567 }
 568
 569 int
 570 Next_AtSys(register struct vcache *avc, struct vrequest *areq,
 571            struct sysname_info *state)
 572 {
 573     int num = afs_sysnamecount;
 574     char **sysnamelist[MAXNUMSYSNAMES];
 575
 576     if (state->index == -1)
 577         return 0;               /* No list */
 578
 579     /* Check for the initial state of aname != "@sys" in Check_AtSys */
 580     if (state->offset == -1 && state->allocked == 0) {
 581         register char *tname;
 582
 583         /* Check for .*@sys */
 584         for (tname = state->name; *tname; tname++)
 585             /*Move to the end of the string */ ;
 586
 587         if ((tname > state->name + 4) && (AFS_EQ_ATSYS(tname - 4))) {
 588             state->offset = (tname - 4) - state->name;
 589             tname = (char *)osi_AllocLargeSpace(AFS_LRALLOCSIZ);
 590             strncpy(tname, state->name, state->offset);
 591             state->name = tname;
 592             state->allocked = 1;
 593             num = 0;
 594             state->index =
 595                 afs_getsysname(areq, avc, state->name + state->offset, &num,
 596                                sysnamelist);
 597             return 1;
 598         } else
 599             return 0;           /* .*@sys doesn't match either */
 600     } else {
 601         register struct unixuser *au;
 602         register afs_int32 error;
 603
 604         *sysnamelist = afs_sysnamelist;
 605
 606         if (afs_nfsexporter) {
 607             au = afs_GetUser(areq->uid, avc->f.fid.Cell, 0);
 608             if (au->exporter) {
 609                 error =
 610                     EXP_SYSNAME(au->exporter, (char *)0, sysnamelist, &num, 0);
 611                 if (error) {
 612                     afs_PutUser(au, 0);
 613                     return 0;
 614                 }
 615             }
 616             afs_PutUser(au, 0);
 617         }
 618         if (++(state->index) >= num || !(*sysnamelist)[(unsigned int)state->index])
 619             return 0;           /* end of list */
 620     }
 621     strcpy(state->name + state->offset, (*sysnamelist)[(unsigned int)state->index]);
 622     return 1;
 623 }
 624
 625 extern int BlobScan(struct dcache * afile, afs_int32 ablob);
 626
 627 /* called with an unlocked directory and directory cookie.  Areqp
 628  * describes who is making the call.
 629  * Scans the next N (about 30, typically) directory entries, and does
 630  * a bulk stat call to stat them all.
 631  *
 632  * Must be very careful when merging in RPC responses, since we dont
 633  * want to overwrite newer info that was added by a file system mutating
 634  * call that ran concurrently with our bulk stat call.
 635  *
 636  * We do that, as described below, by not merging in our info (always
 637  * safe to skip the merge) if the status info is valid in the vcache entry.
 638  *
 639  * If adapt ever implements the bulk stat RPC, then this code will need to
 640  * ensure that vcaches created for failed RPC's to older servers have the
 641  * CForeign bit set.
 642  */
 643 static struct vcache *BStvc = NULL;
 644
 645 int
 646 afs_DoBulkStat(struct vcache *adp, long dirCookie, struct vrequest *areqp)
 647 {
 648     int nentries;               /* # of entries to prefetch */
 649     int nskip;                  /* # of slots in the LRU queue to skip */
 650     int novlru = 0;             /* Currently Darwin-only but can be used
 651                                    globally if needed */
 652 #ifdef AFS_DARWIN80_ENV
 653     int npasses = 0;
 654     struct vnode *lruvp;
 655 #endif
 656     struct vcache *lruvcp;      /* vcache ptr of our goal pos in LRU queue */
 657     struct dcache *dcp;         /* chunk containing the dir block */
 658     afs_size_t temp;            /* temp for holding chunk length, &c. */
 659     struct AFSFid *fidsp;       /* file IDs were collecting */
 660     struct AFSCallBack *cbsp;   /* call back pointers */
 661     struct AFSCallBack *tcbp;   /* temp callback ptr */
 662     struct AFSFetchStatus *statsp;      /* file status info */
 663     struct AFSVolSync volSync;  /* vol sync return info */
 664     struct vcache *tvcp;        /* temp vcp */
 665     struct afs_q *tq;           /* temp queue variable */
 666     AFSCBFids fidParm;          /* file ID parm for bulk stat */
 667     AFSBulkStats statParm;      /* stat info parm for bulk stat */
 668     int fidIndex = 0;           /* which file were stating */
 669     struct afs_conn *tcp = 0;   /* conn for call */
 670     AFSCBs cbParm;              /* callback parm for bulk stat */
 671     struct server *hostp = 0;   /* host we got callback from */
 672     long startTime;             /* time we started the call,
 673                                  * for callback expiration base
 674                                  */
 675     afs_size_t statSeqNo = 0;   /* Valued of file size to detect races */
 676     int code;                   /* error code */
 677     long newIndex;              /* new index in the dir */
 678     struct DirEntry *dirEntryp; /* dir entry we are examining */
 679     int i;
 680     struct VenusFid afid;       /* file ID we are using now */
 681     struct VenusFid tfid;       /* another temp. file ID */
 682     afs_int32 retry;            /* handle low-level SGI MP race conditions */
 683     long volStates;             /* flags from vol structure */
 684     struct volume *volp = 0;    /* volume ptr */
 685     struct VenusFid dotdot = {0, {0, 0, 0}};
 686     int flagIndex = 0;          /* First file with bulk fetch flag set */
 687     int inlinebulk = 0;         /* Did we use InlineBulk RPC or not? */
 688     XSTATS_DECLS;
 689     dotdot.Cell = 0;
 690     dotdot.Fid.Unique = 0;
 691     dotdot.Fid.Vnode = 0;
 692
 693     /* first compute some basic parameters.  We dont want to prefetch more
 694      * than a fraction of the cache in any given call, and we want to preserve
 695      * a portion of the LRU queue in any event, so as to avoid thrashing
 696      * the entire stat cache (we will at least leave some of it alone).
 697      * presently dont stat more than 1/8 the cache in any one call.      */
 698     nentries = afs_cacheStats / 8;
 699
 700     /* dont bother prefetching more than one calls worth of info */
 701     if (nentries > AFSCBMAX)
 702         nentries = AFSCBMAX;
 703
 704     /* heuristic to make sure that things fit in 4K.  This means that
 705      * we shouldnt make it any bigger than 47 entries.  I am typically
 706      * going to keep it a little lower, since we don't want to load
 707      * too much of the stat cache.
 708      */
 709     if (nentries > 30)
 710         nentries = 30;
 711
 712     /* now, to reduce the stack size, well allocate two 4K blocks,
 713      * one for fids and callbacks, and one for stat info.  Well set
 714      * up our pointers to the memory from there, too.
 715      */
 716     statsp = (AFSFetchStatus *)
 717             osi_Alloc(AFSCBMAX * sizeof(AFSFetchStatus));
 718     fidsp = (AFSFid *) osi_AllocLargeSpace(nentries * sizeof(AFSFid));
 719     cbsp = (AFSCallBack *)
 720             osi_Alloc(AFSCBMAX * sizeof(AFSCallBack));
 721
 722     /* next, we must iterate over the directory, starting from the specified
 723      * cookie offset (dirCookie), and counting out nentries file entries.
 724      * We skip files that already have stat cache entries, since we
 725      * dont want to bulk stat files that are already in the cache.
 726      */
 727   tagain:
 728     code = afs_VerifyVCache(adp, areqp);
 729     if (code)
 730         goto done2;
 731
 732     dcp = afs_GetDCache(adp, (afs_size_t) 0, areqp, &temp, &temp, 1);
 733     if (!dcp) {
 734         code = ENOENT;
 735         goto done2;
 736     }
 737
 738     /* lock the directory cache entry */
 739     ObtainReadLock(&adp->lock);
 740     ObtainReadLock(&dcp->lock);
 741
 742     /*
 743      * Make sure that the data in the cache is current. There are two
 744      * cases we need to worry about:
 745      * 1. The cache data is being fetched by another process.
 746      * 2. The cache data is no longer valid
 747      */
 748     while ((adp->f.states & CStatd)
 749            && (dcp->dflags & DFFetching)
 750            && hsame(adp->f.m.DataVersion, dcp->f.versionNo)) {
 751         afs_Trace4(afs_iclSetp, CM_TRACE_DCACHEWAIT, ICL_TYPE_STRING,
 752                    __FILE__, ICL_TYPE_INT32, __LINE__, ICL_TYPE_POINTER, dcp,
 753                    ICL_TYPE_INT32, dcp->dflags);
 754         ReleaseReadLock(&dcp->lock);
 755         ReleaseReadLock(&adp->lock);
 756         afs_osi_Sleep(&dcp->validPos);
 757         ObtainReadLock(&adp->lock);
 758         ObtainReadLock(&dcp->lock);
 759     }
 760     if (!(adp->f.states & CStatd)
 761         || !hsame(adp->f.m.DataVersion, dcp->f.versionNo)) {
 762         ReleaseReadLock(&dcp->lock);
 763         ReleaseReadLock(&adp->lock);
 764         afs_PutDCache(dcp);
 765         goto tagain;
 766     }
 767
 768     /* Generate a sequence number so we can tell whether we should
 769      * store the attributes when processing the response. This number is
 770      * stored in the file size when we set the CBulkFetching bit. If the
 771      * CBulkFetching is still set and this value hasn't changed, then
 772      * we know we were the last to set CBulkFetching bit for this file,
 773      * and it is safe to set the status information for this file.
 774      */
 775     statSeqNo = bulkStatCounter++;
 776     /* ensure against wrapping */
 777     if (statSeqNo == 0)
 778         statSeqNo = bulkStatCounter++;
 779
 780     /* now we have dir data in the cache, so scan the dir page */
 781     fidIndex = 0;
 782     flagIndex = 0;
 783     while (1) {                 /* Should probably have some constant bound */
 784         /* look for first safe entry to examine in the directory.  BlobScan
 785          * looks for a the 1st allocated dir after the dirCookie slot.
 786          */
 787         newIndex = BlobScan(dcp, (dirCookie >> 5));
 788         if (newIndex == 0)
 789             break;
 790
 791         /* remember the updated directory cookie */
 792         dirCookie = newIndex << 5;
 793
 794         /* get a ptr to the dir entry */
 795         dirEntryp =
 796             (struct DirEntry *)afs_dir_GetBlob(dcp, newIndex);
 797         if (!dirEntryp)
 798             break;
 799
 800         /* dont copy more than we have room for */
 801         if (fidIndex >= nentries) {
 802             DRelease(dirEntryp, 0);
 803             break;
 804         }
 805
 806         /* now, if the dir entry looks good, copy it out to our list.  Vnode
 807          * 0 means deleted, although it should also be free were it deleted.
 808          */
 809         if (dirEntryp->fid.vnode != 0) {
 810             /* dont copy entries we have in our cache.  This check will
 811              * also make us skip "." and probably "..", unless it has
 812              * disappeared from the cache since we did our namei call.
 813              */
 814             tfid.Cell = adp->f.fid.Cell;
 815             tfid.Fid.Volume = adp->f.fid.Fid.Volume;
 816             tfid.Fid.Vnode = ntohl(dirEntryp->fid.vnode);
 817             tfid.Fid.Unique = ntohl(dirEntryp->fid.vunique);
 818             do {
 819                 retry = 0;
 820                 ObtainWriteLock(&afs_xvcache, 130);
 821                 tvcp = afs_FindVCache(&tfid, &retry, IS_WLOCK /* no stats | LRU */ );
 822                 if (tvcp && retry) {
 823                     ReleaseWriteLock(&afs_xvcache);
 824                     afs_PutVCache(tvcp);
 825                 }
 826             } while (tvcp && retry);
 827             if (!tvcp) {        /* otherwise, create manually */
 828                 tvcp = afs_NewBulkVCache(&tfid, hostp, statSeqNo);
 829                 if (tvcp)
 830                 {
 831                         ObtainWriteLock(&tvcp->lock, 505);
 832                         ReleaseWriteLock(&afs_xvcache);
 833                         afs_RemoveVCB(&tfid);
 834                         ReleaseWriteLock(&tvcp->lock);
 835                 } else {
 836                         ReleaseWriteLock(&afs_xvcache);
 837                 }
 838             } else {
 839                 ReleaseWriteLock(&afs_xvcache);
 840             }
 841             if (!tvcp)
 842             {
 843                 DRelease(dirEntryp, 0);
 844                 ReleaseReadLock(&dcp->lock);
 845                 ReleaseReadLock(&adp->lock);
 846                 afs_PutDCache(dcp);
 847                 goto done;      /* can happen if afs_NewVCache fails */
 848             }
 849
 850             /* WARNING: afs_DoBulkStat uses the Length field to store a
 851              * sequence number for each bulk status request. Under no
 852              * circumstances should afs_DoBulkStat store a sequence number
 853              * if the new length will be ignored when afs_ProcessFS is
 854              * called with new stats. */
 855 #ifdef AFS_SGI_ENV
 856             if (!(tvcp->f.states & CStatd)
 857                 && (!((tvcp->f.states & CBulkFetching) &&
 858                       (tvcp->f.m.Length != statSeqNo)))
 859                 && (tvcp->execsOrWriters <= 0)
 860                 && !afs_DirtyPages(tvcp)
 861                 && !AFS_VN_MAPPED((vnode_t *) tvcp))
 862 #else
 863             if (!(tvcp->f.states & CStatd)
 864                 && (!((tvcp->f.states & CBulkFetching) &&
 865                       (tvcp->f.m.Length != statSeqNo)))
 866                 && (tvcp->execsOrWriters <= 0)
 867                 && !afs_DirtyPages(tvcp))
 868 #endif
 869
 870             {
 871                 /* this entry doesnt exist in the cache, and is not
 872                  * already being fetched by someone else, so add it to the
 873                  * list of file IDs to obtain.
 874                  *
 875                  * We detect a callback breaking race condition by checking the
 876                  * CBulkFetching state bit and the value in the file size.
 877                  * It is safe to set the status only if the CBulkFetching
 878                  * flag is still set and the value in the file size does
 879                  * not change. NewBulkVCache sets us up.
 880                  *
 881                  * Don't fetch status for dirty files. We need to
 882                  * preserve the value of the file size. We could
 883                  * flush the pages, but it wouldn't be worthwhile.
 884                  */
 885                 memcpy((char *)(fidsp + fidIndex), (char *)&tfid.Fid,
 886                        sizeof(*fidsp));
 887                 fidIndex++;
 888             }
 889             afs_PutVCache(tvcp);
 890         }
 891
 892         /* if dir vnode has non-zero entry */
 893         /* move to the next dir entry by adding in the # of entries
 894          * used by this dir entry.
 895          */
 896         temp = afs_dir_NameBlobs(dirEntryp->name) << 5;
 897         DRelease(dirEntryp, 0);
 898         if (temp <= 0)
 899             break;
 900         dirCookie += temp;
 901     }                           /* while loop over all dir entries */
 902
 903     /* now release the dir lock and prepare to make the bulk RPC */
 904     ReleaseReadLock(&dcp->lock);
 905     ReleaseReadLock(&adp->lock);
 906
 907     /* release the chunk */
 908     afs_PutDCache(dcp);
 909
 910     /* dont make a null call */
 911     if (fidIndex == 0)
 912         goto done;
 913
 914     do {
 915         /* setup the RPC parm structures */
 916         fidParm.AFSCBFids_len = fidIndex;
 917         fidParm.AFSCBFids_val = fidsp;
 918         statParm.AFSBulkStats_len = fidIndex;
 919         statParm.AFSBulkStats_val = statsp;
 920         cbParm.AFSCBs_len = fidIndex;
 921         cbParm.AFSCBs_val = cbsp;
 922
 923         /* start the timer; callback expirations are relative to this */
 924         startTime = osi_Time();
 925
 926         tcp = afs_Conn(&adp->f.fid, areqp, SHARED_LOCK);
 927         if (tcp) {
 928             hostp = tcp->srvr->server;
 929             XSTATS_START_TIME(AFS_STATS_FS_RPCIDX_BULKSTATUS);
 930             RX_AFS_GUNLOCK();
 931
 932             if (!(tcp->srvr->server->flags & SNO_INLINEBULK)) {
 933                 code =
 934                     RXAFS_InlineBulkStatus(tcp->id, &fidParm, &statParm,
 935                                            &cbParm, &volSync);
 936                 if (code == RXGEN_OPCODE) {
 937                     tcp->srvr->server->flags |= SNO_INLINEBULK;
 938                     inlinebulk = 0;
 939                     code =
 940                         RXAFS_BulkStatus(tcp->id, &fidParm, &statParm,
 941                                          &cbParm, &volSync);
 942                 } else
 943                     inlinebulk = 1;
 944             } else {
 945                 inlinebulk = 0;
 946                 code =
 947                     RXAFS_BulkStatus(tcp->id, &fidParm, &statParm, &cbParm,
 948                                      &volSync);
 949             }
 950             RX_AFS_GLOCK();
 951             XSTATS_END_TIME;
 952         } else
 953             code = -1;
 954     } while (afs_Analyze
 955              (tcp, code, &adp->f.fid, areqp, AFS_STATS_FS_RPCIDX_BULKSTATUS,
 956               SHARED_LOCK, NULL));
 957
 958     /* now, if we didnt get the info, bail out. */
 959     if (code)
 960         goto done;
 961
 962     /* we need vol flags to create the entries properly */
 963     dotdot.Fid.Volume = 0;
 964     volp = afs_GetVolume(&adp->f.fid, areqp, READ_LOCK);
 965     if (volp) {
 966         volStates = volp->states;
 967         if (volp->dotdot.Fid.Volume != 0)
 968             dotdot = volp->dotdot;
 969     } else
 970         volStates = 0;
 971
 972     /* find the place to merge the info into  We do this by skipping
 973      * nskip entries in the LRU queue.  The more we skip, the more
 974      * we preserve, since the head of the VLRU queue is the most recently
 975      * referenced file.
 976      */
 977   reskip:
 978     nskip = afs_cacheStats / 2; /* preserved fraction of the cache */
 979     ObtainReadLock(&afs_xvcache);
 980  reskip2:
 981     if (QEmpty(&VLRU)) {
 982         /* actually a serious error, probably should panic. Probably will
 983          * panic soon, oh well. */
 984         ReleaseReadLock(&afs_xvcache);
 985         afs_warnuser("afs_DoBulkStat: VLRU empty!");
 986         goto done;
 987     }
 988     if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
 989         refpanic("Bulkstat VLRU inconsistent");
 990     }
 991     for (tq = VLRU.next; tq != &VLRU; tq = QNext(tq)) {
 992         if (--nskip <= 0) {
 993 #ifdef AFS_DARWIN80_ENV
 994             if (!(QTOV(tq)->f.states & CDeadVnode))
 995 #endif
 996                 break;
 997         }
 998         if (QNext(QPrev(tq)) != tq) {
 999             BStvc = QTOV(tq);
1000             refpanic("BulkStat VLRU inconsistent");
1001         }
1002     }
1003     if (tq != &VLRU)
1004         lruvcp = QTOV(tq);
1005     else
1006         lruvcp = QTOV(VLRU.next);
1007
1008     /* now we have to hold this entry, so that it does not get moved
1009      * into the free list while we're running.  It could still get
1010      * moved within the lru queue, but hopefully that will be rare; it
1011      * doesn't hurt nearly as much.
1012      */
1013     retry = 0;
1014 #ifdef AFS_DARWIN80_ENV
1015     if ((lruvcp->f.states & CDeadVnode)) {
1016         if (npasses == 0) {
1017             nskip = 1;
1018             npasses++;
1019             goto reskip2;
1020         } else {
1021             afs_warn("Can't find non-dead vnode in VLRU\n");
1022             novlru = 1;
1023         }
1024     }
1025     if (!novlru) {
1026         lruvp = AFSTOV(lruvcp);
1027         if (vnode_get(lruvp))       /* this bumps ref count */
1028             retry = 1;
1029         else if (vnode_ref(lruvp)) {
1030             AFS_GUNLOCK();
1031             /* AFSTOV(lruvcp) may be NULL */
1032             vnode_put(lruvp);
1033             AFS_GLOCK();
1034             retry = 1;
1035         }
1036     }
1037 #else
1038     if (novlru)
1039         osi_vnhold(lruvcp, &retry);
1040 #endif
1041     ReleaseReadLock(&afs_xvcache);      /* could be read lock */
1042     if (retry)
1043         goto reskip;
1044
1045     /* otherwise, merge in the info.  We have to be quite careful here,
1046      * since we need to ensure that we don't merge old info over newer
1047      * stuff in a stat cache entry.  We're very conservative here: we don't
1048      * do the merge at all unless we ourselves create the stat cache
1049      * entry.  That's pretty safe, and should work pretty well, since we
1050      * typically expect to do the stat cache creation ourselves.
1051      *
1052      * We also have to take into account racing token revocations.
1053      */
1054     for (i = 0; i < fidIndex; i++) {
1055         if ((&statsp[i])->errorCode)
1056             continue;
1057         afid.Cell = adp->f.fid.Cell;
1058         afid.Fid.Volume = adp->f.fid.Fid.Volume;
1059         afid.Fid.Vnode = fidsp[i].Vnode;
1060         afid.Fid.Unique = fidsp[i].Unique;
1061         do {
1062             retry = 0;
1063             ObtainReadLock(&afs_xvcache);
1064             tvcp = afs_FindVCache(&afid, &retry, 0 /* !stats&!lru */ );
1065             ReleaseReadLock(&afs_xvcache);
1066         } while (tvcp && retry);
1067
1068         /* The entry may no longer exist */
1069         if (tvcp == NULL) {
1070             continue;
1071         }
1072
1073         /* now we have the entry held, but we need to fill it in */
1074         ObtainWriteLock(&tvcp->lock, 131);
1075
1076         /* if CBulkFetching is not set, or if the file size no longer
1077          * matches the value we placed there when we set the CBulkFetching
1078          * flag, then someone else has done something with this node,
1079          * and we may not have the latest status information for this
1080          * file.  Leave the entry alone.
1081          */
1082         if (!(tvcp->f.states & CBulkFetching) || (tvcp->f.m.Length != statSeqNo)) {
1083 #ifdef AFS_DARWIN80_ENV
1084             int isdead = (tvcp->f.states & CDeadVnode);
1085 #endif
1086             flagIndex++;
1087             ReleaseWriteLock(&tvcp->lock);
1088 #ifdef AFS_DARWIN80_ENV
1089             if (!isdead)
1090                 /* re-acquire the usecount that the other finalizevnode disposed of */
1091                 vnode_ref(AFSTOV(tvcp));
1092 #endif
1093             afs_PutVCache(tvcp);
1094             continue;
1095         }
1096
1097         /* now copy ".." entry back out of volume structure, if necessary */
1098         if (tvcp->mvstat == 2 && (dotdot.Fid.Volume != 0)) {
1099             if (!tvcp->mvid)
1100                 tvcp->mvid = (struct VenusFid *)
1101                     osi_AllocSmallSpace(sizeof(struct VenusFid));
1102             *tvcp->mvid = dotdot;
1103         }
1104
1105         if (!novlru) {
1106             ObtainWriteLock(&afs_xvcache, 132);
1107             if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
1108                 refpanic("Bulkstat VLRU inconsistent2");
1109             }
1110             if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
1111                 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq)) {
1112                 refpanic("Bulkstat VLRU inconsistent4");
1113             }
1114             if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
1115                 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq)) {
1116                 refpanic("Bulkstat VLRU inconsistent5");
1117             }
1118
1119             if (tvcp != lruvcp) {       /* if they are == don't move it, don't corrupt vlru */
1120                 QRemove(&tvcp->vlruq);
1121                 QAdd(&lruvcp->vlruq, &tvcp->vlruq);
1122             }
1123
1124             if ((VLRU.next->prev != &VLRU) || (VLRU.prev->next != &VLRU)) {
1125                 refpanic("Bulkstat VLRU inconsistent3");
1126             }
1127             if ((QNext(QPrev(&tvcp->vlruq)) != &tvcp->vlruq)
1128                 || (QPrev(QNext(&tvcp->vlruq)) != &tvcp->vlruq)) {
1129                 refpanic("Bulkstat VLRU inconsistent5");
1130             }
1131             if ((QNext(QPrev(&lruvcp->vlruq)) != &lruvcp->vlruq)
1132                 || (QPrev(QNext(&lruvcp->vlruq)) != &lruvcp->vlruq)) {
1133                 refpanic("Bulkstat VLRU inconsistent6");
1134             }
1135             ReleaseWriteLock(&afs_xvcache);
1136         }
1137
1138         ObtainWriteLock(&afs_xcbhash, 494);
1139
1140         /* We need to check the flags again. We may have missed
1141          * something while we were waiting for a lock.
1142          */
1143         if (!(tvcp->f.states & CBulkFetching) || (tvcp->f.m.Length != statSeqNo)) {
1144             flagIndex++;
1145 #ifdef AFS_DARWIN80_ENV
1146             if ((tvcp->f.states & CDeadVnode) == 0)
1147                 /* re-acquire the usecount that the other finalizevnode disposed of */
1148                 vnode_ref(AFSTOV(tvcp));
1149 #endif
1150             ReleaseWriteLock(&tvcp->lock);
1151             ReleaseWriteLock(&afs_xcbhash);
1152             afs_PutVCache(tvcp);
1153             continue;
1154         }
1155
1156         /* now merge in the resulting status back into the vnode.
1157          * We only do this if the entry looks clear.
1158          */
1159         afs_ProcessFS(tvcp, &statsp[i], areqp);
1160 #if defined(AFS_LINUX22_ENV)
1161         afs_fill_inode(AFSTOV(tvcp), NULL);     /* reset inode operations */
1162 #endif
1163
1164         /* do some accounting for bulk stats: mark this entry as
1165          * loaded, so we can tell if we use it before it gets
1166          * recycled.
1167          */
1168         tvcp->f.states |= CBulkStat;
1169         tvcp->f.states &= ~CBulkFetching;
1170         flagIndex++;
1171         afs_bulkStatsDone++;
1172
1173         /* merge in vol info */
1174         if (volStates & VRO)
1175             tvcp->f.states |= CRO;
1176         if (volStates & VBackup)
1177             tvcp->f.states |= CBackup;
1178         if (volStates & VForeign)
1179             tvcp->f.states |= CForeign;
1180
1181         /* merge in the callback info */
1182         tvcp->f.states |= CTruth;
1183
1184         /* get ptr to the callback we are interested in */
1185         tcbp = cbsp + i;
1186
1187         if (tcbp->ExpirationTime != 0) {
1188             tvcp->cbExpires = tcbp->ExpirationTime + startTime;
1189             tvcp->callback = hostp;
1190             tvcp->f.states |= CStatd;
1191             afs_QueueCallback(tvcp, CBHash(tcbp->ExpirationTime), volp);
1192         } else if (tvcp->f.states & CRO) {
1193             /* ordinary callback on a read-only volume -- AFS 3.2 style */
1194             tvcp->cbExpires = 3600 + startTime;
1195             tvcp->callback = hostp;
1196             tvcp->f.states |= CStatd;
1197             afs_QueueCallback(tvcp, CBHash(3600), volp);
1198         } else {
1199             tvcp->callback = 0;
1200             tvcp->f.states &= ~(CStatd | CUnique);
1201             afs_DequeueCallback(tvcp);
1202             if ((tvcp->f.states & CForeign) || (vType(tvcp) == VDIR))
1203                 osi_dnlc_purgedp(tvcp); /* if it (could be) a directory */
1204         }
1205         ReleaseWriteLock(&afs_xcbhash);
1206 #ifdef AFS_DARWIN80_ENV
1207         /* reclaim->FlushVCache will need xcbhash */
1208         if (tvcp->f.states & CDeadVnode) {
1209             /* passing in a parent hangs getting the vnode lock */
1210             code = afs_darwin_finalizevnode(tvcp, NULL, NULL, 0, 1);
1211             if (code) {
1212                 /* It's gonna get recycled - shouldn't happen */
1213                 tvcp->callback = 0;
1214                 tvcp->f.states &= ~(CStatd | CUnique);
1215                 afs_DequeueCallback(tvcp);
1216                 if ((tvcp->f.states & CForeign) || (vType(tvcp) == VDIR))
1217                     osi_dnlc_purgedp(tvcp); /* if it (could be) a directory */
1218             } else
1219                 /* re-acquire the usecount that finalizevnode disposed of */
1220                 vnode_ref(AFSTOV(tvcp));
1221         }
1222 #endif
1223
1224         ReleaseWriteLock(&tvcp->lock);
1225         /* finally, we're done with the entry */
1226         afs_PutVCache(tvcp);
1227     }                           /* for all files we got back */
1228
1229     /* finally return the pointer into the LRU queue */
1230     if (!novlru) {
1231 #ifdef AFS_DARWIN80_ENV
1232         AFS_GUNLOCK();
1233         vnode_put(lruvp);
1234         vnode_rele(lruvp);
1235         AFS_GLOCK();
1236 #else
1237         afs_PutVCache(lruvcp);
1238 #endif
1239     }
1240
1241   done:
1242     /* Be sure to turn off the CBulkFetching flags */
1243     for (i = flagIndex; i < fidIndex; i++) {
1244         afid.Cell = adp->f.fid.Cell;
1245         afid.Fid.Volume = adp->f.fid.Fid.Volume;
1246         afid.Fid.Vnode = fidsp[i].Vnode;
1247         afid.Fid.Unique = fidsp[i].Unique;
1248         do {
1249             retry = 0;
1250             ObtainReadLock(&afs_xvcache);
1251             tvcp = afs_FindVCache(&afid, &retry, 0 /* !stats&!lru */ );
1252             ReleaseReadLock(&afs_xvcache);
1253         } while (tvcp && retry);
1254         if (tvcp != NULL && (tvcp->f.states & CBulkFetching)
1255             && (tvcp->f.m.Length == statSeqNo)) {
1256             tvcp->f.states &= ~CBulkFetching;
1257         }
1258         if (tvcp != NULL) {
1259 #ifdef AFS_DARWIN80_ENV
1260             if ((tvcp->f.states & CDeadVnode) == 0)
1261                 /* re-acquire the usecount that the other finalizevnode disposed of */
1262                 vnode_ref(AFSTOV(tvcp));
1263 #endif
1264             afs_PutVCache(tvcp);
1265         }
1266     }
1267     if (volp)
1268         afs_PutVolume(volp, READ_LOCK);
1269
1270     /* If we did the InlineBulk RPC pull out the return code */
1271     if (inlinebulk && code == 0) {
1272         if ((&statsp[0])->errorCode) {
1273             afs_Analyze(tcp, (&statsp[0])->errorCode, &adp->f.fid, areqp,
1274                         AFS_STATS_FS_RPCIDX_BULKSTATUS, SHARED_LOCK, NULL);
1275             code = (&statsp[0])->errorCode;
1276         }
1277     } else {
1278         code = 0;
1279     }
1280   done2:
1281     osi_FreeLargeSpace((char *)fidsp);
1282     osi_Free((char *)statsp, AFSCBMAX * sizeof(AFSFetchStatus));
1283     osi_Free((char *)cbsp, AFSCBMAX * sizeof(AFSCallBack));
1284     return code;
1285 }
1286
1287 /* was: (AFS_DEC_ENV) || defined(AFS_OSF30_ENV) || defined(AFS_NCR_ENV) */
1288 static int AFSDOBULK = 1;
1289
1290 int
1291 #if defined(AFS_SUN5_ENV) || defined(AFS_SGI_ENV)
1292 afs_lookup(OSI_VC_DECL(adp), char *aname, struct vcache **avcp, struct pathname *pnp, int flags, struct vnode *rdir, afs_ucred_t *acred)
1293 #elif defined(UKERNEL)
1294 afs_lookup(OSI_VC_DECL(adp), char *aname, struct vcache **avcp, afs_ucred_t *acred, int flags)
1295 #else
1296 afs_lookup(OSI_VC_DECL(adp), char *aname, struct vcache **avcp, afs_ucred_t *acred)
1297 #endif
1298 {
1299     struct vrequest treq;
1300     char *tname = NULL;
1301     register struct vcache *tvc = 0;
1302     register afs_int32 code;
1303     register afs_int32 bulkcode = 0;
1304     int pass = 0, hit = 0;
1305     int force_eval = afs_fakestat_enable ? 0 : 1;
1306     long dirCookie;
1307     extern afs_int32 afs_mariner;       /*Writing activity to log? */
1308     afs_hyper_t versionNo;
1309     int no_read_access = 0;
1310     struct sysname_info sysState;       /* used only for @sys checking */
1311     int dynrootRetry = 1;
1312     struct afs_fakestat_state fakestate;
1313     int tryEvalOnly = 0;
1314     OSI_VC_CONVERT(adp);
1315
1316     AFS_STATCNT(afs_lookup);
1317     afs_InitFakeStat(&fakestate);
1318
1319     AFS_DISCON_LOCK();
1320
1321     if ((code = afs_InitReq(&treq, acred)))
1322         goto done;
1323
1324     if (afs_fakestat_enable && adp->mvstat == 1) {
1325        if (strcmp(aname, ".directory") == 0)
1326            tryEvalOnly = 1;
1327     }
1328
1329 #if defined(AFS_DARWIN_ENV)
1330     /* Workaround for MacOSX Finder, which tries to look for
1331      * .DS_Store and Contents under every directory.
1332      */
1333     if (afs_fakestat_enable && adp->mvstat == 1) {
1334         if (strcmp(aname, ".DS_Store") == 0)
1335             tryEvalOnly = 1;
1336         if (strcmp(aname, "Contents") == 0)
1337             tryEvalOnly = 1;
1338     }
1339     if (afs_fakestat_enable && adp->mvstat == 2) {
1340         if (strncmp(aname, "._", 2) == 0)
1341             tryEvalOnly = 1;
1342     }
1343 #endif
1344
1345     if (tryEvalOnly)
1346         code = afs_TryEvalFakeStat(&adp, &fakestate, &treq);
1347     else
1348         code = afs_EvalFakeStat(&adp, &fakestate, &treq);
1349
1350     /*printf("Code is %d\n", code);*/
1351
1352     if (tryEvalOnly && adp->mvstat == 1)
1353         code = ENOENT;
1354     if (code)
1355         goto done;
1356
1357     *avcp = NULL;               /* Since some callers don't initialize it */
1358
1359     /* come back to here if we encounter a non-existent object in a read-only
1360      * volume's directory */
1361
1362   redo:
1363     *avcp = NULL;               /* Since some callers don't initialize it */
1364     bulkcode = 0;
1365
1366     if (!(adp->f.states & CStatd) && !afs_InReadDir(adp)) {
1367         if ((code = afs_VerifyVCache2(adp, &treq))) {
1368             goto done;
1369         }
1370     } else
1371         code = 0;
1372
1373     /* watch for ".." in a volume root */
1374     if (adp->mvstat == 2 && aname[0] == '.' && aname[1] == '.' && !aname[2]) {
1375         /* looking up ".." in root via special hacks */
1376         if (adp->mvid == (struct VenusFid *)0 || adp->mvid->Fid.Volume == 0) {
1377             code = ENODEV;
1378             goto done;
1379         }
1380         /* otherwise we have the fid here, so we use it */
1381         /*printf("Getting vcache\n");*/
1382         tvc = afs_GetVCache(adp->mvid, &treq, NULL, NULL);
1383         afs_Trace3(afs_iclSetp, CM_TRACE_GETVCDOTDOT, ICL_TYPE_FID, adp->mvid,
1384                    ICL_TYPE_POINTER, tvc, ICL_TYPE_INT32, code);
1385         *avcp = tvc;
1386         code = (tvc ? 0 : ENOENT);
1387         hit = 1;
1388         if (tvc && !VREFCOUNT_GT(tvc, 0)) {
1389             osi_Panic("TT1");
1390         }
1391         if (code) {
1392             /*printf("LOOKUP GETVCDOTDOT -> %d\n", code); */
1393         }
1394         goto done;
1395     }
1396
1397     /* now check the access */
1398     if (treq.uid != adp->last_looker) {
1399         if (!afs_AccessOK(adp, PRSFS_LOOKUP, &treq, CHECK_MODE_BITS)) {
1400             *avcp = NULL;
1401             code = EACCES;
1402             goto done;
1403         } else
1404             adp->last_looker = treq.uid;
1405     }
1406
1407     /* Check for read access as well.  We need read access in order to
1408      * stat files, but not to stat subdirectories. */
1409     if (!afs_AccessOK(adp, PRSFS_READ, &treq, CHECK_MODE_BITS))
1410         no_read_access = 1;
1411
1412     /* special case lookup of ".".  Can we check for it sooner in this code,
1413      * for instance, way up before "redo:" ??
1414      * I'm not fiddling with the LRUQ here, either, perhaps I should, or else
1415      * invent a lightweight version of GetVCache.
1416      */
1417     if (aname[0] == '.' && !aname[1]) { /* special case */
1418         ObtainReadLock(&afs_xvcache);
1419         osi_vnhold(adp, 0);
1420         ReleaseReadLock(&afs_xvcache);
1421 #ifdef AFS_DARWIN80_ENV
1422         vnode_get(AFSTOV(adp));
1423 #endif
1424         code = 0;
1425         *avcp = tvc = adp;
1426         hit = 1;
1427         if (adp && !VREFCOUNT_GT(adp, 0)) {
1428             osi_Panic("TT2");
1429         }
1430         goto done;
1431     }
1432
1433     /*
1434      * Special case lookup of ".." in the dynamic mount directory.
1435      * The parent of this directory is _always_ the AFS root volume.
1436      */
1437     if (afs_IsDynrootMount(adp) &&
1438         aname[0] == '.' && aname[1] == '.' && !aname[2]) {
1439
1440         ObtainReadLock(&afs_xvcache);
1441         osi_vnhold(afs_globalVp, 0);
1442         ReleaseReadLock(&afs_xvcache);
1443 #ifdef AFS_DARWIN80_ENV
1444         vnode_get(AFSTOV(afs_globalVp));
1445 #endif
1446         code = 0;
1447         *avcp = tvc = afs_globalVp;
1448         hit = 1;
1449         goto done;
1450     }
1451
1452     /*
1453      * Special case lookups in the dynamic mount directory.
1454      * The names here take the form cell:volume, similar to a mount point.
1455      * EvalMountData parses that and returns a cell and volume ID, which
1456      * we use to construct the appropriate dynroot Fid.
1457      */
1458     if (afs_IsDynrootMount(adp)) {
1459         struct VenusFid tfid;
1460         afs_uint32 cellidx, volid, vnoid, uniq;
1461
1462         code = EvalMountData('%', aname, 0, 0, NULL, &treq, &cellidx, &volid, &vnoid, &uniq);
1463         if (code)
1464             goto done;
1465         /* If a vnode was returned, it's not a real mount point */
1466         if (vnoid > 1) {
1467             struct cell *tcell = afs_GetCellByIndex(cellidx, READ_LOCK);
1468             tfid.Cell = tcell->cellNum;
1469             afs_PutCell(tcell, READ_LOCK);
1470             tfid.Fid.Vnode = vnoid;
1471             tfid.Fid.Volume = volid;
1472             tfid.Fid.Unique = uniq;
1473         } else {
1474             afs_GetDynrootMountFid(&tfid);
1475             tfid.Fid.Vnode = VNUM_FROM_TYPEID(VN_TYPE_MOUNT, cellidx << 2);
1476             tfid.Fid.Unique = volid;
1477         }
1478         *avcp = tvc = afs_GetVCache(&tfid, &treq, NULL, NULL);
1479         code = (tvc ? 0 : ENOENT);
1480         hit = 1;
1481         goto done;
1482     }
1483
1484 #ifdef AFS_LINUX26_ENV
1485     /*
1486      * Special case of the dynamic mount volume in a static root.
1487      * This is really unfortunate, but we need this for the translator.
1488      */
1489     if (adp == afs_globalVp && !afs_GetDynrootEnable() &&
1490         !strcmp(aname, AFS_DYNROOT_MOUNTNAME)) {
1491         struct VenusFid tfid;
1492
1493         afs_GetDynrootMountFid(&tfid);
1494         *avcp = tvc = afs_GetVCache(&tfid, &treq, NULL, NULL);
1495         code = 0;
1496         hit = 1;
1497         goto done;
1498     }
1499 #endif
1500
1501     Check_AtSys(adp, aname, &sysState, &treq);
1502     tname = sysState.name;
1503
1504     /* 1st Check_AtSys and lookup by tname is required here, for now,
1505      * because the dnlc is *not* told to remove entries for the parent
1506      * dir of file/dir op that afs_LocalHero likes, but dnlc is informed
1507      * if the cached entry for the parent dir is invalidated for a
1508      * non-local change.
1509      * Otherwise, we'd be able to do a dnlc lookup on an entry ending
1510      * w/@sys and know the dnlc was consistent with reality. */
1511     tvc = osi_dnlc_lookup(adp, tname, WRITE_LOCK);
1512     *avcp = tvc;                /* maybe wasn't initialized, but it is now */
1513     if (tvc) {
1514         if (no_read_access && vType(tvc) != VDIR && vType(tvc) != VLNK) {
1515             /* need read access on dir to stat non-directory / non-link */
1516 #ifndef AFS_FBSD80_ENV
1517             afs_PutVCache(tvc);
1518 #endif
1519             *avcp = NULL;
1520             code = EACCES;
1521             goto done;
1522         }
1523 #ifdef AFS_LINUX22_ENV
1524         if (tvc->mvstat == 2) { /* we don't trust the dnlc for root vcaches */
1525             AFS_RELE(AFSTOV(tvc));
1526             *avcp = 0;
1527         } else {
1528             code = 0;
1529             hit = 1;
1530             goto done;
1531         }
1532 #else /* non - LINUX */
1533         code = 0;
1534         hit = 1;
1535         goto done;
1536 #endif /* linux22 */
1537     }
1538
1539     {                           /* sub-block just to reduce stack usage */
1540         register struct dcache *tdc;
1541         afs_size_t dirOffset, dirLen;
1542         struct VenusFid tfid;
1543
1544         /* now we have to lookup the next fid */
1545         if (afs_InReadDir(adp))
1546             tdc = adp->dcreaddir;
1547         else
1548             tdc = afs_GetDCache(adp, (afs_size_t) 0, &treq,
1549                                 &dirOffset, &dirLen, 1);
1550         if (!tdc) {
1551             *avcp = NULL;       /* redundant, but harmless */
1552             code = EIO;
1553             goto done;
1554         }
1555
1556         /* now we will just call dir package with appropriate inode.
1557          * Dirs are always fetched in their entirety for now */
1558         ObtainReadLock(&adp->lock);
1559         ObtainReadLock(&tdc->lock);
1560
1561         /*
1562          * Make sure that the data in the cache is current. There are two
1563          * cases we need to worry about:
1564          * 1. The cache data is being fetched by another process.
1565          * 2. The cache data is no longer valid
1566          *
1567          * If a readdir is in progress _in this thread_, it has a shared
1568          * lock on the vcache and has obtained current data, so we just
1569          * use that.  This eliminates several possible deadlocks.
1570          */
1571         if (!afs_InReadDir(adp)) {
1572             while ((adp->f.states & CStatd)
1573                    && (tdc->dflags & DFFetching)
1574                    && hsame(adp->f.m.DataVersion, tdc->f.versionNo)) {
1575                 ReleaseReadLock(&tdc->lock);
1576                 ReleaseReadLock(&adp->lock);
1577                 afs_osi_Sleep(&tdc->validPos);
1578                 ObtainReadLock(&adp->lock);
1579                 ObtainReadLock(&tdc->lock);
1580             }
1581             if (!(adp->f.states & CStatd)
1582                 || !hsame(adp->f.m.DataVersion, tdc->f.versionNo)) {
1583                 ReleaseReadLock(&tdc->lock);
1584                 ReleaseReadLock(&adp->lock);
1585                 afs_PutDCache(tdc);
1586                 if (tname && tname != aname)
1587                     osi_FreeLargeSpace(tname);
1588                 goto redo;
1589             }
1590         }
1591
1592         /* Save the version number for when we call osi_dnlc_enter */
1593         hset(versionNo, tdc->f.versionNo);
1594
1595         /*
1596          * check for, and handle "@sys" if it's there.  We should be able
1597          * to avoid the alloc and the strcpy with a little work, but it's
1598          * not pressing.  If there aren't any remote users (ie, via the
1599          * NFS translator), we have a slightly easier job.
1600          * the faster way to do this is to check for *aname == '@' and if
1601          * it's there, check for @sys, otherwise, assume there's no @sys
1602          * then, if the lookup fails, check for .*@sys...
1603          */
1604         /* above now implemented by Check_AtSys and Next_AtSys */
1605
1606         /* lookup the name in the appropriate dir, and return a cache entry
1607          * on the resulting fid */
1608         code =
1609             afs_dir_LookupOffset(tdc, sysState.name, &tfid.Fid,
1610                                  &dirCookie);
1611
1612         /* If the first lookup doesn't succeed, maybe it's got @sys in the name */
1613         while (code == ENOENT && Next_AtSys(adp, &treq, &sysState))
1614             code =
1615                 afs_dir_LookupOffset(tdc, sysState.name, &tfid.Fid,
1616                                      &dirCookie);
1617         tname = sysState.name;
1618
1619         ReleaseReadLock(&tdc->lock);
1620         if (!afs_InReadDir(adp))
1621             afs_PutDCache(tdc);
1622         if (code == ENOENT && afs_IsDynroot(adp) && dynrootRetry && !tryEvalOnly) {
1623             ReleaseReadLock(&adp->lock);
1624             dynrootRetry = 0;
1625             if (tname[0] == '.')
1626                 afs_LookupAFSDB(tname + 1);
1627             else
1628                 afs_LookupAFSDB(tname);
1629             if (tname && tname != aname)
1630                 osi_FreeLargeSpace(tname);
1631             goto redo;
1632         } else {
1633             ReleaseReadLock(&adp->lock);
1634         }
1635
1636         /* new fid has same cell and volume */
1637         tfid.Cell = adp->f.fid.Cell;
1638         tfid.Fid.Volume = adp->f.fid.Fid.Volume;
1639         afs_Trace4(afs_iclSetp, CM_TRACE_LOOKUP, ICL_TYPE_POINTER, adp,
1640                    ICL_TYPE_STRING, tname, ICL_TYPE_FID, &tfid,
1641                    ICL_TYPE_INT32, code);
1642
1643         if (code) {
1644             if (code != ENOENT) {
1645                 /*printf("LOOKUP dirLookupOff -> %d\n", code);*/
1646             }
1647             goto done;
1648         }
1649
1650         /* prefetch some entries, if the dir is currently open.  The variable
1651          * dirCookie tells us where to start prefetching from.
1652          */
1653         if (!AFS_IS_DISCONNECTED &&
1654             AFSDOBULK && adp->opens > 0 && !(adp->f.states & CForeign)
1655             && !afs_IsDynroot(adp) && !afs_InReadDir(adp)) {
1656             afs_int32 retry;
1657             /* if the entry is not in the cache, or is in the cache,
1658              * but hasn't been statd, then do a bulk stat operation.
1659              */
1660             do {
1661                 retry = 0;
1662                 ObtainReadLock(&afs_xvcache);
1663                 tvc = afs_FindVCache(&tfid, &retry, 0 /* !stats,!lru */ );
1664                 ReleaseReadLock(&afs_xvcache);
1665             } while (tvc && retry);
1666
1667             if (!tvc || !(tvc->f.states & CStatd))
1668                 bulkcode = afs_DoBulkStat(adp, dirCookie, &treq);
1669             else
1670                 bulkcode = 0;
1671
1672             /* if the vcache isn't usable, release it */
1673             if (tvc && !(tvc->f.states & CStatd)) {
1674 #ifndef  AFS_FBSD80_ENV
1675                 afs_PutVCache(tvc);
1676 #endif
1677                 tvc = NULL;
1678             }
1679         } else {
1680             tvc = NULL;
1681             bulkcode = 0;
1682         }
1683
1684         /* now get the status info, if we don't already have it */
1685         /* This is kind of weird, but we might wind up accidentally calling
1686          * RXAFS_Lookup because we happened upon a file which legitimately
1687          * has a 0 uniquifier. That is the result of allowing unique to wrap
1688          * to 0. This was fixed in AFS 3.4. For CForeign, Unique == 0 means that
1689          * the file has not yet been looked up.
1690          */
1691         if (!tvc) {
1692             afs_int32 cached = 0;
1693             if (!tfid.Fid.Unique && (adp->f.states & CForeign)) {
1694                 tvc = afs_LookupVCache(&tfid, &treq, &cached, adp, tname);
1695             }
1696             if (!tvc && !bulkcode) {    /* lookup failed or wasn't called */
1697                 tvc = afs_GetVCache(&tfid, &treq, &cached, NULL);
1698             }
1699         }                       /* if !tvc */
1700     }                           /* sub-block just to reduce stack usage */
1701
1702     if (tvc) {
1703         if (adp->f.states & CForeign)
1704             tvc->f.states |= CForeign;
1705         tvc->f.parent.vnode = adp->f.fid.Fid.Vnode;
1706         tvc->f.parent.unique = adp->f.fid.Fid.Unique;
1707         tvc->f.states &= ~CBulkStat;
1708
1709         if (afs_fakestat_enable == 2 && tvc->mvstat == 1) {
1710             ObtainSharedLock(&tvc->lock, 680);
1711             if (!tvc->linkData) {
1712                 UpgradeSToWLock(&tvc->lock, 681);
1713                 code = afs_HandleLink(tvc, &treq);
1714                 ConvertWToRLock(&tvc->lock);
1715             } else {
1716                 ConvertSToRLock(&tvc->lock);
1717                 code = 0;
1718             }
1719             if (!code && !afs_strchr(tvc->linkData, ':'))
1720                 force_eval = 1;
1721             ReleaseReadLock(&tvc->lock);
1722         }
1723         if (tvc->mvstat == 1 && (tvc->f.states & CMValid) && tvc->mvid != NULL)
1724           force_eval = 1; /* This is now almost for free, get it correct */
1725
1726 #if defined(UKERNEL) && defined(AFS_WEB_ENHANCEMENTS)
1727         if (!(flags & AFS_LOOKUP_NOEVAL))
1728             /* don't eval mount points */
1729 #endif /* UKERNEL && AFS_WEB_ENHANCEMENTS */
1730             if (tvc->mvstat == 1 && force_eval) {
1731                 /* a mt point, possibly unevaluated */
1732                 struct volume *tvolp;
1733
1734                 ObtainWriteLock(&tvc->lock, 133);
1735                 code = EvalMountPoint(tvc, adp, &tvolp, &treq);
1736                 ReleaseWriteLock(&tvc->lock);
1737
1738                 if (code) {
1739 #ifndef AFS_FBSD80_ENV
1740                     afs_PutVCache(tvc);
1741 #endif
1742                     if (tvolp)
1743                         afs_PutVolume(tvolp, WRITE_LOCK);
1744                     goto done;
1745                 }
1746
1747                 /* next, we want to continue using the target of the mt point */
1748                 if (tvc->mvid && (tvc->f.states & CMValid)) {
1749                     struct vcache *uvc;
1750                     /* now lookup target, to set .. pointer */
1751                     afs_Trace2(afs_iclSetp, CM_TRACE_LOOKUP1,
1752                                ICL_TYPE_POINTER, tvc, ICL_TYPE_FID,
1753                                &tvc->f.fid);
1754                     uvc = tvc;  /* remember for later */
1755
1756                     if (tvolp && (tvolp->states & VForeign)) {
1757                         /* XXXX tvolp has ref cnt on but not locked! XXX */
1758                         tvc =
1759                             afs_GetRootVCache(tvc->mvid, &treq, NULL, tvolp);
1760                     } else {
1761                         tvc = afs_GetVCache(tvc->mvid, &treq, NULL, NULL);
1762                     }
1763 #ifndef AFS_FBSD80_ENV
1764                     afs_PutVCache(uvc); /* we're done with it */
1765 #endif
1766
1767                     if (!tvc) {
1768                         code = ENOENT;
1769                         if (tvolp) {
1770                             afs_PutVolume(tvolp, WRITE_LOCK);
1771                         }
1772                         goto done;
1773                     }
1774
1775                     /* now, if we came via a new mt pt (say because of a new
1776                      * release of a R/O volume), we must reevaluate the ..
1777                      * ptr to point back to the appropriate place */
1778                     if (tvolp) {
1779                         ObtainWriteLock(&tvc->lock, 134);
1780                         if (tvc->mvid == NULL) {
1781                             tvc->mvid = (struct VenusFid *)
1782                                 osi_AllocSmallSpace(sizeof(struct VenusFid));
1783                         }
1784                         /* setup backpointer */
1785                         *tvc->mvid = tvolp->dotdot;
1786                         ReleaseWriteLock(&tvc->lock);
1787                         afs_PutVolume(tvolp, WRITE_LOCK);
1788                     }
1789                 } else {
1790 #ifndef AFS_FBSD80_ENV
1791                     afs_PutVCache(tvc);
1792 #endif
1793                     code = ENOENT;
1794                     if (tvolp)
1795                         afs_PutVolume(tvolp, WRITE_LOCK);
1796                     goto done;
1797                 }
1798             }
1799         *avcp = tvc;
1800         if (tvc && !VREFCOUNT_GT(tvc, 0)) {
1801             osi_Panic("TT3");
1802         }
1803         code = 0;
1804     } else {
1805         /* if we get here, we found something in a directory that couldn't
1806          * be located (a Multics "connection failure").  If the volume is
1807          * read-only, we try flushing this entry from the cache and trying
1808          * again. */
1809         if (!AFS_IS_DISCONNECTED) {
1810             if (pass == 0) {
1811                 struct volume *tv;
1812                 tv = afs_GetVolume(&adp->f.fid, &treq, READ_LOCK);
1813                 if (tv) {
1814                     if (tv->states & VRO) {
1815                         pass = 1;       /* try this *once* */
1816                         ObtainWriteLock(&afs_xcbhash, 495);
1817                         afs_DequeueCallback(adp);
1818                         /* re-stat to get later version */
1819                         adp->f.states &= ~CStatd;
1820                         ReleaseWriteLock(&afs_xcbhash);
1821                         osi_dnlc_purgedp(adp);
1822                         afs_PutVolume(tv, READ_LOCK);
1823                         goto redo;
1824                     }
1825                     afs_PutVolume(tv, READ_LOCK);
1826                 }
1827             }
1828             code = ENOENT;
1829         } else {
1830             code = ENETDOWN;
1831         }
1832     }
1833
1834   done:
1835     /* put the network buffer back, if need be */
1836     if (tname != aname && tname)
1837         osi_FreeLargeSpace(tname);
1838     if (code == 0) {
1839
1840         if (afs_mariner)
1841             afs_AddMarinerName(aname, tvc);
1842
1843 #if defined(UKERNEL) && defined(AFS_WEB_ENHANCEMENTS)
1844         if (!(flags & AFS_LOOKUP_NOEVAL)) {
1845             /* Here we don't enter the name into the DNLC because we want the
1846              * evaluated mount dir to be there (the vcache for the mounted
1847              * volume) rather than the vc of the mount point itself.  We can
1848              * still find the mount point's vc in the vcache by its fid. */
1849 #endif /* UKERNEL && AFS_WEB_ENHANCEMENTS */
1850             if (!hit && force_eval) {
1851                 osi_dnlc_enter(adp, aname, tvc, &versionNo);
1852             } else {
1853 #ifdef AFS_LINUX20_ENV
1854                 /* So Linux inode cache is up to date. */
1855                 code = afs_VerifyVCache(tvc, &treq);
1856 #else
1857                 afs_PutFakeStat(&fakestate);
1858                 AFS_DISCON_UNLOCK();
1859                 return 0;       /* can't have been any errors if hit and !code */
1860 #endif
1861             }
1862 #if defined(UKERNEL) && defined(AFS_WEB_ENHANCEMENTS)
1863         }
1864 #endif
1865     }
1866     if (bulkcode)
1867         code = bulkcode;
1868
1869     code = afs_CheckCode(code, &treq, 19);
1870     if (code) {
1871         /* If there is an error, make sure *avcp is null.
1872          * Alphas panic otherwise - defect 10719.
1873          */
1874         *avcp = NULL;
1875     }
1876
1877     afs_PutFakeStat(&fakestate);
1878     AFS_DISCON_UNLOCK();
1879     return code;
1880 }