osi_rwlock_t cm_connLock;
-long RDRtimeout = CM_CONN_DEFAULTRDRTIMEOUT;
+DWORD RDRtimeout = CM_CONN_DEFAULTRDRTIMEOUT;
unsigned short ConnDeadtimeout = CM_CONN_CONNDEADTIME;
unsigned short HardDeadtimeout = CM_CONN_HARDDEADTIME;
void cm_PutConn(cm_conn_t *connp)
{
lock_ObtainWrite(&cm_connLock);
- osi_assert(connp->refCount-- > 0);
+ osi_assertx(connp->refCount-- > 0, "cm_conn_t refcount 0");
lock_ReleaseWrite(&cm_connLock);
}
RegCloseKey(parmKey);
}
- afsi_log("lanmanworkstation : SessTimeout %d", RDRtimeout);
+ afsi_log("lanmanworkstation : SessTimeout %u", RDRtimeout);
if (ConnDeadtimeout == 0)
ConnDeadtimeout = (unsigned short) (RDRtimeout / 2);
afsi_log("ConnDeadTimeout is %d", ConnDeadtimeout);
if (!fidp) {
*serversppp = NULL;
- return 0;
+ return CM_ERROR_INVAL;
}
- cellp = cm_FindCellByID(fidp->cell);
- if (!cellp) return CM_ERROR_NOSUCHCELL;
+ cellp = cm_FindCellByID(fidp->cell, 0);
+ if (!cellp)
+ return CM_ERROR_NOSUCHCELL;
- code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp, &volp);
- if (code) return code;
+ code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp, CM_GETVOL_FLAG_CREATE, &volp);
+ if (code)
+ return code;
*serversppp = cm_GetVolServers(volp, fidp->volume);
* and if we're going to retry, determine whether failover is appropriate,
* and whether timed backoff is appropriate.
*
- * If the error code is from cm_Conn() or friends, it will be a CM_ERROR code.
+ * If the error code is from cm_ConnFromFID() or friends, it will be a CM_ERROR code.
* Otherwise it will be an RPC code. This may be a UNIX code (e.g. EDQUOT), or
* it may be an RX code, or it may be a special code (e.g. VNOVOL), or it may
* be a security code (e.g. RXKADEXPIRED).
*
- * If the error code is from cm_Conn() or friends, connp will be NULL.
+ * If the error code is from cm_ConnFromFID() or friends, connp will be NULL.
*
* For VLDB calls, fidp will be NULL.
*
cm_serverRef_t *tsrp;
cm_cell_t *cellp = NULL;
cm_ucell_t *ucellp;
+ cm_volume_t * volp = NULL;
+ cm_vol_state_t *statep = NULL;
int retry = 0;
int free_svr_list = 0;
int dead_session;
long timeUsed, timeLeft;
long code;
char addr[16];
+ int forcing_new = 0;
osi_Log2(afsd_logp, "cm_Analyze connp 0x%p, code 0x%x",
connp, errorCode);
lock_ReleaseWrite(&cm_callbackLock);
}
- /* If not allowed to retry, don't */
- if (reqp->flags & CM_REQ_NORETRY)
- goto out;
-
/* if timeout - check that it did not exceed the HardDead timeout
* and retry */
/* leave 5 seconds margin for sleep */
timeLeft = HardDeadtimeout - timeUsed;
+ /* get a pointer to the cell */
+ if (errorCode) {
+ if (cellp == NULL && serverp)
+ cellp = serverp->cellp;
+ if (cellp == NULL && serversp) {
+ struct cm_serverRef * refp;
+ for ( refp=serversp ; cellp == NULL && refp != NULL; refp=refp->next) {
+ if ( refp->server )
+ cellp = refp->server->cellp;
+ }
+ }
+ if (cellp == NULL && fidp) {
+ cellp = cm_FindCellByID(fidp->cell, 0);
+ }
+ }
+
if (errorCode == CM_ERROR_TIMEDOUT) {
if (timeLeft > 5 ) {
thrd_Sleep(3000);
- if (cellp == NULL && serverp)
- cellp = serverp->cellp;
- if (cellp == NULL && serversp) {
- struct cm_serverRef * refp;
- for ( refp=serversp ; cellp == NULL && refp != NULL; refp=refp->next) {
- if ( refp->server )
- cellp = refp->server->cellp;
- }
- }
cm_CheckServers(CM_FLAG_CHECKDOWNSERVERS, cellp);
retry = 1;
}
- }
+ }
+
+ else if (errorCode == UAEWOULDBLOCK || errorCode == EWOULDBLOCK ||
+ errorCode == UAEAGAIN || errorCode == EAGAIN) {
+ osi_Log0(afsd_logp, "cm_Analyze passed EWOULDBLOCK or EAGAIN.");
+ if (timeLeft > 5 ) {
+ thrd_Sleep(1000);
+ retry = 1;
+ }
+ }
/* if there is nosuchvolume, then we have a situation in which a
* previously known volume no longer has a set of servers
}
else if (errorCode == CM_ERROR_ALLOFFLINE) {
- if (timeLeft > 7) {
- osi_Log0(afsd_logp, "cm_Analyze passed CM_ERROR_ALLOFFLINE.");
+ osi_Log0(afsd_logp, "cm_Analyze passed CM_ERROR_ALLOFFLINE.");
+ /* Volume instances marked offline will be restored by the
+ * background daemon thread as they become available
+ */
+ if (timeLeft > 7 && fidp) {
thrd_Sleep(5000);
-
- if (fidp) { /* Not a VLDB call */
- if (!serversp) {
- code = cm_GetServerList(fidp, userp, reqp, &serverspp);
- if (code == 0) {
- serversp = *serverspp;
- free_svr_list = 1;
- }
- }
- if (serversp) {
- lock_ObtainWrite(&cm_serverLock);
- for (tsrp = serversp; tsrp; tsrp=tsrp->next)
- tsrp->status = not_busy;
- lock_ReleaseWrite(&cm_serverLock);
- if (free_svr_list) {
- cm_FreeServerList(&serversp);
- *serverspp = serversp;
- }
- retry = 1;
- }
- cm_ForceUpdateVolume(fidp, userp, reqp);
- } else { /* VLDB call */
- if (serversp) {
- lock_ObtainWrite(&cm_serverLock);
- for (tsrp = serversp; tsrp; tsrp=tsrp->next)
- tsrp->status = not_busy;
- lock_ReleaseWrite(&cm_serverLock);
- if (free_svr_list) {
- cm_FreeServerList(&serversp);
- *serverspp = serversp;
- }
- }
- }
+ code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp,
+ CM_GETVOL_FLAG_NO_LRU_UPDATE,
+ &volp);
+ if (code == 0) {
+ if (fidp->volume == volp->rw.ID)
+ statep = &volp->rw;
+ else if (fidp->volume == volp->ro.ID)
+ statep = &volp->ro;
+ else if (fidp->volume == volp->bk.ID)
+ statep = &volp->bk;
+
+ if (statep->state != vl_offline) {
+ retry = 1;
+ } else {
+ if (cm_CheckOfflineVolume(volp, statep->ID))
+ retry = 1;
+ }
+
+ cm_PutVolume(volp);
+ }
}
}
-
- /* if all servers are busy, mark them non-busy and start over */
else if (errorCode == CM_ERROR_ALLBUSY) {
+ /* Volumes that are busy cannot be determined to be non-busy
+ * without actually attempting to access them.
+ */
osi_Log0(afsd_logp, "cm_Analyze passed CM_ERROR_ALLBUSY.");
if (timeLeft > 7) {
+
thrd_Sleep(5000);
- if (!serversp) {
- code = cm_GetServerList(fidp, userp, reqp, &serverspp);
+
+ if (fidp) { /* File Server query */
+ code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp,
+ CM_GETVOL_FLAG_NO_LRU_UPDATE,
+ &volp);
if (code == 0) {
- serversp = *serverspp;
- free_svr_list = 1;
+ if (fidp->volume == volp->rw.ID)
+ statep = &volp->rw;
+ else if (fidp->volume == volp->ro.ID)
+ statep = &volp->ro;
+ else if (fidp->volume == volp->bk.ID)
+ statep = &volp->bk;
+
+ if (statep->state != vl_offline && statep->state != vl_busy) {
+ retry = 1;
+ } else {
+ if (!serversp) {
+ code = cm_GetServerList(fidp, userp, reqp, &serverspp);
+ if (code == 0) {
+ serversp = *serverspp;
+ free_svr_list = 1;
+ }
+ }
+ lock_ObtainWrite(&cm_serverLock);
+ for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
+ if (tsrp->status == srv_busy) {
+ tsrp->status = srv_not_busy;
+ }
+ }
+ lock_ReleaseWrite(&cm_serverLock);
+ if (free_svr_list) {
+ cm_FreeServerList(&serversp, 0);
+ *serverspp = serversp;
+ }
+
+ cm_UpdateVolumeStatus(volp, statep->ID);
+ retry = 1;
+ }
+
+ cm_PutVolume(volp);
+ }
+ } else { /* VL Server query */
+ if (serversp) {
+ lock_ObtainWrite(&cm_serverLock);
+ for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
+ if (tsrp->status == srv_busy) {
+ tsrp->status = srv_not_busy;
+ }
+ }
+ lock_ReleaseWrite(&cm_serverLock);
+ retry = 1;
}
}
- lock_ObtainWrite(&cm_serverLock);
- for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
- if (tsrp->status == busy)
- tsrp->status = not_busy;
- }
- lock_ReleaseWrite(&cm_serverLock);
- if (free_svr_list) {
- cm_FreeServerList(&serversp);
- *serverspp = serversp;
- }
- retry = 1;
}
}
/* special codes: VBUSY and VRESTARTING */
else if (errorCode == VBUSY || errorCode == VRESTARTING) {
- if (!serversp) {
+ if (!serversp && fidp) {
code = cm_GetServerList(fidp, userp, reqp, &serverspp);
if (code == 0) {
serversp = *serverspp;
}
lock_ObtainWrite(&cm_serverLock);
for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
- if (tsrp->server == serverp
- && tsrp->status == not_busy) {
- tsrp->status = busy;
+ if (tsrp->server == serverp && tsrp->status == srv_not_busy) {
+ tsrp->status = srv_busy;
+ if (fidp) { /* File Server query */
+ code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp,
+ CM_GETVOL_FLAG_NO_LRU_UPDATE,
+ &volp);
+ if (code == 0) {
+ if (fidp->volume == volp->rw.ID)
+ statep = &volp->rw;
+ else if (fidp->volume == volp->ro.ID)
+ statep = &volp->ro;
+ else if (fidp->volume == volp->bk.ID)
+ statep = &volp->bk;
+ }
+ }
break;
}
}
lock_ReleaseWrite(&cm_serverLock);
+
+ if (statep) {
+ cm_UpdateVolumeStatus(volp, statep->ID);
+ cm_PutVolume(volp);
+ }
+
if (free_svr_list) {
- cm_FreeServerList(&serversp);
+ cm_FreeServerList(&serversp, 0);
*serverspp = serversp;
}
retry = 1;
LogEvent(EVENTLOG_WARNING_TYPE, msgID, addr, fidp->volume);
/* Mark server offline for this volume */
- if (!serversp) {
+ if (!serversp && fidp) {
code = cm_GetServerList(fidp, userp, reqp, &serverspp);
if (code == 0) {
serversp = *serverspp;
free_svr_list = 1;
}
}
+ lock_ObtainWrite(&cm_serverLock);
for (tsrp = serversp; tsrp; tsrp=tsrp->next) {
- if (tsrp->server == serverp)
- tsrp->status = offline;
+ if (tsrp->server == serverp) {
+ /* REDIRECT */
+ if (errorCode == VMOVED) {
+ tsrp->status = srv_deleted;
+ } else {
+ tsrp->status = srv_offline;
+ }
+
+ if (fidp) { /* File Server query */
+ code = cm_GetVolumeByID(cellp, fidp->volume, userp, reqp,
+ CM_GETVOL_FLAG_NO_LRU_UPDATE,
+ &volp);
+ if (code == 0) {
+ if (fidp->volume == volp->rw.ID)
+ statep = &volp->rw;
+ else if (fidp->volume == volp->ro.ID)
+ statep = &volp->ro;
+ else if (fidp->volume == volp->bk.ID)
+ statep = &volp->bk;
+ }
+ }
+ }
}
+ lock_ReleaseWrite(&cm_serverLock);
+
+ if (fidp && errorCode == VMOVED)
+ cm_ForceUpdateVolume(fidp, userp, reqp);
+
+ if (statep) {
+ cm_UpdateVolumeStatus(volp, statep->ID);
+ cm_PutVolume(volp);
+ }
+
if (free_svr_list) {
- cm_FreeServerList(&serversp);
+ cm_FreeServerList(&serversp, 0);
*serverspp = serversp;
}
if ( timeLeft > 2 )
else if (errorCode >= -64 && errorCode < 0) {
/* mark server as down */
lock_ObtainMutex(&serverp->mx);
- serverp->flags |= CM_SERVERFLAG_DOWN;
+ if (reqp->flags & CM_REQ_NEW_CONN_FORCED) {
+ if (!(serverp->flags & CM_SERVERFLAG_DOWN)) {
+ serverp->flags |= CM_SERVERFLAG_DOWN;
+ serverp->downTime = time(NULL);
+ }
+ } else {
+ reqp->flags |= CM_REQ_NEW_CONN_FORCED;
+ forcing_new = 1;
+ }
lock_ReleaseMutex(&serverp->mx);
cm_ForceNewConnections(serverp);
if ( timeLeft > 2 )
case UAENOENT : s = "UAENOENT"; break;
case VICECONNBAD : s = "VICECONNBAD"; break;
case VICETOKENDEAD : s = "VICETOKENDEAD"; break;
+ case WSAEWOULDBLOCK : s = "WSAEWOULDBLOCK"; break;
+ case UAEWOULDBLOCK : s = "UAEWOULDBLOCK"; break;
case CM_ERROR_NOSUCHCELL : s = "CM_ERROR_NOSUCHCELL"; break;
case CM_ERROR_NOSUCHVOLUME : s = "CM_ERROR_NOSUCHVOLUME"; break;
case CM_ERROR_TIMEDOUT : s = "CM_ERROR_TIMEDOUT"; break;
}
}
- if (retry && dead_session)
+ /* If not allowed to retry, don't */
+ if (!forcing_new && (reqp->flags & CM_REQ_NORETRY))
+ retry = 0;
+ else if (retry && dead_session)
retry = 0;
out:
int someBusy = 0, someOffline = 0, allOffline = 1, allBusy = 1, allDown = 1;
long timeUsed, timeLeft, hardTimeLeft;
+ *connpp = NULL;
+
if (serversp == NULL) {
- osi_Log1(afsd_logp, "cm_ConnByMServers returning 0x%x", CM_ERROR_NOSUCHVOLUME);
- return CM_ERROR_NOSUCHVOLUME;
+ osi_Log1(afsd_logp, "cm_ConnByMServers returning 0x%x", CM_ERROR_ALLDOWN);
+ return CM_ERROR_ALLDOWN;
}
- *connpp = NULL;
-
timeUsed = (GetTickCount() - reqp->startTime) / 1000;
/* leave 5 seconds margin of safety */
lock_ReleaseWrite(&cm_serverLock);
if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
allDown = 0;
- if (tsrp->status == busy) {
+ if (tsrp->status == srv_deleted) {
+ /* skip this entry. no longer valid. */;
+ } else if (tsrp->status == srv_busy) {
allOffline = 0;
someBusy = 1;
- } else if (tsrp->status == offline) {
+ } else if (tsrp->status == srv_offline) {
allBusy = 0;
someOffline = 1;
} else {
serviceID = 52;
}
else {
- osi_assert(serverp->type == CM_SERVER_FILE);
+ osi_assertx(serverp->type == CM_SERVER_FILE, "incorrect server type");
port = htons(7000);
serviceID = 1;
}
tcp->cryptlevel = rxkad_clear;
secObjp = rxnull_NewClientSecurityObject();
}
- osi_assert(secObjp != NULL);
+ osi_assertx(secObjp != NULL, "null rx_securityClass");
tcp->callp = rx_NewConnection(serverp->addr.sin_addr.s_addr,
port,
serviceID,
cm_conn_t *tcp;
cm_ucell_t *ucellp;
+ *connpp = NULL;
+
lock_ObtainMutex(&userp->mx);
lock_ObtainWrite(&cm_connLock);
for (tcp = serverp->connsp; tcp; tcp=tcp->nextp) {
return 0;
}
-long cm_Conn(struct cm_fid *fidp, struct cm_user *userp, cm_req_t *reqp,
- cm_conn_t **connpp)
+long cm_ServerAvailable(struct cm_fid *fidp, struct cm_user *userp)
{
long code;
+ cm_req_t req;
+ cm_serverRef_t **serverspp;
+ cm_serverRef_t *tsrp;
+ cm_server_t *tsp;
+ int someBusy = 0, someOffline = 0, allOffline = 1, allBusy = 1, allDown = 1;
+
+ cm_InitReq(&req);
+
+ code = cm_GetServerList(fidp, userp, &req, &serverspp);
+ if (code)
+ return 0;
+
+ lock_ObtainWrite(&cm_serverLock);
+ for (tsrp = *serverspp; tsrp; tsrp=tsrp->next) {
+ tsp = tsrp->server;
+ cm_GetServerNoLock(tsp);
+ if (!(tsp->flags & CM_SERVERFLAG_DOWN)) {
+ allDown = 0;
+ if (tsrp->status == srv_busy) {
+ allOffline = 0;
+ someBusy = 1;
+ } else if (tsrp->status == srv_offline) {
+ allBusy = 0;
+ someOffline = 1;
+ } else {
+ allOffline = 0;
+ allBusy = 0;
+ }
+ }
+ cm_PutServerNoLock(tsp);
+ }
+ lock_ReleaseWrite(&cm_serverLock);
+ cm_FreeServerList(serverspp, 0);
+
+ if (allDown)
+ return 0;
+ else if (allBusy)
+ return 0;
+ else if (allOffline || (someBusy && someOffline))
+ return 0;
+ else
+ return 1;
+}
+/*
+ * The returned cm_conn_t ** object is released in the subsequent call
+ * to cm_Analyze().
+ */
+long cm_ConnFromFID(struct cm_fid *fidp, struct cm_user *userp, cm_req_t *reqp,
+ cm_conn_t **connpp)
+{
+ long code;
cm_serverRef_t **serverspp;
+ *connpp = NULL;
+
code = cm_GetServerList(fidp, userp, reqp, &serverspp);
if (code) {
- *connpp = NULL;
return code;
}
code = cm_ConnByMServers(*serverspp, userp, reqp, connpp);
- cm_FreeServerList(serverspp);
+ cm_FreeServerList(serverspp, 0);
return code;
}
-extern struct rx_connection *
+
+long cm_ConnFromVolume(struct cm_volume *volp, unsigned long volid, struct cm_user *userp, cm_req_t *reqp,
+ cm_conn_t **connpp)
+{
+ long code;
+ cm_serverRef_t **serverspp;
+
+ *connpp = NULL;
+
+ serverspp = cm_GetVolServers(volp, volid);
+
+ code = cm_ConnByMServers(*serverspp, userp, reqp, connpp);
+ cm_FreeServerList(serverspp, 0);
+ return code;
+}
+
+
+extern struct rx_connection *
cm_GetRxConn(cm_conn_t *connp)
{
struct rx_connection * rxconn;