pnfs: Proper delay for NFS4ERR_RECALLCONFLICT in layout_get_done

author Boaz Harrosh <bharrosh@panasas.com>

Wed, 22 Jan 2014 18:34:54 +0000 (20:34 +0200)

committer Trond Myklebust <trond.myklebust@primarydata.com>

Thu, 23 Jan 2014 01:10:49 +0000 (18:10 -0700)
author Boaz Harrosh <bharrosh@panasas.com>
Wed, 22 Jan 2014 18:34:54 +0000 (20:34 +0200)
committer Trond Myklebust <trond.myklebust@primarydata.com>
Thu, 23 Jan 2014 01:10:49 +0000 (18:10 -0700)
diff --git a/fs/nfs/nfs4proc.c b/fs/nfs/nfs4proc.c

index a9eaaaa436cb37d7c32784bb7747fa9f1873e4c6..a1965329a12c078781431c289bdb1c8b10954782 100644 (file)
--- a/fs/nfs/nfs4proc.c
+++ b/fs/nfs/nfs4proc.c
@@ -7409,9 +7409,9 @@ static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
         struct nfs_server *server = NFS_SERVER(inode);
         struct pnfs_layout_hdr *lo;
         struct nfs4_state *state = NULL;
-       unsigned long timeo, giveup;
+       unsigned long timeo, now, giveup;
  
-       dprintk("--> %s\n", __func__);
+       dprintk("--> %s tk_status => %d\n", __func__, -task->tk_status);
  
         if (!nfs41_sequence_done(task, &lgp->res.seq_res))
                 goto out;
@@ -7419,12 +7419,38 @@ static void nfs4_layoutget_done(struct rpc_task *task, void *calldata)
         switch (task->tk_status) {
         case 0:
                 goto out;
+       /*
+        * NFS4ERR_LAYOUTTRYLATER is a conflict with another client
+        * (or clients) writing to the same RAID stripe
+        */
         case -NFS4ERR_LAYOUTTRYLATER:
+       /*
+        * NFS4ERR_RECALLCONFLICT is when conflict with self (must recall
+        * existing layout before getting a new one).
+        */
         case -NFS4ERR_RECALLCONFLICT:
                 timeo = rpc_get_timeout(task->tk_client);
                 giveup = lgp->args.timestamp + timeo;
-               if (time_after(giveup, jiffies))
-                       task->tk_status = -NFS4ERR_DELAY;
+               now = jiffies;
+               if (time_after(giveup, now)) {
+                       unsigned long delay;
+
+                       /* Delay for:
+                        * - Not less then NFS4_POLL_RETRY_MIN.
+                        * - One last time a jiffie before we give up
+                        * - exponential backoff (time_now minus start_attempt)
+                        */
+                       delay = max_t(unsigned long, NFS4_POLL_RETRY_MIN,
+                                   min((giveup - now - 1),
+                                       now - lgp->args.timestamp));
+
+                       dprintk("%s: NFS4ERR_RECALLCONFLICT waiting %lu\n",
+                               __func__, delay);
+                       rpc_delay(task, delay);
+                       task->tk_status = 0;
+                       rpc_restart_call_prepare(task);
+                       goto out; /* Do not call nfs4_async_handle_error() */
+               }
                 break;
         case -NFS4ERR_EXPIRED:
         case -NFS4ERR_BAD_STATEID:
author	Boaz Harrosh <bharrosh@panasas.com>
	Wed, 22 Jan 2014 18:34:54 +0000 (20:34 +0200)
committer	Trond Myklebust <trond.myklebust@primarydata.com>
	Thu, 23 Jan 2014 01:10:49 +0000 (18:10 -0700)