NFSv4 fix CLOSE not waiting for direct IO compeletion
authorOlga Kornievskaia <olga.kornievskaia@gmail.com>
Wed, 24 Jun 2020 17:54:08 +0000 (13:54 -0400)
committerSasha Levin <sashal@kernel.org>
Tue, 30 Jun 2020 00:08:04 +0000 (20:08 -0400)
commit d03727b248d0dae6199569a8d7b629a681154633 upstream.

Figuring out the root case for the REMOVE/CLOSE race and
suggesting the solution was done by Neil Brown.

Currently what happens is that direct IO calls hold a reference
on the open context which is decremented as an asynchronous task
in the nfs_direct_complete(). Before reference is decremented,
control is returned to the application which is free to close the
file. When close is being processed, it decrements its reference
on the open_context but since directIO still holds one, it doesn't
sent a close on the wire. It returns control to the application
which is free to do other operations. For instance, it can delete a
file. Direct IO is finally releasing its reference and triggering
an asynchronous close. Which races with the REMOVE. On the server,
REMOVE can be processed before the CLOSE, failing the REMOVE with
EACCES as the file is still opened.

Signed-off-by: Olga Kornievskaia <kolga@netapp.com>
Suggested-by: Neil Brown <neilb@suse.com>
CC: stable@vger.kernel.org
Signed-off-by: Anna Schumaker <Anna.Schumaker@Netapp.com>
Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
fs/nfs/direct.c
fs/nfs/file.c

index 7789f0b9b999ecd11d9d0286ff3e391f5bde43f2..4d76e9a97538d06ae1bce05dcba67010bb28d9e8 100644 (file)
@@ -385,8 +385,6 @@ static void nfs_direct_complete(struct nfs_direct_req *dreq, bool write)
        if (write)
                nfs_zap_mapping(inode, inode->i_mapping);
 
-       inode_dio_end(inode);
-
        if (dreq->iocb) {
                long res = (long) dreq->error;
                if (!res)
@@ -396,7 +394,10 @@ static void nfs_direct_complete(struct nfs_direct_req *dreq, bool write)
 
        complete_all(&dreq->completion);
 
+       igrab(inode);
        nfs_direct_req_release(dreq);
+       inode_dio_end(inode);
+       iput(inode);
 }
 
 static void nfs_direct_readpage_release(struct nfs_page *req)
@@ -537,8 +538,10 @@ static ssize_t nfs_direct_read_schedule_iovec(struct nfs_direct_req *dreq,
         * generic layer handle the completion.
         */
        if (requested_bytes == 0) {
-               inode_dio_end(inode);
+               igrab(inode);
                nfs_direct_req_release(dreq);
+               inode_dio_end(inode);
+               iput(inode);
                return result < 0 ? result : -EIO;
        }
 
@@ -939,8 +942,10 @@ static ssize_t nfs_direct_write_schedule_iovec(struct nfs_direct_req *dreq,
         * generic layer handle the completion.
         */
        if (requested_bytes == 0) {
-               inode_dio_end(inode);
+               igrab(inode);
                nfs_direct_req_release(dreq);
+               inode_dio_end(inode);
+               iput(inode);
                return result < 0 ? result : -EIO;
        }
 
index dc875cd0e11d52386c893ee83c1c71ff40f855ef..eaa6697d256ea587f5d6bc38969781b67d196edc 100644 (file)
@@ -82,6 +82,7 @@ nfs_file_release(struct inode *inode, struct file *filp)
        dprintk("NFS: release(%pD2)\n", filp);
 
        nfs_inc_stats(inode, NFSIOS_VFSRELEASE);
+       inode_dio_wait(inode);
        nfs_file_clear_open_context(filp);
        return 0;
 }