ceph: when seeing write errors on an inode, switch to sync writes

Currently, we don't have a real feedback mechanism in place for when we start seeing buffered writeback errors. If writeback is failing, there is nothing that prevents an application from continuing to dirty pages that aren't being cleaned. In the event that we're seeing write errors of any sort occur on an inode, have the callback set a flag to force further writes to be synchronous. When the next write succeeds, clear the flag to allow buffered writeback to continue. Since this is just a hint to the write submission mechanism, we only take the i_ceph_lock when a lockless check shows that the flag needs to be changed. Signed-off-by: Jeff Layton <jlayton@redhat.com> Reviewed-by: "Yan, Zheng” <zyan@redhat.com> Signed-off-by: Ilya Dryomov <idryomov@gmail.com>
author: Jeff Layton <jlayton@redhat.com> 2017-04-04 08:39:46 -0400
committer: Ilya Dryomov <idryomov@gmail.com> 2017-05-04 09:19:22 +0200
commit: 26544c623e741ac6445f8b1ae369ee32ae1794ad (patch)
tree: 72810f59f5735dad3b29c5a127ae2a823fc1ff1d /fs/ceph/super.h
parent: 6fc1fe5e4cfc8939ee59a570b087946042a30140 (diff)
download: op-kernel-dev-26544c623e741ac6445f8b1ae369ee32ae1794ad.zip
op-kernel-dev-26544c623e741ac6445f8b1ae369ee32ae1794ad.tar.gz
1 files changed, 26 insertions, 0 deletions
diff --git a/fs/ceph/super.h b/fs/ceph/super.h
index c68e6a0..7334ee8 100644
--- a/fs/ceph/super.h
+++ b/fs/ceph/super.h
@@ -474,6 +474,32 @@ static inline struct inode *ceph_find_inode(struct super_block *sb,
 #define CEPH_I_CAP_DROPPED	(1 << 8)  /* caps were forcibly dropped */
 #define CEPH_I_KICK_FLUSH	(1 << 9)  /* kick flushing caps */
 #define CEPH_I_FLUSH_SNAPS	(1 << 10) /* need flush snapss */
+#define CEPH_I_ERROR_WRITE	(1 << 11) /* have seen write errors */
+
+/*
+ * We set the ERROR_WRITE bit when we start seeing write errors on an inode
+ * and then clear it when they start succeeding. Note that we do a lockless
+ * check first, and only take the lock if it looks like it needs to be changed.
+ * The write submission code just takes this as a hint, so we're not too
+ * worried if a few slip through in either direction.
+ */
+static inline void ceph_set_error_write(struct ceph_inode_info *ci)
+{
+	if (!(READ_ONCE(ci->i_ceph_flags) & CEPH_I_ERROR_WRITE)) {
+		spin_lock(&ci->i_ceph_lock);
+		ci->i_ceph_flags |= CEPH_I_ERROR_WRITE;
+		spin_unlock(&ci->i_ceph_lock);
+	}
+}
+
+static inline void ceph_clear_error_write(struct ceph_inode_info *ci)
+{
+	if (READ_ONCE(ci->i_ceph_flags) & CEPH_I_ERROR_WRITE) {
+		spin_lock(&ci->i_ceph_lock);
+		ci->i_ceph_flags &= ~CEPH_I_ERROR_WRITE;
+		spin_unlock(&ci->i_ceph_lock);
+	}
+}
 
 static inline void __ceph_dir_set_complete(struct ceph_inode_info *ci,
 					   long long release_count,
author	Jeff Layton <jlayton@redhat.com>	2017-04-04 08:39:46 -0400
committer	Ilya Dryomov <idryomov@gmail.com>	2017-05-04 09:19:22 +0200
commit	26544c623e741ac6445f8b1ae369ee32ae1794ad (patch)
tree	72810f59f5735dad3b29c5a127ae2a823fc1ff1d /fs/ceph/super.h
parent	6fc1fe5e4cfc8939ee59a570b087946042a30140 (diff)
download	op-kernel-dev-26544c623e741ac6445f8b1ae369ee32ae1794ad.zip op-kernel-dev-26544c623e741ac6445f8b1ae369ee32ae1794ad.tar.gz