Btrfs: cleanup the read failure record after write or when the inode is freeing After the data is written successfully, we should cleanup the read failure record in that range because - If we set data COW for the file, the range that the failure record pointed to is mapped to a new place, so it is invalid. - If we set no data COW for the file, and if there is no error during writting, the corrupted data is corrected, so the failure record can be removed. And if some errors happen on the mirrors, we also needn't worry about it because the failure record will be recreated if we read the same place again. Sometimes, we may fail to correct the data, so the failure records will be left in the tree, we need free them when we free the inode or the memory leak happens. Signed-off-by: Miao Xie <miaox@cn.fujitsu.com> Signed-off-by: Chris Mason <clm@fb.com>

commit: f612496bca664bff6a09a99a9a7506410b6e876e [log] [tgz]
author: Miao Xie <miaox@cn.fujitsu.com> Fri Sep 12 18:44:04 2014 +0800
committer: Chris Mason <clm@fb.com> Wed Sep 17 13:39:02 2014 -0700
tree: d74da9c3d7c60a4ceb29c70be9a5d114eb7c8cc2
parent: 8b110e393c5a6e72d50fcdf9fa7ed8b647cfdfc9 [diff] [blame]
diff --git a/fs/btrfs/extent_io.c b/fs/btrfs/extent_io.c
index 9e2ef27..7822900 100644
--- a/fs/btrfs/extent_io.c
+++ b/fs/btrfs/extent_io.c

@@ -2138,6 +2138,40 @@
 	return 0;
 }
 
+/*
+ * Can be called when
+ * - hold extent lock
+ * - under ordered extent
+ * - the inode is freeing
+ */
+void btrfs_free_io_failure_record(struct inode *inode, u64 start, u64 end)
+{
+	struct extent_io_tree *failure_tree = &BTRFS_I(inode)->io_failure_tree;
+	struct io_failure_record *failrec;
+	struct extent_state *state, *next;
+
+	if (RB_EMPTY_ROOT(&failure_tree->state))
+		return;
+
+	spin_lock(&failure_tree->lock);
+	state = find_first_extent_bit_state(failure_tree, start, EXTENT_DIRTY);
+	while (state) {
+		if (state->start > end)
+			break;
+
+		ASSERT(state->end <= end);
+
+		next = next_state(state);
+
+		failrec = (struct io_failure_record *)state->private;
+		free_extent_state(state);
+		kfree(failrec);
+
+		state = next;
+	}
+	spin_unlock(&failure_tree->lock);
+}
+
 int btrfs_get_io_failure_record(struct inode *inode, u64 start, u64 end,
 				struct io_failure_record **failrec_ret)
 {
commit	f612496bca664bff6a09a99a9a7506410b6e876e	[log] [tgz]
author	Miao Xie <miaox@cn.fujitsu.com>	Fri Sep 12 18:44:04 2014 +0800
committer	Chris Mason <clm@fb.com>	Wed Sep 17 13:39:02 2014 -0700
tree	d74da9c3d7c60a4ceb29c70be9a5d114eb7c8cc2
parent	8b110e393c5a6e72d50fcdf9fa7ed8b647cfdfc9 [diff] [blame]