4.14-stable patches

author Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)
author Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)
diff --git a/queue-4.14/bpf-wait-for-running-bpf-programs-when-updating-map-in-map.patch b/queue-4.14/bpf-wait-for-running-bpf-programs-when-updating-map-in-map.patch

new file mode 100644 (file)

index 0000000..2e8a369
--- /dev/null
+++ b/queue-4.14/bpf-wait-for-running-bpf-programs-when-updating-map-in-map.patch
@@ -0,0 +1,66 @@
+From 1ae80cf31938c8f77c37a29bbe29e7f1cd492be8 Mon Sep 17 00:00:00 2001
+From: Daniel Colascione <dancol@google.com>
+Date: Fri, 12 Oct 2018 03:54:27 -0700
+Subject: bpf: wait for running BPF programs when updating map-in-map
+
+From: Daniel Colascione <dancol@google.com>
+
+commit 1ae80cf31938c8f77c37a29bbe29e7f1cd492be8 upstream.
+
+The map-in-map frequently serves as a mechanism for atomic
+snapshotting of state that a BPF program might record.  The current
+implementation is dangerous to use in this way, however, since
+userspace has no way of knowing when all programs that might have
+retrieved the "old" value of the map may have completed.
+
+This change ensures that map update operations on map-in-map map types
+always wait for all references to the old map to drop before returning
+to userspace.
+
+Signed-off-by: Daniel Colascione <dancol@google.com>
+Reviewed-by: Joel Fernandes (Google) <joel@joelfernandes.org>
+Signed-off-by: Alexei Starovoitov <ast@kernel.org>
+[fengc@google.com: 4.14 backport: adjust context]
+Signed-off-by: Chenbo Feng <fengc@google.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ kernel/bpf/syscall.c |   13 +++++++++++++
+ 1 file changed, 13 insertions(+)
+
+--- a/kernel/bpf/syscall.c
++++ b/kernel/bpf/syscall.c
+@@ -519,6 +519,17 @@ err_put:
+       return err;
+ }
+ 
++static void maybe_wait_bpf_programs(struct bpf_map *map)
++{
++      /* Wait for any running BPF programs to complete so that
++       * userspace, when we return to it, knows that all programs
++       * that could be running use the new map value.
++       */
++      if (map->map_type == BPF_MAP_TYPE_HASH_OF_MAPS ||
++          map->map_type == BPF_MAP_TYPE_ARRAY_OF_MAPS)
++              synchronize_rcu();
++}
++
+ #define BPF_MAP_UPDATE_ELEM_LAST_FIELD flags
+ 
+ static int map_update_elem(union bpf_attr *attr)
+@@ -592,6 +603,7 @@ static int map_update_elem(union bpf_att
+       }
+       __this_cpu_dec(bpf_prog_active);
+       preempt_enable();
++      maybe_wait_bpf_programs(map);
+ 
+       if (!err)
+               trace_bpf_map_update_elem(map, ufd, key, value);
+@@ -636,6 +648,7 @@ static int map_delete_elem(union bpf_att
+       rcu_read_unlock();
+       __this_cpu_dec(bpf_prog_active);
+       preempt_enable();
++      maybe_wait_bpf_programs(map);
+ 
+       if (!err)
+               trace_bpf_map_delete_elem(map, ufd, key);
diff --git a/queue-4.14/btrfs-don-t-run-delayed_iputs-in-commit.patch b/queue-4.14/btrfs-don-t-run-delayed_iputs-in-commit.patch

new file mode 100644 (file)

index 0000000..ac92b27
--- /dev/null
+++ b/queue-4.14/btrfs-don-t-run-delayed_iputs-in-commit.patch
@@ -0,0 +1,52 @@
+From 30928e9baac238a7330085a1c5747f0b5df444b4 Mon Sep 17 00:00:00 2001
+From: Josef Bacik <josef@toxicpanda.com>
+Date: Thu, 11 Oct 2018 15:54:31 -0400
+Subject: btrfs: don't run delayed_iputs in commit
+
+From: Josef Bacik <josef@toxicpanda.com>
+
+commit 30928e9baac238a7330085a1c5747f0b5df444b4 upstream.
+
+This could result in a really bad case where we do something like
+
+evict
+  evict_refill_and_join
+    btrfs_commit_transaction
+      btrfs_run_delayed_iputs
+        evict
+          evict_refill_and_join
+            btrfs_commit_transaction
+... forever
+
+We have plenty of other places where we run delayed iputs that are much
+safer, let those do the work.
+
+CC: stable@vger.kernel.org # 4.4+
+Reviewed-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: Josef Bacik <josef@toxicpanda.com>
+Reviewed-by: David Sterba <dsterba@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/transaction.c |    9 ---------
+ 1 file changed, 9 deletions(-)
+
+--- a/fs/btrfs/transaction.c
++++ b/fs/btrfs/transaction.c
+@@ -2307,15 +2307,6 @@ int btrfs_commit_transaction(struct btrf
+ 
+       kmem_cache_free(btrfs_trans_handle_cachep, trans);
+ 
+-      /*
+-       * If fs has been frozen, we can not handle delayed iputs, otherwise
+-       * it'll result in deadlock about SB_FREEZE_FS.
+-       */
+-      if (current != fs_info->transaction_kthread &&
+-          current != fs_info->cleaner_kthread &&
+-          !test_bit(BTRFS_FS_FROZEN, &fs_info->flags))
+-              btrfs_run_delayed_iputs(fs_info);
+-
+       return ret;
+ 
+ scrub_continue:
diff --git a/queue-4.14/btrfs-don-t-use-ctl-free_space-for-max_extent_size.patch b/queue-4.14/btrfs-don-t-use-ctl-free_space-for-max_extent_size.patch

new file mode 100644 (file)

index 0000000..11b66cb
--- /dev/null
+++ b/queue-4.14/btrfs-don-t-use-ctl-free_space-for-max_extent_size.patch
@@ -0,0 +1,56 @@
+From fb5c39d7a887108087de6ff93d3f326b01b4ef41 Mon Sep 17 00:00:00 2001
+From: Josef Bacik <jbacik@fb.com>
+Date: Thu, 11 Oct 2018 15:54:09 -0400
+Subject: btrfs: don't use ctl->free_space for max_extent_size
+
+From: Josef Bacik <jbacik@fb.com>
+
+commit fb5c39d7a887108087de6ff93d3f326b01b4ef41 upstream.
+
+max_extent_size is supposed to be the largest contiguous range for the
+space info, and ctl->free_space is the total free space in the block
+group.  We need to keep track of these separately and _only_ use the
+max_free_space if we don't have a max_extent_size, as that means our
+original request was too large to search any of the block groups for and
+therefore wouldn't have a max_extent_size set.
+
+CC: stable@vger.kernel.org # 4.14+
+Reviewed-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: Josef Bacik <jbacik@fb.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/extent-tree.c |    7 +++++--
+ 1 file changed, 5 insertions(+), 2 deletions(-)
+
+--- a/fs/btrfs/extent-tree.c
++++ b/fs/btrfs/extent-tree.c
+@@ -7573,6 +7573,7 @@ static noinline int find_free_extent(str
+       struct btrfs_block_group_cache *block_group = NULL;
+       u64 search_start = 0;
+       u64 max_extent_size = 0;
++      u64 max_free_space = 0;
+       u64 empty_cluster = 0;
+       struct btrfs_space_info *space_info;
+       int loop = 0;
+@@ -7867,8 +7868,8 @@ unclustered_alloc:
+                       spin_lock(&ctl->tree_lock);
+                       if (ctl->free_space <
+                           num_bytes + empty_cluster + empty_size) {
+-                              if (ctl->free_space > max_extent_size)
+-                                      max_extent_size = ctl->free_space;
++                              max_free_space = max(max_free_space,
++                                                   ctl->free_space);
+                               spin_unlock(&ctl->tree_lock);
+                               goto loop;
+                       }
+@@ -8037,6 +8038,8 @@ loop:
+       }
+ out:
+       if (ret == -ENOSPC) {
++              if (!max_extent_size)
++                      max_extent_size = max_free_space;
+               spin_lock(&space_info->lock);
+               space_info->max_extent_size = max_extent_size;
+               spin_unlock(&space_info->lock);
diff --git a/queue-4.14/btrfs-fix-assertion-on-fsync-of-regular-file-when-using-no-holes-feature.patch b/queue-4.14/btrfs-fix-assertion-on-fsync-of-regular-file-when-using-no-holes-feature.patch

new file mode 100644 (file)

index 0000000..5dfcef2
--- /dev/null
+++ b/queue-4.14/btrfs-fix-assertion-on-fsync-of-regular-file-when-using-no-holes-feature.patch
@@ -0,0 +1,59 @@
+From 7ed586d0a8241e81d58c656c5b315f781fa6fc97 Mon Sep 17 00:00:00 2001
+From: Filipe Manana <fdmanana@suse.com>
+Date: Mon, 15 Oct 2018 09:51:00 +0100
+Subject: Btrfs: fix assertion on fsync of regular file when using no-holes feature
+
+From: Filipe Manana <fdmanana@suse.com>
+
+commit 7ed586d0a8241e81d58c656c5b315f781fa6fc97 upstream.
+
+When using the NO_HOLES feature and logging a regular file, we were
+expecting that if we find an inline extent, that either its size in RAM
+(uncompressed and unenconded) matches the size of the file or if it does
+not, that it matches the sector size and it represents compressed data.
+This assertion does not cover a case where the length of the inline extent
+is smaller than the sector size and also smaller the file's size, such
+case is possible through fallocate. Example:
+
+  $ mkfs.btrfs -f -O no-holes /dev/sdb
+  $ mount /dev/sdb /mnt
+
+  $ xfs_io -f -c "pwrite -S 0xb60 0 21" /mnt/foobar
+  $ xfs_io -c "falloc 40 40" /mnt/foobar
+  $ xfs_io -c "fsync" /mnt/foobar
+
+In the above example we trigger the assertion because the inline extent's
+length is 21 bytes while the file size is 80 bytes. The fallocate() call
+merely updated the file's size and did not touch the existing inline
+extent, as expected.
+
+So fix this by adjusting the assertion so that an inline extent length
+smaller than the file size is valid if the file size is smaller than the
+filesystem's sector size.
+
+A test case for fstests follows soon.
+
+Reported-by: Anatoly Trosinenko <anatoly.trosinenko@gmail.com>
+Fixes: a89ca6f24ffe ("Btrfs: fix fsync after truncate when no_holes feature is enabled")
+CC: stable@vger.kernel.org # 4.14+
+Link: https://lore.kernel.org/linux-btrfs/CAE5jQCfRSBC7n4pUTFJcmHh109=gwyT9mFkCOL+NKfzswmR=_Q@mail.gmail.com/
+Signed-off-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/tree-log.c |    3 ++-
+ 1 file changed, 2 insertions(+), 1 deletion(-)
+
+--- a/fs/btrfs/tree-log.c
++++ b/fs/btrfs/tree-log.c
+@@ -4641,7 +4641,8 @@ static int btrfs_log_trailing_hole(struc
+                       ASSERT(len == i_size ||
+                              (len == fs_info->sectorsize &&
+                               btrfs_file_extent_compression(leaf, extent) !=
+-                              BTRFS_COMPRESS_NONE));
++                              BTRFS_COMPRESS_NONE) ||
++                             (len < i_size && i_size < fs_info->sectorsize));
+                       return 0;
+               }
+ 
diff --git a/queue-4.14/btrfs-fix-fsync-after-hole-punching-when-using-no-holes-feature.patch b/queue-4.14/btrfs-fix-fsync-after-hole-punching-when-using-no-holes-feature.patch

new file mode 100644 (file)

index 0000000..1f210d8
--- /dev/null
+++ b/queue-4.14/btrfs-fix-fsync-after-hole-punching-when-using-no-holes-feature.patch
@@ -0,0 +1,97 @@
+From 4ee3fad34a9cc2cf33303dfbd0cf554248651c86 Mon Sep 17 00:00:00 2001
+From: Filipe Manana <fdmanana@suse.com>
+Date: Mon, 26 Mar 2018 23:59:00 +0100
+Subject: Btrfs: fix fsync after hole punching when using no-holes feature
+
+From: Filipe Manana <fdmanana@suse.com>
+
+commit 4ee3fad34a9cc2cf33303dfbd0cf554248651c86 upstream.
+
+When we have the no-holes mode enabled and fsync a file after punching a
+hole in it, we can end up not logging the whole hole range in the log tree.
+This happens if the file has extent items that span more than one leaf and
+we punch a hole that covers a range that starts in a leaf but does not go
+beyond the offset of the first extent in the next leaf.
+
+Example:
+
+  $ mkfs.btrfs -f -O no-holes -n 65536 /dev/sdb
+  $ mount /dev/sdb /mnt
+  $ for ((i = 0; i <= 831; i++)); do
+       offset=$((i * 2 * 256 * 1024))
+       xfs_io -f -c "pwrite -S 0xab -b 256K $offset 256K" \
+               /mnt/foobar >/dev/null
+    done
+  $ sync
+
+  # We now have 2 leafs in our filesystem fs tree, the first leaf has an
+  # item corresponding the extent at file offset 216530944 and the second
+  # leaf has a first item corresponding to the extent at offset 217055232.
+  # Now we punch a hole that partially covers the range of the extent at
+  # offset 216530944 but does go beyond the offset 217055232.
+
+  $ xfs_io -c "fpunch $((216530944 + 128 * 1024 - 4000)) 256K" /mnt/foobar
+  $ xfs_io -c "fsync" /mnt/foobar
+
+  <power fail>
+
+  # mount to replay the log
+  $ mount /dev/sdb /mnt
+
+  # Before this patch, only the subrange [216658016, 216662016[ (length of
+  # 4000 bytes) was logged, leaving an incorrect file layout after log
+  # replay.
+
+Fix this by checking if there is a hole between the last extent item that
+we processed and the first extent item in the next leaf, and if there is
+one, log an explicit hole extent item.
+
+Fixes: 16e7549f045d ("Btrfs: incompatible format change to remove hole extents")
+Signed-off-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Sudip Mukherjee <sudipm.mukherjee@gmail.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/tree-log.c |   30 ++++++++++++++++++++++++++++++
+ 1 file changed, 30 insertions(+)
+
+--- a/fs/btrfs/tree-log.c
++++ b/fs/btrfs/tree-log.c
+@@ -3978,6 +3978,36 @@ fill_holes:
+                       break;
+               *last_extent = extent_end;
+       }
++
++      /*
++       * Check if there is a hole between the last extent found in our leaf
++       * and the first extent in the next leaf. If there is one, we need to
++       * log an explicit hole so that at replay time we can punch the hole.
++       */
++      if (ret == 0 &&
++          key.objectid == btrfs_ino(inode) &&
++          key.type == BTRFS_EXTENT_DATA_KEY &&
++          i == btrfs_header_nritems(src_path->nodes[0])) {
++              ret = btrfs_next_leaf(inode->root, src_path);
++              need_find_last_extent = true;
++              if (ret > 0) {
++                      ret = 0;
++              } else if (ret == 0) {
++                      btrfs_item_key_to_cpu(src_path->nodes[0], &key,
++                                            src_path->slots[0]);
++                      if (key.objectid == btrfs_ino(inode) &&
++                          key.type == BTRFS_EXTENT_DATA_KEY &&
++                          *last_extent < key.offset) {
++                              const u64 len = key.offset - *last_extent;
++
++                              ret = btrfs_insert_file_extent(trans, log,
++                                                             btrfs_ino(inode),
++                                                             *last_extent, 0,
++                                                             0, len, 0, len,
++                                                             0, 0, 0);
++                      }
++              }
++      }
+       /*
+        * Need to let the callers know we dropped the path so they should
+        * re-search.
diff --git a/queue-4.14/btrfs-fix-null-pointer-dereference-on-compressed-write-path-error.patch b/queue-4.14/btrfs-fix-null-pointer-dereference-on-compressed-write-path-error.patch

new file mode 100644 (file)

index 0000000..634529b
--- /dev/null
+++ b/queue-4.14/btrfs-fix-null-pointer-dereference-on-compressed-write-path-error.patch
@@ -0,0 +1,46 @@
+From 3527a018c00e5dbada2f9d7ed5576437b6dd5cfb Mon Sep 17 00:00:00 2001
+From: Filipe Manana <fdmanana@suse.com>
+Date: Sat, 13 Oct 2018 00:37:25 +0100
+Subject: Btrfs: fix null pointer dereference on compressed write path error
+
+From: Filipe Manana <fdmanana@suse.com>
+
+commit 3527a018c00e5dbada2f9d7ed5576437b6dd5cfb upstream.
+
+At inode.c:compress_file_range(), under the "free_pages_out" label, we can
+end up dereferencing the "pages" pointer when it has a NULL value. This
+case happens when "start" has a value of 0 and we fail to allocate memory
+for the "pages" pointer. When that happens we jump to the "cont" label and
+then enter the "if (start == 0)" branch where we immediately call the
+cow_file_range_inline() function. If that function returns 0 (success
+creating an inline extent) or an error (like -ENOMEM for example) we jump
+to the "free_pages_out" label and then access "pages[i]" leading to a NULL
+pointer dereference, since "nr_pages" has a value greater than zero at
+that point.
+
+Fix this by setting "nr_pages" to 0 when we fail to allocate memory for
+the "pages" pointer.
+
+Bugzilla: https://bugzilla.kernel.org/show_bug.cgi?id=201119
+Fixes: 771ed689d2cd ("Btrfs: Optimize compressed writeback and reads")
+CC: stable@vger.kernel.org # 4.4+
+Reviewed-by: Liu Bo <bo.liu@linux.alibaba.com>
+Signed-off-by: Filipe Manana <fdmanana@suse.com>
+Reviewed-by: David Sterba <dsterba@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/inode.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/fs/btrfs/inode.c
++++ b/fs/btrfs/inode.c
+@@ -524,6 +524,7 @@ again:
+               pages = kcalloc(nr_pages, sizeof(struct page *), GFP_NOFS);
+               if (!pages) {
+                       /* just bail out to the uncompressed code */
++                      nr_pages = 0;
+                       goto cont;
+               }
+ 
diff --git a/queue-4.14/btrfs-fix-use-after-free-during-inode-eviction.patch b/queue-4.14/btrfs-fix-use-after-free-during-inode-eviction.patch

new file mode 100644 (file)

index 0000000..ef5e7ae
--- /dev/null
+++ b/queue-4.14/btrfs-fix-use-after-free-during-inode-eviction.patch
@@ -0,0 +1,61 @@
+From 421f0922a2cfb0c75acd9746454aaa576c711a65 Mon Sep 17 00:00:00 2001
+From: Filipe Manana <fdmanana@suse.com>
+Date: Fri, 12 Oct 2018 13:02:48 +0100
+Subject: Btrfs: fix use-after-free during inode eviction
+
+From: Filipe Manana <fdmanana@suse.com>
+
+commit 421f0922a2cfb0c75acd9746454aaa576c711a65 upstream.
+
+At inode.c:evict_inode_truncate_pages(), when we iterate over the
+inode's extent states, we access an extent state record's "state" field
+after we unlocked the inode's io tree lock. This can lead to a
+use-after-free issue because after we unlock the io tree that extent
+state record might have been freed due to being merged into another
+adjacent extent state record (a previous inflight bio for a read
+operation finished in the meanwhile which unlocked a range in the io
+tree and cause a merge of extent state records, as explained in the
+comment before the while loop added in commit 6ca0709756710 ("Btrfs: fix
+hang during inode eviction due to concurrent readahead")).
+
+Fix this by keeping a copy of the extent state's flags in a local
+variable and using it after unlocking the io tree.
+
+Bugzilla: https://bugzilla.kernel.org/show_bug.cgi?id=201189
+Fixes: b9d0b38928e2 ("btrfs: Add handler for invalidate page")
+CC: stable@vger.kernel.org # 4.4+
+Reviewed-by: Qu Wenruo <wqu@suse.com>
+Signed-off-by: Filipe Manana <fdmanana@suse.com>
+Reviewed-by: David Sterba <dsterba@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/inode.c |    4 +++-
+ 1 file changed, 3 insertions(+), 1 deletion(-)
+
+--- a/fs/btrfs/inode.c
++++ b/fs/btrfs/inode.c
+@@ -5335,11 +5335,13 @@ static void evict_inode_truncate_pages(s
+               struct extent_state *cached_state = NULL;
+               u64 start;
+               u64 end;
++              unsigned state_flags;
+ 
+               node = rb_first(&io_tree->state);
+               state = rb_entry(node, struct extent_state, rb_node);
+               start = state->start;
+               end = state->end;
++              state_flags = state->state;
+               spin_unlock(&io_tree->lock);
+ 
+               lock_extent_bits(io_tree, start, end, &cached_state);
+@@ -5352,7 +5354,7 @@ static void evict_inode_truncate_pages(s
+                *
+                * Note, end is the bytenr of last byte, so we need + 1 here.
+                */
+-              if (state->state & EXTENT_DELALLOC)
++              if (state_flags & EXTENT_DELALLOC)
+                       btrfs_qgroup_free_data(inode, NULL, start, end - start + 1);
+ 
+               clear_extent_bit(io_tree, start, end,
diff --git a/queue-4.14/btrfs-fix-use-after-free-when-dumping-free-space.patch b/queue-4.14/btrfs-fix-use-after-free-when-dumping-free-space.patch

new file mode 100644 (file)

index 0000000..4b15e79
--- /dev/null
+++ b/queue-4.14/btrfs-fix-use-after-free-when-dumping-free-space.patch
@@ -0,0 +1,221 @@
+From 9084cb6a24bf5838a665af92ded1af8363f9e563 Mon Sep 17 00:00:00 2001
+From: Filipe Manana <fdmanana@suse.com>
+Date: Mon, 22 Oct 2018 10:43:06 +0100
+Subject: Btrfs: fix use-after-free when dumping free space
+
+From: Filipe Manana <fdmanana@suse.com>
+
+commit 9084cb6a24bf5838a665af92ded1af8363f9e563 upstream.
+
+We were iterating a block group's free space cache rbtree without locking
+first the lock that protects it (the free_space_ctl->free_space_offset
+rbtree is protected by the free_space_ctl->tree_lock spinlock).
+
+KASAN reported an use-after-free problem when iterating such a rbtree due
+to a concurrent rbtree delete:
+
+[ 9520.359168] ==================================================================
+[ 9520.359656] BUG: KASAN: use-after-free in rb_next+0x13/0x90
+[ 9520.359949] Read of size 8 at addr ffff8800b7ada500 by task btrfs-transacti/1721
+[ 9520.360357]
+[ 9520.360530] CPU: 4 PID: 1721 Comm: btrfs-transacti Tainted: G             L    4.19.0-rc8-nbor #555
+[ 9520.360990] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.10.2-1ubuntu1 04/01/2014
+[ 9520.362682] Call Trace:
+[ 9520.362887]  dump_stack+0xa4/0xf5
+[ 9520.363146]  print_address_description+0x78/0x280
+[ 9520.363412]  kasan_report+0x263/0x390
+[ 9520.363650]  ? rb_next+0x13/0x90
+[ 9520.363873]  __asan_load8+0x54/0x90
+[ 9520.364102]  rb_next+0x13/0x90
+[ 9520.364380]  btrfs_dump_free_space+0x146/0x160 [btrfs]
+[ 9520.364697]  dump_space_info+0x2cd/0x310 [btrfs]
+[ 9520.364997]  btrfs_reserve_extent+0x1ee/0x1f0 [btrfs]
+[ 9520.365310]  __btrfs_prealloc_file_range+0x1cc/0x620 [btrfs]
+[ 9520.365646]  ? btrfs_update_time+0x180/0x180 [btrfs]
+[ 9520.365923]  ? _raw_spin_unlock+0x27/0x40
+[ 9520.366204]  ? btrfs_alloc_data_chunk_ondemand+0x2c0/0x5c0 [btrfs]
+[ 9520.366549]  btrfs_prealloc_file_range_trans+0x23/0x30 [btrfs]
+[ 9520.366880]  cache_save_setup+0x42e/0x580 [btrfs]
+[ 9520.367220]  ? btrfs_check_data_free_space+0xd0/0xd0 [btrfs]
+[ 9520.367518]  ? lock_downgrade+0x2f0/0x2f0
+[ 9520.367799]  ? btrfs_write_dirty_block_groups+0x11f/0x6e0 [btrfs]
+[ 9520.368104]  ? kasan_check_read+0x11/0x20
+[ 9520.368349]  ? do_raw_spin_unlock+0xa8/0x140
+[ 9520.368638]  btrfs_write_dirty_block_groups+0x2af/0x6e0 [btrfs]
+[ 9520.368978]  ? btrfs_start_dirty_block_groups+0x870/0x870 [btrfs]
+[ 9520.369282]  ? do_raw_spin_unlock+0xa8/0x140
+[ 9520.369534]  ? _raw_spin_unlock+0x27/0x40
+[ 9520.369811]  ? btrfs_run_delayed_refs+0x1b8/0x230 [btrfs]
+[ 9520.370137]  commit_cowonly_roots+0x4b9/0x610 [btrfs]
+[ 9520.370560]  ? commit_fs_roots+0x350/0x350 [btrfs]
+[ 9520.370926]  ? btrfs_run_delayed_refs+0x1b8/0x230 [btrfs]
+[ 9520.371285]  btrfs_commit_transaction+0x5e5/0x10e0 [btrfs]
+[ 9520.371612]  ? btrfs_apply_pending_changes+0x90/0x90 [btrfs]
+[ 9520.371943]  ? start_transaction+0x168/0x6c0 [btrfs]
+[ 9520.372257]  transaction_kthread+0x21c/0x240 [btrfs]
+[ 9520.372537]  kthread+0x1d2/0x1f0
+[ 9520.372793]  ? btrfs_cleanup_transaction+0xb50/0xb50 [btrfs]
+[ 9520.373090]  ? kthread_park+0xb0/0xb0
+[ 9520.373329]  ret_from_fork+0x3a/0x50
+[ 9520.373567]
+[ 9520.373738] Allocated by task 1804:
+[ 9520.373974]  kasan_kmalloc+0xff/0x180
+[ 9520.374208]  kasan_slab_alloc+0x11/0x20
+[ 9520.374447]  kmem_cache_alloc+0xfc/0x2d0
+[ 9520.374731]  __btrfs_add_free_space+0x40/0x580 [btrfs]
+[ 9520.375044]  unpin_extent_range+0x4f7/0x7a0 [btrfs]
+[ 9520.375383]  btrfs_finish_extent_commit+0x15f/0x4d0 [btrfs]
+[ 9520.375707]  btrfs_commit_transaction+0xb06/0x10e0 [btrfs]
+[ 9520.376027]  btrfs_alloc_data_chunk_ondemand+0x237/0x5c0 [btrfs]
+[ 9520.376365]  btrfs_check_data_free_space+0x81/0xd0 [btrfs]
+[ 9520.376689]  btrfs_delalloc_reserve_space+0x25/0x80 [btrfs]
+[ 9520.377018]  btrfs_direct_IO+0x42e/0x6d0 [btrfs]
+[ 9520.377284]  generic_file_direct_write+0x11e/0x220
+[ 9520.377587]  btrfs_file_write_iter+0x472/0xac0 [btrfs]
+[ 9520.377875]  aio_write+0x25c/0x360
+[ 9520.378106]  io_submit_one+0xaa0/0xdc0
+[ 9520.378343]  __se_sys_io_submit+0xfa/0x2f0
+[ 9520.378589]  __x64_sys_io_submit+0x43/0x50
+[ 9520.378840]  do_syscall_64+0x7d/0x240
+[ 9520.379081]  entry_SYSCALL_64_after_hwframe+0x49/0xbe
+[ 9520.379387]
+[ 9520.379557] Freed by task 1802:
+[ 9520.379782]  __kasan_slab_free+0x173/0x260
+[ 9520.380028]  kasan_slab_free+0xe/0x10
+[ 9520.380262]  kmem_cache_free+0xc1/0x2c0
+[ 9520.380544]  btrfs_find_space_for_alloc+0x4cd/0x4e0 [btrfs]
+[ 9520.380866]  find_free_extent+0xa99/0x17e0 [btrfs]
+[ 9520.381166]  btrfs_reserve_extent+0xd5/0x1f0 [btrfs]
+[ 9520.381474]  btrfs_get_blocks_direct+0x60b/0xbd0 [btrfs]
+[ 9520.381761]  __blockdev_direct_IO+0x10ee/0x58a1
+[ 9520.382059]  btrfs_direct_IO+0x25a/0x6d0 [btrfs]
+[ 9520.382321]  generic_file_direct_write+0x11e/0x220
+[ 9520.382623]  btrfs_file_write_iter+0x472/0xac0 [btrfs]
+[ 9520.382904]  aio_write+0x25c/0x360
+[ 9520.383172]  io_submit_one+0xaa0/0xdc0
+[ 9520.383416]  __se_sys_io_submit+0xfa/0x2f0
+[ 9520.383678]  __x64_sys_io_submit+0x43/0x50
+[ 9520.383927]  do_syscall_64+0x7d/0x240
+[ 9520.384165]  entry_SYSCALL_64_after_hwframe+0x49/0xbe
+[ 9520.384439]
+[ 9520.384610] The buggy address belongs to the object at ffff8800b7ada500
+                which belongs to the cache btrfs_free_space of size 72
+[ 9520.385175] The buggy address is located 0 bytes inside of
+                72-byte region [ffff8800b7ada500, ffff8800b7ada548)
+[ 9520.385691] The buggy address belongs to the page:
+[ 9520.385957] page:ffffea0002deb680 count:1 mapcount:0 mapping:ffff880108a1d700 index:0x0 compound_mapcount: 0
+[ 9520.388030] flags: 0x8100(slab|head)
+[ 9520.388281] raw: 0000000000008100 ffffea0002deb608 ffffea0002728808 ffff880108a1d700
+[ 9520.388722] raw: 0000000000000000 0000000000130013 00000001ffffffff 0000000000000000
+[ 9520.389169] page dumped because: kasan: bad access detected
+[ 9520.389473]
+[ 9520.389658] Memory state around the buggy address:
+[ 9520.389943]  ffff8800b7ada400: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
+[ 9520.390368]  ffff8800b7ada480: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
+[ 9520.390796] >ffff8800b7ada500: fb fb fb fb fb fb fb fb fb fc fc fc fc fc fc fc
+[ 9520.391223]                    ^
+[ 9520.391461]  ffff8800b7ada580: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
+[ 9520.391885]  ffff8800b7ada600: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
+[ 9520.392313] ==================================================================
+[ 9520.392772] BTRFS critical (device vdc): entry offset 2258497536, bytes 131072, bitmap no
+[ 9520.393247] BUG: unable to handle kernel NULL pointer dereference at 0000000000000011
+[ 9520.393705] PGD 800000010dbab067 P4D 800000010dbab067 PUD 107551067 PMD 0
+[ 9520.394059] Oops: 0000 [#1] SMP DEBUG_PAGEALLOC KASAN PTI
+[ 9520.394378] CPU: 4 PID: 1721 Comm: btrfs-transacti Tainted: G    B        L    4.19.0-rc8-nbor #555
+[ 9520.394858] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.10.2-1ubuntu1 04/01/2014
+[ 9520.395350] RIP: 0010:rb_next+0x3c/0x90
+[ 9520.396461] RSP: 0018:ffff8801074ff780 EFLAGS: 00010292
+[ 9520.396762] RAX: 0000000000000000 RBX: 0000000000000001 RCX: ffffffff81b5ac4c
+[ 9520.397115] RDX: 0000000000000000 RSI: 0000000000000008 RDI: 0000000000000011
+[ 9520.397468] RBP: ffff8801074ff7a0 R08: ffffed0021d64ccc R09: ffffed0021d64ccc
+[ 9520.397821] R10: 0000000000000001 R11: ffffed0021d64ccb R12: ffff8800b91e0000
+[ 9520.398188] R13: ffff8800a3ceba48 R14: ffff8800b627bf80 R15: 0000000000020000
+[ 9520.398555] FS:  0000000000000000(0000) GS:ffff88010eb00000(0000) knlGS:0000000000000000
+[ 9520.399007] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
+[ 9520.399335] CR2: 0000000000000011 CR3: 0000000106b52000 CR4: 00000000000006a0
+[ 9520.399679] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
+[ 9520.400023] DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
+[ 9520.400400] Call Trace:
+[ 9520.400648]  btrfs_dump_free_space+0x146/0x160 [btrfs]
+[ 9520.400974]  dump_space_info+0x2cd/0x310 [btrfs]
+[ 9520.401287]  btrfs_reserve_extent+0x1ee/0x1f0 [btrfs]
+[ 9520.401609]  __btrfs_prealloc_file_range+0x1cc/0x620 [btrfs]
+[ 9520.401952]  ? btrfs_update_time+0x180/0x180 [btrfs]
+[ 9520.402232]  ? _raw_spin_unlock+0x27/0x40
+[ 9520.402522]  ? btrfs_alloc_data_chunk_ondemand+0x2c0/0x5c0 [btrfs]
+[ 9520.402882]  btrfs_prealloc_file_range_trans+0x23/0x30 [btrfs]
+[ 9520.403261]  cache_save_setup+0x42e/0x580 [btrfs]
+[ 9520.403570]  ? btrfs_check_data_free_space+0xd0/0xd0 [btrfs]
+[ 9520.403871]  ? lock_downgrade+0x2f0/0x2f0
+[ 9520.404161]  ? btrfs_write_dirty_block_groups+0x11f/0x6e0 [btrfs]
+[ 9520.404481]  ? kasan_check_read+0x11/0x20
+[ 9520.404732]  ? do_raw_spin_unlock+0xa8/0x140
+[ 9520.405026]  btrfs_write_dirty_block_groups+0x2af/0x6e0 [btrfs]
+[ 9520.405375]  ? btrfs_start_dirty_block_groups+0x870/0x870 [btrfs]
+[ 9520.405694]  ? do_raw_spin_unlock+0xa8/0x140
+[ 9520.405958]  ? _raw_spin_unlock+0x27/0x40
+[ 9520.406243]  ? btrfs_run_delayed_refs+0x1b8/0x230 [btrfs]
+[ 9520.406574]  commit_cowonly_roots+0x4b9/0x610 [btrfs]
+[ 9520.406899]  ? commit_fs_roots+0x350/0x350 [btrfs]
+[ 9520.407253]  ? btrfs_run_delayed_refs+0x1b8/0x230 [btrfs]
+[ 9520.407589]  btrfs_commit_transaction+0x5e5/0x10e0 [btrfs]
+[ 9520.407925]  ? btrfs_apply_pending_changes+0x90/0x90 [btrfs]
+[ 9520.408262]  ? start_transaction+0x168/0x6c0 [btrfs]
+[ 9520.408582]  transaction_kthread+0x21c/0x240 [btrfs]
+[ 9520.408870]  kthread+0x1d2/0x1f0
+[ 9520.409138]  ? btrfs_cleanup_transaction+0xb50/0xb50 [btrfs]
+[ 9520.409440]  ? kthread_park+0xb0/0xb0
+[ 9520.409682]  ret_from_fork+0x3a/0x50
+[ 9520.410508] Dumping ftrace buffer:
+[ 9520.410764]    (ftrace buffer empty)
+[ 9520.411007] CR2: 0000000000000011
+[ 9520.411297] ---[ end trace 01a0863445cf360a ]---
+[ 9520.411568] RIP: 0010:rb_next+0x3c/0x90
+[ 9520.412644] RSP: 0018:ffff8801074ff780 EFLAGS: 00010292
+[ 9520.412932] RAX: 0000000000000000 RBX: 0000000000000001 RCX: ffffffff81b5ac4c
+[ 9520.413274] RDX: 0000000000000000 RSI: 0000000000000008 RDI: 0000000000000011
+[ 9520.413616] RBP: ffff8801074ff7a0 R08: ffffed0021d64ccc R09: ffffed0021d64ccc
+[ 9520.414007] R10: 0000000000000001 R11: ffffed0021d64ccb R12: ffff8800b91e0000
+[ 9520.414349] R13: ffff8800a3ceba48 R14: ffff8800b627bf80 R15: 0000000000020000
+[ 9520.416074] FS:  0000000000000000(0000) GS:ffff88010eb00000(0000) knlGS:0000000000000000
+[ 9520.416536] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
+[ 9520.416848] CR2: 0000000000000011 CR3: 0000000106b52000 CR4: 00000000000006a0
+[ 9520.418477] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
+[ 9520.418846] DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
+[ 9520.419204] Kernel panic - not syncing: Fatal exception
+[ 9520.419666] Dumping ftrace buffer:
+[ 9520.419930]    (ftrace buffer empty)
+[ 9520.420168] Kernel Offset: disabled
+[ 9520.420406] ---[ end Kernel panic - not syncing: Fatal exception ]---
+
+Fix this by acquiring the respective lock before iterating the rbtree.
+
+Reported-by: Nikolay Borisov <nborisov@suse.com>
+CC: stable@vger.kernel.org # 4.4+
+Reviewed-by: Josef Bacik <josef@toxicpanda.com>
+Signed-off-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/free-space-cache.c |    2 ++
+ 1 file changed, 2 insertions(+)
+
+--- a/fs/btrfs/free-space-cache.c
++++ b/fs/btrfs/free-space-cache.c
+@@ -2482,6 +2482,7 @@ void btrfs_dump_free_space(struct btrfs_
+       struct rb_node *n;
+       int count = 0;
+ 
++      spin_lock(&ctl->tree_lock);
+       for (n = rb_first(&ctl->free_space_offset); n; n = rb_next(n)) {
+               info = rb_entry(n, struct btrfs_free_space, offset_index);
+               if (info->bytes >= bytes && !block_group->ro)
+@@ -2490,6 +2491,7 @@ void btrfs_dump_free_space(struct btrfs_
+                          info->offset, info->bytes,
+                      (info->bitmap) ? "yes" : "no");
+       }
++      spin_unlock(&ctl->tree_lock);
+       btrfs_info(fs_info, "block group has cluster?: %s",
+              list_empty(&block_group->cluster_list) ? "no" : "yes");
+       btrfs_info(fs_info,
diff --git a/queue-4.14/btrfs-move-the-dio_sem-higher-up-the-callchain.patch b/queue-4.14/btrfs-move-the-dio_sem-higher-up-the-callchain.patch

new file mode 100644 (file)

index 0000000..08c8be3
--- /dev/null
+++ b/queue-4.14/btrfs-move-the-dio_sem-higher-up-the-callchain.patch
@@ -0,0 +1,239 @@
+From c495144bc6962186feae31d687596d2472000e45 Mon Sep 17 00:00:00 2001
+From: Josef Bacik <josef@toxicpanda.com>
+Date: Fri, 12 Oct 2018 15:32:32 -0400
+Subject: btrfs: move the dio_sem higher up the callchain
+
+From: Josef Bacik <josef@toxicpanda.com>
+
+commit c495144bc6962186feae31d687596d2472000e45 upstream.
+
+We're getting a lockdep splat because we take the dio_sem under the
+log_mutex.  What we really need is to protect fsync() from logging an
+extent map for an extent we never waited on higher up, so just guard the
+whole thing with dio_sem.
+
+======================================================
+WARNING: possible circular locking dependency detected
+4.18.0-rc4-xfstests-00025-g5de5edbaf1d4 #411 Not tainted
+------------------------------------------------------
+aio-dio-invalid/30928 is trying to acquire lock:
+0000000092621cfd (&mm->mmap_sem){++++}, at: get_user_pages_unlocked+0x5a/0x1e0
+
+but task is already holding lock:
+00000000cefe6b35 (&ei->dio_sem){++++}, at: btrfs_direct_IO+0x3be/0x400
+
+which lock already depends on the new lock.
+
+the existing dependency chain (in reverse order) is:
+
+-> #5 (&ei->dio_sem){++++}:
+       lock_acquire+0xbd/0x220
+       down_write+0x51/0xb0
+       btrfs_log_changed_extents+0x80/0xa40
+       btrfs_log_inode+0xbaf/0x1000
+       btrfs_log_inode_parent+0x26f/0xa80
+       btrfs_log_dentry_safe+0x50/0x70
+       btrfs_sync_file+0x357/0x540
+       do_fsync+0x38/0x60
+       __ia32_sys_fdatasync+0x12/0x20
+       do_fast_syscall_32+0x9a/0x2f0
+       entry_SYSENTER_compat+0x84/0x96
+
+-> #4 (&ei->log_mutex){+.+.}:
+       lock_acquire+0xbd/0x220
+       __mutex_lock+0x86/0xa10
+       btrfs_record_unlink_dir+0x2a/0xa0
+       btrfs_unlink+0x5a/0xc0
+       vfs_unlink+0xb1/0x1a0
+       do_unlinkat+0x264/0x2b0
+       do_fast_syscall_32+0x9a/0x2f0
+       entry_SYSENTER_compat+0x84/0x96
+
+-> #3 (sb_internal#2){.+.+}:
+       lock_acquire+0xbd/0x220
+       __sb_start_write+0x14d/0x230
+       start_transaction+0x3e6/0x590
+       btrfs_evict_inode+0x475/0x640
+       evict+0xbf/0x1b0
+       btrfs_run_delayed_iputs+0x6c/0x90
+       cleaner_kthread+0x124/0x1a0
+       kthread+0x106/0x140
+       ret_from_fork+0x3a/0x50
+
+-> #2 (&fs_info->cleaner_delayed_iput_mutex){+.+.}:
+       lock_acquire+0xbd/0x220
+       __mutex_lock+0x86/0xa10
+       btrfs_alloc_data_chunk_ondemand+0x197/0x530
+       btrfs_check_data_free_space+0x4c/0x90
+       btrfs_delalloc_reserve_space+0x20/0x60
+       btrfs_page_mkwrite+0x87/0x520
+       do_page_mkwrite+0x31/0xa0
+       __handle_mm_fault+0x799/0xb00
+       handle_mm_fault+0x7c/0xe0
+       __do_page_fault+0x1d3/0x4a0
+       async_page_fault+0x1e/0x30
+
+-> #1 (sb_pagefaults){.+.+}:
+       lock_acquire+0xbd/0x220
+       __sb_start_write+0x14d/0x230
+       btrfs_page_mkwrite+0x6a/0x520
+       do_page_mkwrite+0x31/0xa0
+       __handle_mm_fault+0x799/0xb00
+       handle_mm_fault+0x7c/0xe0
+       __do_page_fault+0x1d3/0x4a0
+       async_page_fault+0x1e/0x30
+
+-> #0 (&mm->mmap_sem){++++}:
+       __lock_acquire+0x42e/0x7a0
+       lock_acquire+0xbd/0x220
+       down_read+0x48/0xb0
+       get_user_pages_unlocked+0x5a/0x1e0
+       get_user_pages_fast+0xa4/0x150
+       iov_iter_get_pages+0xc3/0x340
+       do_direct_IO+0xf93/0x1d70
+       __blockdev_direct_IO+0x32d/0x1c20
+       btrfs_direct_IO+0x227/0x400
+       generic_file_direct_write+0xcf/0x180
+       btrfs_file_write_iter+0x308/0x58c
+       aio_write+0xf8/0x1d0
+       io_submit_one+0x3a9/0x620
+       __ia32_compat_sys_io_submit+0xb2/0x270
+       do_int80_syscall_32+0x5b/0x1a0
+       entry_INT80_compat+0x88/0xa0
+
+other info that might help us debug this:
+
+Chain exists of:
+  &mm->mmap_sem --> &ei->log_mutex --> &ei->dio_sem
+
+ Possible unsafe locking scenario:
+
+       CPU0                    CPU1
+       ----                    ----
+  lock(&ei->dio_sem);
+                               lock(&ei->log_mutex);
+                               lock(&ei->dio_sem);
+  lock(&mm->mmap_sem);
+
+ *** DEADLOCK ***
+
+1 lock held by aio-dio-invalid/30928:
+ #0: 00000000cefe6b35 (&ei->dio_sem){++++}, at: btrfs_direct_IO+0x3be/0x400
+
+stack backtrace:
+CPU: 0 PID: 30928 Comm: aio-dio-invalid Not tainted 4.18.0-rc4-xfstests-00025-g5de5edbaf1d4 #411
+Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.11.0-2.el7 04/01/2014
+Call Trace:
+ dump_stack+0x7c/0xbb
+ print_circular_bug.isra.37+0x297/0x2a4
+ check_prev_add.constprop.45+0x781/0x7a0
+ ? __lock_acquire+0x42e/0x7a0
+ validate_chain.isra.41+0x7f0/0xb00
+ __lock_acquire+0x42e/0x7a0
+ lock_acquire+0xbd/0x220
+ ? get_user_pages_unlocked+0x5a/0x1e0
+ down_read+0x48/0xb0
+ ? get_user_pages_unlocked+0x5a/0x1e0
+ get_user_pages_unlocked+0x5a/0x1e0
+ get_user_pages_fast+0xa4/0x150
+ iov_iter_get_pages+0xc3/0x340
+ do_direct_IO+0xf93/0x1d70
+ ? __alloc_workqueue_key+0x358/0x490
+ ? __blockdev_direct_IO+0x14b/0x1c20
+ __blockdev_direct_IO+0x32d/0x1c20
+ ? btrfs_run_delalloc_work+0x40/0x40
+ ? can_nocow_extent+0x490/0x490
+ ? kvm_clock_read+0x1f/0x30
+ ? can_nocow_extent+0x490/0x490
+ ? btrfs_run_delalloc_work+0x40/0x40
+ btrfs_direct_IO+0x227/0x400
+ ? btrfs_run_delalloc_work+0x40/0x40
+ generic_file_direct_write+0xcf/0x180
+ btrfs_file_write_iter+0x308/0x58c
+ aio_write+0xf8/0x1d0
+ ? kvm_clock_read+0x1f/0x30
+ ? __might_fault+0x3e/0x90
+ io_submit_one+0x3a9/0x620
+ ? io_submit_one+0xe5/0x620
+ __ia32_compat_sys_io_submit+0xb2/0x270
+ do_int80_syscall_32+0x5b/0x1a0
+ entry_INT80_compat+0x88/0xa0
+
+CC: stable@vger.kernel.org # 4.14+
+Reviewed-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: Josef Bacik <josef@toxicpanda.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/file.c     |   12 ++++++++++++
+ fs/btrfs/tree-log.c |    2 --
+ 2 files changed, 12 insertions(+), 2 deletions(-)
+
+--- a/fs/btrfs/file.c
++++ b/fs/btrfs/file.c
+@@ -2078,6 +2078,14 @@ int btrfs_sync_file(struct file *file, l
+               goto out;
+ 
+       inode_lock(inode);
++
++      /*
++       * We take the dio_sem here because the tree log stuff can race with
++       * lockless dio writes and get an extent map logged for an extent we
++       * never waited on.  We need it this high up for lockdep reasons.
++       */
++      down_write(&BTRFS_I(inode)->dio_sem);
++
+       atomic_inc(&root->log_batch);
+       full_sync = test_bit(BTRFS_INODE_NEEDS_FULL_SYNC,
+                            &BTRFS_I(inode)->runtime_flags);
+@@ -2129,6 +2137,7 @@ int btrfs_sync_file(struct file *file, l
+               ret = start_ordered_ops(inode, start, end);
+       }
+       if (ret) {
++              up_write(&BTRFS_I(inode)->dio_sem);
+               inode_unlock(inode);
+               goto out;
+       }
+@@ -2184,6 +2193,7 @@ int btrfs_sync_file(struct file *file, l
+                * checked called fsync.
+                */
+               ret = filemap_check_wb_err(inode->i_mapping, file->f_wb_err);
++              up_write(&BTRFS_I(inode)->dio_sem);
+               inode_unlock(inode);
+               goto out;
+       }
+@@ -2208,6 +2218,7 @@ int btrfs_sync_file(struct file *file, l
+       trans = btrfs_start_transaction(root, 0);
+       if (IS_ERR(trans)) {
+               ret = PTR_ERR(trans);
++              up_write(&BTRFS_I(inode)->dio_sem);
+               inode_unlock(inode);
+               goto out;
+       }
+@@ -2229,6 +2240,7 @@ int btrfs_sync_file(struct file *file, l
+        * file again, but that will end up using the synchronization
+        * inside btrfs_sync_log to keep things safe.
+        */
++      up_write(&BTRFS_I(inode)->dio_sem);
+       inode_unlock(inode);
+ 
+       /*
+--- a/fs/btrfs/tree-log.c
++++ b/fs/btrfs/tree-log.c
+@@ -4362,7 +4362,6 @@ static int btrfs_log_changed_extents(str
+ 
+       INIT_LIST_HEAD(&extents);
+ 
+-      down_write(&inode->dio_sem);
+       write_lock(&tree->lock);
+       test_gen = root->fs_info->last_trans_committed;
+       logged_start = start;
+@@ -4443,7 +4442,6 @@ process:
+       }
+       WARN_ON(!list_empty(&extents));
+       write_unlock(&tree->lock);
+-      up_write(&inode->dio_sem);
+ 
+       btrfs_release_path(path);
+       if (!ret)
diff --git a/queue-4.14/btrfs-only-free-reserved-extent-if-we-didn-t-insert-it.patch b/queue-4.14/btrfs-only-free-reserved-extent-if-we-didn-t-insert-it.patch

new file mode 100644 (file)

index 0000000..af6ae16
--- /dev/null
+++ b/queue-4.14/btrfs-only-free-reserved-extent-if-we-didn-t-insert-it.patch
@@ -0,0 +1,66 @@
+From 49940bdd57779c78462da7aa5a8650b2fea8c2ff Mon Sep 17 00:00:00 2001
+From: Josef Bacik <josef@toxicpanda.com>
+Date: Thu, 11 Oct 2018 15:54:21 -0400
+Subject: btrfs: only free reserved extent if we didn't insert it
+
+From: Josef Bacik <josef@toxicpanda.com>
+
+commit 49940bdd57779c78462da7aa5a8650b2fea8c2ff upstream.
+
+When we insert the file extent once the ordered extent completes we free
+the reserved extent reservation as it'll have been migrated to the
+bytes_used counter.  However if we error out after this step we'll still
+clear the reserved extent reservation, resulting in a negative
+accounting of the reserved bytes for the block group and space info.
+Fix this by only doing the free if we didn't successfully insert a file
+extent for this extent.
+
+CC: stable@vger.kernel.org # 4.14+
+Reviewed-by: Omar Sandoval <osandov@fb.com>
+Reviewed-by: Filipe Manana <fdmanana@suse.com>
+Signed-off-by: Josef Bacik <josef@toxicpanda.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/inode.c |   10 +++++++++-
+ 1 file changed, 9 insertions(+), 1 deletion(-)
+
+--- a/fs/btrfs/inode.c
++++ b/fs/btrfs/inode.c
+@@ -2966,6 +2966,7 @@ static int btrfs_finish_ordered_io(struc
+       bool truncated = false;
+       bool range_locked = false;
+       bool clear_new_delalloc_bytes = false;
++      bool clear_reserved_extent = true;
+ 
+       if (!test_bit(BTRFS_ORDERED_NOCOW, &ordered_extent->flags) &&
+           !test_bit(BTRFS_ORDERED_PREALLOC, &ordered_extent->flags) &&
+@@ -3069,10 +3070,12 @@ static int btrfs_finish_ordered_io(struc
+                                               logical_len, logical_len,
+                                               compress_type, 0, 0,
+                                               BTRFS_FILE_EXTENT_REG);
+-              if (!ret)
++              if (!ret) {
++                      clear_reserved_extent = false;
+                       btrfs_release_delalloc_bytes(fs_info,
+                                                    ordered_extent->start,
+                                                    ordered_extent->disk_len);
++              }
+       }
+       unpin_extent_cache(&BTRFS_I(inode)->extent_tree,
+                          ordered_extent->file_offset, ordered_extent->len,
+@@ -3132,8 +3135,13 @@ out:
+                * wrong we need to return the space for this ordered extent
+                * back to the allocator.  We only free the extent in the
+                * truncated case if we didn't write out the extent at all.
++               *
++               * If we made it past insert_reserved_file_extent before we
++               * errored out then we don't need to do this as the accounting
++               * has already been done.
+                */
+               if ((ret || !logical_len) &&
++                  clear_reserved_extent &&
+                   !test_bit(BTRFS_ORDERED_NOCOW, &ordered_extent->flags) &&
+                   !test_bit(BTRFS_ORDERED_PREALLOC, &ordered_extent->flags))
+                       btrfs_free_reserved_extent(fs_info,
diff --git a/queue-4.14/btrfs-set-max_extent_size-properly.patch b/queue-4.14/btrfs-set-max_extent_size-properly.patch

new file mode 100644 (file)

index 0000000..4047bf6
--- /dev/null
+++ b/queue-4.14/btrfs-set-max_extent_size-properly.patch
@@ -0,0 +1,97 @@
+From ad22cf6ea47fa20fbe11ac324a0a15c0a9a4a2a9 Mon Sep 17 00:00:00 2001
+From: Josef Bacik <jbacik@fb.com>
+Date: Fri, 12 Oct 2018 15:32:33 -0400
+Subject: btrfs: set max_extent_size properly
+
+From: Josef Bacik <jbacik@fb.com>
+
+commit ad22cf6ea47fa20fbe11ac324a0a15c0a9a4a2a9 upstream.
+
+We can't use entry->bytes if our entry is a bitmap entry, we need to use
+entry->max_extent_size in that case.  Fix up all the logic to make this
+consistent.
+
+CC: stable@vger.kernel.org # 4.4+
+Signed-off-by: Josef Bacik <jbacik@fb.com>
+Reviewed-by: David Sterba <dsterba@suse.com>
+Signed-off-by: David Sterba <dsterba@suse.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/btrfs/free-space-cache.c |   30 ++++++++++++++++++++----------
+ 1 file changed, 20 insertions(+), 10 deletions(-)
+
+--- a/fs/btrfs/free-space-cache.c
++++ b/fs/btrfs/free-space-cache.c
+@@ -1795,6 +1795,13 @@ static int search_bitmap(struct btrfs_fr
+       return -1;
+ }
+ 
++static inline u64 get_max_extent_size(struct btrfs_free_space *entry)
++{
++      if (entry->bitmap)
++              return entry->max_extent_size;
++      return entry->bytes;
++}
++
+ /* Cache the size of the max extent in bytes */
+ static struct btrfs_free_space *
+ find_free_space(struct btrfs_free_space_ctl *ctl, u64 *offset, u64 *bytes,
+@@ -1816,8 +1823,8 @@ find_free_space(struct btrfs_free_space_
+       for (node = &entry->offset_index; node; node = rb_next(node)) {
+               entry = rb_entry(node, struct btrfs_free_space, offset_index);
+               if (entry->bytes < *bytes) {
+-                      if (entry->bytes > *max_extent_size)
+-                              *max_extent_size = entry->bytes;
++                      *max_extent_size = max(get_max_extent_size(entry),
++                                             *max_extent_size);
+                       continue;
+               }
+ 
+@@ -1835,8 +1842,8 @@ find_free_space(struct btrfs_free_space_
+               }
+ 
+               if (entry->bytes < *bytes + align_off) {
+-                      if (entry->bytes > *max_extent_size)
+-                              *max_extent_size = entry->bytes;
++                      *max_extent_size = max(get_max_extent_size(entry),
++                                             *max_extent_size);
+                       continue;
+               }
+ 
+@@ -1848,8 +1855,10 @@ find_free_space(struct btrfs_free_space_
+                               *offset = tmp;
+                               *bytes = size;
+                               return entry;
+-                      } else if (size > *max_extent_size) {
+-                              *max_extent_size = size;
++                      } else {
++                              *max_extent_size =
++                                      max(get_max_extent_size(entry),
++                                          *max_extent_size);
+                       }
+                       continue;
+               }
+@@ -2709,8 +2718,8 @@ static u64 btrfs_alloc_from_bitmap(struc
+ 
+       err = search_bitmap(ctl, entry, &search_start, &search_bytes, true);
+       if (err) {
+-              if (search_bytes > *max_extent_size)
+-                      *max_extent_size = search_bytes;
++              *max_extent_size = max(get_max_extent_size(entry),
++                                     *max_extent_size);
+               return 0;
+       }
+ 
+@@ -2747,8 +2756,9 @@ u64 btrfs_alloc_from_cluster(struct btrf
+ 
+       entry = rb_entry(node, struct btrfs_free_space, offset_index);
+       while (1) {
+-              if (entry->bytes < bytes && entry->bytes > *max_extent_size)
+-                      *max_extent_size = entry->bytes;
++              if (entry->bytes < bytes)
++                      *max_extent_size = max(get_max_extent_size(entry),
++                                             *max_extent_size);
+ 
+               if (entry->bytes < bytes ||
+                   (!entry->bitmap && entry->offset < min_start)) {
diff --git a/queue-4.14/net-sched-remove-tca_options-from-policy.patch b/queue-4.14/net-sched-remove-tca_options-from-policy.patch

new file mode 100644 (file)

index 0000000..d0fc0b5
--- /dev/null
+++ b/queue-4.14/net-sched-remove-tca_options-from-policy.patch
@@ -0,0 +1,36 @@
+From e72bde6b66299602087c8c2350d36a525e75d06e Mon Sep 17 00:00:00 2001
+From: David Ahern <dsahern@gmail.com>
+Date: Wed, 24 Oct 2018 08:32:49 -0700
+Subject: net: sched: Remove TCA_OPTIONS from policy
+
+From: David Ahern <dsahern@gmail.com>
+
+commit e72bde6b66299602087c8c2350d36a525e75d06e upstream.
+
+Marco reported an error with hfsc:
+root@Calimero:~# tc qdisc add dev eth0 root handle 1:0 hfsc default 1
+Error: Attribute failed policy validation.
+
+Apparently a few implementations pass TCA_OPTIONS as a binary instead
+of nested attribute, so drop TCA_OPTIONS from the policy.
+
+Fixes: 8b4c3cdd9dd8 ("net: sched: Add policy validation for tc attributes")
+Reported-by: Marco Berizzi <pupilla@libero.it>
+Signed-off-by: David Ahern <dsahern@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ net/sched/sch_api.c |    1 -
+ 1 file changed, 1 deletion(-)
+
+--- a/net/sched/sch_api.c
++++ b/net/sched/sch_api.c
+@@ -1218,7 +1218,6 @@ check_loop_fn(struct Qdisc *q, unsigned
+ 
+ const struct nla_policy rtm_tca_policy[TCA_MAX + 1] = {
+       [TCA_KIND]              = { .type = NLA_STRING },
+-      [TCA_OPTIONS]           = { .type = NLA_NESTED },
+       [TCA_RATE]              = { .type = NLA_BINARY,
+                                   .len = sizeof(struct tc_estimator) },
+       [TCA_STAB]              = { .type = NLA_NESTED },
diff --git a/queue-4.14/series b/queue-4.14/series

index 87f41cb5b5b3411d95c0d014dd058857d2388175..199922c7c76365460c220ca04249296fcb86f891 100644 (file)
--- a/queue-4.14/series
+++ b/queue-4.14/series
@@ -208,3 +208,15 @@ btrfs-make-sure-we-create-all-new-block-groups.patch
  btrfs-fix-warning-when-replaying-log-after-fsync-of-a-tmpfile.patch
  btrfs-fix-wrong-dentries-after-fsync-of-file-that-got-its-parent-replaced.patch
  btrfs-qgroup-dirty-all-qgroups-before-rescan.patch
+btrfs-fix-null-pointer-dereference-on-compressed-write-path-error.patch
+btrfs-fix-assertion-on-fsync-of-regular-file-when-using-no-holes-feature.patch
+btrfs-set-max_extent_size-properly.patch
+btrfs-don-t-use-ctl-free_space-for-max_extent_size.patch
+btrfs-only-free-reserved-extent-if-we-didn-t-insert-it.patch
+btrfs-don-t-run-delayed_iputs-in-commit.patch
+btrfs-move-the-dio_sem-higher-up-the-callchain.patch
+btrfs-fix-use-after-free-during-inode-eviction.patch
+btrfs-fix-use-after-free-when-dumping-free-space.patch
+btrfs-fix-fsync-after-hole-punching-when-using-no-holes-feature.patch
+net-sched-remove-tca_options-from-policy.patch
+bpf-wait-for-running-bpf-programs-when-updating-map-in-map.patch
author	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Sun, 11 Nov 2018 20:56:29 +0000 (12:56 -0800)
queue-4.14/bpf-wait-for-running-bpf-programs-when-updating-map-in-map.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-don-t-run-delayed_iputs-in-commit.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-don-t-use-ctl-free_space-for-max_extent_size.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-fix-assertion-on-fsync-of-regular-file-when-using-no-holes-feature.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-fix-fsync-after-hole-punching-when-using-no-holes-feature.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-fix-null-pointer-dereference-on-compressed-write-path-error.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-fix-use-after-free-during-inode-eviction.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-fix-use-after-free-when-dumping-free-space.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-move-the-dio_sem-higher-up-the-callchain.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-only-free-reserved-extent-if-we-didn-t-insert-it.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/btrfs-set-max_extent_size-properly.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/net-sched-remove-tca_options-from-policy.patch	[new file with mode: 0644]	patch \| blob
queue-4.14/series		patch \| blob \| blame \| history