]> git.ipfire.org Git - thirdparty/kernel/stable-queue.git/commitdiff
4.14-stable patches
authorGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Mon, 4 Feb 2019 08:58:40 +0000 (09:58 +0100)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Mon, 4 Feb 2019 08:58:40 +0000 (09:58 +0100)
added patches:
cifs-always-resolve-hostname-before-reconnecting.patch
drivers-core-remove-glue-dirs-from-sysfs-earlier.patch
md-raid5-fix-out-of-memory-during-raid-cache-recovery.patch

queue-4.14/cifs-always-resolve-hostname-before-reconnecting.patch [new file with mode: 0644]
queue-4.14/drivers-core-remove-glue-dirs-from-sysfs-earlier.patch [new file with mode: 0644]
queue-4.14/md-raid5-fix-out-of-memory-during-raid-cache-recovery.patch [new file with mode: 0644]
queue-4.14/series

diff --git a/queue-4.14/cifs-always-resolve-hostname-before-reconnecting.patch b/queue-4.14/cifs-always-resolve-hostname-before-reconnecting.patch
new file mode 100644 (file)
index 0000000..6d79b52
--- /dev/null
@@ -0,0 +1,99 @@
+From 28eb24ff75c5ac130eb326b3b4d0dcecfc0f427d Mon Sep 17 00:00:00 2001
+From: Paulo Alcantara <paulo@paulo.ac>
+Date: Tue, 20 Nov 2018 15:16:36 -0200
+Subject: cifs: Always resolve hostname before reconnecting
+
+From: Paulo Alcantara <paulo@paulo.ac>
+
+commit 28eb24ff75c5ac130eb326b3b4d0dcecfc0f427d upstream.
+
+In case a hostname resolves to a different IP address (e.g. long
+running mounts), make sure to resolve it every time prior to calling
+generic_ip_connect() in reconnect.
+
+Suggested-by: Steve French <stfrench@microsoft.com>
+Signed-off-by: Paulo Alcantara <palcantara@suse.de>
+Signed-off-by: Steve French <stfrench@microsoft.com>
+Signed-off-by: Pavel Shilovsky <pshilov@microsoft.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ fs/cifs/connect.c |   53 +++++++++++++++++++++++++++++++++++++++++++++++++++++
+ 1 file changed, 53 insertions(+)
+
+--- a/fs/cifs/connect.c
++++ b/fs/cifs/connect.c
+@@ -51,6 +51,7 @@
+ #include "cifs_unicode.h"
+ #include "cifs_debug.h"
+ #include "cifs_fs_sb.h"
++#include "dns_resolve.h"
+ #include "ntlmssp.h"
+ #include "nterr.h"
+ #include "rfc1002pdu.h"
+@@ -314,6 +315,53 @@ static int cifs_setup_volume_info(struct
+                                       const char *devname);
+ /*
++ * Resolve hostname and set ip addr in tcp ses. Useful for hostnames that may
++ * get their ip addresses changed at some point.
++ *
++ * This should be called with server->srv_mutex held.
++ */
++#ifdef CONFIG_CIFS_DFS_UPCALL
++static int reconn_set_ipaddr(struct TCP_Server_Info *server)
++{
++      int rc;
++      int len;
++      char *unc, *ipaddr = NULL;
++
++      if (!server->hostname)
++              return -EINVAL;
++
++      len = strlen(server->hostname) + 3;
++
++      unc = kmalloc(len, GFP_KERNEL);
++      if (!unc) {
++              cifs_dbg(FYI, "%s: failed to create UNC path\n", __func__);
++              return -ENOMEM;
++      }
++      snprintf(unc, len, "\\\\%s", server->hostname);
++
++      rc = dns_resolve_server_name_to_ip(unc, &ipaddr);
++      kfree(unc);
++
++      if (rc < 0) {
++              cifs_dbg(FYI, "%s: failed to resolve server part of %s to IP: %d\n",
++                       __func__, server->hostname, rc);
++              return rc;
++      }
++
++      rc = cifs_convert_address((struct sockaddr *)&server->dstaddr, ipaddr,
++                                strlen(ipaddr));
++      kfree(ipaddr);
++
++      return !rc ? -1 : 0;
++}
++#else
++static inline int reconn_set_ipaddr(struct TCP_Server_Info *server)
++{
++      return 0;
++}
++#endif
++
++/*
+  * cifs tcp session reconnection
+  *
+  * mark tcp session as reconnecting so temporarily locked
+@@ -408,6 +456,11 @@ cifs_reconnect(struct TCP_Server_Info *s
+               rc = generic_ip_connect(server);
+               if (rc) {
+                       cifs_dbg(FYI, "reconnect error %d\n", rc);
++                      rc = reconn_set_ipaddr(server);
++                      if (rc) {
++                              cifs_dbg(FYI, "%s: failed to resolve hostname: %d\n",
++                                       __func__, rc);
++                      }
+                       mutex_unlock(&server->srv_mutex);
+                       msleep(3000);
+               } else {
diff --git a/queue-4.14/drivers-core-remove-glue-dirs-from-sysfs-earlier.patch b/queue-4.14/drivers-core-remove-glue-dirs-from-sysfs-earlier.patch
new file mode 100644 (file)
index 0000000..35f39d9
--- /dev/null
@@ -0,0 +1,86 @@
+From 726e41097920a73e4c7c33385dcc0debb1281e18 Mon Sep 17 00:00:00 2001
+From: Benjamin Herrenschmidt <benh@kernel.crashing.org>
+Date: Tue, 10 Jul 2018 10:29:10 +1000
+Subject: drivers: core: Remove glue dirs from sysfs earlier
+
+From: Benjamin Herrenschmidt <benh@kernel.crashing.org>
+
+commit 726e41097920a73e4c7c33385dcc0debb1281e18 upstream.
+
+For devices with a class, we create a "glue" directory between
+the parent device and the new device with the class name.
+
+This directory is never "explicitely" removed when empty however,
+this is left to the implicit sysfs removal done by kobject_release()
+when the object loses its last reference via kobject_put().
+
+This is problematic because as long as it's not been removed from
+sysfs, it is still present in the class kset and in sysfs directory
+structure.
+
+The presence in the class kset exposes a use after free bug fixed
+by the previous patch, but the presence in sysfs means that until
+the kobject is released, which can take a while (especially with
+kobject debugging), any attempt at re-creating such as binding a
+new device for that class/parent pair, will result in a sysfs
+duplicate file name error.
+
+This fixes it by instead doing an explicit kobject_del() when
+the glue dir is empty, by keeping track of the number of
+child devices of the gluedir.
+
+This is made easy by the fact that all glue dir operations are
+done with a global mutex, and there's already a function
+(cleanup_glue_dir) called in all the right places taking that
+mutex that can be enhanced for this. It appears that this was
+in fact the intent of the function, but the implementation was
+wrong.
+
+Signed-off-by: Benjamin Herrenschmidt <benh@kernel.crashing.org>
+Acked-by: Linus Torvalds <torvalds@linux-foundation.org>
+Cc: Guenter Roeck <groeck@google.com>
+Cc: Zubin Mithra <zsm@chromium.org>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ drivers/base/core.c     |    2 ++
+ include/linux/kobject.h |   17 +++++++++++++++++
+ 2 files changed, 19 insertions(+)
+
+--- a/drivers/base/core.c
++++ b/drivers/base/core.c
+@@ -1571,6 +1571,8 @@ static void cleanup_glue_dir(struct devi
+               return;
+       mutex_lock(&gdp_mutex);
++      if (!kobject_has_children(glue_dir))
++              kobject_del(glue_dir);
+       kobject_put(glue_dir);
+       mutex_unlock(&gdp_mutex);
+ }
+--- a/include/linux/kobject.h
++++ b/include/linux/kobject.h
+@@ -117,6 +117,23 @@ extern void kobject_put(struct kobject *
+ extern const void *kobject_namespace(struct kobject *kobj);
+ extern char *kobject_get_path(struct kobject *kobj, gfp_t flag);
++/**
++ * kobject_has_children - Returns whether a kobject has children.
++ * @kobj: the object to test
++ *
++ * This will return whether a kobject has other kobjects as children.
++ *
++ * It does NOT account for the presence of attribute files, only sub
++ * directories. It also assumes there is no concurrent addition or
++ * removal of such children, and thus relies on external locking.
++ */
++static inline bool kobject_has_children(struct kobject *kobj)
++{
++      WARN_ON_ONCE(kref_read(&kobj->kref) == 0);
++
++      return kobj->sd && kobj->sd->dir.subdirs;
++}
++
+ struct kobj_type {
+       void (*release)(struct kobject *kobj);
+       const struct sysfs_ops *sysfs_ops;
diff --git a/queue-4.14/md-raid5-fix-out-of-memory-during-raid-cache-recovery.patch b/queue-4.14/md-raid5-fix-out-of-memory-during-raid-cache-recovery.patch
new file mode 100644 (file)
index 0000000..ffbfe59
--- /dev/null
@@ -0,0 +1,125 @@
+From 483cbbeddd5fe2c80fd4141ff0748fa06c4ff146 Mon Sep 17 00:00:00 2001
+From: Alexei Naberezhnov <anaberezhnov@fb.com>
+Date: Tue, 27 Mar 2018 16:54:16 -0700
+Subject: md/raid5: fix 'out of memory' during raid cache recovery
+
+From: Alexei Naberezhnov <anaberezhnov@fb.com>
+
+commit 483cbbeddd5fe2c80fd4141ff0748fa06c4ff146 upstream.
+
+This fixes the case when md array assembly fails because of raid cache recovery
+unable to allocate a stripe, despite attempts to replay stripes and increase
+cache size. This happens because stripes released by r5c_recovery_replay_stripes
+and raid5_set_cache_size don't become available for allocation immediately.
+Released stripes first are placed on conf->released_stripes list and require
+md thread to merge them on conf->inactive_list before they can be allocated.
+
+Patch allows final allocation attempt during cache recovery to wait for
+new stripes to become availabe for allocation.
+
+Cc: linux-raid@vger.kernel.org
+Cc: Shaohua Li <shli@kernel.org>
+Cc: linux-stable <stable@vger.kernel.org> # 4.10+
+Fixes: b4c625c67362 ("md/r5cache: r5cache recovery: part 1")
+Signed-off-by: Alexei Naberezhnov <anaberezhnov@fb.com>
+Signed-off-by: Song Liu <songliubraving@fb.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+
+---
+ drivers/md/raid5-cache.c |   33 ++++++++++++++++++++++-----------
+ drivers/md/raid5.c       |    8 ++++++--
+ 2 files changed, 28 insertions(+), 13 deletions(-)
+
+--- a/drivers/md/raid5-cache.c
++++ b/drivers/md/raid5-cache.c
+@@ -1942,12 +1942,14 @@ out:
+ }
+ static struct stripe_head *
+-r5c_recovery_alloc_stripe(struct r5conf *conf,
+-                        sector_t stripe_sect)
++r5c_recovery_alloc_stripe(
++              struct r5conf *conf,
++              sector_t stripe_sect,
++              int noblock)
+ {
+       struct stripe_head *sh;
+-      sh = raid5_get_active_stripe(conf, stripe_sect, 0, 1, 0);
++      sh = raid5_get_active_stripe(conf, stripe_sect, 0, noblock, 0);
+       if (!sh)
+               return NULL;  /* no more stripe available */
+@@ -2157,7 +2159,7 @@ r5c_recovery_analyze_meta_block(struct r
+                                               stripe_sect);
+               if (!sh) {
+-                      sh = r5c_recovery_alloc_stripe(conf, stripe_sect);
++                      sh = r5c_recovery_alloc_stripe(conf, stripe_sect, 1);
+                       /*
+                        * cannot get stripe from raid5_get_active_stripe
+                        * try replay some stripes
+@@ -2166,20 +2168,29 @@ r5c_recovery_analyze_meta_block(struct r
+                               r5c_recovery_replay_stripes(
+                                       cached_stripe_list, ctx);
+                               sh = r5c_recovery_alloc_stripe(
+-                                      conf, stripe_sect);
++                                      conf, stripe_sect, 1);
+                       }
+                       if (!sh) {
++                              int new_size = conf->min_nr_stripes * 2;
+                               pr_debug("md/raid:%s: Increasing stripe cache size to %d to recovery data on journal.\n",
+                                       mdname(mddev),
+-                                      conf->min_nr_stripes * 2);
+-                              raid5_set_cache_size(mddev,
+-                                                   conf->min_nr_stripes * 2);
+-                              sh = r5c_recovery_alloc_stripe(conf,
+-                                                             stripe_sect);
++                                      new_size);
++                              ret = raid5_set_cache_size(mddev, new_size);
++                              if (conf->min_nr_stripes <= new_size / 2) {
++                                      pr_err("md/raid:%s: Cannot increase cache size, ret=%d, new_size=%d, min_nr_stripes=%d, max_nr_stripes=%d\n",
++                                              mdname(mddev),
++                                              ret,
++                                              new_size,
++                                              conf->min_nr_stripes,
++                                              conf->max_nr_stripes);
++                                      return -ENOMEM;
++                              }
++                              sh = r5c_recovery_alloc_stripe(
++                                      conf, stripe_sect, 0);
+                       }
+                       if (!sh) {
+                               pr_err("md/raid:%s: Cannot get enough stripes due to memory pressure. Recovery failed.\n",
+-                                     mdname(mddev));
++                                      mdname(mddev));
+                               return -ENOMEM;
+                       }
+                       list_add_tail(&sh->lru, cached_stripe_list);
+--- a/drivers/md/raid5.c
++++ b/drivers/md/raid5.c
+@@ -6336,6 +6336,7 @@ raid5_show_stripe_cache_size(struct mdde
+ int
+ raid5_set_cache_size(struct mddev *mddev, int size)
+ {
++      int result = 0;
+       struct r5conf *conf = mddev->private;
+       if (size <= 16 || size > 32768)
+@@ -6352,11 +6353,14 @@ raid5_set_cache_size(struct mddev *mddev
+       mutex_lock(&conf->cache_size_mutex);
+       while (size > conf->max_nr_stripes)
+-              if (!grow_one_stripe(conf, GFP_KERNEL))
++              if (!grow_one_stripe(conf, GFP_KERNEL)) {
++                      conf->min_nr_stripes = conf->max_nr_stripes;
++                      result = -ENOMEM;
+                       break;
++              }
+       mutex_unlock(&conf->cache_size_mutex);
+-      return 0;
++      return result;
+ }
+ EXPORT_SYMBOL(raid5_set_cache_size);
index d32610037572dc89c039dbeebff59780d497965e..7bea22557a2b7e4fcf57b39438f4e7b00fe92eee 100644 (file)
@@ -40,3 +40,6 @@ oom-oom_reaper-do-not-enqueue-same-task-twice.patch
 mm-oom-fix-use-after-free-in-oom_kill_process.patch
 mm-hwpoison-use-do_send_sig_info-instead-of-force_sig.patch
 mm-migrate-don-t-rely-on-__pagemovable-of-newpage-after-unlocking-it.patch
+md-raid5-fix-out-of-memory-during-raid-cache-recovery.patch
+cifs-always-resolve-hostname-before-reconnecting.patch
+drivers-core-remove-glue-dirs-from-sysfs-earlier.patch