4.3-stable patches

author Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)

committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>

Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)
author Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)
committer Greg Kroah-Hartman <gregkh@linuxfoundation.org>
Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)
diff --git a/queue-4.3/addrconf-always-initialize-sysctl-table-data.patch b/queue-4.3/addrconf-always-initialize-sysctl-table-data.patch

new file mode 100644 (file)

index 0000000..76f6876
--- /dev/null
+++ b/queue-4.3/addrconf-always-initialize-sysctl-table-data.patch
@@ -0,0 +1,44 @@
+From foo@baz Tue Jan 26 21:35:02 PST 2016
+From: WANG Cong <xiyou.wangcong@gmail.com>
+Date: Mon, 21 Dec 2015 10:55:45 -0800
+Subject: addrconf: always initialize sysctl table data
+
+From: WANG Cong <xiyou.wangcong@gmail.com>
+
+[ Upstream commit 5449a5ca9bc27dd51a462de7ca0b1cd861cd2bd0 ]
+
+When sysctl performs restrict writes, it allows to write from
+a middle position of a sysctl file, which requires us to initialize
+the table data before calling proc_dostring() for the write case.
+
+Fixes: 3d1bec99320d ("ipv6: introduce secret_stable to ipv6_devconf")
+Reported-by: Sasha Levin <sasha.levin@oracle.com>
+Acked-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
+Tested-by: Sasha Levin <sasha.levin@oracle.com>
+Signed-off-by: Cong Wang <xiyou.wangcong@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv6/addrconf.c |   11 ++++-------
+ 1 file changed, 4 insertions(+), 7 deletions(-)
+
+--- a/net/ipv6/addrconf.c
++++ b/net/ipv6/addrconf.c
+@@ -5349,13 +5349,10 @@ static int addrconf_sysctl_stable_secret
+               goto out;
+       }
+ 
+-      if (!write) {
+-              err = snprintf(str, sizeof(str), "%pI6",
+-                             &secret->secret);
+-              if (err >= sizeof(str)) {
+-                      err = -EIO;
+-                      goto out;
+-              }
++      err = snprintf(str, sizeof(str), "%pI6", &secret->secret);
++      if (err >= sizeof(str)) {
++              err = -EIO;
++              goto out;
+       }
+ 
+       err = proc_dostring(&lctl, write, buffer, lenp, ppos);
diff --git a/queue-4.3/af_unix-fix-splice-bind-deadlock.patch b/queue-4.3/af_unix-fix-splice-bind-deadlock.patch

new file mode 100644 (file)

index 0000000..2969d34
--- /dev/null
+++ b/queue-4.3/af_unix-fix-splice-bind-deadlock.patch
@@ -0,0 +1,186 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Rainer Weikusat <rweikusat@mobileactivedefense.com>
+Date: Sun, 3 Jan 2016 18:56:38 +0000
+Subject: af_unix: Fix splice-bind deadlock
+
+From: Rainer Weikusat <rweikusat@mobileactivedefense.com>
+
+[ Upstream commit c845acb324aa85a39650a14e7696982ceea75dc1 ]
+
+On 2015/11/06, Dmitry Vyukov reported a deadlock involving the splice
+system call and AF_UNIX sockets,
+
+http://lists.openwall.net/netdev/2015/11/06/24
+
+The situation was analyzed as
+
+(a while ago) A: socketpair()
+B: splice() from a pipe to /mnt/regular_file
+       does sb_start_write() on /mnt
+C: try to freeze /mnt
+       wait for B to finish with /mnt
+A: bind() try to bind our socket to /mnt/new_socket_name
+       lock our socket, see it not bound yet
+       decide that it needs to create something in /mnt
+       try to do sb_start_write() on /mnt, block (it's
+       waiting for C).
+D: splice() from the same pipe to our socket
+       lock the pipe, see that socket is connected
+       try to lock the socket, block waiting for A
+B:     get around to actually feeding a chunk from
+       pipe to file, try to lock the pipe.  Deadlock.
+
+on 2015/11/10 by Al Viro,
+
+http://lists.openwall.net/netdev/2015/11/10/4
+
+The patch fixes this by removing the kern_path_create related code from
+unix_mknod and executing it as part of unix_bind prior acquiring the
+readlock of the socket in question. This means that A (as used above)
+will sb_start_write on /mnt before it acquires the readlock, hence, it
+won't indirectly block B which first did a sb_start_write and then
+waited for a thread trying to acquire the readlock. Consequently, A
+being blocked by C waiting for B won't cause a deadlock anymore
+(effectively, both A and B acquire two locks in opposite order in the
+situation described above).
+
+Dmitry Vyukov(<dvyukov@google.com>) tested the original patch.
+
+Signed-off-by: Rainer Weikusat <rweikusat@mobileactivedefense.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/unix/af_unix.c |   68 +++++++++++++++++++++++++++++++----------------------
+ 1 file changed, 41 insertions(+), 27 deletions(-)
+
+--- a/net/unix/af_unix.c
++++ b/net/unix/af_unix.c
+@@ -952,32 +952,20 @@ fail:
+       return NULL;
+ }
+ 
+-static int unix_mknod(const char *sun_path, umode_t mode, struct path *res)
++static int unix_mknod(struct dentry *dentry, struct path *path, umode_t mode,
++                    struct path *res)
+ {
+-      struct dentry *dentry;
+-      struct path path;
+-      int err = 0;
+-      /*
+-       * Get the parent directory, calculate the hash for last
+-       * component.
+-       */
+-      dentry = kern_path_create(AT_FDCWD, sun_path, &path, 0);
+-      err = PTR_ERR(dentry);
+-      if (IS_ERR(dentry))
+-              return err;
+-
+-      /*
+-       * All right, let's create it.
+-       */
+-      err = security_path_mknod(&path, dentry, mode, 0);
++      int err;
++
++      err = security_path_mknod(path, dentry, mode, 0);
+       if (!err) {
+-              err = vfs_mknod(d_inode(path.dentry), dentry, mode, 0);
++              err = vfs_mknod(d_inode(path->dentry), dentry, mode, 0);
+               if (!err) {
+-                      res->mnt = mntget(path.mnt);
++                      res->mnt = mntget(path->mnt);
+                       res->dentry = dget(dentry);
+               }
+       }
+-      done_path_create(&path, dentry);
++
+       return err;
+ }
+ 
+@@ -988,10 +976,12 @@ static int unix_bind(struct socket *sock
+       struct unix_sock *u = unix_sk(sk);
+       struct sockaddr_un *sunaddr = (struct sockaddr_un *)uaddr;
+       char *sun_path = sunaddr->sun_path;
+-      int err;
++      int err, name_err;
+       unsigned int hash;
+       struct unix_address *addr;
+       struct hlist_head *list;
++      struct path path;
++      struct dentry *dentry;
+ 
+       err = -EINVAL;
+       if (sunaddr->sun_family != AF_UNIX)
+@@ -1007,14 +997,34 @@ static int unix_bind(struct socket *sock
+               goto out;
+       addr_len = err;
+ 
++      name_err = 0;
++      dentry = NULL;
++      if (sun_path[0]) {
++              /* Get the parent directory, calculate the hash for last
++               * component.
++               */
++              dentry = kern_path_create(AT_FDCWD, sun_path, &path, 0);
++
++              if (IS_ERR(dentry)) {
++                      /* delay report until after 'already bound' check */
++                      name_err = PTR_ERR(dentry);
++                      dentry = NULL;
++              }
++      }
++
+       err = mutex_lock_interruptible(&u->readlock);
+       if (err)
+-              goto out;
++              goto out_path;
+ 
+       err = -EINVAL;
+       if (u->addr)
+               goto out_up;
+ 
++      if (name_err) {
++              err = name_err == -EEXIST ? -EADDRINUSE : name_err;
++              goto out_up;
++      }
++
+       err = -ENOMEM;
+       addr = kmalloc(sizeof(*addr)+addr_len, GFP_KERNEL);
+       if (!addr)
+@@ -1025,11 +1035,11 @@ static int unix_bind(struct socket *sock
+       addr->hash = hash ^ sk->sk_type;
+       atomic_set(&addr->refcnt, 1);
+ 
+-      if (sun_path[0]) {
+-              struct path path;
++      if (dentry) {
++              struct path u_path;
+               umode_t mode = S_IFSOCK |
+                      (SOCK_INODE(sock)->i_mode & ~current_umask());
+-              err = unix_mknod(sun_path, mode, &path);
++              err = unix_mknod(dentry, &path, mode, &u_path);
+               if (err) {
+                       if (err == -EEXIST)
+                               err = -EADDRINUSE;
+@@ -1037,9 +1047,9 @@ static int unix_bind(struct socket *sock
+                       goto out_up;
+               }
+               addr->hash = UNIX_HASH_SIZE;
+-              hash = d_backing_inode(path.dentry)->i_ino & (UNIX_HASH_SIZE-1);
++              hash = d_backing_inode(dentry)->i_ino & (UNIX_HASH_SIZE - 1);
+               spin_lock(&unix_table_lock);
+-              u->path = path;
++              u->path = u_path;
+               list = &unix_socket_table[hash];
+       } else {
+               spin_lock(&unix_table_lock);
+@@ -1062,6 +1072,10 @@ out_unlock:
+       spin_unlock(&unix_table_lock);
+ out_up:
+       mutex_unlock(&u->readlock);
++out_path:
++      if (dentry)
++              done_path_create(&path, dentry);
++
+ out:
+       return err;
+ }
diff --git a/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_bla_claim.patch b/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_bla_claim.patch

new file mode 100644 (file)

index 0000000..b1435cc
--- /dev/null
+++ b/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_bla_claim.patch
@@ -0,0 +1,61 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Thu, 14 Jan 2016 15:28:19 +0100
+Subject: batman-adv: Avoid recursive call_rcu for batadv_bla_claim
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit 63b399272294e7a939cde41792dca38c549f0484 ]
+
+The batadv_claim_free_ref function uses call_rcu to delay the free of the
+batadv_bla_claim object until no (already started) rcu_read_lock is enabled
+anymore. This makes sure that no context is still trying to access the
+object which should be removed. But batadv_bla_claim also contains a
+reference to backbone_gw which must be removed.
+
+The reference drop of backbone_gw was done in the call_rcu function
+batadv_claim_free_rcu but should actually be done in the
+batadv_claim_release function to avoid nested call_rcus. This is important
+because rcu_barrier (e.g. batadv_softif_free or batadv_exit) will not
+detect the inner call_rcu as relevant for its execution. Otherwise this
+barrier will most likely be inserted in the queue before the callback of
+the first call_rcu was executed. The caller of rcu_barrier will therefore
+continue to run before the inner call_rcu callback finished.
+
+Fixes: 23721387c409 ("batman-adv: add basic bridge loop avoidance code")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Acked-by: Simon Wunderlich <sw@simonwunderlich.de>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/bridge_loop_avoidance.c |   10 +++-------
+ 1 file changed, 3 insertions(+), 7 deletions(-)
+
+--- a/net/batman-adv/bridge_loop_avoidance.c
++++ b/net/batman-adv/bridge_loop_avoidance.c
+@@ -127,21 +127,17 @@ batadv_backbone_gw_free_ref(struct batad
+ }
+ 
+ /* finally deinitialize the claim */
+-static void batadv_claim_free_rcu(struct rcu_head *rcu)
++static void batadv_claim_release(struct batadv_bla_claim *claim)
+ {
+-      struct batadv_bla_claim *claim;
+-
+-      claim = container_of(rcu, struct batadv_bla_claim, rcu);
+-
+       batadv_backbone_gw_free_ref(claim->backbone_gw);
+-      kfree(claim);
++      kfree_rcu(claim, rcu);
+ }
+ 
+ /* free a claim, call claim_free_rcu if its the last reference */
+ static void batadv_claim_free_ref(struct batadv_bla_claim *claim)
+ {
+       if (atomic_dec_and_test(&claim->refcount))
+-              call_rcu(&claim->rcu, batadv_claim_free_rcu);
++              batadv_claim_release(claim);
+ }
+ 
+ /**
diff --git a/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_nc_node.patch b/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_nc_node.patch

new file mode 100644 (file)

index 0000000..75a6d05
--- /dev/null
+++ b/queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_nc_node.patch
@@ -0,0 +1,72 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:19 +0100
+Subject: batman-adv: Avoid recursive call_rcu for batadv_nc_node
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit 44e8e7e91d6c7c7ab19688750f7257292640d1a0 ]
+
+The batadv_nc_node_free_ref function uses call_rcu to delay the free of the
+batadv_nc_node object until no (already started) rcu_read_lock is enabled
+anymore. This makes sure that no context is still trying to access the
+object which should be removed. But batadv_nc_node also contains a
+reference to orig_node which must be removed.
+
+The reference drop of orig_node was done in the call_rcu function
+batadv_nc_node_free_rcu but should actually be done in the
+batadv_nc_node_release function to avoid nested call_rcus. This is
+important because rcu_barrier (e.g. batadv_softif_free or batadv_exit) will
+not detect the inner call_rcu as relevant for its execution. Otherwise this
+barrier will most likely be inserted in the queue before the callback of
+the first call_rcu was executed. The caller of rcu_barrier will therefore
+continue to run before the inner call_rcu callback finished.
+
+Fixes: d56b1705e28c ("batman-adv: network coding - detect coding nodes and remove these after timeout")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/network-coding.c |   19 ++++++++-----------
+ 1 file changed, 8 insertions(+), 11 deletions(-)
+
+--- a/net/batman-adv/network-coding.c
++++ b/net/batman-adv/network-coding.c
+@@ -203,28 +203,25 @@ void batadv_nc_init_orig(struct batadv_o
+ }
+ 
+ /**
+- * batadv_nc_node_free_rcu - rcu callback to free an nc node and remove
+- *  its refcount on the orig_node
+- * @rcu: rcu pointer of the nc node
++ * batadv_nc_node_release - release nc_node from lists and queue for free after
++ *  rcu grace period
++ * @nc_node: the nc node to free
+  */
+-static void batadv_nc_node_free_rcu(struct rcu_head *rcu)
++static void batadv_nc_node_release(struct batadv_nc_node *nc_node)
+ {
+-      struct batadv_nc_node *nc_node;
+-
+-      nc_node = container_of(rcu, struct batadv_nc_node, rcu);
+       batadv_orig_node_free_ref(nc_node->orig_node);
+-      kfree(nc_node);
++      kfree_rcu(nc_node, rcu);
+ }
+ 
+ /**
+- * batadv_nc_node_free_ref - decrements the nc node refcounter and possibly
+- * frees it
++ * batadv_nc_node_free_ref - decrement the nc node refcounter and possibly
++ *  release it
+  * @nc_node: the nc node to free
+  */
+ static void batadv_nc_node_free_ref(struct batadv_nc_node *nc_node)
+ {
+       if (atomic_dec_and_test(&nc_node->refcount))
+-              call_rcu(&nc_node->rcu, batadv_nc_node_free_rcu);
++              batadv_nc_node_release(nc_node);
+ }
+ 
+ /**
diff --git a/queue-4.3/batman-adv-drop-immediate-batadv_hard_iface-free-function.patch b/queue-4.3/batman-adv-drop-immediate-batadv_hard_iface-free-function.patch

new file mode 100644 (file)

index 0000000..c671e94
--- /dev/null
+++ b/queue-4.3/batman-adv-drop-immediate-batadv_hard_iface-free-function.patch
@@ -0,0 +1,95 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:25 +0100
+Subject: batman-adv: Drop immediate batadv_hard_iface free function
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit b4d922cfc9c08318eeb77d53b7633740e6b0efb0 ]
+
+It is not allowed to free the memory of an object which is part of a list
+which is protected by rcu-read-side-critical sections without making sure
+that no other context is accessing the object anymore. This usually happens
+by removing the references to this object and then waiting until the rcu
+grace period is over and no one (allowedly) accesses it anymore.
+
+But the _now functions ignore this completely. They free the object
+directly even when a different context still tries to access it. This has
+to be avoided and thus these functions must be removed and all functions
+have to use batadv_hardif_free_ref.
+
+Fixes: 89652331c00f ("batman-adv: split tq information in neigh_node struct")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/hard-interface.h |   12 ------------
+ net/batman-adv/originator.c     |   14 +++++++-------
+ 2 files changed, 7 insertions(+), 19 deletions(-)
+
+--- a/net/batman-adv/hard-interface.h
++++ b/net/batman-adv/hard-interface.h
+@@ -75,18 +75,6 @@ batadv_hardif_free_ref(struct batadv_har
+               call_rcu(&hard_iface->rcu, batadv_hardif_free_rcu);
+ }
+ 
+-/**
+- * batadv_hardif_free_ref_now - decrement the hard interface refcounter and
+- *  possibly free it (without rcu callback)
+- * @hard_iface: the hard interface to free
+- */
+-static inline void
+-batadv_hardif_free_ref_now(struct batadv_hard_iface *hard_iface)
+-{
+-      if (atomic_dec_and_test(&hard_iface->refcount))
+-              batadv_hardif_free_rcu(&hard_iface->rcu);
+-}
+-
+ static inline struct batadv_hard_iface *
+ batadv_primary_if_get_selected(struct batadv_priv *bat_priv)
+ {
+--- a/net/batman-adv/originator.c
++++ b/net/batman-adv/originator.c
+@@ -189,16 +189,16 @@ void batadv_neigh_ifinfo_free_ref(struct
+ 
+ /**
+  * batadv_neigh_node_free_rcu - free the neigh_node
+- * @rcu: rcu pointer of the neigh_node
++ * batadv_neigh_node_release - release neigh_node from lists and queue for
++ *  free after rcu grace period
++ * @neigh_node: neigh neighbor to free
+  */
+-static void batadv_neigh_node_free_rcu(struct rcu_head *rcu)
++static void batadv_neigh_node_release(struct batadv_neigh_node *neigh_node)
+ {
+       struct hlist_node *node_tmp;
+-      struct batadv_neigh_node *neigh_node;
+       struct batadv_neigh_ifinfo *neigh_ifinfo;
+       struct batadv_algo_ops *bao;
+ 
+-      neigh_node = container_of(rcu, struct batadv_neigh_node, rcu);
+       bao = neigh_node->orig_node->bat_priv->bat_algo_ops;
+ 
+       hlist_for_each_entry_safe(neigh_ifinfo, node_tmp,
+@@ -209,9 +209,9 @@ static void batadv_neigh_node_free_rcu(s
+       if (bao->bat_neigh_free)
+               bao->bat_neigh_free(neigh_node);
+ 
+-      batadv_hardif_free_ref_now(neigh_node->if_incoming);
++      batadv_hardif_free_ref(neigh_node->if_incoming);
+ 
+-      kfree(neigh_node);
++      kfree_rcu(neigh_node, rcu);
+ }
+ 
+ /**
+@@ -222,7 +222,7 @@ static void batadv_neigh_node_free_rcu(s
+ void batadv_neigh_node_free_ref(struct batadv_neigh_node *neigh_node)
+ {
+       if (atomic_dec_and_test(&neigh_node->refcount))
+-              call_rcu(&neigh_node->rcu, batadv_neigh_node_free_rcu);
++              batadv_neigh_node_release(neigh_node);
+ }
+ 
+ /**
diff --git a/queue-4.3/batman-adv-drop-immediate-batadv_neigh_node-free-function.patch b/queue-4.3/batman-adv-drop-immediate-batadv_neigh_node-free-function.patch

new file mode 100644 (file)

index 0000000..7f76634
--- /dev/null
+++ b/queue-4.3/batman-adv-drop-immediate-batadv_neigh_node-free-function.patch
@@ -0,0 +1,95 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:22 +0100
+Subject: batman-adv: Drop immediate batadv_neigh_node free function
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit 2baa753c276f27f8e844637561ad597867aa6fb6 ]
+
+It is not allowed to free the memory of an object which is part of a list
+which is protected by rcu-read-side-critical sections without making sure
+that no other context is accessing the object anymore. This usually happens
+by removing the references to this object and then waiting until the rcu
+grace period is over and no one (allowedly) accesses it anymore.
+
+But the _now functions ignore this completely. They free the object
+directly even when a different context still tries to access it. This has
+to be avoided and thus these functions must be removed and all functions
+have to use batadv_neigh_node_free_ref.
+
+Fixes: 89652331c00f ("batman-adv: split tq information in neigh_node struct")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/originator.c |   33 ++++++++++-----------------------
+ 1 file changed, 10 insertions(+), 23 deletions(-)
+
+--- a/net/batman-adv/originator.c
++++ b/net/batman-adv/originator.c
+@@ -229,20 +229,8 @@ static void batadv_neigh_node_free_rcu(s
+ }
+ 
+ /**
+- * batadv_neigh_node_free_ref_now - decrement the neighbors refcounter
+- *  and possibly free it (without rcu callback)
+- * @neigh_node: neigh neighbor to free
+- */
+-static void
+-batadv_neigh_node_free_ref_now(struct batadv_neigh_node *neigh_node)
+-{
+-      if (atomic_dec_and_test(&neigh_node->refcount))
+-              batadv_neigh_node_free_rcu(&neigh_node->rcu);
+-}
+-
+-/**
+  * batadv_neigh_node_free_ref - decrement the neighbors refcounter
+- *  and possibly free it
++ *  and possibly release it
+  * @neigh_node: neigh neighbor to free
+  */
+ void batadv_neigh_node_free_ref(struct batadv_neigh_node *neigh_node)
+@@ -532,24 +520,23 @@ out:
+ }
+ 
+ /**
+- * batadv_orig_ifinfo_free_rcu - free the orig_ifinfo object
+- * @rcu: rcu pointer of the orig_ifinfo object
++ * batadv_orig_ifinfo_release - release orig_ifinfo from lists and queue for
++ *  free after rcu grace period
++ * @orig_ifinfo: the orig_ifinfo object to release
+  */
+-static void batadv_orig_ifinfo_free_rcu(struct rcu_head *rcu)
++static void batadv_orig_ifinfo_release(struct batadv_orig_ifinfo *orig_ifinfo)
+ {
+-      struct batadv_orig_ifinfo *orig_ifinfo;
+       struct batadv_neigh_node *router;
+ 
+-      orig_ifinfo = container_of(rcu, struct batadv_orig_ifinfo, rcu);
+-
+       if (orig_ifinfo->if_outgoing != BATADV_IF_DEFAULT)
+-              batadv_hardif_free_ref_now(orig_ifinfo->if_outgoing);
++              batadv_hardif_free_ref(orig_ifinfo->if_outgoing);
+ 
+       /* this is the last reference to this object */
+       router = rcu_dereference_protected(orig_ifinfo->router, true);
+       if (router)
+-              batadv_neigh_node_free_ref_now(router);
+-      kfree(orig_ifinfo);
++              batadv_neigh_node_free_ref(router);
++
++      kfree_rcu(orig_ifinfo, rcu);
+ }
+ 
+ /**
+@@ -560,7 +547,7 @@ static void batadv_orig_ifinfo_free_rcu(
+ void batadv_orig_ifinfo_free_ref(struct batadv_orig_ifinfo *orig_ifinfo)
+ {
+       if (atomic_dec_and_test(&orig_ifinfo->refcount))
+-              call_rcu(&orig_ifinfo->rcu, batadv_orig_ifinfo_free_rcu);
++              batadv_orig_ifinfo_release(orig_ifinfo);
+ }
+ 
+ /**
diff --git a/queue-4.3/batman-adv-drop-immediate-batadv_orig_ifinfo-free-function.patch b/queue-4.3/batman-adv-drop-immediate-batadv_orig_ifinfo-free-function.patch

new file mode 100644 (file)

index 0000000..7dc7caa
--- /dev/null
+++ b/queue-4.3/batman-adv-drop-immediate-batadv_orig_ifinfo-free-function.patch
@@ -0,0 +1,139 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:21 +0100
+Subject: batman-adv: Drop immediate batadv_orig_ifinfo free function
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit deed96605f5695cb945e0b3d79429581857a2b9d ]
+
+It is not allowed to free the memory of an object which is part of a list
+which is protected by rcu-read-side-critical sections without making sure
+that no other context is accessing the object anymore. This usually happens
+by removing the references to this object and then waiting until the rcu
+grace period is over and no one (allowedly) accesses it anymore.
+
+But the _now functions ignore this completely. They free the object
+directly even when a different context still tries to access it. This has
+to be avoided and thus these functions must be removed and all functions
+have to use batadv_orig_ifinfo_free_ref.
+
+Fixes: 7351a4822d42 ("batman-adv: split out router from orig_node")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/originator.c |   59 +++++++++++++++++++++++---------------------
+ 1 file changed, 31 insertions(+), 28 deletions(-)
+
+--- a/net/batman-adv/originator.c
++++ b/net/batman-adv/originator.c
+@@ -553,76 +553,79 @@ static void batadv_orig_ifinfo_free_rcu(
+ }
+ 
+ /**
+- * batadv_orig_ifinfo_free_ref - decrement the refcounter and possibly free
+- *  the orig_ifinfo (without rcu callback)
++ * batadv_orig_ifinfo_free_ref - decrement the refcounter and possibly release
++ *  the orig_ifinfo
+  * @orig_ifinfo: the orig_ifinfo object to release
+  */
+-static void
+-batadv_orig_ifinfo_free_ref_now(struct batadv_orig_ifinfo *orig_ifinfo)
++void batadv_orig_ifinfo_free_ref(struct batadv_orig_ifinfo *orig_ifinfo)
+ {
+       if (atomic_dec_and_test(&orig_ifinfo->refcount))
+-              batadv_orig_ifinfo_free_rcu(&orig_ifinfo->rcu);
++              call_rcu(&orig_ifinfo->rcu, batadv_orig_ifinfo_free_rcu);
+ }
+ 
+ /**
+- * batadv_orig_ifinfo_free_ref - decrement the refcounter and possibly free
+- *  the orig_ifinfo
+- * @orig_ifinfo: the orig_ifinfo object to release
++ * batadv_orig_node_free_rcu - free the orig_node
++ * @rcu: rcu pointer of the orig_node
+  */
+-void batadv_orig_ifinfo_free_ref(struct batadv_orig_ifinfo *orig_ifinfo)
++static void batadv_orig_node_free_rcu(struct rcu_head *rcu)
+ {
+-      if (atomic_dec_and_test(&orig_ifinfo->refcount))
+-              call_rcu(&orig_ifinfo->rcu, batadv_orig_ifinfo_free_rcu);
++      struct batadv_orig_node *orig_node;
++
++      orig_node = container_of(rcu, struct batadv_orig_node, rcu);
++
++      batadv_mcast_purge_orig(orig_node);
++
++      batadv_frag_purge_orig(orig_node, NULL);
++
++      if (orig_node->bat_priv->bat_algo_ops->bat_orig_free)
++              orig_node->bat_priv->bat_algo_ops->bat_orig_free(orig_node);
++
++      kfree(orig_node->tt_buff);
++      kfree(orig_node);
+ }
+ 
+-static void batadv_orig_node_free_rcu(struct rcu_head *rcu)
++/**
++ * batadv_orig_node_release - release orig_node from lists and queue for
++ *  free after rcu grace period
++ * @orig_node: the orig node to free
++ */
++static void batadv_orig_node_release(struct batadv_orig_node *orig_node)
+ {
+       struct hlist_node *node_tmp;
+       struct batadv_neigh_node *neigh_node;
+-      struct batadv_orig_node *orig_node;
+       struct batadv_orig_ifinfo *orig_ifinfo;
+ 
+-      orig_node = container_of(rcu, struct batadv_orig_node, rcu);
+-
+       spin_lock_bh(&orig_node->neigh_list_lock);
+ 
+       /* for all neighbors towards this originator ... */
+       hlist_for_each_entry_safe(neigh_node, node_tmp,
+                                 &orig_node->neigh_list, list) {
+               hlist_del_rcu(&neigh_node->list);
+-              batadv_neigh_node_free_ref_now(neigh_node);
++              batadv_neigh_node_free_ref(neigh_node);
+       }
+ 
+       hlist_for_each_entry_safe(orig_ifinfo, node_tmp,
+                                 &orig_node->ifinfo_list, list) {
+               hlist_del_rcu(&orig_ifinfo->list);
+-              batadv_orig_ifinfo_free_ref_now(orig_ifinfo);
++              batadv_orig_ifinfo_free_ref(orig_ifinfo);
+       }
+       spin_unlock_bh(&orig_node->neigh_list_lock);
+ 
+-      batadv_mcast_purge_orig(orig_node);
+-
+       /* Free nc_nodes */
+       batadv_nc_purge_orig(orig_node->bat_priv, orig_node, NULL);
+ 
+-      batadv_frag_purge_orig(orig_node, NULL);
+-
+-      if (orig_node->bat_priv->bat_algo_ops->bat_orig_free)
+-              orig_node->bat_priv->bat_algo_ops->bat_orig_free(orig_node);
+-
+-      kfree(orig_node->tt_buff);
+-      kfree(orig_node);
++      call_rcu(&orig_node->rcu, batadv_orig_node_free_rcu);
+ }
+ 
+ /**
+  * batadv_orig_node_free_ref - decrement the orig node refcounter and possibly
+- * schedule an rcu callback for freeing it
++ *  release it
+  * @orig_node: the orig node to free
+  */
+ void batadv_orig_node_free_ref(struct batadv_orig_node *orig_node)
+ {
+       if (atomic_dec_and_test(&orig_node->refcount))
+-              call_rcu(&orig_node->rcu, batadv_orig_node_free_rcu);
++              batadv_orig_node_release(orig_node);
+ }
+ 
+ /**
diff --git a/queue-4.3/batman-adv-drop-immediate-neigh_ifinfo-free-function.patch b/queue-4.3/batman-adv-drop-immediate-neigh_ifinfo-free-function.patch

new file mode 100644 (file)

index 0000000..c903d55
--- /dev/null
+++ b/queue-4.3/batman-adv-drop-immediate-neigh_ifinfo-free-function.patch
@@ -0,0 +1,92 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:24 +0100
+Subject: batman-adv: Drop immediate neigh_ifinfo free function
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit ae3e1e36e3cb6c686a7a2725af20ca86aa46d62a ]
+
+It is not allowed to free the memory of an object which is part of a list
+which is protected by rcu-read-side-critical sections without making sure
+that no other context is accessing the object anymore. This usually happens
+by removing the references to this object and then waiting until the rcu
+grace period is over and no one (allowedly) accesses it anymore.
+
+But the _now functions ignore this completely. They free the object
+directly even when a different context still tries to access it. This has
+to be avoided and thus these functions must be removed and all functions
+have to use batadv_neigh_ifinfo_free_ref.
+
+Fixes: 89652331c00f ("batman-adv: split tq information in neigh_node struct")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/originator.c |   34 ++++++++++------------------------
+ 1 file changed, 10 insertions(+), 24 deletions(-)
+
+--- a/net/batman-adv/originator.c
++++ b/net/batman-adv/originator.c
+@@ -163,42 +163,28 @@ err:
+ }
+ 
+ /**
+- * batadv_neigh_ifinfo_free_rcu - free the neigh_ifinfo object
+- * @rcu: rcu pointer of the neigh_ifinfo object
+- */
+-static void batadv_neigh_ifinfo_free_rcu(struct rcu_head *rcu)
+-{
+-      struct batadv_neigh_ifinfo *neigh_ifinfo;
+-
+-      neigh_ifinfo = container_of(rcu, struct batadv_neigh_ifinfo, rcu);
+-
+-      if (neigh_ifinfo->if_outgoing != BATADV_IF_DEFAULT)
+-              batadv_hardif_free_ref_now(neigh_ifinfo->if_outgoing);
+-
+-      kfree(neigh_ifinfo);
+-}
+-
+-/**
+- * batadv_neigh_ifinfo_free_now - decrement the refcounter and possibly free
+- *  the neigh_ifinfo (without rcu callback)
++ * batadv_neigh_ifinfo_release - release neigh_ifinfo from lists and queue for
++ *  free after rcu grace period
+  * @neigh_ifinfo: the neigh_ifinfo object to release
+  */
+ static void
+-batadv_neigh_ifinfo_free_ref_now(struct batadv_neigh_ifinfo *neigh_ifinfo)
++batadv_neigh_ifinfo_release(struct batadv_neigh_ifinfo *neigh_ifinfo)
+ {
+-      if (atomic_dec_and_test(&neigh_ifinfo->refcount))
+-              batadv_neigh_ifinfo_free_rcu(&neigh_ifinfo->rcu);
++      if (neigh_ifinfo->if_outgoing != BATADV_IF_DEFAULT)
++              batadv_hardif_free_ref(neigh_ifinfo->if_outgoing);
++
++      kfree_rcu(neigh_ifinfo, rcu);
+ }
+ 
+ /**
+- * batadv_neigh_ifinfo_free_ref - decrement the refcounter and possibly free
++ * batadv_neigh_ifinfo_free_ref - decrement the refcounter and possibly release
+  *  the neigh_ifinfo
+  * @neigh_ifinfo: the neigh_ifinfo object to release
+  */
+ void batadv_neigh_ifinfo_free_ref(struct batadv_neigh_ifinfo *neigh_ifinfo)
+ {
+       if (atomic_dec_and_test(&neigh_ifinfo->refcount))
+-              call_rcu(&neigh_ifinfo->rcu, batadv_neigh_ifinfo_free_rcu);
++              batadv_neigh_ifinfo_release(neigh_ifinfo);
+ }
+ 
+ /**
+@@ -217,7 +203,7 @@ static void batadv_neigh_node_free_rcu(s
+ 
+       hlist_for_each_entry_safe(neigh_ifinfo, node_tmp,
+                                 &neigh_node->ifinfo_list, list) {
+-              batadv_neigh_ifinfo_free_ref_now(neigh_ifinfo);
++              batadv_neigh_ifinfo_free_ref(neigh_ifinfo);
+       }
+ 
+       if (bao->bat_neigh_free)
diff --git a/queue-4.3/batman-adv-drop-immediate-orig_node-free-function.patch b/queue-4.3/batman-adv-drop-immediate-orig_node-free-function.patch

new file mode 100644 (file)

index 0000000..f3ecfea
--- /dev/null
+++ b/queue-4.3/batman-adv-drop-immediate-orig_node-free-function.patch
@@ -0,0 +1,111 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sven Eckelmann <sven@narfation.org>
+Date: Tue, 5 Jan 2016 12:06:20 +0100
+Subject: batman-adv: Drop immediate orig_node free function
+
+From: Sven Eckelmann <sven@narfation.org>
+
+[ Upstream commit 42eff6a617e23b691f8e4467f4687ed7245a92db ]
+
+It is not allowed to free the memory of an object which is part of a list
+which is protected by rcu-read-side-critical sections without making sure
+that no other context is accessing the object anymore. This usually happens
+by removing the references to this object and then waiting until the rcu
+grace period is over and no one (allowedly) accesses it anymore.
+
+But the _now functions ignore this completely. They free the object
+directly even when a different context still tries to access it. This has
+to be avoided and thus these functions must be removed and all functions
+have to use batadv_orig_node_free_ref.
+
+Fixes: 72822225bd41 ("batman-adv: Fix rcu_barrier() miss due to double call_rcu() in TT code")
+Signed-off-by: Sven Eckelmann <sven@narfation.org>
+Signed-off-by: Marek Lindner <mareklindner@neomailbox.ch>
+Signed-off-by: Antonio Quartulli <a@unstable.cc>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/batman-adv/originator.c        |   11 -----------
+ net/batman-adv/originator.h        |    1 -
+ net/batman-adv/translation-table.c |   28 +++++++++++++---------------
+ 3 files changed, 13 insertions(+), 27 deletions(-)
+
+--- a/net/batman-adv/originator.c
++++ b/net/batman-adv/originator.c
+@@ -601,17 +601,6 @@ void batadv_orig_node_free_ref(struct ba
+               batadv_orig_node_release(orig_node);
+ }
+ 
+-/**
+- * batadv_orig_node_free_ref_now - decrement the orig node refcounter and
+- * possibly free it (without rcu callback)
+- * @orig_node: the orig node to free
+- */
+-void batadv_orig_node_free_ref_now(struct batadv_orig_node *orig_node)
+-{
+-      if (atomic_dec_and_test(&orig_node->refcount))
+-              batadv_orig_node_free_rcu(&orig_node->rcu);
+-}
+-
+ void batadv_originator_free(struct batadv_priv *bat_priv)
+ {
+       struct batadv_hashtable *hash = bat_priv->orig_hash;
+--- a/net/batman-adv/originator.h
++++ b/net/batman-adv/originator.h
+@@ -38,7 +38,6 @@ int batadv_originator_init(struct batadv
+ void batadv_originator_free(struct batadv_priv *bat_priv);
+ void batadv_purge_orig_ref(struct batadv_priv *bat_priv);
+ void batadv_orig_node_free_ref(struct batadv_orig_node *orig_node);
+-void batadv_orig_node_free_ref_now(struct batadv_orig_node *orig_node);
+ struct batadv_orig_node *batadv_orig_node_new(struct batadv_priv *bat_priv,
+                                             const u8 *addr);
+ struct batadv_neigh_node *
+--- a/net/batman-adv/translation-table.c
++++ b/net/batman-adv/translation-table.c
+@@ -238,20 +238,6 @@ int batadv_tt_global_hash_count(struct b
+       return count;
+ }
+ 
+-static void batadv_tt_orig_list_entry_free_rcu(struct rcu_head *rcu)
+-{
+-      struct batadv_tt_orig_list_entry *orig_entry;
+-
+-      orig_entry = container_of(rcu, struct batadv_tt_orig_list_entry, rcu);
+-
+-      /* We are in an rcu callback here, therefore we cannot use
+-       * batadv_orig_node_free_ref() and its call_rcu():
+-       * An rcu_barrier() wouldn't wait for that to finish
+-       */
+-      batadv_orig_node_free_ref_now(orig_entry->orig_node);
+-      kfree(orig_entry);
+-}
+-
+ /**
+  * batadv_tt_local_size_mod - change the size by v of the local table identified
+  *  by vid
+@@ -347,13 +333,25 @@ static void batadv_tt_global_size_dec(st
+       batadv_tt_global_size_mod(orig_node, vid, -1);
+ }
+ 
++/**
++ * batadv_tt_orig_list_entry_release - release tt orig entry from lists and
++ *  queue for free after rcu grace period
++ * @orig_entry: tt orig entry to be free'd
++ */
++static void
++batadv_tt_orig_list_entry_release(struct batadv_tt_orig_list_entry *orig_entry)
++{
++      batadv_orig_node_free_ref(orig_entry->orig_node);
++      kfree_rcu(orig_entry, rcu);
++}
++
+ static void
+ batadv_tt_orig_list_entry_free_ref(struct batadv_tt_orig_list_entry *orig_entry)
+ {
+       if (!atomic_dec_and_test(&orig_entry->refcount))
+               return;
+ 
+-      call_rcu(&orig_entry->rcu, batadv_tt_orig_list_entry_free_rcu);
++      batadv_tt_orig_list_entry_release(orig_entry);
+ }
+ 
+ /**
diff --git a/queue-4.3/bonding-prevent-ipv6-link-local-address-on-enslaved-devices.patch b/queue-4.3/bonding-prevent-ipv6-link-local-address-on-enslaved-devices.patch

new file mode 100644 (file)

index 0000000..6e1b99d
--- /dev/null
+++ b/queue-4.3/bonding-prevent-ipv6-link-local-address-on-enslaved-devices.patch
@@ -0,0 +1,58 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Karl Heiss <kheiss@gmail.com>
+Date: Mon, 11 Jan 2016 08:28:43 -0500
+Subject: bonding: Prevent IPv6 link local address on enslaved devices
+
+From: Karl Heiss <kheiss@gmail.com>
+
+[ Upstream commit 03d84a5f83a67e692af00a3d3901e7820e3e84d5 ]
+
+Commit 1f718f0f4f97 ("bonding: populate neighbour's private on enslave")
+undoes the fix provided by commit c2edacf80e15 ("bonding / ipv6: no addrconf
+for slaves separately from master") by effectively setting the slave flag
+after the slave has been opened.  If the slave comes up quickly enough, it
+will go through the IPv6 addrconf before the slave flag has been set and
+will get a link local IPv6 address.
+
+In order to ensure that addrconf knows to ignore the slave devices on state
+change, set IFF_SLAVE before dev_open() during bonding enslavement.
+
+Fixes: 1f718f0f4f97 ("bonding: populate neighbour's private on enslave")
+Signed-off-by: Karl Heiss <kheiss@gmail.com>
+Signed-off-by: Jay Vosburgh <jay.vosburgh@canonical.com>
+Reviewed-by: Jarod Wilson <jarod@redhat.com>
+Signed-off-by: Andy Gospodarek <gospo@cumulusnetworks.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/bonding/bond_main.c |    5 ++++-
+ 1 file changed, 4 insertions(+), 1 deletion(-)
+
+--- a/drivers/net/bonding/bond_main.c
++++ b/drivers/net/bonding/bond_main.c
+@@ -1207,7 +1207,6 @@ static int bond_master_upper_dev_link(st
+       err = netdev_master_upper_dev_link_private(slave_dev, bond_dev, slave);
+       if (err)
+               return err;
+-      slave_dev->flags |= IFF_SLAVE;
+       rtmsg_ifinfo(RTM_NEWLINK, slave_dev, IFF_SLAVE, GFP_KERNEL);
+       return 0;
+ }
+@@ -1465,6 +1464,9 @@ int bond_enslave(struct net_device *bond
+               }
+       }
+ 
++      /* set slave flag before open to prevent IPv6 addrconf */
++      slave_dev->flags |= IFF_SLAVE;
++
+       /* open the slave since the application closed it */
+       res = dev_open(slave_dev);
+       if (res) {
+@@ -1725,6 +1727,7 @@ err_close:
+       dev_close(slave_dev);
+ 
+ err_restore_mac:
++      slave_dev->flags &= ~IFF_SLAVE;
+       if (!bond->params.fail_over_mac ||
+           BOND_MODE(bond) != BOND_MODE_ACTIVEBACKUP) {
+               /* XXX TODO - fom follow mode needs to change master's
diff --git a/queue-4.3/bridge-fix-lockdep-addr_list_lock-false-positive-splat.patch b/queue-4.3/bridge-fix-lockdep-addr_list_lock-false-positive-splat.patch

new file mode 100644 (file)

index 0000000..e4bb215
--- /dev/null
+++ b/queue-4.3/bridge-fix-lockdep-addr_list_lock-false-positive-splat.patch
@@ -0,0 +1,133 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Nikolay Aleksandrov <nikolay@cumulusnetworks.com>
+Date: Fri, 15 Jan 2016 19:03:54 +0100
+Subject: bridge: fix lockdep addr_list_lock false positive splat
+
+From: Nikolay Aleksandrov <nikolay@cumulusnetworks.com>
+
+[ Upstream commit c6894dec8ea9ae05747124dce98b3b5c2e69b168 ]
+
+After promisc mode management was introduced a bridge device could do
+dev_set_promiscuity from its ndo_change_rx_flags() callback which in
+turn can be called after the bridge's addr_list_lock has been taken
+(e.g. by dev_uc_add). This causes a false positive lockdep splat because
+the port interfaces' addr_list_lock is taken when br_manage_promisc()
+runs after the bridge's addr list lock was already taken.
+To remove the false positive introduce a custom bridge addr_list_lock
+class and set it on bridge init.
+A simple way to reproduce this is with the following:
+$ brctl addbr br0
+$ ip l add l br0 br0.100 type vlan id 100
+$ ip l set br0 up
+$ ip l set br0.100 up
+$ echo 1 > /sys/class/net/br0/bridge/vlan_filtering
+$ brctl addif br0 eth0
+Splat:
+[   43.684325] =============================================
+[   43.684485] [ INFO: possible recursive locking detected ]
+[   43.684636] 4.4.0-rc8+ #54 Not tainted
+[   43.684755] ---------------------------------------------
+[   43.684906] brctl/1187 is trying to acquire lock:
+[   43.685047]  (_xmit_ETHER){+.....}, at: [<ffffffff8150169e>] dev_set_rx_mode+0x1e/0x40
+[   43.685460]  but task is already holding lock:
+[   43.685618]  (_xmit_ETHER){+.....}, at: [<ffffffff815072a7>] dev_uc_add+0x27/0x80
+[   43.686015]  other info that might help us debug this:
+[   43.686316]  Possible unsafe locking scenario:
+
+[   43.686743]        CPU0
+[   43.686967]        ----
+[   43.687197]   lock(_xmit_ETHER);
+[   43.687544]   lock(_xmit_ETHER);
+[   43.687886] *** DEADLOCK ***
+
+[   43.688438]  May be due to missing lock nesting notation
+
+[   43.688882] 2 locks held by brctl/1187:
+[   43.689134]  #0:  (rtnl_mutex){+.+.+.}, at: [<ffffffff81510317>] rtnl_lock+0x17/0x20
+[   43.689852]  #1:  (_xmit_ETHER){+.....}, at: [<ffffffff815072a7>] dev_uc_add+0x27/0x80
+[   43.690575] stack backtrace:
+[   43.690970] CPU: 0 PID: 1187 Comm: brctl Not tainted 4.4.0-rc8+ #54
+[   43.691270] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.8.1-20150318_183358- 04/01/2014
+[   43.691770]  ffffffff826a25c0 ffff8800369fb8e0 ffffffff81360ceb ffffffff826a25c0
+[   43.692425]  ffff8800369fb9b8 ffffffff810d0466 ffff8800369fb968 ffffffff81537139
+[   43.693071]  ffff88003a08c880 0000000000000000 00000000ffffffff 0000000002080020
+[   43.693709] Call Trace:
+[   43.693931]  [<ffffffff81360ceb>] dump_stack+0x4b/0x70
+[   43.694199]  [<ffffffff810d0466>] __lock_acquire+0x1e46/0x1e90
+[   43.694483]  [<ffffffff81537139>] ? netlink_broadcast_filtered+0x139/0x3e0
+[   43.694789]  [<ffffffff8153b5da>] ? nlmsg_notify+0x5a/0xc0
+[   43.695064]  [<ffffffff810d10f5>] lock_acquire+0xe5/0x1f0
+[   43.695340]  [<ffffffff8150169e>] ? dev_set_rx_mode+0x1e/0x40
+[   43.695623]  [<ffffffff815edea5>] _raw_spin_lock_bh+0x45/0x80
+[   43.695901]  [<ffffffff8150169e>] ? dev_set_rx_mode+0x1e/0x40
+[   43.696180]  [<ffffffff8150169e>] dev_set_rx_mode+0x1e/0x40
+[   43.696460]  [<ffffffff8150189c>] dev_set_promiscuity+0x3c/0x50
+[   43.696750]  [<ffffffffa0586845>] br_port_set_promisc+0x25/0x50 [bridge]
+[   43.697052]  [<ffffffffa05869aa>] br_manage_promisc+0x8a/0xe0 [bridge]
+[   43.697348]  [<ffffffffa05826ee>] br_dev_change_rx_flags+0x1e/0x20 [bridge]
+[   43.697655]  [<ffffffff81501532>] __dev_set_promiscuity+0x132/0x1f0
+[   43.697943]  [<ffffffff81501672>] __dev_set_rx_mode+0x82/0x90
+[   43.698223]  [<ffffffff815072de>] dev_uc_add+0x5e/0x80
+[   43.698498]  [<ffffffffa05b3c62>] vlan_device_event+0x542/0x650 [8021q]
+[   43.698798]  [<ffffffff8109886d>] notifier_call_chain+0x5d/0x80
+[   43.699083]  [<ffffffff810988b6>] raw_notifier_call_chain+0x16/0x20
+[   43.699374]  [<ffffffff814f456e>] call_netdevice_notifiers_info+0x6e/0x80
+[   43.699678]  [<ffffffff814f4596>] call_netdevice_notifiers+0x16/0x20
+[   43.699973]  [<ffffffffa05872be>] br_add_if+0x47e/0x4c0 [bridge]
+[   43.700259]  [<ffffffffa058801e>] add_del_if+0x6e/0x80 [bridge]
+[   43.700548]  [<ffffffffa0588b5f>] br_dev_ioctl+0xaf/0xc0 [bridge]
+[   43.700836]  [<ffffffff8151a7ac>] dev_ifsioc+0x30c/0x3c0
+[   43.701106]  [<ffffffff8151aac9>] dev_ioctl+0xf9/0x6f0
+[   43.701379]  [<ffffffff81254345>] ? mntput_no_expire+0x5/0x450
+[   43.701665]  [<ffffffff812543ee>] ? mntput_no_expire+0xae/0x450
+[   43.701947]  [<ffffffff814d7b02>] sock_do_ioctl+0x42/0x50
+[   43.702219]  [<ffffffff814d8175>] sock_ioctl+0x1e5/0x290
+[   43.702500]  [<ffffffff81242d0b>] do_vfs_ioctl+0x2cb/0x5c0
+[   43.702771]  [<ffffffff81243079>] SyS_ioctl+0x79/0x90
+[   43.703033]  [<ffffffff815eebb6>] entry_SYSCALL_64_fastpath+0x16/0x7a
+
+CC: Vlad Yasevich <vyasevic@redhat.com>
+CC: Stephen Hemminger <stephen@networkplumber.org>
+CC: Bridge list <bridge@lists.linux-foundation.org>
+CC: Andy Gospodarek <gospo@cumulusnetworks.com>
+CC: Roopa Prabhu <roopa@cumulusnetworks.com>
+Fixes: 2796d0c648c9 ("bridge: Automatically manage port promiscuous mode.")
+Reported-by: Andy Gospodarek <gospo@cumulusnetworks.com>
+Signed-off-by: Nikolay Aleksandrov <nikolay@cumulusnetworks.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bridge/br_device.c |    8 ++++++++
+ 1 file changed, 8 insertions(+)
+
+--- a/net/bridge/br_device.c
++++ b/net/bridge/br_device.c
+@@ -28,6 +28,8 @@
+ const struct nf_br_ops __rcu *nf_br_ops __read_mostly;
+ EXPORT_SYMBOL_GPL(nf_br_ops);
+ 
++static struct lock_class_key bridge_netdev_addr_lock_key;
++
+ /* net device transmit always called with BH disabled */
+ netdev_tx_t br_dev_xmit(struct sk_buff *skb, struct net_device *dev)
+ {
+@@ -87,6 +89,11 @@ out:
+       return NETDEV_TX_OK;
+ }
+ 
++static void br_set_lockdep_class(struct net_device *dev)
++{
++      lockdep_set_class(&dev->addr_list_lock, &bridge_netdev_addr_lock_key);
++}
++
+ static int br_dev_init(struct net_device *dev)
+ {
+       struct net_bridge *br = netdev_priv(dev);
+@@ -99,6 +106,7 @@ static int br_dev_init(struct net_device
+       err = br_vlan_init(br);
+       if (err)
+               free_percpu(br->stats);
++      br_set_lockdep_class(dev);
+ 
+       return err;
+ }
diff --git a/queue-4.3/bridge-only-call-sbin-bridge-stp-for-the-initial-network-namespace.patch b/queue-4.3/bridge-only-call-sbin-bridge-stp-for-the-initial-network-namespace.patch

new file mode 100644 (file)

index 0000000..c75c8cd
--- /dev/null
+++ b/queue-4.3/bridge-only-call-sbin-bridge-stp-for-the-initial-network-namespace.patch
@@ -0,0 +1,45 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Hannes Frederic Sowa <hannes@stressinduktion.org>
+Date: Tue, 5 Jan 2016 10:46:00 +0100
+Subject: bridge: Only call /sbin/bridge-stp for the initial network namespace
+
+From: Hannes Frederic Sowa <hannes@stressinduktion.org>
+
+[ Upstream commit ff62198553e43cdffa9d539f6165d3e83f8a42bc ]
+
+[I stole this patch from Eric Biederman. He wrote:]
+
+> There is no defined mechanism to pass network namespace information
+> into /sbin/bridge-stp therefore don't even try to invoke it except
+> for bridge devices in the initial network namespace.
+>
+> It is possible for unprivileged users to cause /sbin/bridge-stp to be
+> invoked for any network device name which if /sbin/bridge-stp does not
+> guard against unreasonable arguments or being invoked twice on the
+> same network device could cause problems.
+
+[Hannes: changed patch using netns_eq]
+
+Cc: Eric W. Biederman <ebiederm@xmission.com>
+Signed-off-by: Eric W. Biederman <ebiederm@xmission.com>
+Signed-off-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bridge/br_stp_if.c |    5 ++++-
+ 1 file changed, 4 insertions(+), 1 deletion(-)
+
+--- a/net/bridge/br_stp_if.c
++++ b/net/bridge/br_stp_if.c
+@@ -130,7 +130,10 @@ static void br_stp_start(struct net_brid
+       char *envp[] = { NULL };
+       struct net_bridge_port *p;
+ 
+-      r = call_usermodehelper(BR_STP_PROG, argv, envp, UMH_WAIT_PROC);
++      if (net_eq(dev_net(br->dev), &init_net))
++              r = call_usermodehelper(BR_STP_PROG, argv, envp, UMH_WAIT_PROC);
++      else
++              r = -ENOENT;
+ 
+       spin_lock_bh(&br->lock);
+ 
diff --git a/queue-4.3/connector-bump-skb-users-before-callback-invocation.patch b/queue-4.3/connector-bump-skb-users-before-callback-invocation.patch

new file mode 100644 (file)

index 0000000..92bd189
--- /dev/null
+++ b/queue-4.3/connector-bump-skb-users-before-callback-invocation.patch
@@ -0,0 +1,54 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Florian Westphal <fw@strlen.de>
+Date: Thu, 31 Dec 2015 14:26:33 +0100
+Subject: connector: bump skb->users before callback invocation
+
+From: Florian Westphal <fw@strlen.de>
+
+[ Upstream commit 55285bf09427c5abf43ee1d54e892f352092b1f1 ]
+
+Dmitry reports memleak with syskaller program.
+Problem is that connector bumps skb usecount but might not invoke callback.
+
+So move skb_get to where we invoke the callback.
+
+Reported-by: Dmitry Vyukov <dvyukov@google.com>
+Signed-off-by: Florian Westphal <fw@strlen.de>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/connector/connector.c |   11 +++--------
+ 1 file changed, 3 insertions(+), 8 deletions(-)
+
+--- a/drivers/connector/connector.c
++++ b/drivers/connector/connector.c
+@@ -178,26 +178,21 @@ static int cn_call_callback(struct sk_bu
+  *
+  * It checks skb, netlink header and msg sizes, and calls callback helper.
+  */
+-static void cn_rx_skb(struct sk_buff *__skb)
++static void cn_rx_skb(struct sk_buff *skb)
+ {
+       struct nlmsghdr *nlh;
+-      struct sk_buff *skb;
+       int len, err;
+ 
+-      skb = skb_get(__skb);
+-
+       if (skb->len >= NLMSG_HDRLEN) {
+               nlh = nlmsg_hdr(skb);
+               len = nlmsg_len(nlh);
+ 
+               if (len < (int)sizeof(struct cn_msg) ||
+                   skb->len < nlh->nlmsg_len ||
+-                  len > CONNECTOR_MAX_MSG_SIZE) {
+-                      kfree_skb(skb);
++                  len > CONNECTOR_MAX_MSG_SIZE)
+                       return;
+-              }
+ 
+-              err = cn_call_callback(skb);
++              err = cn_call_callback(skb_get(skb));
+               if (err < 0)
+                       kfree_skb(skb);
+       }
diff --git a/queue-4.3/dwc_eth_qos-fix-dma-address-for-multi-fragment-skbs.patch b/queue-4.3/dwc_eth_qos-fix-dma-address-for-multi-fragment-skbs.patch

new file mode 100644 (file)

index 0000000..b3358e3
--- /dev/null
+++ b/queue-4.3/dwc_eth_qos-fix-dma-address-for-multi-fragment-skbs.patch
@@ -0,0 +1,31 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Lars Persson <lars.persson@axis.com>
+Date: Tue, 12 Jan 2016 15:28:13 +0100
+Subject: dwc_eth_qos: Fix dma address for multi-fragment skbs
+
+From: Lars Persson <lars.persson@axis.com>
+
+[ Upstream commit d461873272169a3fc3a8d155d7b1c92e9d97b419 ]
+
+The offset inside the fragment was not used for the dma address and
+silent data corruption resulted because TSO makes the checksum match.
+
+Fixes: 077742dac2c7 ("dwc_eth_qos: Add support for Synopsys DWC Ethernet QoS")
+Signed-off-by: Lars Persson <larper@axis.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/ethernet/synopsys/dwc_eth_qos.c |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/drivers/net/ethernet/synopsys/dwc_eth_qos.c
++++ b/drivers/net/ethernet/synopsys/dwc_eth_qos.c
+@@ -2107,7 +2107,7 @@ static int dwceqos_tx_frags(struct sk_bu
+                       dd = &lp->tx_descs[lp->tx_next];
+ 
+                       /* Set DMA Descriptor fields */
+-                      dd->des0 = dma_handle;
++                      dd->des0 = dma_handle + consumed_size;
+                       dd->des1 = 0;
+                       dd->des2 = dma_size;
+ 
diff --git a/queue-4.3/ipv6-addrlabel-fix-ip6addrlbl_get.patch b/queue-4.3/ipv6-addrlabel-fix-ip6addrlbl_get.patch

new file mode 100644 (file)

index 0000000..c5d1c3b
--- /dev/null
+++ b/queue-4.3/ipv6-addrlabel-fix-ip6addrlbl_get.patch
@@ -0,0 +1,36 @@
+From foo@baz Tue Jan 26 21:35:02 PST 2016
+From: Andrey Ryabinin <aryabinin@virtuozzo.com>
+Date: Mon, 21 Dec 2015 12:54:45 +0300
+Subject: ipv6/addrlabel: fix ip6addrlbl_get()
+
+From: Andrey Ryabinin <aryabinin@virtuozzo.com>
+
+[ Upstream commit e459dfeeb64008b2d23bdf600f03b3605dbb8152 ]
+
+ip6addrlbl_get() has never worked. If ip6addrlbl_hold() succeeded,
+ip6addrlbl_get() will exit with '-ESRCH'. If ip6addrlbl_hold() failed,
+ip6addrlbl_get() will use about to be free ip6addrlbl_entry pointer.
+
+Fix this by inverting ip6addrlbl_hold() check.
+
+Fixes: 2a8cc6c89039 ("[IPV6] ADDRCONF: Support RFC3484 configurable address selection policy table.")
+Signed-off-by: Andrey Ryabinin <aryabinin@virtuozzo.com>
+Reviewed-by: Cong Wang <cwang@twopensource.com>
+Acked-by: YOSHIFUJI Hideaki <yoshfuji@linux-ipv6.org>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv6/addrlabel.c |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/net/ipv6/addrlabel.c
++++ b/net/ipv6/addrlabel.c
+@@ -552,7 +552,7 @@ static int ip6addrlbl_get(struct sk_buff
+ 
+       rcu_read_lock();
+       p = __ipv6_addr_label(net, addr, ipv6_addr_type(addr), ifal->ifal_index);
+-      if (p && ip6addrlbl_hold(p))
++      if (p && !ip6addrlbl_hold(p))
+               p = NULL;
+       lseq = ip6addrlbl_table.seq;
+       rcu_read_unlock();
diff --git a/queue-4.3/ipv6-tcp-add-rcu-locking-in-tcp_v6_send_synack.patch b/queue-4.3/ipv6-tcp-add-rcu-locking-in-tcp_v6_send_synack.patch

new file mode 100644 (file)

index 0000000..bfc8ee9
--- /dev/null
+++ b/queue-4.3/ipv6-tcp-add-rcu-locking-in-tcp_v6_send_synack.patch
@@ -0,0 +1,35 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Eric Dumazet <edumazet@google.com>
+Date: Fri, 8 Jan 2016 09:35:51 -0800
+Subject: ipv6: tcp: add rcu locking in tcp_v6_send_synack()
+
+From: Eric Dumazet <edumazet@google.com>
+
+[ Upstream commit 3e4006f0b86a5ae5eb0e8215f9a9e1db24506977 ]
+
+When first SYNACK is sent, we already hold rcu_read_lock(), but this
+is not true if a SYNACK is retransmitted, as a timer (soft) interrupt
+does not hold rcu_read_lock()
+
+Fixes: 45f6fad84cc30 ("ipv6: add complete rcu protection around np->opt")
+Reported-by: Dave Jones <davej@codemonkey.org.uk>
+Signed-off-by: Eric Dumazet <edumazet@google.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv6/tcp_ipv6.c |    2 ++
+ 1 file changed, 2 insertions(+)
+
+--- a/net/ipv6/tcp_ipv6.c
++++ b/net/ipv6/tcp_ipv6.c
+@@ -462,8 +462,10 @@ static int tcp_v6_send_synack(struct soc
+                       fl6->flowlabel = ip6_flowlabel(ipv6_hdr(ireq->pktopts));
+ 
+               skb_set_queue_mapping(skb, queue_mapping);
++              rcu_read_lock();
+               err = ip6_xmit(sk, skb, fl6, rcu_dereference(np->opt),
+                              np->tclass);
++              rcu_read_unlock();
+               err = net_xmit_eval(err);
+       }
+ 
diff --git a/queue-4.3/ipv6-update-skb-csum-when-ce-mark-is-propagated.patch b/queue-4.3/ipv6-update-skb-csum-when-ce-mark-is-propagated.patch

new file mode 100644 (file)

index 0000000..40056d7
--- /dev/null
+++ b/queue-4.3/ipv6-update-skb-csum-when-ce-mark-is-propagated.patch
@@ -0,0 +1,74 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Eric Dumazet <edumazet@google.com>
+Date: Fri, 15 Jan 2016 04:56:56 -0800
+Subject: ipv6: update skb->csum when CE mark is propagated
+
+From: Eric Dumazet <edumazet@google.com>
+
+[ Upstream commit 34ae6a1aa0540f0f781dd265366036355fdc8930 ]
+
+When a tunnel decapsulates the outer header, it has to comply
+with RFC 6080 and eventually propagate CE mark into inner header.
+
+It turns out IP6_ECN_set_ce() does not correctly update skb->csum
+for CHECKSUM_COMPLETE packets, triggering infamous "hw csum failure"
+messages and stack traces.
+
+Signed-off-by: Eric Dumazet <edumazet@google.com>
+Acked-by: Herbert Xu <herbert@gondor.apana.org.au>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ include/net/inet_ecn.h       |   19 ++++++++++++++++---
+ net/ipv6/xfrm6_mode_tunnel.c |    2 +-
+ 2 files changed, 17 insertions(+), 4 deletions(-)
+
+--- a/include/net/inet_ecn.h
++++ b/include/net/inet_ecn.h
+@@ -111,11 +111,24 @@ static inline void ipv4_copy_dscp(unsign
+ 
+ struct ipv6hdr;
+ 
+-static inline int IP6_ECN_set_ce(struct ipv6hdr *iph)
++/* Note:
++ * IP_ECN_set_ce() has to tweak IPV4 checksum when setting CE,
++ * meaning both changes have no effect on skb->csum if/when CHECKSUM_COMPLETE
++ * In IPv6 case, no checksum compensates the change in IPv6 header,
++ * so we have to update skb->csum.
++ */
++static inline int IP6_ECN_set_ce(struct sk_buff *skb, struct ipv6hdr *iph)
+ {
++      __be32 from, to;
++
+       if (INET_ECN_is_not_ect(ipv6_get_dsfield(iph)))
+               return 0;
+-      *(__be32*)iph |= htonl(INET_ECN_CE << 20);
++
++      from = *(__be32 *)iph;
++      to = from | htonl(INET_ECN_CE << 20);
++      *(__be32 *)iph = to;
++      if (skb->ip_summed == CHECKSUM_COMPLETE)
++              skb->csum = csum_add(csum_sub(skb->csum, from), to);
+       return 1;
+ }
+ 
+@@ -142,7 +155,7 @@ static inline int INET_ECN_set_ce(struct
+       case cpu_to_be16(ETH_P_IPV6):
+               if (skb_network_header(skb) + sizeof(struct ipv6hdr) <=
+                   skb_tail_pointer(skb))
+-                      return IP6_ECN_set_ce(ipv6_hdr(skb));
++                      return IP6_ECN_set_ce(skb, ipv6_hdr(skb));
+               break;
+       }
+ 
+--- a/net/ipv6/xfrm6_mode_tunnel.c
++++ b/net/ipv6/xfrm6_mode_tunnel.c
+@@ -23,7 +23,7 @@ static inline void ipip6_ecn_decapsulate
+       struct ipv6hdr *inner_iph = ipipv6_hdr(skb);
+ 
+       if (INET_ECN_is_ce(XFRM_MODE_SKB_CB(skb)->tos))
+-              IP6_ECN_set_ce(inner_iph);
++              IP6_ECN_set_ce(skb, inner_iph);
+ }
+ 
+ /* Add encapsulation header.
diff --git a/queue-4.3/isdn_ppp-add-checks-for-allocation-failure-in-isdn_ppp_open.patch b/queue-4.3/isdn_ppp-add-checks-for-allocation-failure-in-isdn_ppp_open.patch

new file mode 100644 (file)

index 0000000..fecc2dd
--- /dev/null
+++ b/queue-4.3/isdn_ppp-add-checks-for-allocation-failure-in-isdn_ppp_open.patch
@@ -0,0 +1,40 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Ben Hutchings <ben@decadent.org.uk>
+Date: Sun, 1 Nov 2015 16:21:24 +0000
+Subject: isdn_ppp: Add checks for allocation failure in isdn_ppp_open()
+
+From: Ben Hutchings <ben@decadent.org.uk>
+
+[ Upstream commit 0baa57d8dc32db78369d8b5176ef56c5e2e18ab3 ]
+
+Compile-tested only.
+
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/isdn/i4l/isdn_ppp.c |    6 ++++++
+ 1 file changed, 6 insertions(+)
+
+--- a/drivers/isdn/i4l/isdn_ppp.c
++++ b/drivers/isdn/i4l/isdn_ppp.c
+@@ -301,6 +301,8 @@ isdn_ppp_open(int min, struct file *file
+       is->compflags = 0;
+ 
+       is->reset = isdn_ppp_ccp_reset_alloc(is);
++      if (!is->reset)
++              return -ENOMEM;
+ 
+       is->lp = NULL;
+       is->mp_seqno = 0;       /* MP sequence number */
+@@ -320,6 +322,10 @@ isdn_ppp_open(int min, struct file *file
+        * VJ header compression init
+        */
+       is->slcomp = slhc_init(16, 16); /* not necessary for 2. link in bundle */
++      if (!is->slcomp) {
++              isdn_ppp_ccp_reset_free(is);
++              return -ENOMEM;
++      }
+ #endif
+ #ifdef CONFIG_IPPP_FILTER
+       is->pass_filter = NULL;
diff --git a/queue-4.3/net-bpf-reject-invalid-shifts.patch b/queue-4.3/net-bpf-reject-invalid-shifts.patch

new file mode 100644 (file)

index 0000000..7f8d901
--- /dev/null
+++ b/queue-4.3/net-bpf-reject-invalid-shifts.patch
@@ -0,0 +1,59 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Rabin Vincent <rabin@rab.in>
+Date: Tue, 12 Jan 2016 20:17:08 +0100
+Subject: net: bpf: reject invalid shifts
+
+From: Rabin Vincent <rabin@rab.in>
+
+[ Upstream commit 229394e8e62a4191d592842cf67e80c62a492937 ]
+
+On ARM64, a BUG() is triggered in the eBPF JIT if a filter with a
+constant shift that can't be encoded in the immediate field of the
+UBFM/SBFM instructions is passed to the JIT.  Since these shifts
+amounts, which are negative or >= regsize, are invalid, reject them in
+the eBPF verifier and the classic BPF filter checker, for all
+architectures.
+
+Signed-off-by: Rabin Vincent <rabin@rab.in>
+Acked-by: Alexei Starovoitov <ast@kernel.org>
+Acked-by: Daniel Borkmann <daniel@iogearbox.net>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ kernel/bpf/verifier.c |   10 ++++++++++
+ net/core/filter.c     |    5 +++++
+ 2 files changed, 15 insertions(+)
+
+--- a/kernel/bpf/verifier.c
++++ b/kernel/bpf/verifier.c
+@@ -1058,6 +1058,16 @@ static int check_alu_op(struct reg_state
+                       return -EINVAL;
+               }
+ 
++              if ((opcode == BPF_LSH || opcode == BPF_RSH ||
++                   opcode == BPF_ARSH) && BPF_SRC(insn->code) == BPF_K) {
++                      int size = BPF_CLASS(insn->code) == BPF_ALU64 ? 64 : 32;
++
++                      if (insn->imm < 0 || insn->imm >= size) {
++                              verbose("invalid shift %d\n", insn->imm);
++                              return -EINVAL;
++                      }
++              }
++
+               /* pattern match 'bpf_add Rx, imm' instruction */
+               if (opcode == BPF_ADD && BPF_CLASS(insn->code) == BPF_ALU64 &&
+                   regs[insn->dst_reg].type == FRAME_PTR &&
+--- a/net/core/filter.c
++++ b/net/core/filter.c
+@@ -781,6 +781,11 @@ static int bpf_check_classic(const struc
+                       if (ftest->k == 0)
+                               return -EINVAL;
+                       break;
++              case BPF_ALU | BPF_LSH | BPF_K:
++              case BPF_ALU | BPF_RSH | BPF_K:
++                      if (ftest->k >= 32)
++                              return -EINVAL;
++                      break;
+               case BPF_LD | BPF_MEM:
+               case BPF_LDX | BPF_MEM:
+               case BPF_ST:
diff --git a/queue-4.3/net-cdc_ncm-avoid-changing-rx-tx-buffers-on-mtu-changes.patch b/queue-4.3/net-cdc_ncm-avoid-changing-rx-tx-buffers-on-mtu-changes.patch

new file mode 100644 (file)

index 0000000..39f9810
--- /dev/null
+++ b/queue-4.3/net-cdc_ncm-avoid-changing-rx-tx-buffers-on-mtu-changes.patch
@@ -0,0 +1,112 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: =?UTF-8?q?Bj=C3=B8rn=20Mork?= <bjorn@mork.no>
+Date: Wed, 23 Dec 2015 13:42:43 +0100
+Subject: net: cdc_ncm: avoid changing RX/TX buffers on MTU changes
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+From: =?UTF-8?q?Bj=C3=B8rn=20Mork?= <bjorn@mork.no>
+
+[ Upstream commit 1dfddff5fcd869fcab0c52fafae099dfa435a935 ]
+
+NCM buffer sizes are negotiated with the device independently of
+the network device MTU.  The RX buffers are allocated by the
+usbnet framework based on the rx_urb_size value set by cdc_ncm. A
+single RX buffer can hold a number of MTU sized packets.
+
+The default usbnet change_mtu ndo only modifies rx_urb_size if it
+is equal to hard_mtu.  And the cdc_ncm driver will set rx_urb_size
+and hard_mtu independently of each other, based on dwNtbInMaxSize
+and dwNtbOutMaxSize respectively. It was therefore assumed that
+usbnet_change_mtu() would never touch rx_urb_size.  This failed to
+consider the case where dwNtbInMaxSize and dwNtbOutMaxSize happens
+to be equal.
+
+Fix by implementing an NCM specific change_mtu ndo, modifying the
+netdev MTU without touching the buffer size settings.
+
+Signed-off-by: Bjørn Mork <bjorn@mork.no>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/usb/cdc_mbim.c  |    2 +-
+ drivers/net/usb/cdc_ncm.c   |   31 +++++++++++++++++++++++++++++++
+ include/linux/usb/cdc_ncm.h |    1 +
+ 3 files changed, 33 insertions(+), 1 deletion(-)
+
+--- a/drivers/net/usb/cdc_mbim.c
++++ b/drivers/net/usb/cdc_mbim.c
+@@ -100,7 +100,7 @@ static const struct net_device_ops cdc_m
+       .ndo_stop             = usbnet_stop,
+       .ndo_start_xmit       = usbnet_start_xmit,
+       .ndo_tx_timeout       = usbnet_tx_timeout,
+-      .ndo_change_mtu       = usbnet_change_mtu,
++      .ndo_change_mtu       = cdc_ncm_change_mtu,
+       .ndo_set_mac_address  = eth_mac_addr,
+       .ndo_validate_addr    = eth_validate_addr,
+       .ndo_vlan_rx_add_vid  = cdc_mbim_rx_add_vid,
+--- a/drivers/net/usb/cdc_ncm.c
++++ b/drivers/net/usb/cdc_ncm.c
+@@ -41,6 +41,7 @@
+ #include <linux/module.h>
+ #include <linux/netdevice.h>
+ #include <linux/ctype.h>
++#include <linux/etherdevice.h>
+ #include <linux/ethtool.h>
+ #include <linux/workqueue.h>
+ #include <linux/mii.h>
+@@ -689,6 +690,33 @@ static void cdc_ncm_free(struct cdc_ncm_
+       kfree(ctx);
+ }
+ 
++/* we need to override the usbnet change_mtu ndo for two reasons:
++ *  - respect the negotiated maximum datagram size
++ *  - avoid unwanted changes to rx and tx buffers
++ */
++int cdc_ncm_change_mtu(struct net_device *net, int new_mtu)
++{
++      struct usbnet *dev = netdev_priv(net);
++      struct cdc_ncm_ctx *ctx = (struct cdc_ncm_ctx *)dev->data[0];
++      int maxmtu = ctx->max_datagram_size - cdc_ncm_eth_hlen(dev);
++
++      if (new_mtu <= 0 || new_mtu > maxmtu)
++              return -EINVAL;
++      net->mtu = new_mtu;
++      return 0;
++}
++EXPORT_SYMBOL_GPL(cdc_ncm_change_mtu);
++
++static const struct net_device_ops cdc_ncm_netdev_ops = {
++      .ndo_open            = usbnet_open,
++      .ndo_stop            = usbnet_stop,
++      .ndo_start_xmit      = usbnet_start_xmit,
++      .ndo_tx_timeout      = usbnet_tx_timeout,
++      .ndo_change_mtu      = cdc_ncm_change_mtu,
++      .ndo_set_mac_address = eth_mac_addr,
++      .ndo_validate_addr   = eth_validate_addr,
++};
++
+ int cdc_ncm_bind_common(struct usbnet *dev, struct usb_interface *intf, u8 data_altsetting, int drvflags)
+ {
+       const struct usb_cdc_union_desc *union_desc = NULL;
+@@ -874,6 +902,9 @@ advance:
+       /* add our sysfs attrs */
+       dev->net->sysfs_groups[0] = &cdc_ncm_sysfs_attr_group;
+ 
++      /* must handle MTU changes */
++      dev->net->netdev_ops = &cdc_ncm_netdev_ops;
++
+       return 0;
+ 
+ error2:
+--- a/include/linux/usb/cdc_ncm.h
++++ b/include/linux/usb/cdc_ncm.h
+@@ -138,6 +138,7 @@ struct cdc_ncm_ctx {
+ };
+ 
+ u8 cdc_ncm_select_altsetting(struct usb_interface *intf);
++int cdc_ncm_change_mtu(struct net_device *net, int new_mtu);
+ int cdc_ncm_bind_common(struct usbnet *dev, struct usb_interface *intf, u8 data_altsetting, int drvflags);
+ void cdc_ncm_unbind(struct usbnet *dev, struct usb_interface *intf);
+ struct sk_buff *cdc_ncm_fill_tx_frame(struct usbnet *dev, struct sk_buff *skb, __le32 sign);
diff --git a/queue-4.3/net-filter-make-jits-zero-a-for-skf_ad_alu_xor_x.patch b/queue-4.3/net-filter-make-jits-zero-a-for-skf_ad_alu_xor_x.patch

new file mode 100644 (file)

index 0000000..736bc2d
--- /dev/null
+++ b/queue-4.3/net-filter-make-jits-zero-a-for-skf_ad_alu_xor_x.patch
@@ -0,0 +1,189 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Rabin Vincent <rabin@rab.in>
+Date: Tue, 5 Jan 2016 16:23:07 +0100
+Subject: net: filter: make JITs zero A for SKF_AD_ALU_XOR_X
+
+From: Rabin Vincent <rabin@rab.in>
+
+[ Upstream commit 55795ef5469290f89f04e12e662ded604909e462 ]
+
+The SKF_AD_ALU_XOR_X ancillary is not like the other ancillary data
+instructions since it XORs A with X while all the others replace A with
+some loaded value.  All the BPF JITs fail to clear A if this is used as
+the first instruction in a filter.  This was found using american fuzzy
+lop.
+
+Add a helper to determine if A needs to be cleared given the first
+instruction in a filter, and use this in the JITs.  Except for ARM, the
+rest have only been compile-tested.
+
+Fixes: 3480593131e0 ("net: filter: get rid of BPF_S_* enum")
+Signed-off-by: Rabin Vincent <rabin@rab.in>
+Acked-by: Daniel Borkmann <daniel@iogearbox.net>
+Acked-by: Alexei Starovoitov <ast@kernel.org>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ arch/arm/net/bpf_jit_32.c       |   16 +---------------
+ arch/mips/net/bpf_jit.c         |   16 +---------------
+ arch/powerpc/net/bpf_jit_comp.c |   13 ++-----------
+ arch/sparc/net/bpf_jit_comp.c   |   17 ++---------------
+ include/linux/filter.h          |   19 +++++++++++++++++++
+ 5 files changed, 25 insertions(+), 56 deletions(-)
+
+--- a/arch/arm/net/bpf_jit_32.c
++++ b/arch/arm/net/bpf_jit_32.c
+@@ -182,19 +182,6 @@ static inline int mem_words_used(struct
+       return fls(ctx->seen & SEEN_MEM);
+ }
+ 
+-static inline bool is_load_to_a(u16 inst)
+-{
+-      switch (inst) {
+-      case BPF_LD | BPF_W | BPF_LEN:
+-      case BPF_LD | BPF_W | BPF_ABS:
+-      case BPF_LD | BPF_H | BPF_ABS:
+-      case BPF_LD | BPF_B | BPF_ABS:
+-              return true;
+-      default:
+-              return false;
+-      }
+-}
+-
+ static void jit_fill_hole(void *area, unsigned int size)
+ {
+       u32 *ptr;
+@@ -206,7 +193,6 @@ static void jit_fill_hole(void *area, un
+ static void build_prologue(struct jit_ctx *ctx)
+ {
+       u16 reg_set = saved_regs(ctx);
+-      u16 first_inst = ctx->skf->insns[0].code;
+       u16 off;
+ 
+ #ifdef CONFIG_FRAME_POINTER
+@@ -236,7 +222,7 @@ static void build_prologue(struct jit_ct
+               emit(ARM_MOV_I(r_X, 0), ctx);
+ 
+       /* do not leak kernel data to userspace */
+-      if ((first_inst != (BPF_RET | BPF_K)) && !(is_load_to_a(first_inst)))
++      if (bpf_needs_clear_a(&ctx->skf->insns[0]))
+               emit(ARM_MOV_I(r_A, 0), ctx);
+ 
+       /* stack space for the BPF_MEM words */
+--- a/arch/mips/net/bpf_jit.c
++++ b/arch/mips/net/bpf_jit.c
+@@ -521,19 +521,6 @@ static inline u16 align_sp(unsigned int
+       return num;
+ }
+ 
+-static bool is_load_to_a(u16 inst)
+-{
+-      switch (inst) {
+-      case BPF_LD | BPF_W | BPF_LEN:
+-      case BPF_LD | BPF_W | BPF_ABS:
+-      case BPF_LD | BPF_H | BPF_ABS:
+-      case BPF_LD | BPF_B | BPF_ABS:
+-              return true;
+-      default:
+-              return false;
+-      }
+-}
+-
+ static void save_bpf_jit_regs(struct jit_ctx *ctx, unsigned offset)
+ {
+       int i = 0, real_off = 0;
+@@ -614,7 +601,6 @@ static unsigned int get_stack_depth(stru
+ 
+ static void build_prologue(struct jit_ctx *ctx)
+ {
+-      u16 first_inst = ctx->skf->insns[0].code;
+       int sp_off;
+ 
+       /* Calculate the total offset for the stack pointer */
+@@ -641,7 +627,7 @@ static void build_prologue(struct jit_ct
+               emit_jit_reg_move(r_X, r_zero, ctx);
+ 
+       /* Do not leak kernel data to userspace */
+-      if ((first_inst != (BPF_RET | BPF_K)) && !(is_load_to_a(first_inst)))
++      if (bpf_needs_clear_a(&ctx->skf->insns[0]))
+               emit_jit_reg_move(r_A, r_zero, ctx);
+ }
+ 
+--- a/arch/powerpc/net/bpf_jit_comp.c
++++ b/arch/powerpc/net/bpf_jit_comp.c
+@@ -78,18 +78,9 @@ static void bpf_jit_build_prologue(struc
+               PPC_LI(r_X, 0);
+       }
+ 
+-      switch (filter[0].code) {
+-      case BPF_RET | BPF_K:
+-      case BPF_LD | BPF_W | BPF_LEN:
+-      case BPF_LD | BPF_W | BPF_ABS:
+-      case BPF_LD | BPF_H | BPF_ABS:
+-      case BPF_LD | BPF_B | BPF_ABS:
+-              /* first instruction sets A register (or is RET 'constant') */
+-              break;
+-      default:
+-              /* make sure we dont leak kernel information to user */
++      /* make sure we dont leak kernel information to user */
++      if (bpf_needs_clear_a(&filter[0]))
+               PPC_LI(r_A, 0);
+-      }
+ }
+ 
+ static void bpf_jit_build_epilogue(u32 *image, struct codegen_context *ctx)
+--- a/arch/sparc/net/bpf_jit_comp.c
++++ b/arch/sparc/net/bpf_jit_comp.c
+@@ -420,22 +420,9 @@ void bpf_jit_compile(struct bpf_prog *fp
+               }
+               emit_reg_move(O7, r_saved_O7);
+ 
+-              switch (filter[0].code) {
+-              case BPF_RET | BPF_K:
+-              case BPF_LD | BPF_W | BPF_LEN:
+-              case BPF_LD | BPF_W | BPF_ABS:
+-              case BPF_LD | BPF_H | BPF_ABS:
+-              case BPF_LD | BPF_B | BPF_ABS:
+-                      /* The first instruction sets the A register (or is
+-                       * a "RET 'constant'")
+-                       */
+-                      break;
+-              default:
+-                      /* Make sure we dont leak kernel information to the
+-                       * user.
+-                       */
++              /* Make sure we dont leak kernel information to the user. */
++              if (bpf_needs_clear_a(&filter[0]))
+                       emit_clear(r_A); /* A = 0 */
+-              }
+ 
+               for (i = 0; i < flen; i++) {
+                       unsigned int K = filter[i].k;
+--- a/include/linux/filter.h
++++ b/include/linux/filter.h
+@@ -459,6 +459,25 @@ static inline void bpf_jit_free(struct b
+ 
+ #define BPF_ANC               BIT(15)
+ 
++static inline bool bpf_needs_clear_a(const struct sock_filter *first)
++{
++      switch (first->code) {
++      case BPF_RET | BPF_K:
++      case BPF_LD | BPF_W | BPF_LEN:
++              return false;
++
++      case BPF_LD | BPF_W | BPF_ABS:
++      case BPF_LD | BPF_H | BPF_ABS:
++      case BPF_LD | BPF_B | BPF_ABS:
++              if (first->k == SKF_AD_OFF + SKF_AD_ALU_XOR_X)
++                      return true;
++              return false;
++
++      default:
++              return true;
++      }
++}
++
+ static inline u16 bpf_anc_helper(const struct sock_filter *ftest)
+ {
+       BUG_ON(ftest->code & BPF_ANC);
diff --git a/queue-4.3/net-mlx5_core-fix-trimming-down-irq-number.patch b/queue-4.3/net-mlx5_core-fix-trimming-down-irq-number.patch

new file mode 100644 (file)

index 0000000..e6ff0d9
--- /dev/null
+++ b/queue-4.3/net-mlx5_core-fix-trimming-down-irq-number.patch
@@ -0,0 +1,124 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Doron Tsur <doront@mellanox.com>
+Date: Sun, 17 Jan 2016 11:25:47 +0200
+Subject: net/mlx5_core: Fix trimming down IRQ number
+
+From: Doron Tsur <doront@mellanox.com>
+
+[ Upstream commit 0b6e26ce89391327d955a756a7823272238eb867 ]
+
+With several ConnectX-4 cards installed on a server, one may receive
+irqn > 255 from the kernel API, which we mistakenly trim to 8bit.
+
+This causes EQ creation failure with the following stack trace:
+[<ffffffff812a11f4>] dump_stack+0x48/0x64
+[<ffffffff810ace21>] __setup_irq+0x3a1/0x4f0
+[<ffffffff810ad7e0>] request_threaded_irq+0x120/0x180
+[<ffffffffa0923660>] ? mlx5_eq_int+0x450/0x450 [mlx5_core]
+[<ffffffffa0922f64>] mlx5_create_map_eq+0x1e4/0x2b0 [mlx5_core]
+[<ffffffffa091de01>] alloc_comp_eqs+0xb1/0x180 [mlx5_core]
+[<ffffffffa091ea99>] mlx5_dev_init+0x5e9/0x6e0 [mlx5_core]
+[<ffffffffa091ec29>] init_one+0x99/0x1c0 [mlx5_core]
+[<ffffffff812e2afc>] local_pci_probe+0x4c/0xa0
+
+Fixing it by changing of the irqn type from u8 to unsigned int to
+support values > 255
+
+Fixes: 61d0e73e0a5a ('net/mlx5_core: Use the the real irqn in eq->irqn')
+Reported-by: Jiri Pirko <jiri@mellanox.com>
+Signed-off-by: Doron Tsur <doront@mellanox.com>
+Signed-off-by: Matan Barak <matanb@mellanox.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/infiniband/hw/mlx5/cq.c                   |    2 +-
+ drivers/net/ethernet/mellanox/mlx5/core/en_main.c |    6 +++---
+ drivers/net/ethernet/mellanox/mlx5/core/main.c    |    3 ++-
+ include/linux/mlx5/cq.h                           |    2 +-
+ include/linux/mlx5/driver.h                       |    5 +++--
+ 5 files changed, 10 insertions(+), 8 deletions(-)
+
+--- a/drivers/infiniband/hw/mlx5/cq.c
++++ b/drivers/infiniband/hw/mlx5/cq.c
+@@ -756,7 +756,7 @@ struct ib_cq *mlx5_ib_create_cq(struct i
+       int uninitialized_var(index);
+       int uninitialized_var(inlen);
+       int cqe_size;
+-      int irqn;
++      unsigned int irqn;
+       int eqn;
+       int err;
+ 
+--- a/drivers/net/ethernet/mellanox/mlx5/core/en_main.c
++++ b/drivers/net/ethernet/mellanox/mlx5/core/en_main.c
+@@ -746,7 +746,7 @@ static int mlx5e_create_cq(struct mlx5e_
+       struct mlx5_core_dev *mdev = priv->mdev;
+       struct mlx5_core_cq *mcq = &cq->mcq;
+       int eqn_not_used;
+-      int irqn;
++      unsigned int irqn;
+       int err;
+       u32 i;
+ 
+@@ -800,7 +800,7 @@ static int mlx5e_enable_cq(struct mlx5e_
+       void *in;
+       void *cqc;
+       int inlen;
+-      int irqn_not_used;
++      unsigned int irqn_not_used;
+       int eqn;
+       int err;
+ 
+@@ -1498,7 +1498,7 @@ static int mlx5e_create_drop_cq(struct m
+       struct mlx5_core_dev *mdev = priv->mdev;
+       struct mlx5_core_cq *mcq = &cq->mcq;
+       int eqn_not_used;
+-      int irqn;
++      unsigned int irqn;
+       int err;
+ 
+       err = mlx5_cqwq_create(mdev, &param->wq, param->cqc, &cq->wq,
+--- a/drivers/net/ethernet/mellanox/mlx5/core/main.c
++++ b/drivers/net/ethernet/mellanox/mlx5/core/main.c
+@@ -520,7 +520,8 @@ static void mlx5_irq_clear_affinity_hint
+               mlx5_irq_clear_affinity_hint(mdev, i);
+ }
+ 
+-int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn, int *irqn)
++int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn,
++                  unsigned int *irqn)
+ {
+       struct mlx5_eq_table *table = &dev->priv.eq_table;
+       struct mlx5_eq *eq, *n;
+--- a/include/linux/mlx5/cq.h
++++ b/include/linux/mlx5/cq.h
+@@ -45,7 +45,7 @@ struct mlx5_core_cq {
+       atomic_t                refcount;
+       struct completion       free;
+       unsigned                vector;
+-      int                     irqn;
++      unsigned int            irqn;
+       void (*comp)            (struct mlx5_core_cq *);
+       void (*event)           (struct mlx5_core_cq *, enum mlx5_event);
+       struct mlx5_uar        *uar;
+--- a/include/linux/mlx5/driver.h
++++ b/include/linux/mlx5/driver.h
+@@ -303,7 +303,7 @@ struct mlx5_eq {
+       u32                     cons_index;
+       struct mlx5_buf         buf;
+       int                     size;
+-      u8                      irqn;
++      unsigned int            irqn;
+       u8                      eqn;
+       int                     nent;
+       u64                     mask;
+@@ -738,7 +738,8 @@ int mlx5_create_map_eq(struct mlx5_core_
+ int mlx5_destroy_unmap_eq(struct mlx5_core_dev *dev, struct mlx5_eq *eq);
+ int mlx5_start_eqs(struct mlx5_core_dev *dev);
+ int mlx5_stop_eqs(struct mlx5_core_dev *dev);
+-int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn, int *irqn);
++int mlx5_vector2eqn(struct mlx5_core_dev *dev, int vector, int *eqn,
++                  unsigned int *irqn);
+ int mlx5_core_attach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
+ int mlx5_core_detach_mcg(struct mlx5_core_dev *dev, union ib_gid *mgid, u32 qpn);
+ 
diff --git a/queue-4.3/net-pktgen-fix-null-ptr-deref-in-skb-allocation.patch b/queue-4.3/net-pktgen-fix-null-ptr-deref-in-skb-allocation.patch

new file mode 100644 (file)

index 0000000..46626ce
--- /dev/null
+++ b/queue-4.3/net-pktgen-fix-null-ptr-deref-in-skb-allocation.patch
@@ -0,0 +1,33 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: John Fastabend <john.fastabend@gmail.com>
+Date: Sun, 10 Jan 2016 21:38:44 -0800
+Subject: net: pktgen: fix null ptr deref in skb allocation
+
+From: John Fastabend <john.fastabend@gmail.com>
+
+[ Upstream commit 3de03596dfeee48bc803c1d1a6daf60a459929f3 ]
+
+Fix possible null pointer dereference that may occur when calling
+skb_reserve() on a null skb.
+
+Fixes: 879c7220e82 ("net: pktgen: Observe needed_headroom of the device")
+Signed-off-by: John Fastabend <john.r.fastabend@intel.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/core/pktgen.c |    4 +++-
+ 1 file changed, 3 insertions(+), 1 deletion(-)
+
+--- a/net/core/pktgen.c
++++ b/net/core/pktgen.c
+@@ -2787,7 +2787,9 @@ static struct sk_buff *pktgen_alloc_skb(
+       } else {
+                skb = __netdev_alloc_skb(dev, size, GFP_NOWAIT);
+       }
+-      skb_reserve(skb, LL_RESERVED_SPACE(dev));
++
++      if (likely(skb))
++              skb_reserve(skb, LL_RESERVED_SPACE(dev));
+ 
+       return skb;
+ }
diff --git a/queue-4.3/net-possible-use-after-free-in-dst_release.patch b/queue-4.3/net-possible-use-after-free-in-dst_release.patch

new file mode 100644 (file)

index 0000000..d36c57f
--- /dev/null
+++ b/queue-4.3/net-possible-use-after-free-in-dst_release.patch
@@ -0,0 +1,41 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Francesco Ruggeri <fruggeri@aristanetworks.com>
+Date: Wed, 6 Jan 2016 00:18:48 -0800
+Subject: net: possible use after free in dst_release
+
+From: Francesco Ruggeri <fruggeri@aristanetworks.com>
+
+[ Upstream commit 07a5d38453599052aff0877b16bb9c1585f08609 ]
+
+dst_release should not access dst->flags after decrementing
+__refcnt to 0. The dst_entry may be in dst_busy_list and
+dst_gc_task may dst_destroy it before dst_release gets a chance
+to access dst->flags.
+
+Fixes: d69bbf88c8d0 ("net: fix a race in dst_release()")
+Fixes: 27b75c95f10d ("net: avoid RCU for NOCACHE dst")
+Signed-off-by: Francesco Ruggeri <fruggeri@arista.com>
+Acked-by: Eric Dumazet <edumazet@google.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/core/dst.c |    3 ++-
+ 1 file changed, 2 insertions(+), 1 deletion(-)
+
+--- a/net/core/dst.c
++++ b/net/core/dst.c
+@@ -301,12 +301,13 @@ void dst_release(struct dst_entry *dst)
+ {
+       if (dst) {
+               int newrefcnt;
++              unsigned short nocache = dst->flags & DST_NOCACHE;
+ 
+               newrefcnt = atomic_dec_return(&dst->__refcnt);
+               if (unlikely(newrefcnt < 0))
+                       net_warn_ratelimited("%s: dst:%p refcnt:%d\n",
+                                            __func__, dst, newrefcnt);
+-              if (!newrefcnt && unlikely(dst->flags & DST_NOCACHE))
++              if (!newrefcnt && unlikely(nocache))
+                       call_rcu(&dst->rcu_head, dst_destroy_rcu);
+       }
+ }
diff --git a/queue-4.3/net-preserve-ip-control-block-during-gso-segmentation.patch b/queue-4.3/net-preserve-ip-control-block-during-gso-segmentation.patch

new file mode 100644 (file)

index 0000000..e56d89c
--- /dev/null
+++ b/queue-4.3/net-preserve-ip-control-block-during-gso-segmentation.patch
@@ -0,0 +1,107 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Konstantin Khlebnikov <koct9i@gmail.com>
+Date: Fri, 8 Jan 2016 15:21:46 +0300
+Subject: net: preserve IP control block during GSO segmentation
+
+From: Konstantin Khlebnikov <koct9i@gmail.com>
+
+[ Upstream commit 9207f9d45b0ad071baa128e846d7e7ed85016df3 ]
+
+Skb_gso_segment() uses skb control block during segmentation.
+This patch adds 32-bytes room for previous control block which
+will be copied into all resulting segments.
+
+This patch fixes kernel crash during fragmenting forwarded packets.
+Fragmentation requires valid IP CB in skb for clearing ip options.
+Also patch removes custom save/restore in ovs code, now it's redundant.
+
+Signed-off-by: Konstantin Khlebnikov <koct9i@gmail.com>
+Link: http://lkml.kernel.org/r/CALYGNiP-0MZ-FExV2HutTvE9U-QQtkKSoE--KN=JQE5STYsjAA@mail.gmail.com
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ include/linux/skbuff.h     |    3 ++-
+ net/core/dev.c             |    5 +++++
+ net/ipv4/ip_output.c       |    1 +
+ net/openvswitch/datapath.c |    5 +----
+ net/xfrm/xfrm_output.c     |    2 ++
+ 5 files changed, 11 insertions(+), 5 deletions(-)
+
+--- a/include/linux/skbuff.h
++++ b/include/linux/skbuff.h
+@@ -3437,7 +3437,8 @@ struct skb_gso_cb {
+       int     encap_level;
+       __u16   csum_start;
+ };
+-#define SKB_GSO_CB(skb) ((struct skb_gso_cb *)(skb)->cb)
++#define SKB_SGO_CB_OFFSET     32
++#define SKB_GSO_CB(skb) ((struct skb_gso_cb *)((skb)->cb + SKB_SGO_CB_OFFSET))
+ 
+ static inline int skb_tnl_header_len(const struct sk_buff *inner_skb)
+ {
+--- a/net/core/dev.c
++++ b/net/core/dev.c
+@@ -2539,6 +2539,8 @@ static inline bool skb_needs_check(struc
+  *
+  *    It may return NULL if the skb requires no segmentation.  This is
+  *    only possible when GSO is used for verifying header integrity.
++ *
++ *    Segmentation preserves SKB_SGO_CB_OFFSET bytes of previous skb cb.
+  */
+ struct sk_buff *__skb_gso_segment(struct sk_buff *skb,
+                                 netdev_features_t features, bool tx_path)
+@@ -2553,6 +2555,9 @@ struct sk_buff *__skb_gso_segment(struct
+                       return ERR_PTR(err);
+       }
+ 
++      BUILD_BUG_ON(SKB_SGO_CB_OFFSET +
++                   sizeof(*SKB_GSO_CB(skb)) > sizeof(skb->cb));
++
+       SKB_GSO_CB(skb)->mac_offset = skb_headroom(skb);
+       SKB_GSO_CB(skb)->encap_level = 0;
+ 
+--- a/net/ipv4/ip_output.c
++++ b/net/ipv4/ip_output.c
+@@ -240,6 +240,7 @@ static int ip_finish_output_gso(struct s
+        * from host network stack.
+        */
+       features = netif_skb_features(skb);
++      BUILD_BUG_ON(sizeof(*IPCB(skb)) > SKB_SGO_CB_OFFSET);
+       segs = skb_gso_segment(skb, features & ~NETIF_F_GSO_MASK);
+       if (IS_ERR_OR_NULL(segs)) {
+               kfree_skb(skb);
+--- a/net/openvswitch/datapath.c
++++ b/net/openvswitch/datapath.c
+@@ -337,12 +337,10 @@ static int queue_gso_packets(struct data
+       unsigned short gso_type = skb_shinfo(skb)->gso_type;
+       struct sw_flow_key later_key;
+       struct sk_buff *segs, *nskb;
+-      struct ovs_skb_cb ovs_cb;
+       int err;
+ 
+-      ovs_cb = *OVS_CB(skb);
++      BUILD_BUG_ON(sizeof(*OVS_CB(skb)) > SKB_SGO_CB_OFFSET);
+       segs = __skb_gso_segment(skb, NETIF_F_SG, false);
+-      *OVS_CB(skb) = ovs_cb;
+       if (IS_ERR(segs))
+               return PTR_ERR(segs);
+       if (segs == NULL)
+@@ -360,7 +358,6 @@ static int queue_gso_packets(struct data
+       /* Queue all of the segments. */
+       skb = segs;
+       do {
+-              *OVS_CB(skb) = ovs_cb;
+               if (gso_type & SKB_GSO_UDP && skb != segs)
+                       key = &later_key;
+ 
+--- a/net/xfrm/xfrm_output.c
++++ b/net/xfrm/xfrm_output.c
+@@ -165,6 +165,8 @@ static int xfrm_output_gso(struct sock *
+ {
+       struct sk_buff *segs;
+ 
++      BUILD_BUG_ON(sizeof(*IPCB(skb)) > SKB_SGO_CB_OFFSET);
++      BUILD_BUG_ON(sizeof(*IP6CB(skb)) > SKB_SGO_CB_OFFSET);
+       segs = skb_gso_segment(skb, 0);
+       kfree_skb(skb);
+       if (IS_ERR(segs))
diff --git a/queue-4.3/net-sched-fix-missing-free-per-cpu-on-qstats.patch b/queue-4.3/net-sched-fix-missing-free-per-cpu-on-qstats.patch

new file mode 100644 (file)

index 0000000..fadaf18
--- /dev/null
+++ b/queue-4.3/net-sched-fix-missing-free-per-cpu-on-qstats.patch
@@ -0,0 +1,36 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: John Fastabend <john.fastabend@gmail.com>
+Date: Tue, 5 Jan 2016 09:11:36 -0800
+Subject: net: sched: fix missing free per cpu on qstats
+
+From: John Fastabend <john.fastabend@gmail.com>
+
+[ Upstream commit 73c20a8b7245273125cfe92c4b46e6fdb568a801 ]
+
+When a qdisc is using per cpu stats (currently just the ingress
+qdisc) only the bstats are being freed. This also free's the qstats.
+
+Fixes: b0ab6f92752b9f9d8 ("net: sched: enable per cpu qstats")
+Signed-off-by: John Fastabend <john.r.fastabend@intel.com>
+Acked-by: Eric Dumazet <edumazet@google.com>
+Acked-by: Daniel Borkmann <daniel@iogearbox.net>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/sched/sch_generic.c |    4 +++-
+ 1 file changed, 3 insertions(+), 1 deletion(-)
+
+--- a/net/sched/sch_generic.c
++++ b/net/sched/sch_generic.c
+@@ -658,8 +658,10 @@ static void qdisc_rcu_free(struct rcu_he
+ {
+       struct Qdisc *qdisc = container_of(head, struct Qdisc, rcu_head);
+ 
+-      if (qdisc_is_percpu_stats(qdisc))
++      if (qdisc_is_percpu_stats(qdisc)) {
+               free_percpu(qdisc->cpu_bstats);
++              free_percpu(qdisc->cpu_qstats);
++      }
+ 
+       kfree((char *) qdisc - qdisc->padded);
+ }
diff --git a/queue-4.3/net-sctp-prevent-writes-to-cookie_hmac_alg-from-accessing-invalid-memory.patch b/queue-4.3/net-sctp-prevent-writes-to-cookie_hmac_alg-from-accessing-invalid-memory.patch

new file mode 100644 (file)

index 0000000..c4cf317
--- /dev/null
+++ b/queue-4.3/net-sctp-prevent-writes-to-cookie_hmac_alg-from-accessing-invalid-memory.patch
@@ -0,0 +1,34 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Sasha Levin <sasha.levin@oracle.com>
+Date: Thu, 7 Jan 2016 14:52:43 -0500
+Subject: net: sctp: prevent writes to cookie_hmac_alg from accessing invalid memory
+
+From: Sasha Levin <sasha.levin@oracle.com>
+
+[ Upstream commit 320f1a4a175e7cd5d3f006f92b4d4d3e2cbb7bb5 ]
+
+proc_dostring() needs an initialized destination string, while the one
+provided in proc_sctp_do_hmac_alg() contains stack garbage.
+
+Thus, writing to cookie_hmac_alg would strlen() that garbage and end up
+accessing invalid memory.
+
+Fixes: 3c68198e7 ("sctp: Make hmac algorithm selection for cookie generation dynamic")
+Signed-off-by: Sasha Levin <sasha.levin@oracle.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/sctp/sysctl.c |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/net/sctp/sysctl.c
++++ b/net/sctp/sysctl.c
+@@ -320,7 +320,7 @@ static int proc_sctp_do_hmac_alg(struct
+       struct ctl_table tbl;
+       bool changed = false;
+       char *none = "none";
+-      char tmp[8];
++      char tmp[8] = {0};
+       int ret;
+ 
+       memset(&tbl, 0, sizeof(struct ctl_table));
diff --git a/queue-4.3/openvswitch-correct-encoding-of-set-tunnel-action-attributes.patch b/queue-4.3/openvswitch-correct-encoding-of-set-tunnel-action-attributes.patch

new file mode 100644 (file)

index 0000000..e4a8277
--- /dev/null
+++ b/queue-4.3/openvswitch-correct-encoding-of-set-tunnel-action-attributes.patch
@@ -0,0 +1,37 @@
+From foo@baz Tue Jan 26 21:35:02 PST 2016
+From: Simon Horman <simon.horman@netronome.com>
+Date: Fri, 18 Dec 2015 19:43:15 +0900
+Subject: openvswitch: correct encoding of set tunnel action attributes
+
+From: Simon Horman <simon.horman@netronome.com>
+
+[ Upstream commit e905eabc90a5b787d8708df164543ee295bea5f2 ]
+
+In a set action tunnel attributes should be encoded in a
+nested action.
+
+I noticed this because ovs-dpctl was reporting an error
+when dumping flows due to the incorrect encoding of tunnel attributes
+in a set action.
+
+Fixes: fc4099f17240 ("openvswitch: Fix egress tunnel info.")
+Signed-off-by: Simon Horman <simon.horman@netronome.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/openvswitch/flow_netlink.c |    4 +++-
+ 1 file changed, 3 insertions(+), 1 deletion(-)
+
+--- a/net/openvswitch/flow_netlink.c
++++ b/net/openvswitch/flow_netlink.c
+@@ -2382,7 +2382,9 @@ static int set_action_to_attr(const stru
+               if (!start)
+                       return -EMSGSIZE;
+ 
+-              err = ovs_nla_put_tunnel_info(skb, tun_info);
++              err =  ipv4_tun_to_nlattr(skb, &tun_info->key,
++                                        ip_tunnel_info_opts(tun_info),
++                                        tun_info->options_len);
+               if (err)
+                       return err;
+               nla_nest_end(skb, start);
diff --git a/queue-4.3/phonet-properly-unshare-skbs-in-phonet_rcv.patch b/queue-4.3/phonet-properly-unshare-skbs-in-phonet_rcv.patch

new file mode 100644 (file)

index 0000000..4338a7f
--- /dev/null
+++ b/queue-4.3/phonet-properly-unshare-skbs-in-phonet_rcv.patch
@@ -0,0 +1,45 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Eric Dumazet <edumazet@google.com>
+Date: Tue, 12 Jan 2016 08:58:00 -0800
+Subject: phonet: properly unshare skbs in phonet_rcv()
+
+From: Eric Dumazet <edumazet@google.com>
+
+[ Upstream commit 7aaed57c5c2890634cfadf725173c7c68ea4cb4f ]
+
+Ivaylo Dimitrov reported a regression caused by commit 7866a621043f
+("dev: add per net_device packet type chains").
+
+skb->dev becomes NULL and we crash in __netif_receive_skb_core().
+
+Before above commit, different kind of bugs or corruptions could happen
+without major crash.
+
+But the root cause is that phonet_rcv() can queue skb without checking
+if skb is shared or not.
+
+Many thanks to Ivaylo Dimitrov for his help, diagnosis and tests.
+
+Reported-by: Ivaylo Dimitrov <ivo.g.dimitrov.75@gmail.com>
+Tested-by: Ivaylo Dimitrov <ivo.g.dimitrov.75@gmail.com>
+Signed-off-by: Eric Dumazet <edumazet@google.com>
+Cc: Remi Denis-Courmont <courmisch@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/phonet/af_phonet.c |    4 ++++
+ 1 file changed, 4 insertions(+)
+
+--- a/net/phonet/af_phonet.c
++++ b/net/phonet/af_phonet.c
+@@ -377,6 +377,10 @@ static int phonet_rcv(struct sk_buff *sk
+       struct sockaddr_pn sa;
+       u16 len;
+ 
++      skb = skb_share_check(skb, GFP_ATOMIC);
++      if (!skb)
++              return NET_RX_DROP;
++
+       /* check we have at least a full Phonet header */
+       if (!pskb_pull(skb, sizeof(struct phonethdr)))
+               goto out;
diff --git a/queue-4.3/ppp-slip-validate-vj-compression-slot-parameters-completely.patch b/queue-4.3/ppp-slip-validate-vj-compression-slot-parameters-completely.patch

new file mode 100644 (file)

index 0000000..e260932
--- /dev/null
+++ b/queue-4.3/ppp-slip-validate-vj-compression-slot-parameters-completely.patch
@@ -0,0 +1,133 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Ben Hutchings <ben@decadent.org.uk>
+Date: Sun, 1 Nov 2015 16:22:53 +0000
+Subject: ppp, slip: Validate VJ compression slot parameters completely
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+From: Ben Hutchings <ben@decadent.org.uk>
+
+[ Upstream commit 4ab42d78e37a294ac7bc56901d563c642e03c4ae ]
+
+Currently slhc_init() treats out-of-range values of rslots and tslots
+as equivalent to 0, except that if tslots is too large it will
+dereference a null pointer (CVE-2015-7799).
+
+Add a range-check at the top of the function and make it return an
+ERR_PTR() on error instead of NULL.  Change the callers accordingly.
+
+Compile-tested only.
+
+Reported-by: 郭永刚 <guoyonggang@360.cn>
+References: http://article.gmane.org/gmane.comp.security.oss.general/17908
+Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/isdn/i4l/isdn_ppp.c   |   10 ++++------
+ drivers/net/ppp/ppp_generic.c |    6 ++----
+ drivers/net/slip/slhc.c       |   12 ++++++++----
+ drivers/net/slip/slip.c       |    2 +-
+ 4 files changed, 15 insertions(+), 15 deletions(-)
+
+--- a/drivers/isdn/i4l/isdn_ppp.c
++++ b/drivers/isdn/i4l/isdn_ppp.c
+@@ -322,9 +322,9 @@ isdn_ppp_open(int min, struct file *file
+        * VJ header compression init
+        */
+       is->slcomp = slhc_init(16, 16); /* not necessary for 2. link in bundle */
+-      if (!is->slcomp) {
++      if (IS_ERR(is->slcomp)) {
+               isdn_ppp_ccp_reset_free(is);
+-              return -ENOMEM;
++              return PTR_ERR(is->slcomp);
+       }
+ #endif
+ #ifdef CONFIG_IPPP_FILTER
+@@ -573,10 +573,8 @@ isdn_ppp_ioctl(int min, struct file *fil
+                       is->maxcid = val;
+ #ifdef CONFIG_ISDN_PPP_VJ
+                       sltmp = slhc_init(16, val);
+-                      if (!sltmp) {
+-                              printk(KERN_ERR "ippp, can't realloc slhc struct\n");
+-                              return -ENOMEM;
+-                      }
++                      if (IS_ERR(sltmp))
++                              return PTR_ERR(sltmp);
+                       if (is->slcomp)
+                               slhc_free(is->slcomp);
+                       is->slcomp = sltmp;
+--- a/drivers/net/ppp/ppp_generic.c
++++ b/drivers/net/ppp/ppp_generic.c
+@@ -721,10 +721,8 @@ static long ppp_ioctl(struct file *file,
+                       val &= 0xffff;
+               }
+               vj = slhc_init(val2+1, val+1);
+-              if (!vj) {
+-                      netdev_err(ppp->dev,
+-                                 "PPP: no memory (VJ compressor)\n");
+-                      err = -ENOMEM;
++              if (IS_ERR(vj)) {
++                      err = PTR_ERR(vj);
+                       break;
+               }
+               ppp_lock(ppp);
+--- a/drivers/net/slip/slhc.c
++++ b/drivers/net/slip/slhc.c
+@@ -84,8 +84,9 @@ static long decode(unsigned char **cpp);
+ static unsigned char * put16(unsigned char *cp, unsigned short x);
+ static unsigned short pull16(unsigned char **cpp);
+ 
+-/* Initialize compression data structure
++/* Allocate compression data structure
+  *    slots must be in range 0 to 255 (zero meaning no compression)
++ * Returns pointer to structure or ERR_PTR() on error.
+  */
+ struct slcompress *
+ slhc_init(int rslots, int tslots)
+@@ -94,11 +95,14 @@ slhc_init(int rslots, int tslots)
+       register struct cstate *ts;
+       struct slcompress *comp;
+ 
++      if (rslots < 0 || rslots > 255 || tslots < 0 || tslots > 255)
++              return ERR_PTR(-EINVAL);
++
+       comp = kzalloc(sizeof(struct slcompress), GFP_KERNEL);
+       if (! comp)
+               goto out_fail;
+ 
+-      if ( rslots > 0  &&  rslots < 256 ) {
++      if (rslots > 0) {
+               size_t rsize = rslots * sizeof(struct cstate);
+               comp->rstate = kzalloc(rsize, GFP_KERNEL);
+               if (! comp->rstate)
+@@ -106,7 +110,7 @@ slhc_init(int rslots, int tslots)
+               comp->rslot_limit = rslots - 1;
+       }
+ 
+-      if ( tslots > 0  &&  tslots < 256 ) {
++      if (tslots > 0) {
+               size_t tsize = tslots * sizeof(struct cstate);
+               comp->tstate = kzalloc(tsize, GFP_KERNEL);
+               if (! comp->tstate)
+@@ -141,7 +145,7 @@ out_free2:
+ out_free:
+       kfree(comp);
+ out_fail:
+-      return NULL;
++      return ERR_PTR(-ENOMEM);
+ }
+ 
+ 
+--- a/drivers/net/slip/slip.c
++++ b/drivers/net/slip/slip.c
+@@ -164,7 +164,7 @@ static int sl_alloc_bufs(struct slip *sl
+       if (cbuff == NULL)
+               goto err_exit;
+       slcomp = slhc_init(16, 16);
+-      if (slcomp == NULL)
++      if (IS_ERR(slcomp))
+               goto err_exit;
+ #endif
+       spin_lock_bh(&sl->lock);
diff --git a/queue-4.3/sched-cls_flower-set-key-address-type-when-present.patch b/queue-4.3/sched-cls_flower-set-key-address-type-when-present.patch

new file mode 100644 (file)

index 0000000..deb9803
--- /dev/null
+++ b/queue-4.3/sched-cls_flower-set-key-address-type-when-present.patch
@@ -0,0 +1,61 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Jamal Hadi Salim <jhs@mojatatu.com>
+Date: Sun, 10 Jan 2016 11:47:01 -0500
+Subject: sched,cls_flower: set key address type when present
+
+From: Jamal Hadi Salim <jhs@mojatatu.com>
+
+[ Upstream commit 66530bdf85eb1d72a0c399665e09a2c2298501c6 ]
+
+only when user space passes the addresses should we consider their
+presence
+
+Signed-off-by: Jamal Hadi Salim <jhs@mojatatu.com>
+Acked-by: Jiri Pirko <jiri@resnulli.us>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/sched/cls_flower.c |   10 ++++++++--
+ 1 file changed, 8 insertions(+), 2 deletions(-)
+
+--- a/net/sched/cls_flower.c
++++ b/net/sched/cls_flower.c
+@@ -252,23 +252,28 @@ static int fl_set_key(struct net *net, s
+       fl_set_key_val(tb, key->eth.src, TCA_FLOWER_KEY_ETH_SRC,
+                      mask->eth.src, TCA_FLOWER_KEY_ETH_SRC_MASK,
+                      sizeof(key->eth.src));
++
+       fl_set_key_val(tb, &key->basic.n_proto, TCA_FLOWER_KEY_ETH_TYPE,
+                      &mask->basic.n_proto, TCA_FLOWER_UNSPEC,
+                      sizeof(key->basic.n_proto));
++
+       if (key->basic.n_proto == htons(ETH_P_IP) ||
+           key->basic.n_proto == htons(ETH_P_IPV6)) {
+               fl_set_key_val(tb, &key->basic.ip_proto, TCA_FLOWER_KEY_IP_PROTO,
+                              &mask->basic.ip_proto, TCA_FLOWER_UNSPEC,
+                              sizeof(key->basic.ip_proto));
+       }
+-      if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV4_ADDRS) {
++
++      if (tb[TCA_FLOWER_KEY_IPV4_SRC] || tb[TCA_FLOWER_KEY_IPV4_DST]) {
++              key->control.addr_type = FLOW_DISSECTOR_KEY_IPV4_ADDRS;
+               fl_set_key_val(tb, &key->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC,
+                              &mask->ipv4.src, TCA_FLOWER_KEY_IPV4_SRC_MASK,
+                              sizeof(key->ipv4.src));
+               fl_set_key_val(tb, &key->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST,
+                              &mask->ipv4.dst, TCA_FLOWER_KEY_IPV4_DST_MASK,
+                              sizeof(key->ipv4.dst));
+-      } else if (key->control.addr_type == FLOW_DISSECTOR_KEY_IPV6_ADDRS) {
++      } else if (tb[TCA_FLOWER_KEY_IPV6_SRC] || tb[TCA_FLOWER_KEY_IPV6_DST]) {
++              key->control.addr_type = FLOW_DISSECTOR_KEY_IPV6_ADDRS;
+               fl_set_key_val(tb, &key->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC,
+                              &mask->ipv6.src, TCA_FLOWER_KEY_IPV6_SRC_MASK,
+                              sizeof(key->ipv6.src));
+@@ -276,6 +281,7 @@ static int fl_set_key(struct net *net, s
+                              &mask->ipv6.dst, TCA_FLOWER_KEY_IPV6_DST_MASK,
+                              sizeof(key->ipv6.dst));
+       }
++
+       if (key->basic.ip_proto == IPPROTO_TCP) {
+               fl_set_key_val(tb, &key->tp.src, TCA_FLOWER_KEY_TCP_SRC,
+                              &mask->tp.src, TCA_FLOWER_UNSPEC,
diff --git a/queue-4.3/sctp-sctp-should-release-assoc-when-sctp_make_abort_user-return-null-in-sctp_close.patch b/queue-4.3/sctp-sctp-should-release-assoc-when-sctp_make_abort_user-return-null-in-sctp_close.patch

new file mode 100644 (file)

index 0000000..0b618ee
--- /dev/null
+++ b/queue-4.3/sctp-sctp-should-release-assoc-when-sctp_make_abort_user-return-null-in-sctp_close.patch
@@ -0,0 +1,69 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Xin Long <lucien.xin@gmail.com>
+Date: Tue, 29 Dec 2015 17:49:25 +0800
+Subject: sctp: sctp should release assoc when sctp_make_abort_user return NULL in sctp_close
+
+From: Xin Long <lucien.xin@gmail.com>
+
+[ Upstream commit 068d8bd338e855286aea54e70d1c101569284b21 ]
+
+In sctp_close, sctp_make_abort_user may return NULL because of memory
+allocation failure. If this happens, it will bypass any state change
+and never free the assoc. The assoc has no chance to be freed and it
+will be kept in memory with the state it had even after the socket is
+closed by sctp_close().
+
+So if sctp_make_abort_user fails to allocate memory, we should abort
+the asoc via sctp_primitive_ABORT as well. Just like the annotation in
+sctp_sf_cookie_wait_prm_abort and sctp_sf_do_9_1_prm_abort said,
+"Even if we can't send the ABORT due to low memory delete the TCB.
+This is a departure from our typical NOMEM handling".
+
+But then the chunk is NULL (low memory) and the SCTP_CMD_REPLY cmd would
+dereference the chunk pointer, and system crash. So we should add
+SCTP_CMD_REPLY cmd only when the chunk is not NULL, just like other
+places where it adds SCTP_CMD_REPLY cmd.
+
+Signed-off-by: Xin Long <lucien.xin@gmail.com>
+Acked-by: Marcelo Ricardo Leitner <marcelo.leitner@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/sctp/sm_statefuns.c |    6 ++++--
+ net/sctp/socket.c       |    3 +--
+ 2 files changed, 5 insertions(+), 4 deletions(-)
+
+--- a/net/sctp/sm_statefuns.c
++++ b/net/sctp/sm_statefuns.c
+@@ -4829,7 +4829,8 @@ sctp_disposition_t sctp_sf_do_9_1_prm_ab
+ 
+       retval = SCTP_DISPOSITION_CONSUME;
+ 
+-      sctp_add_cmd_sf(commands, SCTP_CMD_REPLY, SCTP_CHUNK(abort));
++      if (abort)
++              sctp_add_cmd_sf(commands, SCTP_CMD_REPLY, SCTP_CHUNK(abort));
+ 
+       /* Even if we can't send the ABORT due to low memory delete the
+        * TCB.  This is a departure from our typical NOMEM handling.
+@@ -4966,7 +4967,8 @@ sctp_disposition_t sctp_sf_cookie_wait_p
+                       SCTP_TO(SCTP_EVENT_TIMEOUT_T1_INIT));
+       retval = SCTP_DISPOSITION_CONSUME;
+ 
+-      sctp_add_cmd_sf(commands, SCTP_CMD_REPLY, SCTP_CHUNK(abort));
++      if (abort)
++              sctp_add_cmd_sf(commands, SCTP_CMD_REPLY, SCTP_CHUNK(abort));
+ 
+       sctp_add_cmd_sf(commands, SCTP_CMD_NEW_STATE,
+                       SCTP_STATE(SCTP_STATE_CLOSED));
+--- a/net/sctp/socket.c
++++ b/net/sctp/socket.c
+@@ -1513,8 +1513,7 @@ static void sctp_close(struct sock *sk,
+                       struct sctp_chunk *chunk;
+ 
+                       chunk = sctp_make_abort_user(asoc, NULL, 0);
+-                      if (chunk)
+-                              sctp_primitive_ABORT(net, asoc, chunk);
++                      sctp_primitive_ABORT(net, asoc, chunk);
+               } else
+                       sctp_primitive_SHUTDOWN(net, asoc, NULL);
+       }
diff --git a/queue-4.3/series b/queue-4.3/series

index df5eb674c1879b56b8b5b1298366bfdbdc090e04..9b20d14b098c1b3839476ff65701434cba863a29 100644 (file)
--- a/queue-4.3/series
+++ b/queue-4.3/series
@@ -80,3 +80,43 @@ usb-ipaq.c-fix-a-timeout-loop.patch
  usb-cp210x-add-id-for-elv-marble-sound-board-1.patch
  usb-core-lpm-fix-usb3_hardware_lpm-sysfs-node.patch
  xhci-refuse-loading-if-nousb-is-used.patch
+openvswitch-correct-encoding-of-set-tunnel-action-attributes.patch
+utf-8-q-veth-20don-e2-80-99t-20modify-20ip-5fsum-utf-8-q-med-20doing-20so-20treats-20packets-20with-20bad-20checksums-utf-8-q-20as-20good.patch
+ipv6-addrlabel-fix-ip6addrlbl_get.patch
+addrconf-always-initialize-sysctl-table-data.patch
+net-cdc_ncm-avoid-changing-rx-tx-buffers-on-mtu-changes.patch
+sctp-sctp-should-release-assoc-when-sctp_make_abort_user-return-null-in-sctp_close.patch
+connector-bump-skb-users-before-callback-invocation.patch
+af_unix-fix-splice-bind-deadlock.patch
+unix-properly-account-for-fds-passed-over-unix-sockets.patch
+bridge-only-call-sbin-bridge-stp-for-the-initial-network-namespace.patch
+net-filter-make-jits-zero-a-for-skf_ad_alu_xor_x.patch
+net-sched-fix-missing-free-per-cpu-on-qstats.patch
+net-possible-use-after-free-in-dst_release.patch
+tcp-fix-zero-cwnd-in-tcp_cwnd_reduction.patch
+vxlan-fix-test-which-detect-duplicate-vxlan-iface.patch
+net-sctp-prevent-writes-to-cookie_hmac_alg-from-accessing-invalid-memory.patch
+ipv6-tcp-add-rcu-locking-in-tcp_v6_send_synack.patch
+tcp_yeah-don-t-set-ssthresh-below-2.patch
+sched-cls_flower-set-key-address-type-when-present.patch
+net-pktgen-fix-null-ptr-deref-in-skb-allocation.patch
+udp-disallow-ufo-for-sockets-with-so_no_check-option.patch
+net-preserve-ip-control-block-during-gso-segmentation.patch
+bonding-prevent-ipv6-link-local-address-on-enslaved-devices.patch
+dwc_eth_qos-fix-dma-address-for-multi-fragment-skbs.patch
+phonet-properly-unshare-skbs-in-phonet_rcv.patch
+net-bpf-reject-invalid-shifts.patch
+ipv6-update-skb-csum-when-ce-mark-is-propagated.patch
+bridge-fix-lockdep-addr_list_lock-false-positive-splat.patch
+isdn_ppp-add-checks-for-allocation-failure-in-isdn_ppp_open.patch
+ppp-slip-validate-vj-compression-slot-parameters-completely.patch
+batman-adv-avoid-recursive-call_rcu-for-batadv_bla_claim.patch
+batman-adv-avoid-recursive-call_rcu-for-batadv_nc_node.patch
+batman-adv-drop-immediate-batadv_orig_ifinfo-free-function.patch
+batman-adv-drop-immediate-batadv_neigh_node-free-function.patch
+batman-adv-drop-immediate-neigh_ifinfo-free-function.patch
+batman-adv-drop-immediate-batadv_hard_iface-free-function.patch
+batman-adv-drop-immediate-orig_node-free-function.patch
+net-mlx5_core-fix-trimming-down-irq-number.patch
+team-replace-rcu_read_lock-with-a-mutex-in-team_vlan_rx_kill_vid.patch
+xfrm-dst_entries_init-per-net-dst_ops.patch
diff --git a/queue-4.3/tcp-fix-zero-cwnd-in-tcp_cwnd_reduction.patch b/queue-4.3/tcp-fix-zero-cwnd-in-tcp_cwnd_reduction.patch

new file mode 100644 (file)

index 0000000..1c69934
--- /dev/null
+++ b/queue-4.3/tcp-fix-zero-cwnd-in-tcp_cwnd_reduction.patch
@@ -0,0 +1,63 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Yuchung Cheng <ycheng@google.com>
+Date: Wed, 6 Jan 2016 12:42:38 -0800
+Subject: tcp: fix zero cwnd in tcp_cwnd_reduction
+
+From: Yuchung Cheng <ycheng@google.com>
+
+[ Upstream commit 8b8a321ff72c785ed5e8b4cf6eda20b35d427390 ]
+
+Patch 3759824da87b ("tcp: PRR uses CRB mode by default and SS mode
+conditionally") introduced a bug that cwnd may become 0 when both
+inflight and sndcnt are 0 (cwnd = inflight + sndcnt). This may lead
+to a div-by-zero if the connection starts another cwnd reduction
+phase by setting tp->prior_cwnd to the current cwnd (0) in
+tcp_init_cwnd_reduction().
+
+To prevent this we skip PRR operation when nothing is acked or
+sacked. Then cwnd must be positive in all cases as long as ssthresh
+is positive:
+
+1) The proportional reduction mode
+   inflight > ssthresh > 0
+
+2) The reduction bound mode
+  a) inflight == ssthresh > 0
+
+  b) inflight < ssthresh
+     sndcnt > 0 since newly_acked_sacked > 0 and inflight < ssthresh
+
+Therefore in all cases inflight and sndcnt can not both be 0.
+We check invalid tp->prior_cwnd to avoid potential div0 bugs.
+
+In reality this bug is triggered only with a sequence of less common
+events.  For example, the connection is terminating an ECN-triggered
+cwnd reduction with an inflight 0, then it receives reordered/old
+ACKs or DSACKs from prior transmission (which acks nothing). Or the
+connection is in fast recovery stage that marks everything lost,
+but fails to retransmit due to local issues, then receives data
+packets from other end which acks nothing.
+
+Fixes: 3759824da87b ("tcp: PRR uses CRB mode by default and SS mode conditionally")
+Reported-by: Oleksandr Natalenko <oleksandr@natalenko.name>
+Signed-off-by: Yuchung Cheng <ycheng@google.com>
+Signed-off-by: Neal Cardwell <ncardwell@google.com>
+Signed-off-by: Eric Dumazet <edumazet@google.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv4/tcp_input.c |    3 +++
+ 1 file changed, 3 insertions(+)
+
+--- a/net/ipv4/tcp_input.c
++++ b/net/ipv4/tcp_input.c
+@@ -2525,6 +2525,9 @@ static void tcp_cwnd_reduction(struct so
+       int newly_acked_sacked = prior_unsacked -
+                                (tp->packets_out - tp->sacked_out);
+ 
++      if (newly_acked_sacked <= 0 || WARN_ON_ONCE(!tp->prior_cwnd))
++              return;
++
+       tp->prr_delivered += newly_acked_sacked;
+       if (delta < 0) {
+               u64 dividend = (u64)tp->snd_ssthresh * tp->prr_delivered +
diff --git a/queue-4.3/tcp_yeah-don-t-set-ssthresh-below-2.patch b/queue-4.3/tcp_yeah-don-t-set-ssthresh-below-2.patch

new file mode 100644 (file)

index 0000000..99a544c
--- /dev/null
+++ b/queue-4.3/tcp_yeah-don-t-set-ssthresh-below-2.patch
@@ -0,0 +1,46 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Neal Cardwell <ncardwell@google.com>
+Date: Mon, 11 Jan 2016 13:42:43 -0500
+Subject: tcp_yeah: don't set ssthresh below 2
+
+From: Neal Cardwell <ncardwell@google.com>
+
+[ Upstream commit 83d15e70c4d8909d722c0d64747d8fb42e38a48f ]
+
+For tcp_yeah, use an ssthresh floor of 2, the same floor used by Reno
+and CUBIC, per RFC 5681 (equation 4).
+
+tcp_yeah_ssthresh() was sometimes returning a 0 or negative ssthresh
+value if the intended reduction is as big or bigger than the current
+cwnd. Congestion control modules should never return a zero or
+negative ssthresh. A zero ssthresh generally results in a zero cwnd,
+causing the connection to stall. A negative ssthresh value will be
+interpreted as a u32 and will set a target cwnd for PRR near 4
+billion.
+
+Oleksandr Natalenko reported that a system using tcp_yeah with ECN
+could see a warning about a prior_cwnd of 0 in
+tcp_cwnd_reduction(). Testing verified that this was due to
+tcp_yeah_ssthresh() misbehaving in this way.
+
+Reported-by: Oleksandr Natalenko <oleksandr@natalenko.name>
+Signed-off-by: Neal Cardwell <ncardwell@google.com>
+Signed-off-by: Yuchung Cheng <ycheng@google.com>
+Signed-off-by: Eric Dumazet <edumazet@google.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv4/tcp_yeah.c |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/net/ipv4/tcp_yeah.c
++++ b/net/ipv4/tcp_yeah.c
+@@ -219,7 +219,7 @@ static u32 tcp_yeah_ssthresh(struct sock
+       yeah->fast_count = 0;
+       yeah->reno_count = max(yeah->reno_count>>1, 2U);
+ 
+-      return tp->snd_cwnd - reduction;
++      return max_t(int, tp->snd_cwnd - reduction, 2);
+ }
+ 
+ static struct tcp_congestion_ops tcp_yeah __read_mostly = {
diff --git a/queue-4.3/team-replace-rcu_read_lock-with-a-mutex-in-team_vlan_rx_kill_vid.patch b/queue-4.3/team-replace-rcu_read_lock-with-a-mutex-in-team_vlan_rx_kill_vid.patch

new file mode 100644 (file)

index 0000000..f9ec32e
--- /dev/null
+++ b/queue-4.3/team-replace-rcu_read_lock-with-a-mutex-in-team_vlan_rx_kill_vid.patch
@@ -0,0 +1,39 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Ido Schimmel <idosch@mellanox.com>
+Date: Mon, 18 Jan 2016 17:30:22 +0200
+Subject: team: Replace rcu_read_lock with a mutex in team_vlan_rx_kill_vid
+
+From: Ido Schimmel <idosch@mellanox.com>
+
+[ Upstream commit 60a6531bfe49555581ccd65f66a350cc5693fcde ]
+
+We can't be within an RCU read-side critical section when deleting
+VLANs, as underlying drivers might sleep during the hardware operation.
+Therefore, replace the RCU critical section with a mutex. This is
+consistent with team_vlan_rx_add_vid.
+
+Fixes: 3d249d4ca7d0 ("net: introduce ethernet teaming device")
+Acked-by: Jiri Pirko <jiri@mellanox.com>
+Signed-off-by: Ido Schimmel <idosch@mellanox.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/team/team.c |    6 +++---
+ 1 file changed, 3 insertions(+), 3 deletions(-)
+
+--- a/drivers/net/team/team.c
++++ b/drivers/net/team/team.c
+@@ -1845,10 +1845,10 @@ static int team_vlan_rx_kill_vid(struct
+       struct team *team = netdev_priv(dev);
+       struct team_port *port;
+ 
+-      rcu_read_lock();
+-      list_for_each_entry_rcu(port, &team->port_list, list)
++      mutex_lock(&team->lock);
++      list_for_each_entry(port, &team->port_list, list)
+               vlan_vid_del(port->dev, proto, vid);
+-      rcu_read_unlock();
++      mutex_unlock(&team->lock);
+ 
+       return 0;
+ }
diff --git a/queue-4.3/udp-disallow-ufo-for-sockets-with-so_no_check-option.patch b/queue-4.3/udp-disallow-ufo-for-sockets-with-so_no_check-option.patch

new file mode 100644 (file)

index 0000000..3644069
--- /dev/null
+++ b/queue-4.3/udp-disallow-ufo-for-sockets-with-so_no_check-option.patch
@@ -0,0 +1,51 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: =?UTF-8?q?Michal=20Kube=C4=8Dek?= <mkubecek@suse.cz>
+Date: Mon, 11 Jan 2016 07:50:30 +0100
+Subject: udp: disallow UFO for sockets with SO_NO_CHECK option
+
+From: =?UTF-8?q?Michal=20Kube=C4=8Dek?= <mkubecek@suse.cz>
+
+[ Upstream commit 40ba330227ad00b8c0cdf2f425736ff9549cc423 ]
+
+Commit acf8dd0a9d0b ("udp: only allow UFO for packets from SOCK_DGRAM
+sockets") disallows UFO for packets sent from raw sockets. We need to do
+the same also for SOCK_DGRAM sockets with SO_NO_CHECK options, even if
+for a bit different reason: while such socket would override the
+CHECKSUM_PARTIAL set by ip_ufo_append_data(), gso_size is still set and
+bad offloading flags warning is triggered in __skb_gso_segment().
+
+In the IPv6 case, SO_NO_CHECK option is ignored but we need to disallow
+UFO for packets sent by sockets with UDP_NO_CHECK6_TX option.
+
+Signed-off-by: Michal Kubecek <mkubecek@suse.cz>
+Tested-by: Shannon Nelson <shannon.nelson@intel.com>
+Acked-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv4/ip_output.c  |    2 +-
+ net/ipv6/ip6_output.c |    2 +-
+ 2 files changed, 2 insertions(+), 2 deletions(-)
+
+--- a/net/ipv4/ip_output.c
++++ b/net/ipv4/ip_output.c
+@@ -918,7 +918,7 @@ static int __ip_append_data(struct sock
+       if (((length > mtu) || (skb && skb_is_gso(skb))) &&
+           (sk->sk_protocol == IPPROTO_UDP) &&
+           (rt->dst.dev->features & NETIF_F_UFO) && !rt->dst.header_len &&
+-          (sk->sk_type == SOCK_DGRAM)) {
++          (sk->sk_type == SOCK_DGRAM) && !sk->sk_no_check_tx) {
+               err = ip_ufo_append_data(sk, queue, getfrag, from, length,
+                                        hh_len, fragheaderlen, transhdrlen,
+                                        maxfraglen, flags);
+--- a/net/ipv6/ip6_output.c
++++ b/net/ipv6/ip6_output.c
+@@ -1345,7 +1345,7 @@ emsgsize:
+            (skb && skb_is_gso(skb))) &&
+           (sk->sk_protocol == IPPROTO_UDP) &&
+           (rt->dst.dev->features & NETIF_F_UFO) &&
+-          (sk->sk_type == SOCK_DGRAM)) {
++          (sk->sk_type == SOCK_DGRAM) && !udp_get_no_check6_tx(sk)) {
+               err = ip6_ufo_append_data(sk, queue, getfrag, from, length,
+                                         hh_len, fragheaderlen,
+                                         transhdrlen, mtu, flags, fl6);
diff --git a/queue-4.3/unix-properly-account-for-fds-passed-over-unix-sockets.patch b/queue-4.3/unix-properly-account-for-fds-passed-over-unix-sockets.patch

new file mode 100644 (file)

index 0000000..03a3a42
--- /dev/null
+++ b/queue-4.3/unix-properly-account-for-fds-passed-over-unix-sockets.patch
@@ -0,0 +1,136 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: willy tarreau <w@1wt.eu>
+Date: Sun, 10 Jan 2016 07:54:56 +0100
+Subject: unix: properly account for FDs passed over unix sockets
+
+From: willy tarreau <w@1wt.eu>
+
+[ Upstream commit 712f4aad406bb1ed67f3f98d04c044191f0ff593 ]
+
+It is possible for a process to allocate and accumulate far more FDs than
+the process' limit by sending them over a unix socket then closing them
+to keep the process' fd count low.
+
+This change addresses this problem by keeping track of the number of FDs
+in flight per user and preventing non-privileged processes from having
+more FDs in flight than their configured FD limit.
+
+Reported-by: socketpair@gmail.com
+Reported-by: Tetsuo Handa <penguin-kernel@I-love.SAKURA.ne.jp>
+Mitigates: CVE-2013-4312 (Linux 2.0+)
+Suggested-by: Linus Torvalds <torvalds@linux-foundation.org>
+Acked-by: Hannes Frederic Sowa <hannes@stressinduktion.org>
+Signed-off-by: Willy Tarreau <w@1wt.eu>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ include/linux/sched.h |    1 +
+ net/unix/af_unix.c    |   24 ++++++++++++++++++++----
+ net/unix/garbage.c    |   13 ++++++++-----
+ 3 files changed, 29 insertions(+), 9 deletions(-)
+
+--- a/include/linux/sched.h
++++ b/include/linux/sched.h
+@@ -830,6 +830,7 @@ struct user_struct {
+       unsigned long mq_bytes; /* How many bytes can be allocated to mqueue? */
+ #endif
+       unsigned long locked_shm; /* How many pages of mlocked shm ? */
++      unsigned long unix_inflight;    /* How many files in flight in unix sockets */
+ 
+ #ifdef CONFIG_KEYS
+       struct key *uid_keyring;        /* UID specific keyring */
+--- a/net/unix/af_unix.c
++++ b/net/unix/af_unix.c
+@@ -1512,6 +1512,21 @@ static void unix_destruct_scm(struct sk_
+       sock_wfree(skb);
+ }
+ 
++/*
++ * The "user->unix_inflight" variable is protected by the garbage
++ * collection lock, and we just read it locklessly here. If you go
++ * over the limit, there might be a tiny race in actually noticing
++ * it across threads. Tough.
++ */
++static inline bool too_many_unix_fds(struct task_struct *p)
++{
++      struct user_struct *user = current_user();
++
++      if (unlikely(user->unix_inflight > task_rlimit(p, RLIMIT_NOFILE)))
++              return !capable(CAP_SYS_RESOURCE) && !capable(CAP_SYS_ADMIN);
++      return false;
++}
++
+ #define MAX_RECURSION_LEVEL 4
+ 
+ static int unix_attach_fds(struct scm_cookie *scm, struct sk_buff *skb)
+@@ -1520,6 +1535,9 @@ static int unix_attach_fds(struct scm_co
+       unsigned char max_level = 0;
+       int unix_sock_count = 0;
+ 
++      if (too_many_unix_fds(current))
++              return -ETOOMANYREFS;
++
+       for (i = scm->fp->count - 1; i >= 0; i--) {
+               struct sock *sk = unix_get_socket(scm->fp->fp[i]);
+ 
+@@ -1541,10 +1559,8 @@ static int unix_attach_fds(struct scm_co
+       if (!UNIXCB(skb).fp)
+               return -ENOMEM;
+ 
+-      if (unix_sock_count) {
+-              for (i = scm->fp->count - 1; i >= 0; i--)
+-                      unix_inflight(scm->fp->fp[i]);
+-      }
++      for (i = scm->fp->count - 1; i >= 0; i--)
++              unix_inflight(scm->fp->fp[i]);
+       return max_level;
+ }
+ 
+--- a/net/unix/garbage.c
++++ b/net/unix/garbage.c
+@@ -120,11 +120,11 @@ void unix_inflight(struct file *fp)
+ {
+       struct sock *s = unix_get_socket(fp);
+ 
++      spin_lock(&unix_gc_lock);
++
+       if (s) {
+               struct unix_sock *u = unix_sk(s);
+ 
+-              spin_lock(&unix_gc_lock);
+-
+               if (atomic_long_inc_return(&u->inflight) == 1) {
+                       BUG_ON(!list_empty(&u->link));
+                       list_add_tail(&u->link, &gc_inflight_list);
+@@ -132,25 +132,28 @@ void unix_inflight(struct file *fp)
+                       BUG_ON(list_empty(&u->link));
+               }
+               unix_tot_inflight++;
+-              spin_unlock(&unix_gc_lock);
+       }
++      fp->f_cred->user->unix_inflight++;
++      spin_unlock(&unix_gc_lock);
+ }
+ 
+ void unix_notinflight(struct file *fp)
+ {
+       struct sock *s = unix_get_socket(fp);
+ 
++      spin_lock(&unix_gc_lock);
++
+       if (s) {
+               struct unix_sock *u = unix_sk(s);
+ 
+-              spin_lock(&unix_gc_lock);
+               BUG_ON(list_empty(&u->link));
+ 
+               if (atomic_long_dec_and_test(&u->inflight))
+                       list_del_init(&u->link);
+               unix_tot_inflight--;
+-              spin_unlock(&unix_gc_lock);
+       }
++      fp->f_cred->user->unix_inflight--;
++      spin_unlock(&unix_gc_lock);
+ }
+ 
+ static void scan_inflight(struct sock *x, void (*func)(struct unix_sock *),
diff --git a/queue-4.3/utf-8-q-veth-20don-e2-80-99t-20modify-20ip-5fsum-utf-8-q-med-20doing-20so-20treats-20packets-20with-20bad-20checksums-utf-8-q-20as-20good.patch b/queue-4.3/utf-8-q-veth-20don-e2-80-99t-20modify-20ip-5fsum-utf-8-q-med-20doing-20so-20treats-20packets-20with-20bad-20checksums-utf-8-q-20as-20good.patch

new file mode 100644 (file)

index 0000000..9394485
--- /dev/null
+++ b/queue-4.3/utf-8-q-veth-20don-e2-80-99t-20modify-20ip-5fsum-utf-8-q-med-20doing-20so-20treats-20packets-20with-20bad-20checksums-utf-8-q-20as-20good.patch
@@ -0,0 +1,72 @@
+From foo@baz Tue Jan 26 21:35:02 PST 2016
+From: Vijay Pandurangan <vijayp@vijayp.ca>
+Date: Fri, 18 Dec 2015 14:34:59 -0500
+Subject: =?UTF-8?q?veth:=20don=E2=80=99t=20modify=20ip=5Fsum?= =?UTF-8?q?med;=20doing=20so=20treats=20packets=20with=20bad=20checksums?= =?UTF-8?q?=20as=20good.?=
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+From: Vijay Pandurangan <vijayp@vijayp.ca>
+
+[ Upstream commit ce8c839b74e3017996fad4e1b7ba2e2625ede82f ]
+
+Packets that arrive from real hardware devices have ip_summed ==
+CHECKSUM_UNNECESSARY if the hardware verified the checksums, or
+CHECKSUM_NONE if the packet is bad or it was unable to verify it. The
+current version of veth will replace CHECKSUM_NONE with
+CHECKSUM_UNNECESSARY, which causes corrupt packets routed from hardware to
+a veth device to be delivered to the application. This caused applications
+at Twitter to receive corrupt data when network hardware was corrupting
+packets.
+
+We believe this was added as an optimization to skip computing and
+verifying checksums for communication between containers. However, locally
+generated packets have ip_summed == CHECKSUM_PARTIAL, so the code as
+written does nothing for them. As far as we can tell, after removing this
+code, these packets are transmitted from one stack to another unmodified
+(tcpdump shows invalid checksums on both sides, as expected), and they are
+delivered correctly to applications. We didn’t test every possible network
+configuration, but we tried a few common ones such as bridging containers,
+using NAT between the host and a container, and routing from hardware
+devices to containers. We have effectively deployed this in production at
+Twitter (by disabling RX checksum offloading on veth devices).
+
+This code dates back to the first version of the driver, commit
+<e314dbdc1c0dc6a548ecf> ("[NET]: Virtual ethernet device driver"), so I
+suspect this bug occurred mostly because the driver API has evolved
+significantly since then. Commit <0b7967503dc97864f283a> ("net/veth: Fix
+packet checksumming") (in December 2010) fixed this for packets that get
+created locally and sent to hardware devices, by not changing
+CHECKSUM_PARTIAL. However, the same issue still occurs for packets coming
+in from hardware devices.
+
+Co-authored-by: Evan Jones <ej@evanjones.ca>
+Signed-off-by: Evan Jones <ej@evanjones.ca>
+Cc: Nicolas Dichtel <nicolas.dichtel@6wind.com>
+Cc: Phil Sutter <phil@nwl.cc>
+Cc: Toshiaki Makita <makita.toshiaki@lab.ntt.co.jp>
+Cc: netdev@vger.kernel.org
+Cc: linux-kernel@vger.kernel.org
+Signed-off-by: Vijay Pandurangan <vijayp@vijayp.ca>
+Acked-by: Cong Wang <cwang@twopensource.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/veth.c |    6 ------
+ 1 file changed, 6 deletions(-)
+
+--- a/drivers/net/veth.c
++++ b/drivers/net/veth.c
+@@ -117,12 +117,6 @@ static netdev_tx_t veth_xmit(struct sk_b
+               kfree_skb(skb);
+               goto drop;
+       }
+-      /* don't change ip_summed == CHECKSUM_PARTIAL, as that
+-       * will cause bad checksum on forwarded packets
+-       */
+-      if (skb->ip_summed == CHECKSUM_NONE &&
+-          rcv->features & NETIF_F_RXCSUM)
+-              skb->ip_summed = CHECKSUM_UNNECESSARY;
+ 
+       if (likely(dev_forward_skb(rcv, skb) == NET_RX_SUCCESS)) {
+               struct pcpu_vstats *stats = this_cpu_ptr(dev->vstats);
diff --git a/queue-4.3/vxlan-fix-test-which-detect-duplicate-vxlan-iface.patch b/queue-4.3/vxlan-fix-test-which-detect-duplicate-vxlan-iface.patch

new file mode 100644 (file)

index 0000000..400e830
--- /dev/null
+++ b/queue-4.3/vxlan-fix-test-which-detect-duplicate-vxlan-iface.patch
@@ -0,0 +1,62 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Nicolas Dichtel <nicolas.dichtel@6wind.com>
+Date: Thu, 7 Jan 2016 11:26:53 +0100
+Subject: vxlan: fix test which detect duplicate vxlan iface
+
+From: Nicolas Dichtel <nicolas.dichtel@6wind.com>
+
+[ Upstream commit 07b9b37c227cb8d88d478b4a9c5634fee514ede1 ]
+
+When a vxlan interface is created, the driver checks that there is not
+another vxlan interface with the same properties. To do this, it checks
+the existing vxlan udp socket. Since commit 1c51a9159dde, the creation of
+the vxlan socket is done only when the interface is set up, thus it breaks
+that test.
+
+Example:
+$ ip l a vxlan10 type vxlan id 10 group 239.0.0.10 dev eth0 dstport 0
+$ ip l a vxlan11 type vxlan id 10 group 239.0.0.10 dev eth0 dstport 0
+$ ip -br l | grep vxlan
+vxlan10          DOWN           f2:55:1c:6a:fb:00 <BROADCAST,MULTICAST>
+vxlan11          DOWN           7a:cb:b9:38:59:0d <BROADCAST,MULTICAST>
+
+Instead of checking sockets, let's loop over the vxlan iface list.
+
+Fixes: 1c51a9159dde ("vxlan: fix race caused by dropping rtnl_unlock")
+Reported-by: Thomas Faivre <thomas.faivre@6wind.com>
+Signed-off-by: Nicolas Dichtel <nicolas.dichtel@6wind.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/vxlan.c |   12 +++++++++---
+ 1 file changed, 9 insertions(+), 3 deletions(-)
+
+--- a/drivers/net/vxlan.c
++++ b/drivers/net/vxlan.c
+@@ -2660,7 +2660,7 @@ static int vxlan_dev_configure(struct ne
+                              struct vxlan_config *conf)
+ {
+       struct vxlan_net *vn = net_generic(src_net, vxlan_net_id);
+-      struct vxlan_dev *vxlan = netdev_priv(dev);
++      struct vxlan_dev *vxlan = netdev_priv(dev), *tmp;
+       struct vxlan_rdst *dst = &vxlan->default_dst;
+       int err;
+       bool use_ipv6 = false;
+@@ -2725,9 +2725,15 @@ static int vxlan_dev_configure(struct ne
+       if (!vxlan->cfg.age_interval)
+               vxlan->cfg.age_interval = FDB_AGE_DEFAULT;
+ 
+-      if (vxlan_find_vni(src_net, conf->vni, use_ipv6 ? AF_INET6 : AF_INET,
+-                         vxlan->cfg.dst_port, vxlan->flags))
++      list_for_each_entry(tmp, &vn->vxlan_list, next) {
++              if (tmp->cfg.vni == conf->vni &&
++                  (tmp->default_dst.remote_ip.sa.sa_family == AF_INET6 ||
++                   tmp->cfg.saddr.sa.sa_family == AF_INET6) == use_ipv6 &&
++                  tmp->cfg.dst_port == vxlan->cfg.dst_port &&
++                  (tmp->flags & VXLAN_F_RCV_FLAGS) ==
++                  (vxlan->flags & VXLAN_F_RCV_FLAGS))
+               return -EEXIST;
++      }
+ 
+       dev->ethtool_ops = &vxlan_ethtool_ops;
+ 
diff --git a/queue-4.3/xfrm-dst_entries_init-per-net-dst_ops.patch b/queue-4.3/xfrm-dst_entries_init-per-net-dst_ops.patch

new file mode 100644 (file)

index 0000000..7e8e106
--- /dev/null
+++ b/queue-4.3/xfrm-dst_entries_init-per-net-dst_ops.patch
@@ -0,0 +1,332 @@
+From foo@baz Tue Jan 26 21:35:03 PST 2016
+From: Dan Streetman <dan.streetman@canonical.com>
+Date: Thu, 29 Oct 2015 09:51:16 -0400
+Subject: xfrm: dst_entries_init() per-net dst_ops
+
+From: Dan Streetman <dan.streetman@canonical.com>
+
+[ Upstream commit a8a572a6b5f2a79280d6e302cb3c1cb1fbaeb3e8 ]
+
+Remove the dst_entries_init/destroy calls for xfrm4 and xfrm6 dst_ops
+templates; their dst_entries counters will never be used.  Move the
+xfrm dst_ops initialization from the common xfrm/xfrm_policy.c to
+xfrm4/xfrm4_policy.c and xfrm6/xfrm6_policy.c, and call dst_entries_init
+and dst_entries_destroy for each net namespace.
+
+The ipv4 and ipv6 xfrms each create dst_ops template, and perform
+dst_entries_init on the templates.  The template values are copied to each
+net namespace's xfrm.xfrm*_dst_ops.  The problem there is the dst_ops
+pcpuc_entries field is a percpu counter and cannot be used correctly by
+simply copying it to another object.
+
+The result of this is a very subtle bug; changes to the dst entries
+counter from one net namespace may sometimes get applied to a different
+net namespace dst entries counter.  This is because of how the percpu
+counter works; it has a main count field as well as a pointer to the
+percpu variables.  Each net namespace maintains its own main count
+variable, but all point to one set of percpu variables.  When any net
+namespace happens to change one of the percpu variables to outside its
+small batch range, its count is moved to the net namespace's main count
+variable.  So with multiple net namespaces operating concurrently, the
+dst_ops entries counter can stray from the actual value that it should
+be; if counts are consistently moved from one net namespace to another
+(which my testing showed is likely), then one net namespace winds up
+with a negative dst_ops count while another winds up with a continually
+increasing count, eventually reaching its gc_thresh limit, which causes
+all new traffic on the net namespace to fail with -ENOBUFS.
+
+Signed-off-by: Dan Streetman <dan.streetman@canonical.com>
+Signed-off-by: Dan Streetman <ddstreet@ieee.org>
+Signed-off-by: Steffen Klassert <steffen.klassert@secunet.com>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv4/xfrm4_policy.c |   46 +++++++++++++++++++++++++++++++++--------
+ net/ipv6/xfrm6_policy.c |   53 ++++++++++++++++++++++++++++++++++--------------
+ net/xfrm/xfrm_policy.c  |   38 ----------------------------------
+ 3 files changed, 75 insertions(+), 62 deletions(-)
+
+--- a/net/ipv4/xfrm4_policy.c
++++ b/net/ipv4/xfrm4_policy.c
+@@ -236,7 +236,7 @@ static void xfrm4_dst_ifdown(struct dst_
+       xfrm_dst_ifdown(dst, dev);
+ }
+ 
+-static struct dst_ops xfrm4_dst_ops = {
++static struct dst_ops xfrm4_dst_ops_template = {
+       .family =               AF_INET,
+       .gc =                   xfrm4_garbage_collect,
+       .update_pmtu =          xfrm4_update_pmtu,
+@@ -250,7 +250,7 @@ static struct dst_ops xfrm4_dst_ops = {
+ 
+ static struct xfrm_policy_afinfo xfrm4_policy_afinfo = {
+       .family =               AF_INET,
+-      .dst_ops =              &xfrm4_dst_ops,
++      .dst_ops =              &xfrm4_dst_ops_template,
+       .dst_lookup =           xfrm4_dst_lookup,
+       .get_saddr =            xfrm4_get_saddr,
+       .decode_session =       _decode_session4,
+@@ -272,7 +272,7 @@ static struct ctl_table xfrm4_policy_tab
+       { }
+ };
+ 
+-static int __net_init xfrm4_net_init(struct net *net)
++static int __net_init xfrm4_net_sysctl_init(struct net *net)
+ {
+       struct ctl_table *table;
+       struct ctl_table_header *hdr;
+@@ -300,7 +300,7 @@ err_alloc:
+       return -ENOMEM;
+ }
+ 
+-static void __net_exit xfrm4_net_exit(struct net *net)
++static void __net_exit xfrm4_net_sysctl_exit(struct net *net)
+ {
+       struct ctl_table *table;
+ 
+@@ -312,12 +312,44 @@ static void __net_exit xfrm4_net_exit(st
+       if (!net_eq(net, &init_net))
+               kfree(table);
+ }
++#else /* CONFIG_SYSCTL */
++static int inline xfrm4_net_sysctl_init(struct net *net)
++{
++      return 0;
++}
++
++static void inline xfrm4_net_sysctl_exit(struct net *net)
++{
++}
++#endif
++
++static int __net_init xfrm4_net_init(struct net *net)
++{
++      int ret;
++
++      memcpy(&net->xfrm.xfrm4_dst_ops, &xfrm4_dst_ops_template,
++             sizeof(xfrm4_dst_ops_template));
++      ret = dst_entries_init(&net->xfrm.xfrm4_dst_ops);
++      if (ret)
++              return ret;
++
++      ret = xfrm4_net_sysctl_init(net);
++      if (ret)
++              dst_entries_destroy(&net->xfrm.xfrm4_dst_ops);
++
++      return ret;
++}
++
++static void __net_exit xfrm4_net_exit(struct net *net)
++{
++      xfrm4_net_sysctl_exit(net);
++      dst_entries_destroy(&net->xfrm.xfrm4_dst_ops);
++}
+ 
+ static struct pernet_operations __net_initdata xfrm4_net_ops = {
+       .init   = xfrm4_net_init,
+       .exit   = xfrm4_net_exit,
+ };
+-#endif
+ 
+ static void __init xfrm4_policy_init(void)
+ {
+@@ -326,13 +358,9 @@ static void __init xfrm4_policy_init(voi
+ 
+ void __init xfrm4_init(void)
+ {
+-      dst_entries_init(&xfrm4_dst_ops);
+-
+       xfrm4_state_init();
+       xfrm4_policy_init();
+       xfrm4_protocol_init();
+-#ifdef CONFIG_SYSCTL
+       register_pernet_subsys(&xfrm4_net_ops);
+-#endif
+ }
+ 
+--- a/net/ipv6/xfrm6_policy.c
++++ b/net/ipv6/xfrm6_policy.c
+@@ -281,7 +281,7 @@ static void xfrm6_dst_ifdown(struct dst_
+       xfrm_dst_ifdown(dst, dev);
+ }
+ 
+-static struct dst_ops xfrm6_dst_ops = {
++static struct dst_ops xfrm6_dst_ops_template = {
+       .family =               AF_INET6,
+       .gc =                   xfrm6_garbage_collect,
+       .update_pmtu =          xfrm6_update_pmtu,
+@@ -295,7 +295,7 @@ static struct dst_ops xfrm6_dst_ops = {
+ 
+ static struct xfrm_policy_afinfo xfrm6_policy_afinfo = {
+       .family =               AF_INET6,
+-      .dst_ops =              &xfrm6_dst_ops,
++      .dst_ops =              &xfrm6_dst_ops_template,
+       .dst_lookup =           xfrm6_dst_lookup,
+       .get_saddr =            xfrm6_get_saddr,
+       .decode_session =       _decode_session6,
+@@ -327,7 +327,7 @@ static struct ctl_table xfrm6_policy_tab
+       { }
+ };
+ 
+-static int __net_init xfrm6_net_init(struct net *net)
++static int __net_init xfrm6_net_sysctl_init(struct net *net)
+ {
+       struct ctl_table *table;
+       struct ctl_table_header *hdr;
+@@ -355,7 +355,7 @@ err_alloc:
+       return -ENOMEM;
+ }
+ 
+-static void __net_exit xfrm6_net_exit(struct net *net)
++static void __net_exit xfrm6_net_sysctl_exit(struct net *net)
+ {
+       struct ctl_table *table;
+ 
+@@ -367,24 +367,52 @@ static void __net_exit xfrm6_net_exit(st
+       if (!net_eq(net, &init_net))
+               kfree(table);
+ }
++#else /* CONFIG_SYSCTL */
++static int inline xfrm6_net_sysctl_init(struct net *net)
++{
++      return 0;
++}
++
++static void inline xfrm6_net_sysctl_exit(struct net *net)
++{
++}
++#endif
++
++static int __net_init xfrm6_net_init(struct net *net)
++{
++      int ret;
++
++      memcpy(&net->xfrm.xfrm6_dst_ops, &xfrm6_dst_ops_template,
++             sizeof(xfrm6_dst_ops_template));
++      ret = dst_entries_init(&net->xfrm.xfrm6_dst_ops);
++      if (ret)
++              return ret;
++
++      ret = xfrm6_net_sysctl_init(net);
++      if (ret)
++              dst_entries_destroy(&net->xfrm.xfrm6_dst_ops);
++
++      return ret;
++}
++
++static void __net_exit xfrm6_net_exit(struct net *net)
++{
++      xfrm6_net_sysctl_exit(net);
++      dst_entries_destroy(&net->xfrm.xfrm6_dst_ops);
++}
+ 
+ static struct pernet_operations xfrm6_net_ops = {
+       .init   = xfrm6_net_init,
+       .exit   = xfrm6_net_exit,
+ };
+-#endif
+ 
+ int __init xfrm6_init(void)
+ {
+       int ret;
+ 
+-      dst_entries_init(&xfrm6_dst_ops);
+-
+       ret = xfrm6_policy_init();
+-      if (ret) {
+-              dst_entries_destroy(&xfrm6_dst_ops);
++      if (ret)
+               goto out;
+-      }
+       ret = xfrm6_state_init();
+       if (ret)
+               goto out_policy;
+@@ -393,9 +421,7 @@ int __init xfrm6_init(void)
+       if (ret)
+               goto out_state;
+ 
+-#ifdef CONFIG_SYSCTL
+       register_pernet_subsys(&xfrm6_net_ops);
+-#endif
+ out:
+       return ret;
+ out_state:
+@@ -407,11 +433,8 @@ out_policy:
+ 
+ void xfrm6_fini(void)
+ {
+-#ifdef CONFIG_SYSCTL
+       unregister_pernet_subsys(&xfrm6_net_ops);
+-#endif
+       xfrm6_protocol_fini();
+       xfrm6_policy_fini();
+       xfrm6_state_fini();
+-      dst_entries_destroy(&xfrm6_dst_ops);
+ }
+--- a/net/xfrm/xfrm_policy.c
++++ b/net/xfrm/xfrm_policy.c
+@@ -2807,7 +2807,6 @@ static struct neighbour *xfrm_neigh_look
+ 
+ int xfrm_policy_register_afinfo(struct xfrm_policy_afinfo *afinfo)
+ {
+-      struct net *net;
+       int err = 0;
+       if (unlikely(afinfo == NULL))
+               return -EINVAL;
+@@ -2838,26 +2837,6 @@ int xfrm_policy_register_afinfo(struct x
+       }
+       spin_unlock(&xfrm_policy_afinfo_lock);
+ 
+-      rtnl_lock();
+-      for_each_net(net) {
+-              struct dst_ops *xfrm_dst_ops;
+-
+-              switch (afinfo->family) {
+-              case AF_INET:
+-                      xfrm_dst_ops = &net->xfrm.xfrm4_dst_ops;
+-                      break;
+-#if IS_ENABLED(CONFIG_IPV6)
+-              case AF_INET6:
+-                      xfrm_dst_ops = &net->xfrm.xfrm6_dst_ops;
+-                      break;
+-#endif
+-              default:
+-                      BUG();
+-              }
+-              *xfrm_dst_ops = *afinfo->dst_ops;
+-      }
+-      rtnl_unlock();
+-
+       return err;
+ }
+ EXPORT_SYMBOL(xfrm_policy_register_afinfo);
+@@ -2893,22 +2872,6 @@ int xfrm_policy_unregister_afinfo(struct
+ }
+ EXPORT_SYMBOL(xfrm_policy_unregister_afinfo);
+ 
+-static void __net_init xfrm_dst_ops_init(struct net *net)
+-{
+-      struct xfrm_policy_afinfo *afinfo;
+-
+-      rcu_read_lock();
+-      afinfo = rcu_dereference(xfrm_policy_afinfo[AF_INET]);
+-      if (afinfo)
+-              net->xfrm.xfrm4_dst_ops = *afinfo->dst_ops;
+-#if IS_ENABLED(CONFIG_IPV6)
+-      afinfo = rcu_dereference(xfrm_policy_afinfo[AF_INET6]);
+-      if (afinfo)
+-              net->xfrm.xfrm6_dst_ops = *afinfo->dst_ops;
+-#endif
+-      rcu_read_unlock();
+-}
+-
+ static int xfrm_dev_event(struct notifier_block *this, unsigned long event, void *ptr)
+ {
+       struct net_device *dev = netdev_notifier_info_to_dev(ptr);
+@@ -3057,7 +3020,6 @@ static int __net_init xfrm_net_init(stru
+       rv = xfrm_policy_init(net);
+       if (rv < 0)
+               goto out_policy;
+-      xfrm_dst_ops_init(net);
+       rv = xfrm_sysctl_init(net);
+       if (rv < 0)
+               goto out_sysctl;
author	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)
committer	Greg Kroah-Hartman <gregkh@linuxfoundation.org>
	Wed, 27 Jan 2016 06:28:48 +0000 (22:28 -0800)
queue-4.3/addrconf-always-initialize-sysctl-table-data.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/af_unix-fix-splice-bind-deadlock.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_bla_claim.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-avoid-recursive-call_rcu-for-batadv_nc_node.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-drop-immediate-batadv_hard_iface-free-function.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-drop-immediate-batadv_neigh_node-free-function.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-drop-immediate-batadv_orig_ifinfo-free-function.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-drop-immediate-neigh_ifinfo-free-function.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/batman-adv-drop-immediate-orig_node-free-function.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/bonding-prevent-ipv6-link-local-address-on-enslaved-devices.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/bridge-fix-lockdep-addr_list_lock-false-positive-splat.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/bridge-only-call-sbin-bridge-stp-for-the-initial-network-namespace.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/connector-bump-skb-users-before-callback-invocation.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/dwc_eth_qos-fix-dma-address-for-multi-fragment-skbs.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/ipv6-addrlabel-fix-ip6addrlbl_get.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/ipv6-tcp-add-rcu-locking-in-tcp_v6_send_synack.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/ipv6-update-skb-csum-when-ce-mark-is-propagated.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/isdn_ppp-add-checks-for-allocation-failure-in-isdn_ppp_open.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-bpf-reject-invalid-shifts.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-cdc_ncm-avoid-changing-rx-tx-buffers-on-mtu-changes.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-filter-make-jits-zero-a-for-skf_ad_alu_xor_x.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-mlx5_core-fix-trimming-down-irq-number.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-pktgen-fix-null-ptr-deref-in-skb-allocation.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-possible-use-after-free-in-dst_release.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-preserve-ip-control-block-during-gso-segmentation.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-sched-fix-missing-free-per-cpu-on-qstats.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/net-sctp-prevent-writes-to-cookie_hmac_alg-from-accessing-invalid-memory.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/openvswitch-correct-encoding-of-set-tunnel-action-attributes.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/phonet-properly-unshare-skbs-in-phonet_rcv.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/ppp-slip-validate-vj-compression-slot-parameters-completely.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/sched-cls_flower-set-key-address-type-when-present.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/sctp-sctp-should-release-assoc-when-sctp_make_abort_user-return-null-in-sctp_close.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/series		patch \| blob \| blame \| history
queue-4.3/tcp-fix-zero-cwnd-in-tcp_cwnd_reduction.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/tcp_yeah-don-t-set-ssthresh-below-2.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/team-replace-rcu_read_lock-with-a-mutex-in-team_vlan_rx_kill_vid.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/udp-disallow-ufo-for-sockets-with-so_no_check-option.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/unix-properly-account-for-fds-passed-over-unix-sockets.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/utf-8-q-veth-20don-e2-80-99t-20modify-20ip-5fsum-utf-8-q-med-20doing-20so-20treats-20packets-20with-20bad-20checksums-utf-8-q-20as-20good.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/vxlan-fix-test-which-detect-duplicate-vxlan-iface.patch	[new file with mode: 0644]	patch \| blob
queue-4.3/xfrm-dst_entries_init-per-net-dst_ops.patch	[new file with mode: 0644]	patch \| blob