]> git.ipfire.org Git - thirdparty/kernel/stable-queue.git/commitdiff
3.0-stable patches
authorGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 16 Sep 2012 15:38:05 +0000 (08:38 -0700)
committerGreg Kroah-Hartman <gregkh@linuxfoundation.org>
Sun, 16 Sep 2012 15:38:05 +0000 (08:38 -0700)
added patches:
af_packet-remove-bug-statement-in-tpacket_destruct_skb.patch
atm-fix-info-leak-in-getsockopt-so_atmpvc.patch
atm-fix-info-leak-via-getsockname.patch
bluetooth-hci-fix-info-leak-in-getsockopt-hci_filter.patch
bluetooth-hci-fix-info-leak-via-getsockname.patch
bluetooth-l2cap-fix-info-leak-via-getsockname.patch
bluetooth-rfcomm-fix-info-leak-in-getsockopt-bt_security.patch
bluetooth-rfcomm-fix-info-leak-in-ioctl-rfcommgetdevlist.patch
bluetooth-rfcomm-fix-info-leak-via-getsockname.patch
dccp-fix-info-leak-via-getsockopt-dccp_sockopt_ccid_tx_info.patch
ipv6-addrconf-avoid-calling-netdevice-notifiers-with-rcu-read-side-lock.patch
ipvs-fix-info-leak-in-getsockopt-ip_vs_so_get_timeout.patch
isdnloop-fix-and-simplify-isdnloop_init.patch
l2tp-avoid-to-use-synchronize_rcu-in-tunnel-free-function.patch
llc-fix-info-leak-via-getsockname.patch
net-allow-driver-to-limit-number-of-gso-segments-per-skb.patch
net-core-fix-potential-memory-leak-in-dev_set_alias.patch
net-fix-info-leak-in-compat-dev_ifconf.patch
net-ipv4-ipmr_expire_timer-causes-crash-when-removing-net-namespace.patch
netlink-fix-possible-spoofing-from-non-root-processes.patch
net_sched-gact-fix-potential-panic-in-tcf_gact.patch
sfc-fix-maximum-number-of-tso-segments-and-minimum-tx-queue-size.patch
tcp-apply-device-tso-segment-limit-earlier.patch

24 files changed:
queue-3.0/af_packet-remove-bug-statement-in-tpacket_destruct_skb.patch [new file with mode: 0644]
queue-3.0/atm-fix-info-leak-in-getsockopt-so_atmpvc.patch [new file with mode: 0644]
queue-3.0/atm-fix-info-leak-via-getsockname.patch [new file with mode: 0644]
queue-3.0/bluetooth-hci-fix-info-leak-in-getsockopt-hci_filter.patch [new file with mode: 0644]
queue-3.0/bluetooth-hci-fix-info-leak-via-getsockname.patch [new file with mode: 0644]
queue-3.0/bluetooth-l2cap-fix-info-leak-via-getsockname.patch [new file with mode: 0644]
queue-3.0/bluetooth-rfcomm-fix-info-leak-in-getsockopt-bt_security.patch [new file with mode: 0644]
queue-3.0/bluetooth-rfcomm-fix-info-leak-in-ioctl-rfcommgetdevlist.patch [new file with mode: 0644]
queue-3.0/bluetooth-rfcomm-fix-info-leak-via-getsockname.patch [new file with mode: 0644]
queue-3.0/dccp-fix-info-leak-via-getsockopt-dccp_sockopt_ccid_tx_info.patch [new file with mode: 0644]
queue-3.0/ipv6-addrconf-avoid-calling-netdevice-notifiers-with-rcu-read-side-lock.patch [new file with mode: 0644]
queue-3.0/ipvs-fix-info-leak-in-getsockopt-ip_vs_so_get_timeout.patch [new file with mode: 0644]
queue-3.0/isdnloop-fix-and-simplify-isdnloop_init.patch [new file with mode: 0644]
queue-3.0/l2tp-avoid-to-use-synchronize_rcu-in-tunnel-free-function.patch [new file with mode: 0644]
queue-3.0/llc-fix-info-leak-via-getsockname.patch [new file with mode: 0644]
queue-3.0/net-allow-driver-to-limit-number-of-gso-segments-per-skb.patch [new file with mode: 0644]
queue-3.0/net-core-fix-potential-memory-leak-in-dev_set_alias.patch [new file with mode: 0644]
queue-3.0/net-fix-info-leak-in-compat-dev_ifconf.patch [new file with mode: 0644]
queue-3.0/net-ipv4-ipmr_expire_timer-causes-crash-when-removing-net-namespace.patch [new file with mode: 0644]
queue-3.0/net_sched-gact-fix-potential-panic-in-tcf_gact.patch [new file with mode: 0644]
queue-3.0/netlink-fix-possible-spoofing-from-non-root-processes.patch [new file with mode: 0644]
queue-3.0/series [new file with mode: 0644]
queue-3.0/sfc-fix-maximum-number-of-tso-segments-and-minimum-tx-queue-size.patch [new file with mode: 0644]
queue-3.0/tcp-apply-device-tso-segment-limit-earlier.patch [new file with mode: 0644]

diff --git a/queue-3.0/af_packet-remove-bug-statement-in-tpacket_destruct_skb.patch b/queue-3.0/af_packet-remove-bug-statement-in-tpacket_destruct_skb.patch
new file mode 100644 (file)
index 0000000..d47ae8d
--- /dev/null
@@ -0,0 +1,49 @@
+From 99ee7c1952b5cd7992f17c866f5bcce87bc64551 Mon Sep 17 00:00:00 2001
+From: "danborkmann@iogearbox.net" <danborkmann@iogearbox.net>
+Date: Fri, 10 Aug 2012 22:48:54 +0000
+Subject: af_packet: remove BUG statement in tpacket_destruct_skb
+
+
+From: "danborkmann@iogearbox.net" <danborkmann@iogearbox.net>
+
+[ Upstream commit 7f5c3e3a80e6654cf48dfba7cf94f88c6b505467 ]
+
+Here's a quote of the comment about the BUG macro from asm-generic/bug.h:
+
+ Don't use BUG() or BUG_ON() unless there's really no way out; one
+ example might be detecting data structure corruption in the middle
+ of an operation that can't be backed out of.  If the (sub)system
+ can somehow continue operating, perhaps with reduced functionality,
+ it's probably not BUG-worthy.
+
+ If you're tempted to BUG(), think again:  is completely giving up
+ really the *only* solution?  There are usually better options, where
+ users don't need to reboot ASAP and can mostly shut down cleanly.
+
+In our case, the status flag of a ring buffer slot is managed from both sides,
+the kernel space and the user space. This means that even though the kernel
+side might work as expected, the user space screws up and changes this flag
+right between the send(2) is triggered when the flag is changed to
+TP_STATUS_SENDING and a given skb is destructed after some time. Then, this
+will hit the BUG macro. As David suggested, the best solution is to simply
+remove this statement since it cannot be used for kernel side internal
+consistency checks. I've tested it and the system still behaves /stable/ in
+this case, so in accordance with the above comment, we should rather remove it.
+
+Signed-off-by: Daniel Borkmann <daniel.borkmann@tik.ee.ethz.ch>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/packet/af_packet.c |    1 -
+ 1 file changed, 1 deletion(-)
+
+--- a/net/packet/af_packet.c
++++ b/net/packet/af_packet.c
+@@ -866,7 +866,6 @@ static void tpacket_destruct_skb(struct
+       if (likely(po->tx_ring.pg_vec)) {
+               ph = skb_shinfo(skb)->destructor_arg;
+-              BUG_ON(__packet_get_status(po, ph) != TP_STATUS_SENDING);
+               BUG_ON(atomic_read(&po->tx_ring.pending) == 0);
+               atomic_dec(&po->tx_ring.pending);
+               __packet_set_status(po, ph, TP_STATUS_AVAILABLE);
diff --git a/queue-3.0/atm-fix-info-leak-in-getsockopt-so_atmpvc.patch b/queue-3.0/atm-fix-info-leak-in-getsockopt-so_atmpvc.patch
new file mode 100644 (file)
index 0000000..f47a74e
--- /dev/null
@@ -0,0 +1,31 @@
+From afbc8123713afc04b4a919b7352d99dec64f8fa7 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:44 +0000
+Subject: atm: fix info leak in getsockopt(SO_ATMPVC)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit e862f1a9b7df4e8196ebec45ac62295138aa3fc2 ]
+
+The ATM code fails to initialize the two padding bytes of struct
+sockaddr_atmpvc inserted for alignment. Add an explicit memset(0)
+before filling the structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/atm/common.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/atm/common.c
++++ b/net/atm/common.c
+@@ -784,6 +784,7 @@ int vcc_getsockopt(struct socket *sock,
+               if (!vcc->dev || !test_bit(ATM_VF_ADDR, &vcc->flags))
+                       return -ENOTCONN;
++              memset(&pvc, 0, sizeof(pvc));
+               pvc.sap_family = AF_ATMPVC;
+               pvc.sap_addr.itf = vcc->dev->number;
+               pvc.sap_addr.vpi = vcc->vpi;
diff --git a/queue-3.0/atm-fix-info-leak-via-getsockname.patch b/queue-3.0/atm-fix-info-leak-via-getsockname.patch
new file mode 100644 (file)
index 0000000..5b479be
--- /dev/null
@@ -0,0 +1,31 @@
+From 17bb47570557f353777df0db20ce1613a0034031 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:45 +0000
+Subject: atm: fix info leak via getsockname()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 3c0c5cfdcd4d69ffc4b9c0907cec99039f30a50a ]
+
+The ATM code fails to initialize the two padding bytes of struct
+sockaddr_atmpvc inserted for alignment. Add an explicit memset(0)
+before filling the structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/atm/pvc.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/atm/pvc.c
++++ b/net/atm/pvc.c
+@@ -94,6 +94,7 @@ static int pvc_getname(struct socket *so
+               return -ENOTCONN;
+       *sockaddr_len = sizeof(struct sockaddr_atmpvc);
+       addr = (struct sockaddr_atmpvc *)sockaddr;
++      memset(addr, 0, sizeof(*addr));
+       addr->sap_family = AF_ATMPVC;
+       addr->sap_addr.itf = vcc->dev->number;
+       addr->sap_addr.vpi = vcc->vpi;
diff --git a/queue-3.0/bluetooth-hci-fix-info-leak-in-getsockopt-hci_filter.patch b/queue-3.0/bluetooth-hci-fix-info-leak-in-getsockopt-hci_filter.patch
new file mode 100644 (file)
index 0000000..add77a1
--- /dev/null
@@ -0,0 +1,35 @@
+From b81b8de67f7259c448f200bc816e3585a0ad78d5 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:46 +0000
+Subject: Bluetooth: HCI - Fix info leak in getsockopt(HCI_FILTER)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit e15ca9a0ef9a86f0477530b0f44a725d67f889ee ]
+
+The HCI code fails to initialize the two padding bytes of struct
+hci_ufilter before copying it to userland -- that for leaking two
+bytes kernel stack. Add an explicit memset(0) before filling the
+structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/hci_sock.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/bluetooth/hci_sock.c
++++ b/net/bluetooth/hci_sock.c
+@@ -644,6 +644,7 @@ static int hci_sock_setsockopt(struct so
+               {
+                       struct hci_filter *f = &hci_pi(sk)->filter;
++                      memset(&uf, 0, sizeof(uf));
+                       uf.type_mask = f->type_mask;
+                       uf.opcode    = f->opcode;
+                       uf.event_mask[0] = *((u32 *) f->event_mask + 0);
diff --git a/queue-3.0/bluetooth-hci-fix-info-leak-via-getsockname.patch b/queue-3.0/bluetooth-hci-fix-info-leak-via-getsockname.patch
new file mode 100644 (file)
index 0000000..9dd1733
--- /dev/null
@@ -0,0 +1,35 @@
+From bf45c49b2fa65b5422f48ee2d4846a93c79e309e Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:47 +0000
+Subject: Bluetooth: HCI - Fix info leak via getsockname()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 3f68ba07b1da811bf383b4b701b129bfcb2e4988 ]
+
+The HCI code fails to initialize the hci_channel member of struct
+sockaddr_hci and that for leaks two bytes kernel stack via the
+getsockname() syscall. Initialize hci_channel with 0 to avoid the
+info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/hci_sock.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/bluetooth/hci_sock.c
++++ b/net/bluetooth/hci_sock.c
+@@ -432,6 +432,7 @@ static int hci_sock_getname(struct socke
+       *addr_len = sizeof(*haddr);
+       haddr->hci_family = AF_BLUETOOTH;
+       haddr->hci_dev    = hdev->id;
++      haddr->hci_channel= 0;
+       release_sock(sk);
+       return 0;
diff --git a/queue-3.0/bluetooth-l2cap-fix-info-leak-via-getsockname.patch b/queue-3.0/bluetooth-l2cap-fix-info-leak-via-getsockname.patch
new file mode 100644 (file)
index 0000000..1037f99
--- /dev/null
@@ -0,0 +1,35 @@
+From dfd50a3a0c221b6d99c223dc7f0c654d814403eb Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:51 +0000
+Subject: Bluetooth: L2CAP - Fix info leak via getsockname()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 792039c73cf176c8e39a6e8beef2c94ff46522ed ]
+
+The L2CAP code fails to initialize the l2_bdaddr_type member of struct
+sockaddr_l2 and the padding byte added for alignment. It that for leaks
+two bytes kernel stack via the getsockname() syscall. Add an explicit
+memset(0) before filling the structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/l2cap_sock.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/bluetooth/l2cap_sock.c
++++ b/net/bluetooth/l2cap_sock.c
+@@ -329,6 +329,7 @@ static int l2cap_sock_getname(struct soc
+       BT_DBG("sock %p, sk %p", sock, sk);
++      memset(la, 0, sizeof(struct sockaddr_l2));
+       addr->sa_family = AF_BLUETOOTH;
+       *len = sizeof(struct sockaddr_l2);
diff --git a/queue-3.0/bluetooth-rfcomm-fix-info-leak-in-getsockopt-bt_security.patch b/queue-3.0/bluetooth-rfcomm-fix-info-leak-in-getsockopt-bt_security.patch
new file mode 100644 (file)
index 0000000..f0d687a
--- /dev/null
@@ -0,0 +1,35 @@
+From b22d8822829c34cff9b4ab4b1a556b5c2955e879 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:48 +0000
+Subject: Bluetooth: RFCOMM - Fix info leak in getsockopt(BT_SECURITY)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 9ad2de43f1aee7e7274a4e0d41465489299e344b ]
+
+The RFCOMM code fails to initialize the key_size member of struct
+bt_security before copying it to userland -- that for leaking one
+byte kernel stack. Initialize key_size with 0 to avoid the info
+leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/rfcomm/sock.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/bluetooth/rfcomm/sock.c
++++ b/net/bluetooth/rfcomm/sock.c
+@@ -834,6 +834,7 @@ static int rfcomm_sock_getsockopt(struct
+               }
+               sec.level = rfcomm_pi(sk)->sec_level;
++              sec.key_size = 0;
+               len = min_t(unsigned int, len, sizeof(sec));
+               if (copy_to_user(optval, (char *) &sec, len))
diff --git a/queue-3.0/bluetooth-rfcomm-fix-info-leak-in-ioctl-rfcommgetdevlist.patch b/queue-3.0/bluetooth-rfcomm-fix-info-leak-in-ioctl-rfcommgetdevlist.patch
new file mode 100644 (file)
index 0000000..9f9d144
--- /dev/null
@@ -0,0 +1,39 @@
+From c95564400d94f488f167b3d71472e2c28ca38980 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:49 +0000
+Subject: Bluetooth: RFCOMM - Fix info leak in ioctl(RFCOMMGETDEVLIST)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit f9432c5ec8b1e9a09b9b0e5569e3c73db8de432a ]
+
+The RFCOMM code fails to initialize the two padding bytes of struct
+rfcomm_dev_list_req inserted for alignment before copying it to
+userland. Additionally there are two padding bytes in each instance of
+struct rfcomm_dev_info. The ioctl() that for disclosures two bytes plus
+dev_num times two bytes uninitialized kernel heap memory.
+
+Allocate the memory using kzalloc() to fix this issue.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/rfcomm/tty.c |    2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/net/bluetooth/rfcomm/tty.c
++++ b/net/bluetooth/rfcomm/tty.c
+@@ -471,7 +471,7 @@ static int rfcomm_get_dev_list(void __us
+       size = sizeof(*dl) + dev_num * sizeof(*di);
+-      dl = kmalloc(size, GFP_KERNEL);
++      dl = kzalloc(size, GFP_KERNEL);
+       if (!dl)
+               return -ENOMEM;
diff --git a/queue-3.0/bluetooth-rfcomm-fix-info-leak-via-getsockname.patch b/queue-3.0/bluetooth-rfcomm-fix-info-leak-via-getsockname.patch
new file mode 100644 (file)
index 0000000..e08d130
--- /dev/null
@@ -0,0 +1,35 @@
+From a159893d86bfe008021b59c12ea3d925d0bbbc44 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:50 +0000
+Subject: Bluetooth: RFCOMM - Fix info leak via getsockname()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 9344a972961d1a6d2c04d9008b13617bcb6ec2ef ]
+
+The RFCOMM code fails to initialize the trailing padding byte of struct
+sockaddr_rc added for alignment. It that for leaks one byte kernel stack
+via the getsockname() syscall. Add an explicit memset(0) before filling
+the structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Marcel Holtmann <marcel@holtmann.org>
+Cc: Gustavo Padovan <gustavo@padovan.org>
+Cc: Johan Hedberg <johan.hedberg@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/bluetooth/rfcomm/sock.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/bluetooth/rfcomm/sock.c
++++ b/net/bluetooth/rfcomm/sock.c
+@@ -544,6 +544,7 @@ static int rfcomm_sock_getname(struct so
+       BT_DBG("sock %p, sk %p", sock, sk);
++      memset(sa, 0, sizeof(*sa));
+       sa->rc_family  = AF_BLUETOOTH;
+       sa->rc_channel = rfcomm_pi(sk)->channel;
+       if (peer)
diff --git a/queue-3.0/dccp-fix-info-leak-via-getsockopt-dccp_sockopt_ccid_tx_info.patch b/queue-3.0/dccp-fix-info-leak-via-getsockopt-dccp_sockopt_ccid_tx_info.patch
new file mode 100644 (file)
index 0000000..a1a5e44
--- /dev/null
@@ -0,0 +1,34 @@
+From 364ab5ea1e68f84e054e851b3506eef5de5f3521 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:55 +0000
+Subject: dccp: fix info leak via getsockopt(DCCP_SOCKOPT_CCID_TX_INFO)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 7b07f8eb75aa3097cdfd4f6eac3da49db787381d ]
+
+The CCID3 code fails to initialize the trailing padding bytes of struct
+tfrc_tx_info added for alignment on 64 bit architectures. It that for
+potentially leaks four bytes kernel stack via the getsockopt() syscall.
+Add an explicit memset(0) before filling the structure to avoid the
+info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Gerrit Renker <gerrit@erg.abdn.ac.uk>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/dccp/ccids/ccid3.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/dccp/ccids/ccid3.c
++++ b/net/dccp/ccids/ccid3.c
+@@ -532,6 +532,7 @@ static int ccid3_hc_tx_getsockopt(struct
+       case DCCP_SOCKOPT_CCID_TX_INFO:
+               if (len < sizeof(tfrc))
+                       return -EINVAL;
++              memset(&tfrc, 0, sizeof(tfrc));
+               tfrc.tfrctx_x      = hc->tx_x;
+               tfrc.tfrctx_x_recv = hc->tx_x_recv;
+               tfrc.tfrctx_x_calc = hc->tx_x_calc;
diff --git a/queue-3.0/ipv6-addrconf-avoid-calling-netdevice-notifiers-with-rcu-read-side-lock.patch b/queue-3.0/ipv6-addrconf-avoid-calling-netdevice-notifiers-with-rcu-read-side-lock.patch
new file mode 100644 (file)
index 0000000..39c0a3a
--- /dev/null
@@ -0,0 +1,73 @@
+From d5dd8d18457e05047515bdd59bf8ab586286ce2b Mon Sep 17 00:00:00 2001
+From: Ben Hutchings <bhutchings@solarflare.com>
+Date: Tue, 14 Aug 2012 08:54:51 +0000
+Subject: ipv6: addrconf: Avoid calling netdevice notifiers with RCU read-side lock
+
+
+From: Ben Hutchings <bhutchings@solarflare.com>
+
+[ Upstream commit 4acd4945cd1e1f92b20d14e349c6c6a52acbd42d ]
+
+Cong Wang reports that lockdep detected suspicious RCU usage while
+enabling IPV6 forwarding:
+
+ [ 1123.310275] ===============================
+ [ 1123.442202] [ INFO: suspicious RCU usage. ]
+ [ 1123.558207] 3.6.0-rc1+ #109 Not tainted
+ [ 1123.665204] -------------------------------
+ [ 1123.768254] include/linux/rcupdate.h:430 Illegal context switch in RCU read-side critical section!
+ [ 1123.992320]
+ [ 1123.992320] other info that might help us debug this:
+ [ 1123.992320]
+ [ 1124.307382]
+ [ 1124.307382] rcu_scheduler_active = 1, debug_locks = 0
+ [ 1124.522220] 2 locks held by sysctl/5710:
+ [ 1124.648364]  #0:  (rtnl_mutex){+.+.+.}, at: [<ffffffff81768498>] rtnl_trylock+0x15/0x17
+ [ 1124.882211]  #1:  (rcu_read_lock){.+.+.+}, at: [<ffffffff81871df8>] rcu_lock_acquire+0x0/0x29
+ [ 1125.085209]
+ [ 1125.085209] stack backtrace:
+ [ 1125.332213] Pid: 5710, comm: sysctl Not tainted 3.6.0-rc1+ #109
+ [ 1125.441291] Call Trace:
+ [ 1125.545281]  [<ffffffff8109d915>] lockdep_rcu_suspicious+0x109/0x112
+ [ 1125.667212]  [<ffffffff8107c240>] rcu_preempt_sleep_check+0x45/0x47
+ [ 1125.781838]  [<ffffffff8107c260>] __might_sleep+0x1e/0x19b
+[...]
+ [ 1127.445223]  [<ffffffff81757ac5>] call_netdevice_notifiers+0x4a/0x4f
+[...]
+ [ 1127.772188]  [<ffffffff8175e125>] dev_disable_lro+0x32/0x6b
+ [ 1127.885174]  [<ffffffff81872d26>] dev_forward_change+0x30/0xcb
+ [ 1128.013214]  [<ffffffff818738c4>] addrconf_forward_change+0x85/0xc5
+[...]
+
+addrconf_forward_change() uses RCU iteration over the netdev list,
+which is unnecessary since it already holds the RTNL lock.  We also
+cannot reasonably require netdevice notifier functions not to sleep.
+
+Reported-by: Cong Wang <amwang@redhat.com>
+Signed-off-by: Ben Hutchings <bhutchings@solarflare.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv6/addrconf.c |    4 +---
+ 1 file changed, 1 insertion(+), 3 deletions(-)
+
+--- a/net/ipv6/addrconf.c
++++ b/net/ipv6/addrconf.c
+@@ -492,8 +492,7 @@ static void addrconf_forward_change(stru
+       struct net_device *dev;
+       struct inet6_dev *idev;
+-      rcu_read_lock();
+-      for_each_netdev_rcu(net, dev) {
++      for_each_netdev(net, dev) {
+               idev = __in6_dev_get(dev);
+               if (idev) {
+                       int changed = (!idev->cnf.forwarding) ^ (!newf);
+@@ -502,7 +501,6 @@ static void addrconf_forward_change(stru
+                               dev_forward_change(idev);
+               }
+       }
+-      rcu_read_unlock();
+ }
+ static int addrconf_fixup_forwarding(struct ctl_table *table, int *p, int old)
diff --git a/queue-3.0/ipvs-fix-info-leak-in-getsockopt-ip_vs_so_get_timeout.patch b/queue-3.0/ipvs-fix-info-leak-in-getsockopt-ip_vs_so_get_timeout.patch
new file mode 100644 (file)
index 0000000..f7c37ca
--- /dev/null
@@ -0,0 +1,36 @@
+From 65c66eff54c1ddcc661037de47b17118d6141e0b Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:56 +0000
+Subject: ipvs: fix info leak in getsockopt(IP_VS_SO_GET_TIMEOUT)
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 2d8a041b7bfe1097af21441cb77d6af95f4f4680 ]
+
+If at least one of CONFIG_IP_VS_PROTO_TCP or CONFIG_IP_VS_PROTO_UDP is
+not set, __ip_vs_get_timeouts() does not fully initialize the structure
+that gets copied to userland and that for leaks up to 12 bytes of kernel
+stack. Add an explicit memset(0) before passing the structure to
+__ip_vs_get_timeouts() to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Wensong Zhang <wensong@linux-vs.org>
+Cc: Simon Horman <horms@verge.net.au>
+Cc: Julian Anastasov <ja@ssi.bg>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/netfilter/ipvs/ip_vs_ctl.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/netfilter/ipvs/ip_vs_ctl.c
++++ b/net/netfilter/ipvs/ip_vs_ctl.c
+@@ -2675,6 +2675,7 @@ do_ip_vs_get_ctl(struct sock *sk, int cm
+       {
+               struct ip_vs_timeout_user t;
++              memset(&t, 0, sizeof(t));
+               __ip_vs_get_timeouts(net, &t);
+               if (copy_to_user(user, &t, sizeof(t)) != 0)
+                       ret = -EFAULT;
diff --git a/queue-3.0/isdnloop-fix-and-simplify-isdnloop_init.patch b/queue-3.0/isdnloop-fix-and-simplify-isdnloop_init.patch
new file mode 100644 (file)
index 0000000..1de40c6
--- /dev/null
@@ -0,0 +1,60 @@
+From 85c8437c750422264d24b874a6336f315a5aa90e Mon Sep 17 00:00:00 2001
+From: Wu Fengguang <fengguang.wu@intel.com>
+Date: Thu, 2 Aug 2012 23:10:01 +0000
+Subject: isdnloop: fix and simplify isdnloop_init()
+
+
+From: Wu Fengguang <fengguang.wu@intel.com>
+
+[ Upstream commit 77f00f6324cb97cf1df6f9c4aaeea6ada23abdb2 ]
+
+Fix a buffer overflow bug by removing the revision and printk.
+
+[   22.016214] isdnloop-ISDN-driver Rev 1.11.6.7
+[   22.097508] isdnloop: (loop0) virtual card added
+[   22.174400] Kernel panic - not syncing: stack-protector: Kernel stack is corrupted in: ffffffff83244972
+[   22.174400]
+[   22.436157] Pid: 1, comm: swapper Not tainted 3.5.0-bisect-00018-gfa8bbb1-dirty #129
+[   22.624071] Call Trace:
+[   22.720558]  [<ffffffff832448c3>] ? CallcNew+0x56/0x56
+[   22.815248]  [<ffffffff8222b623>] panic+0x110/0x329
+[   22.914330]  [<ffffffff83244972>] ? isdnloop_init+0xaf/0xb1
+[   23.014800]  [<ffffffff832448c3>] ? CallcNew+0x56/0x56
+[   23.090763]  [<ffffffff8108e24b>] __stack_chk_fail+0x2b/0x30
+[   23.185748]  [<ffffffff83244972>] isdnloop_init+0xaf/0xb1
+
+Signed-off-by: Fengguang Wu <fengguang.wu@intel.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/isdn/isdnloop/isdnloop.c |   12 ------------
+ 1 file changed, 12 deletions(-)
+
+--- a/drivers/isdn/isdnloop/isdnloop.c
++++ b/drivers/isdn/isdnloop/isdnloop.c
+@@ -16,7 +16,6 @@
+ #include <linux/sched.h>
+ #include "isdnloop.h"
+-static char *revision = "$Revision: 1.11.6.7 $";
+ static char *isdnloop_id = "loop0";
+ MODULE_DESCRIPTION("ISDN4Linux: Pseudo Driver that simulates an ISDN card");
+@@ -1494,17 +1493,6 @@ isdnloop_addcard(char *id1)
+ static int __init
+ isdnloop_init(void)
+ {
+-      char *p;
+-      char rev[10];
+-
+-      if ((p = strchr(revision, ':'))) {
+-              strcpy(rev, p + 1);
+-              p = strchr(rev, '$');
+-              *p = 0;
+-      } else
+-              strcpy(rev, " ??? ");
+-      printk(KERN_NOTICE "isdnloop-ISDN-driver Rev%s\n", rev);
+-
+       if (isdnloop_id)
+               return (isdnloop_addcard(isdnloop_id));
diff --git a/queue-3.0/l2tp-avoid-to-use-synchronize_rcu-in-tunnel-free-function.patch b/queue-3.0/l2tp-avoid-to-use-synchronize_rcu-in-tunnel-free-function.patch
new file mode 100644 (file)
index 0000000..f4c1c5b
--- /dev/null
@@ -0,0 +1,46 @@
+From 592a4c6134912f90957f7ce2de4223c013b14054 Mon Sep 17 00:00:00 2001
+From: "xeb@mail.ru" <xeb@mail.ru>
+Date: Fri, 24 Aug 2012 01:07:38 +0000
+Subject: l2tp: avoid to use synchronize_rcu in tunnel free function
+
+
+From: "xeb@mail.ru" <xeb@mail.ru>
+
+[ Upstream commit 99469c32f79a32d8481f87be0d3c66dad286f4ec ]
+
+Avoid to use synchronize_rcu in l2tp_tunnel_free because context may be
+atomic.
+
+Signed-off-by: Dmitry Kozlov <xeb@mail.ru>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/l2tp/l2tp_core.c |    3 +--
+ net/l2tp/l2tp_core.h |    1 +
+ 2 files changed, 2 insertions(+), 2 deletions(-)
+
+--- a/net/l2tp/l2tp_core.c
++++ b/net/l2tp/l2tp_core.c
+@@ -1252,11 +1252,10 @@ static void l2tp_tunnel_free(struct l2tp
+       /* Remove from tunnel list */
+       spin_lock_bh(&pn->l2tp_tunnel_list_lock);
+       list_del_rcu(&tunnel->list);
++      kfree_rcu(tunnel, rcu);
+       spin_unlock_bh(&pn->l2tp_tunnel_list_lock);
+-      synchronize_rcu();
+       atomic_dec(&l2tp_tunnel_count);
+-      kfree(tunnel);
+ }
+ /* Create a socket for the tunnel, if one isn't set up by
+--- a/net/l2tp/l2tp_core.h
++++ b/net/l2tp/l2tp_core.h
+@@ -157,6 +157,7 @@ struct l2tp_tunnel_cfg {
+ struct l2tp_tunnel {
+       int                     magic;          /* Should be L2TP_TUNNEL_MAGIC */
++      struct rcu_head rcu;
+       rwlock_t                hlist_lock;     /* protect session_hlist */
+       struct hlist_head       session_hlist[L2TP_HASH_SIZE];
+                                               /* hashed list of sessions,
diff --git a/queue-3.0/llc-fix-info-leak-via-getsockname.patch b/queue-3.0/llc-fix-info-leak-via-getsockname.patch
new file mode 100644 (file)
index 0000000..2d9899b
--- /dev/null
@@ -0,0 +1,46 @@
+From 0615de68e439c8b73ce9665558e50c28c4b02224 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:53 +0000
+Subject: llc: fix info leak via getsockname()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 3592aaeb80290bda0f2cf0b5456c97bfc638b192 ]
+
+The LLC code wrongly returns 0, i.e. "success", when the socket is
+zapped. Together with the uninitialized uaddrlen pointer argument from
+sys_getsockname this leads to an arbitrary memory leak of up to 128
+bytes kernel stack via the getsockname() syscall.
+
+Return an error instead when the socket is zapped to prevent the info
+leak. Also remove the unnecessary memset(0). We don't directly write to
+the memory pointed by uaddr but memcpy() a local structure at the end of
+the function that is properly initialized.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Cc: Arnaldo Carvalho de Melo <acme@ghostprotocols.net>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/llc/af_llc.c |    3 +--
+ 1 file changed, 1 insertion(+), 2 deletions(-)
+
+--- a/net/llc/af_llc.c
++++ b/net/llc/af_llc.c
+@@ -966,14 +966,13 @@ static int llc_ui_getname(struct socket
+       struct sockaddr_llc sllc;
+       struct sock *sk = sock->sk;
+       struct llc_sock *llc = llc_sk(sk);
+-      int rc = 0;
++      int rc = -EBADF;
+       memset(&sllc, 0, sizeof(sllc));
+       lock_sock(sk);
+       if (sock_flag(sk, SOCK_ZAPPED))
+               goto out;
+       *uaddrlen = sizeof(sllc);
+-      memset(uaddr, 0, *uaddrlen);
+       if (peer) {
+               rc = -ENOTCONN;
+               if (sk->sk_state != TCP_ESTABLISHED)
diff --git a/queue-3.0/net-allow-driver-to-limit-number-of-gso-segments-per-skb.patch b/queue-3.0/net-allow-driver-to-limit-number-of-gso-segments-per-skb.patch
new file mode 100644 (file)
index 0000000..1f68632
--- /dev/null
@@ -0,0 +1,69 @@
+From bada1aad00ffb0c25c5bba14e5d40e8e34e35915 Mon Sep 17 00:00:00 2001
+From: Ben Hutchings <bhutchings@solarflare.com>
+Date: Mon, 30 Jul 2012 15:57:00 +0000
+Subject: net: Allow driver to limit number of GSO segments per skb
+
+
+From: Ben Hutchings <bhutchings@solarflare.com>
+
+[ Upstream commit 30b678d844af3305cda5953467005cebb5d7b687 ]
+
+A peer (or local user) may cause TCP to use a nominal MSS of as little
+as 88 (actual MSS of 76 with timestamps).  Given that we have a
+sufficiently prodigious local sender and the peer ACKs quickly enough,
+it is nevertheless possible to grow the window for such a connection
+to the point that we will try to send just under 64K at once.  This
+results in a single skb that expands to 861 segments.
+
+In some drivers with TSO support, such an skb will require hundreds of
+DMA descriptors; a substantial fraction of a TX ring or even more than
+a full ring.  The TX queue selected for the skb may stall and trigger
+the TX watchdog repeatedly (since the problem skb will be retried
+after the TX reset).  This particularly affects sfc, for which the
+issue is designated as CVE-2012-3412.
+
+Therefore:
+1. Add the field net_device::gso_max_segs holding the device-specific
+   limit.
+2. In netif_skb_features(), if the number of segments is too high then
+   mask out GSO features to force fall back to software GSO.
+
+Signed-off-by: Ben Hutchings <bhutchings@solarflare.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ include/linux/netdevice.h |    2 ++
+ net/core/dev.c            |    4 ++++
+ 2 files changed, 6 insertions(+)
+
+--- a/include/linux/netdevice.h
++++ b/include/linux/netdevice.h
+@@ -1329,6 +1329,8 @@ struct net_device {
+       /* for setting kernel sock attribute on TCP connection setup */
+ #define GSO_MAX_SIZE          65536
+       unsigned int            gso_max_size;
++#define GSO_MAX_SEGS          65535
++      u16                     gso_max_segs;
+ #ifdef CONFIG_DCB
+       /* Data Center Bridging netlink ops */
+--- a/net/core/dev.c
++++ b/net/core/dev.c
+@@ -2050,6 +2050,9 @@ u32 netif_skb_features(struct sk_buff *s
+       __be16 protocol = skb->protocol;
+       u32 features = skb->dev->features;
++      if (skb_shinfo(skb)->gso_segs > skb->dev->gso_max_segs)
++              features &= ~NETIF_F_GSO_MASK;
++
+       if (protocol == htons(ETH_P_8021Q)) {
+               struct vlan_ethhdr *veh = (struct vlan_ethhdr *)skb->data;
+               protocol = veh->h_vlan_encapsulated_proto;
+@@ -5870,6 +5873,7 @@ struct net_device *alloc_netdev_mqs(int
+       dev_net_set(dev, &init_net);
+       dev->gso_max_size = GSO_MAX_SIZE;
++      dev->gso_max_segs = GSO_MAX_SEGS;
+       INIT_LIST_HEAD(&dev->ethtool_ntuple_list.list);
+       dev->ethtool_ntuple_list.count = 0;
diff --git a/queue-3.0/net-core-fix-potential-memory-leak-in-dev_set_alias.patch b/queue-3.0/net-core-fix-potential-memory-leak-in-dev_set_alias.patch
new file mode 100644 (file)
index 0000000..66d089f
--- /dev/null
@@ -0,0 +1,45 @@
+From 373fcfd23b12b5acbe14973c14f8d49922a55611 Mon Sep 17 00:00:00 2001
+From: Alexey Khoroshilov <khoroshilov@ispras.ru>
+Date: Wed, 8 Aug 2012 00:33:25 +0000
+Subject: net/core: Fix potential memory leak in dev_set_alias()
+
+
+From: Alexey Khoroshilov <khoroshilov@ispras.ru>
+
+[ Upstream commit 7364e445f62825758fa61195d237a5b8ecdd06ec ]
+
+Do not leak memory by updating pointer with potentially NULL realloc return value.
+
+Found by Linux Driver Verification project (linuxtesting.org).
+
+Signed-off-by: Alexey Khoroshilov <khoroshilov@ispras.ru>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/core/dev.c |    7 +++++--
+ 1 file changed, 5 insertions(+), 2 deletions(-)
+
+--- a/net/core/dev.c
++++ b/net/core/dev.c
+@@ -1045,6 +1045,8 @@ rollback:
+  */
+ int dev_set_alias(struct net_device *dev, const char *alias, size_t len)
+ {
++      char *new_ifalias;
++
+       ASSERT_RTNL();
+       if (len >= IFALIASZ)
+@@ -1058,9 +1060,10 @@ int dev_set_alias(struct net_device *dev
+               return 0;
+       }
+-      dev->ifalias = krealloc(dev->ifalias, len + 1, GFP_KERNEL);
+-      if (!dev->ifalias)
++      new_ifalias = krealloc(dev->ifalias, len + 1, GFP_KERNEL);
++      if (!new_ifalias)
+               return -ENOMEM;
++      dev->ifalias = new_ifalias;
+       strlcpy(dev->ifalias, alias, len+1);
+       return len;
diff --git a/queue-3.0/net-fix-info-leak-in-compat-dev_ifconf.patch b/queue-3.0/net-fix-info-leak-in-compat-dev_ifconf.patch
new file mode 100644 (file)
index 0000000..5c9ea65
--- /dev/null
@@ -0,0 +1,33 @@
+From 55e3efd6a689c14169fe4d59993f1a6287bebd74 Mon Sep 17 00:00:00 2001
+From: Mathias Krause <minipli@googlemail.com>
+Date: Wed, 15 Aug 2012 11:31:57 +0000
+Subject: net: fix info leak in compat dev_ifconf()
+
+
+From: Mathias Krause <minipli@googlemail.com>
+
+[ Upstream commit 43da5f2e0d0c69ded3d51907d9552310a6b545e8 ]
+
+The implementation of dev_ifconf() for the compat ioctl interface uses
+an intermediate ifc structure allocated in userland for the duration of
+the syscall. Though, it fails to initialize the padding bytes inserted
+for alignment and that for leaks four bytes of kernel stack. Add an
+explicit memset(0) before filling the structure to avoid the info leak.
+
+Signed-off-by: Mathias Krause <minipli@googlemail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/socket.c |    1 +
+ 1 file changed, 1 insertion(+)
+
+--- a/net/socket.c
++++ b/net/socket.c
+@@ -2645,6 +2645,7 @@ static int dev_ifconf(struct net *net, s
+       if (copy_from_user(&ifc32, uifc32, sizeof(struct compat_ifconf)))
+               return -EFAULT;
++      memset(&ifc, 0, sizeof(ifc));
+       if (ifc32.ifcbuf == 0) {
+               ifc32.ifc_len = 0;
+               ifc.ifc_len = 0;
diff --git a/queue-3.0/net-ipv4-ipmr_expire_timer-causes-crash-when-removing-net-namespace.patch b/queue-3.0/net-ipv4-ipmr_expire_timer-causes-crash-when-removing-net-namespace.patch
new file mode 100644 (file)
index 0000000..1cf873e
--- /dev/null
@@ -0,0 +1,84 @@
+From 26b869b60755a4c9b25175808ba8fe983388ea4c Mon Sep 17 00:00:00 2001
+From: Francesco Ruggeri <fruggeri@aristanetworks.com>
+Date: Fri, 24 Aug 2012 07:38:35 +0000
+Subject: net: ipv4: ipmr_expire_timer causes crash when removing net namespace
+
+
+From: Francesco Ruggeri <fruggeri@aristanetworks.com>
+
+[ Upstream commit acbb219d5f53821b2d0080d047800410c0420ea1 ]
+
+When tearing down a net namespace, ipv4 mr_table structures are freed
+without first deactivating their timers. This can result in a crash in
+run_timer_softirq.
+This patch mimics the corresponding behaviour in ipv6.
+Locking and synchronization seem to be adequate.
+We are about to kfree mrt, so existing code should already make sure that
+no other references to mrt are pending or can be created by incoming traffic.
+The functions invoked here do not cause new references to mrt or other
+race conditions to be created.
+Invoking del_timer_sync guarantees that ipmr_expire_timer is inactive.
+Both ipmr_expire_process (whose completion we may have to wait in
+del_timer_sync) and mroute_clean_tables internally use mfc_unres_lock
+or other synchronizations when needed, and they both only modify mrt.
+
+Tested in Linux 3.4.8.
+
+Signed-off-by: Francesco Ruggeri <fruggeri@aristanetworks.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/ipv4/ipmr.c |   14 ++++++++++++--
+ 1 file changed, 12 insertions(+), 2 deletions(-)
+
+--- a/net/ipv4/ipmr.c
++++ b/net/ipv4/ipmr.c
+@@ -124,6 +124,8 @@ static DEFINE_SPINLOCK(mfc_unres_lock);
+ static struct kmem_cache *mrt_cachep __read_mostly;
+ static struct mr_table *ipmr_new_table(struct net *net, u32 id);
++static void ipmr_free_table(struct mr_table *mrt);
++
+ static int ip_mr_forward(struct net *net, struct mr_table *mrt,
+                        struct sk_buff *skb, struct mfc_cache *cache,
+                        int local);
+@@ -131,6 +133,7 @@ static int ipmr_cache_report(struct mr_t
+                            struct sk_buff *pkt, vifi_t vifi, int assert);
+ static int __ipmr_fill_mroute(struct mr_table *mrt, struct sk_buff *skb,
+                             struct mfc_cache *c, struct rtmsg *rtm);
++static void mroute_clean_tables(struct mr_table *mrt);
+ static void ipmr_expire_process(unsigned long arg);
+ #ifdef CONFIG_IP_MROUTE_MULTIPLE_TABLES
+@@ -271,7 +274,7 @@ static void __net_exit ipmr_rules_exit(s
+       list_for_each_entry_safe(mrt, next, &net->ipv4.mr_tables, list) {
+               list_del(&mrt->list);
+-              kfree(mrt);
++              ipmr_free_table(mrt);
+       }
+       fib_rules_unregister(net->ipv4.mr_rules_ops);
+ }
+@@ -299,7 +302,7 @@ static int __net_init ipmr_rules_init(st
+ static void __net_exit ipmr_rules_exit(struct net *net)
+ {
+-      kfree(net->ipv4.mrt);
++      ipmr_free_table(net->ipv4.mrt);
+ }
+ #endif
+@@ -336,6 +339,13 @@ static struct mr_table *ipmr_new_table(s
+       return mrt;
+ }
++static void ipmr_free_table(struct mr_table *mrt)
++{
++      del_timer_sync(&mrt->ipmr_expire_timer);
++      mroute_clean_tables(mrt);
++      kfree(mrt);
++}
++
+ /* Service routines creating virtual interfaces: DVMRP tunnels and PIMREG */
+ static void ipmr_del_tunnel(struct net_device *dev, struct vifctl *v)
diff --git a/queue-3.0/net_sched-gact-fix-potential-panic-in-tcf_gact.patch b/queue-3.0/net_sched-gact-fix-potential-panic-in-tcf_gact.patch
new file mode 100644 (file)
index 0000000..846bd7d
--- /dev/null
@@ -0,0 +1,68 @@
+From 620b32f84744b22e857a827f758814f40a458bf7 Mon Sep 17 00:00:00 2001
+From: Hiroaki SHIMODA <shimoda.hiroaki@gmail.com>
+Date: Fri, 3 Aug 2012 19:57:52 +0900
+Subject: net_sched: gact: Fix potential panic in tcf_gact().
+
+
+From: Hiroaki SHIMODA <shimoda.hiroaki@gmail.com>
+
+[ Upstream commit 696ecdc10622d86541f2e35cc16e15b6b3b1b67e ]
+
+gact_rand array is accessed by gact->tcfg_ptype whose value
+is assumed to less than MAX_RAND, but any range checks are
+not performed.
+
+So add a check in tcf_gact_init(). And in tcf_gact(), we can
+reduce a branch.
+
+Signed-off-by: Hiroaki SHIMODA <shimoda.hiroaki@gmail.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/sched/act_gact.c |   14 +++++++++++---
+ 1 file changed, 11 insertions(+), 3 deletions(-)
+
+--- a/net/sched/act_gact.c
++++ b/net/sched/act_gact.c
+@@ -67,6 +67,9 @@ static int tcf_gact_init(struct nlattr *
+       struct tcf_common *pc;
+       int ret = 0;
+       int err;
++#ifdef CONFIG_GACT_PROB
++      struct tc_gact_p *p_parm = NULL;
++#endif
+       if (nla == NULL)
+               return -EINVAL;
+@@ -82,6 +85,12 @@ static int tcf_gact_init(struct nlattr *
+ #ifndef CONFIG_GACT_PROB
+       if (tb[TCA_GACT_PROB] != NULL)
+               return -EOPNOTSUPP;
++#else
++      if (tb[TCA_GACT_PROB]) {
++              p_parm = nla_data(tb[TCA_GACT_PROB]);
++              if (p_parm->ptype >= MAX_RAND)
++                      return -EINVAL;
++      }
+ #endif
+       pc = tcf_hash_check(parm->index, a, bind, &gact_hash_info);
+@@ -103,8 +112,7 @@ static int tcf_gact_init(struct nlattr *
+       spin_lock_bh(&gact->tcf_lock);
+       gact->tcf_action = parm->action;
+ #ifdef CONFIG_GACT_PROB
+-      if (tb[TCA_GACT_PROB] != NULL) {
+-              struct tc_gact_p *p_parm = nla_data(tb[TCA_GACT_PROB]);
++      if (p_parm) {
+               gact->tcfg_paction = p_parm->paction;
+               gact->tcfg_pval    = p_parm->pval;
+               gact->tcfg_ptype   = p_parm->ptype;
+@@ -132,7 +140,7 @@ static int tcf_gact(struct sk_buff *skb,
+       spin_lock(&gact->tcf_lock);
+ #ifdef CONFIG_GACT_PROB
+-      if (gact->tcfg_ptype && gact_rand[gact->tcfg_ptype] != NULL)
++      if (gact->tcfg_ptype)
+               action = gact_rand[gact->tcfg_ptype](gact);
+       else
+               action = gact->tcf_action;
diff --git a/queue-3.0/netlink-fix-possible-spoofing-from-non-root-processes.patch b/queue-3.0/netlink-fix-possible-spoofing-from-non-root-processes.patch
new file mode 100644 (file)
index 0000000..47aa9dd
--- /dev/null
@@ -0,0 +1,74 @@
+From 66f43e643dc3e35b1895d6d13eca8c2c4ec9f52a Mon Sep 17 00:00:00 2001
+From: Pablo Neira Ayuso <pablo@netfilter.org>
+Date: Thu, 23 Aug 2012 02:09:11 +0000
+Subject: netlink: fix possible spoofing from non-root processes
+
+
+From: Pablo Neira Ayuso <pablo@netfilter.org>
+
+[ Upstream commit 20e1db19db5d6b9e4e83021595eab0dc8f107bef ]
+
+Non-root user-space processes can send Netlink messages to other
+processes that are well-known for being subscribed to Netlink
+asynchronous notifications. This allows ilegitimate non-root
+process to send forged messages to Netlink subscribers.
+
+The userspace process usually verifies the legitimate origin in
+two ways:
+
+a) Socket credentials. If UID != 0, then the message comes from
+   some ilegitimate process and the message needs to be dropped.
+
+b) Netlink portID. In general, portID == 0 means that the origin
+   of the messages comes from the kernel. Thus, discarding any
+   message not coming from the kernel.
+
+However, ctnetlink sets the portID in event messages that has
+been triggered by some user-space process, eg. conntrack utility.
+So other processes subscribed to ctnetlink events, eg. conntrackd,
+know that the event was triggered by some user-space action.
+
+Neither of the two ways to discard ilegitimate messages coming
+from non-root processes can help for ctnetlink.
+
+This patch adds capability validation in case that dst_pid is set
+in netlink_sendmsg(). This approach is aggressive since existing
+applications using any Netlink bus to deliver messages between
+two user-space processes will break. Note that the exception is
+NETLINK_USERSOCK, since it is reserved for netlink-to-netlink
+userspace communication.
+
+Still, if anyone wants that his Netlink bus allows netlink-to-netlink
+userspace, then they can set NL_NONROOT_SEND. However, by default,
+I don't think it makes sense to allow to use NETLINK_ROUTE to
+communicate two processes that are sending no matter what information
+that is not related to link/neighbouring/routing. They should be using
+NETLINK_USERSOCK instead for that.
+
+Signed-off-by: Pablo Neira Ayuso <pablo@netfilter.org>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ net/netlink/af_netlink.c |    4 +++-
+ 1 file changed, 3 insertions(+), 1 deletion(-)
+
+--- a/net/netlink/af_netlink.c
++++ b/net/netlink/af_netlink.c
+@@ -1345,7 +1345,8 @@ static int netlink_sendmsg(struct kiocb
+               dst_pid = addr->nl_pid;
+               dst_group = ffs(addr->nl_groups);
+               err =  -EPERM;
+-              if (dst_group && !netlink_capable(sock, NL_NONROOT_SEND))
++              if ((dst_group || dst_pid) &&
++                  !netlink_capable(sock, NL_NONROOT_SEND))
+                       goto out;
+       } else {
+               dst_pid = nlk->dst_pid;
+@@ -2098,6 +2099,7 @@ static void __init netlink_add_usersock_
+       rcu_assign_pointer(nl_table[NETLINK_USERSOCK].listeners, listeners);
+       nl_table[NETLINK_USERSOCK].module = THIS_MODULE;
+       nl_table[NETLINK_USERSOCK].registered = 1;
++      nl_table[NETLINK_USERSOCK].nl_nonroot = NL_NONROOT_SEND;
+       netlink_table_ungrab();
+ }
diff --git a/queue-3.0/series b/queue-3.0/series
new file mode 100644 (file)
index 0000000..90fba4c
--- /dev/null
@@ -0,0 +1,23 @@
+net-allow-driver-to-limit-number-of-gso-segments-per-skb.patch
+sfc-fix-maximum-number-of-tso-segments-and-minimum-tx-queue-size.patch
+tcp-apply-device-tso-segment-limit-earlier.patch
+net_sched-gact-fix-potential-panic-in-tcf_gact.patch
+isdnloop-fix-and-simplify-isdnloop_init.patch
+net-core-fix-potential-memory-leak-in-dev_set_alias.patch
+af_packet-remove-bug-statement-in-tpacket_destruct_skb.patch
+ipv6-addrconf-avoid-calling-netdevice-notifiers-with-rcu-read-side-lock.patch
+atm-fix-info-leak-in-getsockopt-so_atmpvc.patch
+atm-fix-info-leak-via-getsockname.patch
+bluetooth-hci-fix-info-leak-in-getsockopt-hci_filter.patch
+bluetooth-hci-fix-info-leak-via-getsockname.patch
+bluetooth-rfcomm-fix-info-leak-in-getsockopt-bt_security.patch
+bluetooth-rfcomm-fix-info-leak-in-ioctl-rfcommgetdevlist.patch
+bluetooth-rfcomm-fix-info-leak-via-getsockname.patch
+bluetooth-l2cap-fix-info-leak-via-getsockname.patch
+llc-fix-info-leak-via-getsockname.patch
+dccp-fix-info-leak-via-getsockopt-dccp_sockopt_ccid_tx_info.patch
+ipvs-fix-info-leak-in-getsockopt-ip_vs_so_get_timeout.patch
+net-fix-info-leak-in-compat-dev_ifconf.patch
+netlink-fix-possible-spoofing-from-non-root-processes.patch
+l2tp-avoid-to-use-synchronize_rcu-in-tunnel-free-function.patch
+net-ipv4-ipmr_expire_timer-causes-crash-when-removing-net-namespace.patch
diff --git a/queue-3.0/sfc-fix-maximum-number-of-tso-segments-and-minimum-tx-queue-size.patch b/queue-3.0/sfc-fix-maximum-number-of-tso-segments-and-minimum-tx-queue-size.patch
new file mode 100644 (file)
index 0000000..869e882
--- /dev/null
@@ -0,0 +1,165 @@
+From 374fddbf0d6e4b4c8b7863052faf8d02337c9947 Mon Sep 17 00:00:00 2001
+From: Ben Hutchings <bhutchings@solarflare.com>
+Date: Mon, 30 Jul 2012 15:57:44 +0000
+Subject: sfc: Fix maximum number of TSO segments and minimum TX queue size
+
+
+From: Ben Hutchings <bhutchings@solarflare.com>
+
+[ Upstream commit 7e6d06f0de3f74ca929441add094518ae332257c ]
+
+Currently an skb requiring TSO may not fit within a minimum-size TX
+queue.  The TX queue selected for the skb may stall and trigger the TX
+watchdog repeatedly (since the problem skb will be retried after the
+TX reset).  This issue is designated as CVE-2012-3412.
+
+Set the maximum number of TSO segments for our devices to 100.  This
+should make no difference to behaviour unless the actual MSS is less
+than about 700.  Increase the minimum TX queue size accordingly to
+allow for 2 worst-case skbs, so that there will definitely be space
+to add an skb after we wake a queue.
+
+To avoid invalidating existing configurations, change
+efx_ethtool_set_ringparam() to fix up values that are too small rather
+than returning -EINVAL.
+
+Signed-off-by: Ben Hutchings <bhutchings@solarflare.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ drivers/net/sfc/efx.c     |    6 ++++++
+ drivers/net/sfc/efx.h     |   14 ++++++++++----
+ drivers/net/sfc/ethtool.c |   16 +++++++++++-----
+ drivers/net/sfc/nic.h     |    5 +++++
+ drivers/net/sfc/tx.c      |   19 +++++++++++++++++++
+ 5 files changed, 51 insertions(+), 9 deletions(-)
+
+--- a/drivers/net/sfc/efx.c
++++ b/drivers/net/sfc/efx.c
+@@ -1383,6 +1383,11 @@ static int efx_probe_all(struct efx_nic
+               goto fail2;
+       }
++      BUILD_BUG_ON(EFX_DEFAULT_DMAQ_SIZE < EFX_RXQ_MIN_ENT);
++      if (WARN_ON(EFX_DEFAULT_DMAQ_SIZE < EFX_TXQ_MIN_ENT(efx))) {
++              rc = -EINVAL;
++              goto fail3;
++      }
+       efx->rxq_entries = efx->txq_entries = EFX_DEFAULT_DMAQ_SIZE;
+       rc = efx_probe_channels(efx);
+       if (rc)
+@@ -1942,6 +1947,7 @@ static int efx_register_netdev(struct ef
+       net_dev->irq = efx->pci_dev->irq;
+       net_dev->netdev_ops = &efx_netdev_ops;
+       SET_ETHTOOL_OPS(net_dev, &efx_ethtool_ops);
++      net_dev->gso_max_segs = EFX_TSO_MAX_SEGS;
+       /* Clear MAC statistics */
+       efx->mac_op->update_stats(efx);
+--- a/drivers/net/sfc/efx.h
++++ b/drivers/net/sfc/efx.h
+@@ -38,6 +38,7 @@ extern netdev_tx_t
+ efx_enqueue_skb(struct efx_tx_queue *tx_queue, struct sk_buff *skb);
+ extern void efx_xmit_done(struct efx_tx_queue *tx_queue, unsigned int index);
+ extern int efx_setup_tc(struct net_device *net_dev, u8 num_tc);
++extern unsigned int efx_tx_max_skb_descs(struct efx_nic *efx);
+ /* RX */
+ extern int efx_probe_rx_queue(struct efx_rx_queue *rx_queue);
+@@ -60,10 +61,15 @@ extern void efx_schedule_slow_fill(struc
+ #define EFX_MAX_EVQ_SIZE 16384UL
+ #define EFX_MIN_EVQ_SIZE 512UL
+-/* The smallest [rt]xq_entries that the driver supports. Callers of
+- * efx_wake_queue() assume that they can subsequently send at least one
+- * skb. Falcon/A1 may require up to three descriptors per skb_frag. */
+-#define EFX_MIN_RING_SIZE (roundup_pow_of_two(2 * 3 * MAX_SKB_FRAGS))
++/* Maximum number of TCP segments we support for soft-TSO */
++#define EFX_TSO_MAX_SEGS      100
++
++/* The smallest [rt]xq_entries that the driver supports.  RX minimum
++ * is a bit arbitrary.  For TX, we must have space for at least 2
++ * TSO skbs.
++ */
++#define EFX_RXQ_MIN_ENT               128U
++#define EFX_TXQ_MIN_ENT(efx)  (2 * efx_tx_max_skb_descs(efx))
+ /* Filters */
+ extern int efx_probe_filters(struct efx_nic *efx);
+--- a/drivers/net/sfc/ethtool.c
++++ b/drivers/net/sfc/ethtool.c
+@@ -677,21 +677,27 @@ static int efx_ethtool_set_ringparam(str
+                                    struct ethtool_ringparam *ring)
+ {
+       struct efx_nic *efx = netdev_priv(net_dev);
++      u32 txq_entries;
+       if (ring->rx_mini_pending || ring->rx_jumbo_pending ||
+           ring->rx_pending > EFX_MAX_DMAQ_SIZE ||
+           ring->tx_pending > EFX_MAX_DMAQ_SIZE)
+               return -EINVAL;
+-      if (ring->rx_pending < EFX_MIN_RING_SIZE ||
+-          ring->tx_pending < EFX_MIN_RING_SIZE) {
++      if (ring->rx_pending < EFX_RXQ_MIN_ENT) {
+               netif_err(efx, drv, efx->net_dev,
+-                        "TX and RX queues cannot be smaller than %ld\n",
+-                        EFX_MIN_RING_SIZE);
++                        "RX queues cannot be smaller than %u\n",
++                        EFX_RXQ_MIN_ENT);
+               return -EINVAL;
+       }
+-      return efx_realloc_channels(efx, ring->rx_pending, ring->tx_pending);
++      txq_entries = max(ring->tx_pending, EFX_TXQ_MIN_ENT(efx));
++      if (txq_entries != ring->tx_pending)
++              netif_warn(efx, drv, efx->net_dev,
++                         "increasing TX queue size to minimum of %u\n",
++                         txq_entries);
++
++      return efx_realloc_channels(efx, ring->rx_pending, txq_entries);
+ }
+ static int efx_ethtool_set_pauseparam(struct net_device *net_dev,
+--- a/drivers/net/sfc/nic.h
++++ b/drivers/net/sfc/nic.h
+@@ -65,6 +65,11 @@ enum {
+ #define FALCON_GMAC_LOOPBACKS                 \
+       (1 << LOOPBACK_GMAC)
++/* Alignment of PCIe DMA boundaries (4KB) */
++#define EFX_PAGE_SIZE 4096
++/* Size and alignment of buffer table entries (same) */
++#define EFX_BUF_SIZE  EFX_PAGE_SIZE
++
+ /**
+  * struct falcon_board_type - board operations and type information
+  * @id: Board type id, as found in NVRAM
+--- a/drivers/net/sfc/tx.c
++++ b/drivers/net/sfc/tx.c
+@@ -115,6 +115,25 @@ efx_max_tx_len(struct efx_nic *efx, dma_
+       return len;
+ }
++unsigned int efx_tx_max_skb_descs(struct efx_nic *efx)
++{
++      /* Header and payload descriptor for each output segment, plus
++       * one for every input fragment boundary within a segment
++       */
++      unsigned int max_descs = EFX_TSO_MAX_SEGS * 2 + MAX_SKB_FRAGS;
++
++      /* Possibly one more per segment for the alignment workaround */
++      if (EFX_WORKAROUND_5391(efx))
++              max_descs += EFX_TSO_MAX_SEGS;
++
++      /* Possibly more for PCIe page boundaries within input fragments */
++      if (PAGE_SIZE > EFX_PAGE_SIZE)
++              max_descs += max_t(unsigned int, MAX_SKB_FRAGS,
++                                 DIV_ROUND_UP(GSO_MAX_SIZE, EFX_PAGE_SIZE));
++
++      return max_descs;
++}
++
+ /*
+  * Add a socket buffer to a TX queue
+  *
diff --git a/queue-3.0/tcp-apply-device-tso-segment-limit-earlier.patch b/queue-3.0/tcp-apply-device-tso-segment-limit-earlier.patch
new file mode 100644 (file)
index 0000000..2488e9a
--- /dev/null
@@ -0,0 +1,130 @@
+From 07f3d99da23489cb5315774d29ddd1ea885ad64f Mon Sep 17 00:00:00 2001
+From: Ben Hutchings <bhutchings@solarflare.com>
+Date: Mon, 30 Jul 2012 16:11:42 +0000
+Subject: tcp: Apply device TSO segment limit earlier
+
+
+From: Ben Hutchings <bhutchings@solarflare.com>
+
+[ Upstream commit 1485348d2424e1131ea42efc033cbd9366462b01 ]
+
+Cache the device gso_max_segs in sock::sk_gso_max_segs and use it to
+limit the size of TSO skbs.  This avoids the need to fall back to
+software GSO for local TCP senders.
+
+Signed-off-by: Ben Hutchings <bhutchings@solarflare.com>
+Signed-off-by: David S. Miller <davem@davemloft.net>
+Signed-off-by: Greg Kroah-Hartman <gregkh@linuxfoundation.org>
+---
+ include/net/sock.h    |    2 ++
+ net/core/sock.c       |    1 +
+ net/ipv4/tcp.c        |    4 +++-
+ net/ipv4/tcp_cong.c   |    3 ++-
+ net/ipv4/tcp_output.c |   21 ++++++++++++---------
+ 5 files changed, 20 insertions(+), 11 deletions(-)
+
+--- a/include/net/sock.h
++++ b/include/net/sock.h
+@@ -194,6 +194,7 @@ struct sock_common {
+   *   @sk_route_nocaps: forbidden route capabilities (e.g NETIF_F_GSO_MASK)
+   *   @sk_gso_type: GSO type (e.g. %SKB_GSO_TCPV4)
+   *   @sk_gso_max_size: Maximum GSO segment size to build
++  *   @sk_gso_max_segs: Maximum number of GSO segments
+   *   @sk_lingertime: %SO_LINGER l_linger setting
+   *   @sk_backlog: always used with the per-socket spinlock held
+   *   @sk_callback_lock: used with the callbacks in the end of this struct
+@@ -310,6 +311,7 @@ struct sock {
+       int                     sk_route_nocaps;
+       int                     sk_gso_type;
+       unsigned int            sk_gso_max_size;
++      u16                     sk_gso_max_segs;
+       int                     sk_rcvlowat;
+       unsigned long           sk_lingertime;
+       struct sk_buff_head     sk_error_queue;
+--- a/net/core/sock.c
++++ b/net/core/sock.c
+@@ -1312,6 +1312,7 @@ void sk_setup_caps(struct sock *sk, stru
+               } else {
+                       sk->sk_route_caps |= NETIF_F_SG | NETIF_F_HW_CSUM;
+                       sk->sk_gso_max_size = dst->dev->gso_max_size;
++                      sk->sk_gso_max_segs = dst->dev->gso_max_segs;
+               }
+       }
+ }
+--- a/net/ipv4/tcp.c
++++ b/net/ipv4/tcp.c
+@@ -739,7 +739,9 @@ static unsigned int tcp_xmit_size_goal(s
+                          old_size_goal + mss_now > xmit_size_goal)) {
+                       xmit_size_goal = old_size_goal;
+               } else {
+-                      tp->xmit_size_goal_segs = xmit_size_goal / mss_now;
++                      tp->xmit_size_goal_segs =
++                              min_t(u16, xmit_size_goal / mss_now,
++                                    sk->sk_gso_max_segs);
+                       xmit_size_goal = tp->xmit_size_goal_segs * mss_now;
+               }
+       }
+--- a/net/ipv4/tcp_cong.c
++++ b/net/ipv4/tcp_cong.c
+@@ -290,7 +290,8 @@ int tcp_is_cwnd_limited(const struct soc
+       left = tp->snd_cwnd - in_flight;
+       if (sk_can_gso(sk) &&
+           left * sysctl_tcp_tso_win_divisor < tp->snd_cwnd &&
+-          left * tp->mss_cache < sk->sk_gso_max_size)
++          left * tp->mss_cache < sk->sk_gso_max_size &&
++          left < sk->sk_gso_max_segs)
+               return 1;
+       return left <= tcp_max_burst(tp);
+ }
+--- a/net/ipv4/tcp_output.c
++++ b/net/ipv4/tcp_output.c
+@@ -1310,21 +1310,21 @@ static void tcp_cwnd_validate(struct soc
+  * when we would be allowed to send the split-due-to-Nagle skb fully.
+  */
+ static unsigned int tcp_mss_split_point(struct sock *sk, struct sk_buff *skb,
+-                                      unsigned int mss_now, unsigned int cwnd)
++                                      unsigned int mss_now, unsigned int max_segs)
+ {
+       struct tcp_sock *tp = tcp_sk(sk);
+-      u32 needed, window, cwnd_len;
++      u32 needed, window, max_len;
+       window = tcp_wnd_end(tp) - TCP_SKB_CB(skb)->seq;
+-      cwnd_len = mss_now * cwnd;
++      max_len = mss_now * max_segs;
+-      if (likely(cwnd_len <= window && skb != tcp_write_queue_tail(sk)))
+-              return cwnd_len;
++      if (likely(max_len <= window && skb != tcp_write_queue_tail(sk)))
++              return max_len;
+       needed = min(skb->len, window);
+-      if (cwnd_len <= needed)
+-              return cwnd_len;
++      if (max_len <= needed)
++              return max_len;
+       return needed - needed % mss_now;
+ }
+@@ -1551,7 +1551,8 @@ static int tcp_tso_should_defer(struct s
+       limit = min(send_win, cong_win);
+       /* If a full-sized TSO skb can be sent, do it. */
+-      if (limit >= sk->sk_gso_max_size)
++      if (limit >= min_t(unsigned int, sk->sk_gso_max_size,
++                         sk->sk_gso_max_segs * tp->mss_cache))
+               goto send_now;
+       /* Middle in queue won't get any more data, full sendable already? */
+@@ -1777,7 +1778,9 @@ static int tcp_write_xmit(struct sock *s
+               limit = mss_now;
+               if (tso_segs > 1 && !tcp_urg_mode(tp))
+                       limit = tcp_mss_split_point(sk, skb, mss_now,
+-                                                  cwnd_quota);
++                                                  min_t(unsigned int,
++                                                        cwnd_quota,
++                                                        sk->sk_gso_max_segs));
+               if (skb->len > limit &&
+                   unlikely(tso_fragment(sk, skb, limit, mss_now, gfp)))