--- /dev/null
+Subject: cxgb3 - manage private iSCSI IP addresses
+From: Karen Xie <kxie@chelsio.com>
+References: FATE#304154,bnc#433500
+
+The accelerated iSCSI traffic uses a private IP address unknown to the OS.
+Create a per port sysfs entry to pass an IP address to the NIC driver,
+and a control call for the iSCSI driver to grab it.
+The IP address is required in both drivers to manage ARP requests and connection set up.
+
+Signed-off-by: Karen Xie <kxie@chelsio.com>
+Signed-off-by: Chandra Seetharaman <sekharan@us.ibm.com>
+Signed-off-by: Hannes Reinecke <hare@suse.de>
+
+---
+---
+ drivers/net/cxgb3/adapter.h | 1
+ drivers/net/cxgb3/cxgb3_ctl_defs.h | 9 ++++
+ drivers/net/cxgb3/cxgb3_main.c | 46 +++++++++++++++++++++++++
+ drivers/net/cxgb3/cxgb3_offload.c | 45 +++++++++++++++++-------
+ drivers/net/cxgb3/sge.c | 68 ++++++++++++++++++++++++++++++++++---
+ 5 files changed, 152 insertions(+), 17 deletions(-)
+
+--- a/drivers/net/cxgb3/adapter.h
++++ b/drivers/net/cxgb3/adapter.h
+@@ -64,6 +64,7 @@ struct port_info {
+ struct link_config link_config;
+ struct net_device_stats netstats;
+ int activity;
++ __be32 iscsi_ipv4addr;
+ };
+
+ enum { /* adapter flags */
+--- a/drivers/net/cxgb3/cxgb3_ctl_defs.h
++++ b/drivers/net/cxgb3/cxgb3_ctl_defs.h
+@@ -57,6 +57,9 @@ enum {
+ RDMA_GET_MIB = 19,
+
+ GET_RX_PAGE_INFO = 50,
++
++ GET_ISCSI_IPV4ADDR = 51,
++ SET_ISCSI_IPV4ADDR = 52,
+ };
+
+ /*
+@@ -86,6 +89,12 @@ struct iff_mac {
+ u16 vlan_tag;
+ };
+
++/* Structure used to request a port's iSCSI IPv4 address */
++struct iscsi_ipv4addr {
++ struct net_device *dev; /* the net_device */
++ __be32 ipv4addr; /* the return iSCSI IPv4 address */
++};
++
+ struct pci_dev;
+
+ /*
+--- a/drivers/net/cxgb3/cxgb3_main.c
++++ b/drivers/net/cxgb3/cxgb3_main.c
+@@ -44,6 +44,7 @@
+ #include <linux/rtnetlink.h>
+ #include <linux/firmware.h>
+ #include <linux/log2.h>
++#include <linux/inet.h>
+ #include <asm/uaccess.h>
+
+ #include "common.h"
+@@ -688,6 +689,47 @@ static struct attribute *offload_attrs[]
+
+ static struct attribute_group offload_attr_group = {.attrs = offload_attrs };
+
++static ssize_t iscsi_ipv4addr_attr_show(struct device *d, char *buf)
++{
++ struct port_info *pi = netdev_priv(to_net_dev(d));
++
++ __be32 a = pi->iscsi_ipv4addr;
++ return sprintf(buf, NIPQUAD_FMT "\n", NIPQUAD(a));
++}
++
++static ssize_t iscsi_ipv4addr_attr_store(struct device *d,
++ const char *buf, size_t len)
++{
++ struct port_info *pi = netdev_priv(to_net_dev(d));
++
++ pi->iscsi_ipv4addr = in_aton(buf);
++ return len;
++}
++
++#define ISCSI_IPADDR_ATTR(name) \
++static ssize_t show_##name(struct device *d, struct device_attribute *attr, \
++ char *buf) \
++{ \
++ return iscsi_ipv4addr_attr_show(d, buf); \
++} \
++static ssize_t store_##name(struct device *d, struct device_attribute *attr, \
++ const char *buf, size_t len) \
++{ \
++ return iscsi_ipv4addr_attr_store(d, buf, len); \
++} \
++static DEVICE_ATTR(name, S_IRUGO | S_IWUSR, show_##name, store_##name)
++
++ISCSI_IPADDR_ATTR(iscsi_ipv4addr);
++
++static struct attribute *iscsi_offload_attrs[] = {
++ &dev_attr_iscsi_ipv4addr.attr,
++ NULL
++};
++
++static struct attribute_group iscsi_offload_attr_group = {
++ .attrs = iscsi_offload_attrs
++};
++
+ /*
+ * Sends an sk_buff to an offload queue driver
+ * after dealing with any active network taps.
+@@ -1079,6 +1121,7 @@ static int cxgb_open(struct net_device *
+ if (err)
+ printk(KERN_WARNING
+ "Could not initialize offload capabilities\n");
++ sysfs_create_group(&dev->dev.kobj, &iscsi_offload_attr_group);
+ }
+
+ link_start(dev);
+@@ -1101,6 +1144,9 @@ static int cxgb_close(struct net_device
+ netif_carrier_off(dev);
+ t3_mac_disable(&pi->mac, MAC_DIRECTION_TX | MAC_DIRECTION_RX);
+
++ if (is_offload(adapter) && !ofld_disable)
++ sysfs_remove_group(&dev->dev.kobj, &iscsi_offload_attr_group);
++
+ spin_lock(&adapter->work_lock); /* sync with update task */
+ clear_bit(pi->port_id, &adapter->open_device_map);
+ spin_unlock(&adapter->work_lock);
+--- a/drivers/net/cxgb3/cxgb3_offload.c
++++ b/drivers/net/cxgb3/cxgb3_offload.c
+@@ -182,7 +182,9 @@ static struct net_device *get_iff_from_m
+ static int cxgb_ulp_iscsi_ctl(struct adapter *adapter, unsigned int req,
+ void *data)
+ {
++ int i;
+ int ret = 0;
++ unsigned int val = 0;
+ struct ulp_iscsi_info *uiip = data;
+
+ switch (req) {
+@@ -191,31 +193,36 @@ static int cxgb_ulp_iscsi_ctl(struct ada
+ uiip->llimit = t3_read_reg(adapter, A_ULPRX_ISCSI_LLIMIT);
+ uiip->ulimit = t3_read_reg(adapter, A_ULPRX_ISCSI_ULIMIT);
+ uiip->tagmask = t3_read_reg(adapter, A_ULPRX_ISCSI_TAGMASK);
++ val = t3_read_reg(adapter, A_ULPRX_ISCSI_PSZ);
++ for (i = 0; i < 4; i++, val >>= 8)
++ uiip->pgsz_factor[i] = val & 0xFF;
+ /*
+ * On tx, the iscsi pdu has to be <= tx page size and has to
+ * fit into the Tx PM FIFO.
+ */
+ uiip->max_txsz = min(adapter->params.tp.tx_pg_size,
+ t3_read_reg(adapter, A_PM1_TX_CFG) >> 17);
+- /* on rx, the iscsi pdu has to be < rx page size and the
+- whole pdu + cpl headers has to fit into one sge buffer */
+- uiip->max_rxsz = min_t(unsigned int,
+- adapter->params.tp.rx_pg_size,
+- (adapter->sge.qs[0].fl[1].buf_size -
+- sizeof(struct cpl_rx_data) * 2 -
+- sizeof(struct cpl_rx_data_ddp)));
++ /*
++ * on rx, the iscsi pdu has to be < rx page size and the
++ * the max rx data length programmed in TP
++ */
++ uiip->max_rxsz = min(adapter->params.tp.rx_pg_size,
++ ((t3_read_reg(adapter, A_TP_PARA_REG2))
++ >> S_MAXRXDATA) & M_MAXRXDATA);
+ break;
+ case ULP_ISCSI_SET_PARAMS:
+ t3_write_reg(adapter, A_ULPRX_ISCSI_TAGMASK, uiip->tagmask);
+ /* set MaxRxData and MaxCoalesceSize to 16224 */
+ t3_write_reg(adapter, A_TP_PARA_REG2, 0x3f603f60);
+ /* program the ddp page sizes */
+- {
+- int i;
+- unsigned int val = 0;
+- for (i = 0; i < 4; i++)
+- val |= (uiip->pgsz_factor[i] & 0xF) << (8 * i);
+- if (val)
++ for (val = 0, i = 0; i < 4; i++)
++ val |= (uiip->pgsz_factor[i] & 0xF) << (8 * i);
++ if (val && (val != t3_read_reg(adapter, A_ULPRX_ISCSI_PSZ))) {
++ printk(KERN_INFO
++ "%s, setting iscsi pgsz 0x%x, %u,%u,%u,%u.\n",
++ adapter->name, val, uiip->pgsz_factor[0],
++ uiip->pgsz_factor[1], uiip->pgsz_factor[2],
++ uiip->pgsz_factor[3]);
+ t3_write_reg(adapter, A_ULPRX_ISCSI_PSZ, val);
+ }
+ break;
+@@ -407,6 +414,18 @@ static int cxgb_offload_ctl(struct t3cde
+ rx_page_info->page_size = tp->rx_pg_size;
+ rx_page_info->num = tp->rx_num_pgs;
+ break;
++ case GET_ISCSI_IPV4ADDR: {
++ struct iscsi_ipv4addr *p = data;
++ struct port_info *pi = netdev_priv(p->dev);
++ p->ipv4addr = pi->iscsi_ipv4addr;
++ break;
++ }
++ case SET_ISCSI_IPV4ADDR: {
++ struct iscsi_ipv4addr *p = data;
++ struct port_info *pi = netdev_priv(p->dev);
++ pi->iscsi_ipv4addr = p->ipv4addr;
++ break;
++ }
+ default:
+ return -EOPNOTSUPP;
+ }
+--- a/drivers/net/cxgb3/sge.c
++++ b/drivers/net/cxgb3/sge.c
+@@ -36,6 +36,7 @@
+ #include <linux/ip.h>
+ #include <linux/tcp.h>
+ #include <linux/dma-mapping.h>
++#include <net/arp.h>
+ #include "common.h"
+ #include "regs.h"
+ #include "sge_defs.h"
+@@ -1856,6 +1857,53 @@ static void restart_tx(struct sge_qset *
+ }
+
+ /**
++ * cxgb3_arp_process - process an ARP request probing a private IP address
++ * @adapter: the adapter
++ * @skb: the skbuff containing the ARP request
++ *
++ * Check if the ARP request is probing the private IP address
++ * dedicated to iSCSI, generate an ARP reply if so.
++ */
++static void cxgb3_arp_process(struct adapter *adapter, struct sk_buff *skb)
++{
++ struct net_device *dev = skb->dev;
++ struct port_info *pi;
++ struct arphdr *arp;
++ unsigned char *arp_ptr;
++ unsigned char *sha;
++ __be32 sip, tip;
++
++ if (!dev)
++ return;
++
++ skb_reset_network_header(skb);
++ arp = arp_hdr(skb);
++
++ if (arp->ar_op != htons(ARPOP_REQUEST))
++ return;
++
++ arp_ptr = (unsigned char *)(arp + 1);
++ sha = arp_ptr;
++ arp_ptr += dev->addr_len;
++ memcpy(&sip, arp_ptr, sizeof(sip));
++ arp_ptr += sizeof(sip);
++ arp_ptr += dev->addr_len;
++ memcpy(&tip, arp_ptr, sizeof(tip));
++
++ pi = netdev_priv(dev);
++ if (tip != pi->iscsi_ipv4addr)
++ return;
++
++ arp_send(ARPOP_REPLY, ETH_P_ARP, sip, dev, tip, sha,
++ dev->dev_addr, sha);
++}
++
++static inline int is_arp(struct sk_buff *skb)
++{
++ return skb->protocol == htons(ETH_P_ARP);
++}
++
++/**
+ * rx_eth - process an ingress ethernet packet
+ * @adap: the adapter
+ * @rq: the response queue that received the packet
+@@ -1879,7 +1927,7 @@ static void rx_eth(struct adapter *adap,
+ pi = netdev_priv(skb->dev);
+ if (pi->rx_csum_offload && p->csum_valid && p->csum == htons(0xffff) &&
+ !p->fragment) {
+- rspq_to_qset(rq)->port_stats[SGE_PSTAT_RX_CSUM_GOOD]++;
++ qs->port_stats[SGE_PSTAT_RX_CSUM_GOOD]++;
+ skb->ip_summed = CHECKSUM_UNNECESSARY;
+ } else
+ skb->ip_summed = CHECKSUM_NONE;
+@@ -1894,16 +1942,28 @@ static void rx_eth(struct adapter *adap,
+ grp,
+ ntohs(p->vlan),
+ p);
+- else
++ else {
++ if (unlikely(pi->iscsi_ipv4addr &&
++ is_arp(skb))) {
++ unsigned short vtag = ntohs(p->vlan) &
++ VLAN_VID_MASK;
++ skb->dev = vlan_group_get_device(grp,
++ vtag);
++ cxgb3_arp_process(adap, skb);
++ }
+ __vlan_hwaccel_rx(skb, grp, ntohs(p->vlan),
+- rq->polling);
++ rq->polling);
++ }
+ else
+ dev_kfree_skb_any(skb);
+ } else if (rq->polling) {
+ if (lro)
+ lro_receive_skb(&qs->lro_mgr, skb, p);
+- else
++ else {
++ if (unlikely(pi->iscsi_ipv4addr && is_arp(skb)))
++ cxgb3_arp_process(adap, skb);
+ netif_receive_skb(skb);
++ }
+ } else
+ netif_rx(skb);
+ }