[PATCH 1/4] ibmveth: Enable TCP checksum offload

Jeff Garzik jeff at garzik.org
Thu Jul 19 08:32:48 EST 2007


Brian King wrote:
> This patchset enables TCP checksum offload support for IPV4
> on ibmveth. This completely eliminates the generation and checking of
> the checksum for packets that are completely virtual and never
> touch a physical network. A simple TCP_STREAM netperf run on
> a virtual network with maximum mtu set yielded a ~30% increase
> in throughput. This feature is enabled by default on systems that
> support it, but can be disabled with a module option.
> 
> Signed-off-by: Brian King <brking at linux.vnet.ibm.com>

this should be controllable purely via ethtool...


> diff -puN drivers/net/ibmveth.c~ibmveth_csum_offload drivers/net/ibmveth.c
> --- linux-2.6/drivers/net/ibmveth.c~ibmveth_csum_offload	2007-07-12 08:27:47.000000000 -0500
> +++ linux-2.6-bjking1/drivers/net/ibmveth.c	2007-07-12 09:35:55.000000000 -0500
> @@ -47,6 +47,8 @@
>  #include <linux/mm.h>
>  #include <linux/ethtool.h>
>  #include <linux/proc_fs.h>
> +#include <linux/in.h>
> +#include <linux/ip.h>
>  #include <asm/semaphore.h>
>  #include <asm/hvcall.h>
>  #include <asm/atomic.h>
> @@ -103,12 +105,15 @@ static struct proc_dir_entry *ibmveth_pr
>  
>  static const char ibmveth_driver_name[] = "ibmveth";
>  static const char ibmveth_driver_string[] = "IBM i/pSeries Virtual Ethernet Driver";
> +static unsigned int ibmveth_csum_offload = 1;
>  #define ibmveth_driver_version "1.03"
>  
>  MODULE_AUTHOR("Santiago Leon <santil at us.ibm.com>");
>  MODULE_DESCRIPTION("IBM i/pSeries Virtual Ethernet Driver");
>  MODULE_LICENSE("GPL");
>  MODULE_VERSION(ibmveth_driver_version);
> +module_param_named(csum_offload, ibmveth_csum_offload, uint, 0);
> +MODULE_PARM_DESC(csum_offload, "Checksum offload (0/1). Default: 1");
>  
>  /* simple methods of getting data from the current rxq entry */
>  static inline int ibmveth_rxq_pending_buffer(struct ibmveth_adapter *adapter)
> @@ -131,6 +136,11 @@ static inline int ibmveth_rxq_frame_leng
>  	return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].length);
>  }
>  
> +static inline int ibmveth_rxq_csum_good(struct ibmveth_adapter *adapter)
> +{
> +	return (adapter->rx_queue.queue_addr[adapter->rx_queue.index].csum_good);
> +}
> +
>  /* setup the initial settings for a buffer pool */
>  static void ibmveth_init_buffer_pool(struct ibmveth_buff_pool *pool, u32 pool_index, u32 pool_size, u32 buff_size, u32 pool_active)
>  {
> @@ -684,6 +694,24 @@ static int ibmveth_start_xmit(struct sk_
>  					desc[0].fields.length, DMA_TO_DEVICE);
>  	desc[0].fields.valid   = 1;
>  
> +	if (skb->ip_summed == CHECKSUM_PARTIAL &&
> +	    ip_hdr(skb)->protocol != IPPROTO_TCP && skb_checksum_help(skb)) {
> +		ibmveth_error_printk("tx: failed to checksum packet\n");
> +		tx_dropped++;
> +		goto out;
> +	}
> +
> +	if (skb->ip_summed == CHECKSUM_PARTIAL) {
> +		unsigned char *buf = skb_transport_header(skb) + skb->csum_offset;
> +
> +		desc[0].fields.no_csum = 1;
> +		desc[0].fields.csum_good = 1;
> +
> +		/* Need to zero out the checksum */
> +		buf[0] = 0;
> +		buf[1] = 0;
> +	}
> +
>  	if(dma_mapping_error(desc[0].fields.address)) {
>  		ibmveth_error_printk("tx: unable to map initial fragment\n");
>  		tx_map_failed++;
> @@ -702,6 +730,10 @@ static int ibmveth_start_xmit(struct sk_
>  				frag->size, DMA_TO_DEVICE);
>  		desc[curfrag+1].fields.length = frag->size;
>  		desc[curfrag+1].fields.valid  = 1;
> +		if (skb->ip_summed == CHECKSUM_PARTIAL) {
> +			desc[curfrag+1].fields.no_csum = 1;
> +			desc[curfrag+1].fields.csum_good = 1;
> +		}
>  
>  		if(dma_mapping_error(desc[curfrag+1].fields.address)) {
>  			ibmveth_error_printk("tx: unable to map fragment %d\n", curfrag);
> @@ -792,7 +824,11 @@ static int ibmveth_poll(struct net_devic
>  			} else {
>  				int length = ibmveth_rxq_frame_length(adapter);
>  				int offset = ibmveth_rxq_frame_offset(adapter);
> +				int csum_good = ibmveth_rxq_csum_good(adapter);
> +
>  				skb = ibmveth_rxq_get_buffer(adapter);
> +				if (csum_good)
> +					skb->ip_summed = CHECKSUM_UNNECESSARY;
>  
>  				ibmveth_rxq_harvest_buffer(adapter);
>  
> @@ -962,8 +998,10 @@ static void ibmveth_poll_controller(stru
>  static int __devinit ibmveth_probe(struct vio_dev *dev, const struct vio_device_id *id)
>  {
>  	int rc, i;
> +	long ret;
>  	struct net_device *netdev;
>  	struct ibmveth_adapter *adapter = NULL;
> +	union ibmveth_illan_attributes set_attr, ret_attr;
>  
>  	unsigned char *mac_addr_p;
>  	unsigned int *mcastFilterSize_p;
> @@ -1058,6 +1096,26 @@ static int __devinit ibmveth_probe(struc
>  
>  	ibmveth_debug_printk("registering netdev...\n");
>  
> +	if (ibmveth_csum_offload) {
> +		ret = h_illan_attributes(dev->unit_address, 0, 0, &ret_attr.desc);
> +
> +		if (ret == H_SUCCESS && !ret_attr.fields.active_trunk &&
> +		    !ret_attr.fields.trunk_priority &&
> +		    ret_attr.fields.csum_offload_padded_pkt_support) {
> +			set_attr.desc = 0;
> +			set_attr.fields.tcp_csum_offload_ipv4 = 1;
> +
> +			ret = h_illan_attributes(dev->unit_address, 0, set_attr.desc,
> +						 &ret_attr.desc);
> +
> +			if (ret == H_SUCCESS)
> +				netdev->features |= NETIF_F_IP_CSUM;
> +			else
> +				ret = h_illan_attributes(dev->unit_address, set_attr.desc,
> +							 0, &ret_attr.desc);
> +		}
> +	}
> +
>  	rc = register_netdev(netdev);
>  
>  	if(rc) {
> diff -puN drivers/net/ibmveth.h~ibmveth_csum_offload drivers/net/ibmveth.h
> --- linux-2.6/drivers/net/ibmveth.h~ibmveth_csum_offload	2007-07-12 08:27:47.000000000 -0500
> +++ linux-2.6-bjking1/drivers/net/ibmveth.h	2007-07-12 09:32:54.000000000 -0500
> @@ -67,6 +67,21 @@ static inline long h_send_logical_lan(un
>  	return rc;
>  }
>  
> +static inline long h_illan_attributes(unsigned long unit_address,
> +				      unsigned long reset_mask, unsigned long set_mask,
> +				      unsigned long *ret_attributes)
> +{
> +	long rc;
> +	unsigned long retbuf[PLPAR_HCALL_BUFSIZE];
> +
> +	rc = plpar_hcall(H_ILLAN_ATTRIBUTES, retbuf, unit_address,
> +			 reset_mask, set_mask);
> +
> +	*ret_attributes = retbuf[0];
> +
> +	return rc;
> +}
> +
>  #define h_multicast_ctrl(ua, cmd, mac) \
>    plpar_hcall_norets(H_MULTICAST_CTRL, ua, cmd, mac)
>  
> @@ -144,7 +159,9 @@ struct ibmveth_adapter {
>  struct ibmveth_buf_desc_fields {
>      u32 valid : 1;
>      u32 toggle : 1;
> -    u32 reserved : 6;
> +    u32 reserved : 4;
> +    u32 no_csum : 1;
> +    u32 csum_good : 1;
>      u32 length : 24;
>      u32 address;
>  };
> @@ -154,10 +171,30 @@ union ibmveth_buf_desc {
>      struct ibmveth_buf_desc_fields fields;
>  };
>  
> +struct ibmveth_illan_attributes_fields {
> +	u32 reserved;
> +	u32 reserved2 : 18;
> +	u32 csum_offload_padded_pkt_support : 1;
> +	u32 reserved3 : 1;
> +	u32 trunk_priority : 4;
> +	u32 reserved4 : 5;
> +	u32 tcp_csum_offload_ipv6 : 1;
> +	u32 tcp_csum_offload_ipv4 : 1;
> +	u32 active_trunk : 1;
> +};
> +
> +union ibmveth_illan_attributes {
> +	u64 desc;
> +	struct ibmveth_illan_attributes_fields fields;
> +};
> +
>  struct ibmveth_rx_q_entry {
>      u16 toggle : 1;
>      u16 valid : 1;
> -    u16 reserved : 14;
> +    u16 reserved : 4;
> +    u16 no_csum : 1;
> +    u16 csum_good : 1;
> +    u16 reserved2 : 8;
>      u16 offset;

As a general rule, it would be nice to start moving away from bitfields 
in this driver




More information about the Linuxppc-dev mailing list