1f7917c00SJeff Kirsher /* 2f7917c00SJeff Kirsher * This file is part of the Chelsio T4 Ethernet driver for Linux. 3f7917c00SJeff Kirsher * 4f7917c00SJeff Kirsher * Copyright (c) 2003-2010 Chelsio Communications, Inc. All rights reserved. 5f7917c00SJeff Kirsher * 6f7917c00SJeff Kirsher * This software is available to you under a choice of one of two 7f7917c00SJeff Kirsher * licenses. You may choose to be licensed under the terms of the GNU 8f7917c00SJeff Kirsher * General Public License (GPL) Version 2, available from the file 9f7917c00SJeff Kirsher * COPYING in the main directory of this source tree, or the 10f7917c00SJeff Kirsher * OpenIB.org BSD license below: 11f7917c00SJeff Kirsher * 12f7917c00SJeff Kirsher * Redistribution and use in source and binary forms, with or 13f7917c00SJeff Kirsher * without modification, are permitted provided that the following 14f7917c00SJeff Kirsher * conditions are met: 15f7917c00SJeff Kirsher * 16f7917c00SJeff Kirsher * - Redistributions of source code must retain the above 17f7917c00SJeff Kirsher * copyright notice, this list of conditions and the following 18f7917c00SJeff Kirsher * disclaimer. 19f7917c00SJeff Kirsher * 20f7917c00SJeff Kirsher * - Redistributions in binary form must reproduce the above 21f7917c00SJeff Kirsher * copyright notice, this list of conditions and the following 22f7917c00SJeff Kirsher * disclaimer in the documentation and/or other materials 23f7917c00SJeff Kirsher * provided with the distribution. 24f7917c00SJeff Kirsher * 25f7917c00SJeff Kirsher * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 26f7917c00SJeff Kirsher * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 27f7917c00SJeff Kirsher * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 28f7917c00SJeff Kirsher * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 29f7917c00SJeff Kirsher * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 30f7917c00SJeff Kirsher * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 31f7917c00SJeff Kirsher * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 32f7917c00SJeff Kirsher * SOFTWARE. 33f7917c00SJeff Kirsher */ 34f7917c00SJeff Kirsher 35f7917c00SJeff Kirsher #include <linux/skbuff.h> 36f7917c00SJeff Kirsher #include <linux/netdevice.h> 37f7917c00SJeff Kirsher #include <linux/etherdevice.h> 38f7917c00SJeff Kirsher #include <linux/if_vlan.h> 39f7917c00SJeff Kirsher #include <linux/ip.h> 40f7917c00SJeff Kirsher #include <linux/dma-mapping.h> 41f7917c00SJeff Kirsher #include <linux/jiffies.h> 42f7917c00SJeff Kirsher #include <linux/prefetch.h> 43ee40fa06SPaul Gortmaker #include <linux/export.h> 44f7917c00SJeff Kirsher #include <net/ipv6.h> 45f7917c00SJeff Kirsher #include <net/tcp.h> 46f7917c00SJeff Kirsher #include "cxgb4.h" 47f7917c00SJeff Kirsher #include "t4_regs.h" 48f7917c00SJeff Kirsher #include "t4_msg.h" 49f7917c00SJeff Kirsher #include "t4fw_api.h" 50f7917c00SJeff Kirsher 51f7917c00SJeff Kirsher /* 52f7917c00SJeff Kirsher * Rx buffer size. We use largish buffers if possible but settle for single 53f7917c00SJeff Kirsher * pages under memory shortage. 54f7917c00SJeff Kirsher */ 55f7917c00SJeff Kirsher #if PAGE_SHIFT >= 16 56f7917c00SJeff Kirsher # define FL_PG_ORDER 0 57f7917c00SJeff Kirsher #else 58f7917c00SJeff Kirsher # define FL_PG_ORDER (16 - PAGE_SHIFT) 59f7917c00SJeff Kirsher #endif 60f7917c00SJeff Kirsher 61f7917c00SJeff Kirsher /* RX_PULL_LEN should be <= RX_COPY_THRES */ 62f7917c00SJeff Kirsher #define RX_COPY_THRES 256 63f7917c00SJeff Kirsher #define RX_PULL_LEN 128 64f7917c00SJeff Kirsher 65f7917c00SJeff Kirsher /* 66f7917c00SJeff Kirsher * Main body length for sk_buffs used for Rx Ethernet packets with fragments. 67f7917c00SJeff Kirsher * Should be >= RX_PULL_LEN but possibly bigger to give pskb_may_pull some room. 68f7917c00SJeff Kirsher */ 69f7917c00SJeff Kirsher #define RX_PKT_SKB_LEN 512 70f7917c00SJeff Kirsher 71f7917c00SJeff Kirsher /* 72f7917c00SJeff Kirsher * Max number of Tx descriptors we clean up at a time. Should be modest as 73f7917c00SJeff Kirsher * freeing skbs isn't cheap and it happens while holding locks. We just need 74f7917c00SJeff Kirsher * to free packets faster than they arrive, we eventually catch up and keep 75f7917c00SJeff Kirsher * the amortized cost reasonable. Must be >= 2 * TXQ_STOP_THRES. 76f7917c00SJeff Kirsher */ 77f7917c00SJeff Kirsher #define MAX_TX_RECLAIM 16 78f7917c00SJeff Kirsher 79f7917c00SJeff Kirsher /* 80f7917c00SJeff Kirsher * Max number of Rx buffers we replenish at a time. Again keep this modest, 81f7917c00SJeff Kirsher * allocating buffers isn't cheap either. 82f7917c00SJeff Kirsher */ 83f7917c00SJeff Kirsher #define MAX_RX_REFILL 16U 84f7917c00SJeff Kirsher 85f7917c00SJeff Kirsher /* 86f7917c00SJeff Kirsher * Period of the Rx queue check timer. This timer is infrequent as it has 87f7917c00SJeff Kirsher * something to do only when the system experiences severe memory shortage. 88f7917c00SJeff Kirsher */ 89f7917c00SJeff Kirsher #define RX_QCHECK_PERIOD (HZ / 2) 90f7917c00SJeff Kirsher 91f7917c00SJeff Kirsher /* 92f7917c00SJeff Kirsher * Period of the Tx queue check timer. 93f7917c00SJeff Kirsher */ 94f7917c00SJeff Kirsher #define TX_QCHECK_PERIOD (HZ / 2) 95f7917c00SJeff Kirsher 960f4d201fSKumar Sanghvi /* SGE Hung Ingress DMA Threshold Warning time (in Hz) and Warning Repeat Rate 970f4d201fSKumar Sanghvi * (in RX_QCHECK_PERIOD multiples). If we find one of the SGE Ingress DMA 980f4d201fSKumar Sanghvi * State Machines in the same state for this amount of time (in HZ) then we'll 990f4d201fSKumar Sanghvi * issue a warning about a potential hang. We'll repeat the warning as the 1000f4d201fSKumar Sanghvi * SGE Ingress DMA Channel appears to be hung every N RX_QCHECK_PERIODs till 1010f4d201fSKumar Sanghvi * the situation clears. If the situation clears, we'll note that as well. 1020f4d201fSKumar Sanghvi */ 1030f4d201fSKumar Sanghvi #define SGE_IDMA_WARN_THRESH (1 * HZ) 1040f4d201fSKumar Sanghvi #define SGE_IDMA_WARN_REPEAT (20 * RX_QCHECK_PERIOD) 1050f4d201fSKumar Sanghvi 106f7917c00SJeff Kirsher /* 107f7917c00SJeff Kirsher * Max number of Tx descriptors to be reclaimed by the Tx timer. 108f7917c00SJeff Kirsher */ 109f7917c00SJeff Kirsher #define MAX_TIMER_TX_RECLAIM 100 110f7917c00SJeff Kirsher 111f7917c00SJeff Kirsher /* 112f7917c00SJeff Kirsher * Timer index used when backing off due to memory shortage. 113f7917c00SJeff Kirsher */ 114f7917c00SJeff Kirsher #define NOMEM_TMR_IDX (SGE_NTIMERS - 1) 115f7917c00SJeff Kirsher 116f7917c00SJeff Kirsher /* 117f7917c00SJeff Kirsher * An FL with <= FL_STARVE_THRES buffers is starving and a periodic timer will 118f7917c00SJeff Kirsher * attempt to refill it. 119f7917c00SJeff Kirsher */ 120f7917c00SJeff Kirsher #define FL_STARVE_THRES 4 121f7917c00SJeff Kirsher 122f7917c00SJeff Kirsher /* 123f7917c00SJeff Kirsher * Suspend an Ethernet Tx queue with fewer available descriptors than this. 124f7917c00SJeff Kirsher * This is the same as calc_tx_descs() for a TSO packet with 125f7917c00SJeff Kirsher * nr_frags == MAX_SKB_FRAGS. 126f7917c00SJeff Kirsher */ 127f7917c00SJeff Kirsher #define ETHTXQ_STOP_THRES \ 128f7917c00SJeff Kirsher (1 + DIV_ROUND_UP((3 * MAX_SKB_FRAGS) / 2 + (MAX_SKB_FRAGS & 1), 8)) 129f7917c00SJeff Kirsher 130f7917c00SJeff Kirsher /* 131f7917c00SJeff Kirsher * Suspension threshold for non-Ethernet Tx queues. We require enough room 132f7917c00SJeff Kirsher * for a full sized WR. 133f7917c00SJeff Kirsher */ 134f7917c00SJeff Kirsher #define TXQ_STOP_THRES (SGE_MAX_WR_LEN / sizeof(struct tx_desc)) 135f7917c00SJeff Kirsher 136f7917c00SJeff Kirsher /* 137f7917c00SJeff Kirsher * Max Tx descriptor space we allow for an Ethernet packet to be inlined 138f7917c00SJeff Kirsher * into a WR. 139f7917c00SJeff Kirsher */ 140f7917c00SJeff Kirsher #define MAX_IMM_TX_PKT_LEN 128 141f7917c00SJeff Kirsher 142f7917c00SJeff Kirsher /* 143f7917c00SJeff Kirsher * Max size of a WR sent through a control Tx queue. 144f7917c00SJeff Kirsher */ 145f7917c00SJeff Kirsher #define MAX_CTRL_WR_LEN SGE_MAX_WR_LEN 146f7917c00SJeff Kirsher 147f7917c00SJeff Kirsher struct tx_sw_desc { /* SW state per Tx descriptor */ 148f7917c00SJeff Kirsher struct sk_buff *skb; 149f7917c00SJeff Kirsher struct ulptx_sgl *sgl; 150f7917c00SJeff Kirsher }; 151f7917c00SJeff Kirsher 152f7917c00SJeff Kirsher struct rx_sw_desc { /* SW state per Rx descriptor */ 153f7917c00SJeff Kirsher struct page *page; 154f7917c00SJeff Kirsher dma_addr_t dma_addr; 155f7917c00SJeff Kirsher }; 156f7917c00SJeff Kirsher 157f7917c00SJeff Kirsher /* 15852367a76SVipul Pandya * Rx buffer sizes for "useskbs" Free List buffers (one ingress packet pe skb 15952367a76SVipul Pandya * buffer). We currently only support two sizes for 1500- and 9000-byte MTUs. 16052367a76SVipul Pandya * We could easily support more but there doesn't seem to be much need for 16152367a76SVipul Pandya * that ... 16252367a76SVipul Pandya */ 16352367a76SVipul Pandya #define FL_MTU_SMALL 1500 16452367a76SVipul Pandya #define FL_MTU_LARGE 9000 16552367a76SVipul Pandya 16652367a76SVipul Pandya static inline unsigned int fl_mtu_bufsize(struct adapter *adapter, 16752367a76SVipul Pandya unsigned int mtu) 16852367a76SVipul Pandya { 16952367a76SVipul Pandya struct sge *s = &adapter->sge; 17052367a76SVipul Pandya 17152367a76SVipul Pandya return ALIGN(s->pktshift + ETH_HLEN + VLAN_HLEN + mtu, s->fl_align); 17252367a76SVipul Pandya } 17352367a76SVipul Pandya 17452367a76SVipul Pandya #define FL_MTU_SMALL_BUFSIZE(adapter) fl_mtu_bufsize(adapter, FL_MTU_SMALL) 17552367a76SVipul Pandya #define FL_MTU_LARGE_BUFSIZE(adapter) fl_mtu_bufsize(adapter, FL_MTU_LARGE) 17652367a76SVipul Pandya 17752367a76SVipul Pandya /* 17852367a76SVipul Pandya * Bits 0..3 of rx_sw_desc.dma_addr have special meaning. The hardware uses 17952367a76SVipul Pandya * these to specify the buffer size as an index into the SGE Free List Buffer 18052367a76SVipul Pandya * Size register array. We also use bit 4, when the buffer has been unmapped 18152367a76SVipul Pandya * for DMA, but this is of course never sent to the hardware and is only used 18252367a76SVipul Pandya * to prevent double unmappings. All of the above requires that the Free List 18352367a76SVipul Pandya * Buffers which we allocate have the bottom 5 bits free (0) -- i.e. are 18452367a76SVipul Pandya * 32-byte or or a power of 2 greater in alignment. Since the SGE's minimal 18552367a76SVipul Pandya * Free List Buffer alignment is 32 bytes, this works out for us ... 186f7917c00SJeff Kirsher */ 187f7917c00SJeff Kirsher enum { 18852367a76SVipul Pandya RX_BUF_FLAGS = 0x1f, /* bottom five bits are special */ 18952367a76SVipul Pandya RX_BUF_SIZE = 0x0f, /* bottom three bits are for buf sizes */ 19052367a76SVipul Pandya RX_UNMAPPED_BUF = 0x10, /* buffer is not mapped */ 19152367a76SVipul Pandya 19252367a76SVipul Pandya /* 19352367a76SVipul Pandya * XXX We shouldn't depend on being able to use these indices. 19452367a76SVipul Pandya * XXX Especially when some other Master PF has initialized the 19552367a76SVipul Pandya * XXX adapter or we use the Firmware Configuration File. We 19652367a76SVipul Pandya * XXX should really search through the Host Buffer Size register 19752367a76SVipul Pandya * XXX array for the appropriately sized buffer indices. 19852367a76SVipul Pandya */ 19952367a76SVipul Pandya RX_SMALL_PG_BUF = 0x0, /* small (PAGE_SIZE) page buffer */ 20052367a76SVipul Pandya RX_LARGE_PG_BUF = 0x1, /* buffer large (FL_PG_ORDER) page buffer */ 20152367a76SVipul Pandya 20252367a76SVipul Pandya RX_SMALL_MTU_BUF = 0x2, /* small MTU buffer */ 20352367a76SVipul Pandya RX_LARGE_MTU_BUF = 0x3, /* large MTU buffer */ 204f7917c00SJeff Kirsher }; 205f7917c00SJeff Kirsher 206f7917c00SJeff Kirsher static inline dma_addr_t get_buf_addr(const struct rx_sw_desc *d) 207f7917c00SJeff Kirsher { 20852367a76SVipul Pandya return d->dma_addr & ~(dma_addr_t)RX_BUF_FLAGS; 209f7917c00SJeff Kirsher } 210f7917c00SJeff Kirsher 211f7917c00SJeff Kirsher static inline bool is_buf_mapped(const struct rx_sw_desc *d) 212f7917c00SJeff Kirsher { 213f7917c00SJeff Kirsher return !(d->dma_addr & RX_UNMAPPED_BUF); 214f7917c00SJeff Kirsher } 215f7917c00SJeff Kirsher 216f7917c00SJeff Kirsher /** 217f7917c00SJeff Kirsher * txq_avail - return the number of available slots in a Tx queue 218f7917c00SJeff Kirsher * @q: the Tx queue 219f7917c00SJeff Kirsher * 220f7917c00SJeff Kirsher * Returns the number of descriptors in a Tx queue available to write new 221f7917c00SJeff Kirsher * packets. 222f7917c00SJeff Kirsher */ 223f7917c00SJeff Kirsher static inline unsigned int txq_avail(const struct sge_txq *q) 224f7917c00SJeff Kirsher { 225f7917c00SJeff Kirsher return q->size - 1 - q->in_use; 226f7917c00SJeff Kirsher } 227f7917c00SJeff Kirsher 228f7917c00SJeff Kirsher /** 229f7917c00SJeff Kirsher * fl_cap - return the capacity of a free-buffer list 230f7917c00SJeff Kirsher * @fl: the FL 231f7917c00SJeff Kirsher * 232f7917c00SJeff Kirsher * Returns the capacity of a free-buffer list. The capacity is less than 233f7917c00SJeff Kirsher * the size because one descriptor needs to be left unpopulated, otherwise 234f7917c00SJeff Kirsher * HW will think the FL is empty. 235f7917c00SJeff Kirsher */ 236f7917c00SJeff Kirsher static inline unsigned int fl_cap(const struct sge_fl *fl) 237f7917c00SJeff Kirsher { 238f7917c00SJeff Kirsher return fl->size - 8; /* 1 descriptor = 8 buffers */ 239f7917c00SJeff Kirsher } 240f7917c00SJeff Kirsher 241f7917c00SJeff Kirsher static inline bool fl_starving(const struct sge_fl *fl) 242f7917c00SJeff Kirsher { 243f7917c00SJeff Kirsher return fl->avail - fl->pend_cred <= FL_STARVE_THRES; 244f7917c00SJeff Kirsher } 245f7917c00SJeff Kirsher 246f7917c00SJeff Kirsher static int map_skb(struct device *dev, const struct sk_buff *skb, 247f7917c00SJeff Kirsher dma_addr_t *addr) 248f7917c00SJeff Kirsher { 249f7917c00SJeff Kirsher const skb_frag_t *fp, *end; 250f7917c00SJeff Kirsher const struct skb_shared_info *si; 251f7917c00SJeff Kirsher 252f7917c00SJeff Kirsher *addr = dma_map_single(dev, skb->data, skb_headlen(skb), DMA_TO_DEVICE); 253f7917c00SJeff Kirsher if (dma_mapping_error(dev, *addr)) 254f7917c00SJeff Kirsher goto out_err; 255f7917c00SJeff Kirsher 256f7917c00SJeff Kirsher si = skb_shinfo(skb); 257f7917c00SJeff Kirsher end = &si->frags[si->nr_frags]; 258f7917c00SJeff Kirsher 259f7917c00SJeff Kirsher for (fp = si->frags; fp < end; fp++) { 260e91b0f24SIan Campbell *++addr = skb_frag_dma_map(dev, fp, 0, skb_frag_size(fp), 261e91b0f24SIan Campbell DMA_TO_DEVICE); 262f7917c00SJeff Kirsher if (dma_mapping_error(dev, *addr)) 263f7917c00SJeff Kirsher goto unwind; 264f7917c00SJeff Kirsher } 265f7917c00SJeff Kirsher return 0; 266f7917c00SJeff Kirsher 267f7917c00SJeff Kirsher unwind: 268f7917c00SJeff Kirsher while (fp-- > si->frags) 2699e903e08SEric Dumazet dma_unmap_page(dev, *--addr, skb_frag_size(fp), DMA_TO_DEVICE); 270f7917c00SJeff Kirsher 271f7917c00SJeff Kirsher dma_unmap_single(dev, addr[-1], skb_headlen(skb), DMA_TO_DEVICE); 272f7917c00SJeff Kirsher out_err: 273f7917c00SJeff Kirsher return -ENOMEM; 274f7917c00SJeff Kirsher } 275f7917c00SJeff Kirsher 276f7917c00SJeff Kirsher #ifdef CONFIG_NEED_DMA_MAP_STATE 277f7917c00SJeff Kirsher static void unmap_skb(struct device *dev, const struct sk_buff *skb, 278f7917c00SJeff Kirsher const dma_addr_t *addr) 279f7917c00SJeff Kirsher { 280f7917c00SJeff Kirsher const skb_frag_t *fp, *end; 281f7917c00SJeff Kirsher const struct skb_shared_info *si; 282f7917c00SJeff Kirsher 283f7917c00SJeff Kirsher dma_unmap_single(dev, *addr++, skb_headlen(skb), DMA_TO_DEVICE); 284f7917c00SJeff Kirsher 285f7917c00SJeff Kirsher si = skb_shinfo(skb); 286f7917c00SJeff Kirsher end = &si->frags[si->nr_frags]; 287f7917c00SJeff Kirsher for (fp = si->frags; fp < end; fp++) 2889e903e08SEric Dumazet dma_unmap_page(dev, *addr++, skb_frag_size(fp), DMA_TO_DEVICE); 289f7917c00SJeff Kirsher } 290f7917c00SJeff Kirsher 291f7917c00SJeff Kirsher /** 292f7917c00SJeff Kirsher * deferred_unmap_destructor - unmap a packet when it is freed 293f7917c00SJeff Kirsher * @skb: the packet 294f7917c00SJeff Kirsher * 295f7917c00SJeff Kirsher * This is the packet destructor used for Tx packets that need to remain 296f7917c00SJeff Kirsher * mapped until they are freed rather than until their Tx descriptors are 297f7917c00SJeff Kirsher * freed. 298f7917c00SJeff Kirsher */ 299f7917c00SJeff Kirsher static void deferred_unmap_destructor(struct sk_buff *skb) 300f7917c00SJeff Kirsher { 301f7917c00SJeff Kirsher unmap_skb(skb->dev->dev.parent, skb, (dma_addr_t *)skb->head); 302f7917c00SJeff Kirsher } 303f7917c00SJeff Kirsher #endif 304f7917c00SJeff Kirsher 305f7917c00SJeff Kirsher static void unmap_sgl(struct device *dev, const struct sk_buff *skb, 306f7917c00SJeff Kirsher const struct ulptx_sgl *sgl, const struct sge_txq *q) 307f7917c00SJeff Kirsher { 308f7917c00SJeff Kirsher const struct ulptx_sge_pair *p; 309f7917c00SJeff Kirsher unsigned int nfrags = skb_shinfo(skb)->nr_frags; 310f7917c00SJeff Kirsher 311f7917c00SJeff Kirsher if (likely(skb_headlen(skb))) 312f7917c00SJeff Kirsher dma_unmap_single(dev, be64_to_cpu(sgl->addr0), ntohl(sgl->len0), 313f7917c00SJeff Kirsher DMA_TO_DEVICE); 314f7917c00SJeff Kirsher else { 315f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(sgl->addr0), ntohl(sgl->len0), 316f7917c00SJeff Kirsher DMA_TO_DEVICE); 317f7917c00SJeff Kirsher nfrags--; 318f7917c00SJeff Kirsher } 319f7917c00SJeff Kirsher 320f7917c00SJeff Kirsher /* 321f7917c00SJeff Kirsher * the complexity below is because of the possibility of a wrap-around 322f7917c00SJeff Kirsher * in the middle of an SGL 323f7917c00SJeff Kirsher */ 324f7917c00SJeff Kirsher for (p = sgl->sge; nfrags >= 2; nfrags -= 2) { 325f7917c00SJeff Kirsher if (likely((u8 *)(p + 1) <= (u8 *)q->stat)) { 326f7917c00SJeff Kirsher unmap: dma_unmap_page(dev, be64_to_cpu(p->addr[0]), 327f7917c00SJeff Kirsher ntohl(p->len[0]), DMA_TO_DEVICE); 328f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(p->addr[1]), 329f7917c00SJeff Kirsher ntohl(p->len[1]), DMA_TO_DEVICE); 330f7917c00SJeff Kirsher p++; 331f7917c00SJeff Kirsher } else if ((u8 *)p == (u8 *)q->stat) { 332f7917c00SJeff Kirsher p = (const struct ulptx_sge_pair *)q->desc; 333f7917c00SJeff Kirsher goto unmap; 334f7917c00SJeff Kirsher } else if ((u8 *)p + 8 == (u8 *)q->stat) { 335f7917c00SJeff Kirsher const __be64 *addr = (const __be64 *)q->desc; 336f7917c00SJeff Kirsher 337f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(addr[0]), 338f7917c00SJeff Kirsher ntohl(p->len[0]), DMA_TO_DEVICE); 339f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(addr[1]), 340f7917c00SJeff Kirsher ntohl(p->len[1]), DMA_TO_DEVICE); 341f7917c00SJeff Kirsher p = (const struct ulptx_sge_pair *)&addr[2]; 342f7917c00SJeff Kirsher } else { 343f7917c00SJeff Kirsher const __be64 *addr = (const __be64 *)q->desc; 344f7917c00SJeff Kirsher 345f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(p->addr[0]), 346f7917c00SJeff Kirsher ntohl(p->len[0]), DMA_TO_DEVICE); 347f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(addr[0]), 348f7917c00SJeff Kirsher ntohl(p->len[1]), DMA_TO_DEVICE); 349f7917c00SJeff Kirsher p = (const struct ulptx_sge_pair *)&addr[1]; 350f7917c00SJeff Kirsher } 351f7917c00SJeff Kirsher } 352f7917c00SJeff Kirsher if (nfrags) { 353f7917c00SJeff Kirsher __be64 addr; 354f7917c00SJeff Kirsher 355f7917c00SJeff Kirsher if ((u8 *)p == (u8 *)q->stat) 356f7917c00SJeff Kirsher p = (const struct ulptx_sge_pair *)q->desc; 357f7917c00SJeff Kirsher addr = (u8 *)p + 16 <= (u8 *)q->stat ? p->addr[0] : 358f7917c00SJeff Kirsher *(const __be64 *)q->desc; 359f7917c00SJeff Kirsher dma_unmap_page(dev, be64_to_cpu(addr), ntohl(p->len[0]), 360f7917c00SJeff Kirsher DMA_TO_DEVICE); 361f7917c00SJeff Kirsher } 362f7917c00SJeff Kirsher } 363f7917c00SJeff Kirsher 364f7917c00SJeff Kirsher /** 365f7917c00SJeff Kirsher * free_tx_desc - reclaims Tx descriptors and their buffers 366f7917c00SJeff Kirsher * @adapter: the adapter 367f7917c00SJeff Kirsher * @q: the Tx queue to reclaim descriptors from 368f7917c00SJeff Kirsher * @n: the number of descriptors to reclaim 369f7917c00SJeff Kirsher * @unmap: whether the buffers should be unmapped for DMA 370f7917c00SJeff Kirsher * 371f7917c00SJeff Kirsher * Reclaims Tx descriptors from an SGE Tx queue and frees the associated 372f7917c00SJeff Kirsher * Tx buffers. Called with the Tx queue lock held. 373f7917c00SJeff Kirsher */ 374f7917c00SJeff Kirsher static void free_tx_desc(struct adapter *adap, struct sge_txq *q, 375f7917c00SJeff Kirsher unsigned int n, bool unmap) 376f7917c00SJeff Kirsher { 377f7917c00SJeff Kirsher struct tx_sw_desc *d; 378f7917c00SJeff Kirsher unsigned int cidx = q->cidx; 379f7917c00SJeff Kirsher struct device *dev = adap->pdev_dev; 380f7917c00SJeff Kirsher 381f7917c00SJeff Kirsher d = &q->sdesc[cidx]; 382f7917c00SJeff Kirsher while (n--) { 383f7917c00SJeff Kirsher if (d->skb) { /* an SGL is present */ 384f7917c00SJeff Kirsher if (unmap) 385f7917c00SJeff Kirsher unmap_sgl(dev, d->skb, d->sgl, q); 386f7917c00SJeff Kirsher kfree_skb(d->skb); 387f7917c00SJeff Kirsher d->skb = NULL; 388f7917c00SJeff Kirsher } 389f7917c00SJeff Kirsher ++d; 390f7917c00SJeff Kirsher if (++cidx == q->size) { 391f7917c00SJeff Kirsher cidx = 0; 392f7917c00SJeff Kirsher d = q->sdesc; 393f7917c00SJeff Kirsher } 394f7917c00SJeff Kirsher } 395f7917c00SJeff Kirsher q->cidx = cidx; 396f7917c00SJeff Kirsher } 397f7917c00SJeff Kirsher 398f7917c00SJeff Kirsher /* 399f7917c00SJeff Kirsher * Return the number of reclaimable descriptors in a Tx queue. 400f7917c00SJeff Kirsher */ 401f7917c00SJeff Kirsher static inline int reclaimable(const struct sge_txq *q) 402f7917c00SJeff Kirsher { 403f7917c00SJeff Kirsher int hw_cidx = ntohs(q->stat->cidx); 404f7917c00SJeff Kirsher hw_cidx -= q->cidx; 405f7917c00SJeff Kirsher return hw_cidx < 0 ? hw_cidx + q->size : hw_cidx; 406f7917c00SJeff Kirsher } 407f7917c00SJeff Kirsher 408f7917c00SJeff Kirsher /** 409f7917c00SJeff Kirsher * reclaim_completed_tx - reclaims completed Tx descriptors 410f7917c00SJeff Kirsher * @adap: the adapter 411f7917c00SJeff Kirsher * @q: the Tx queue to reclaim completed descriptors from 412f7917c00SJeff Kirsher * @unmap: whether the buffers should be unmapped for DMA 413f7917c00SJeff Kirsher * 414f7917c00SJeff Kirsher * Reclaims Tx descriptors that the SGE has indicated it has processed, 415f7917c00SJeff Kirsher * and frees the associated buffers if possible. Called with the Tx 416f7917c00SJeff Kirsher * queue locked. 417f7917c00SJeff Kirsher */ 418f7917c00SJeff Kirsher static inline void reclaim_completed_tx(struct adapter *adap, struct sge_txq *q, 419f7917c00SJeff Kirsher bool unmap) 420f7917c00SJeff Kirsher { 421f7917c00SJeff Kirsher int avail = reclaimable(q); 422f7917c00SJeff Kirsher 423f7917c00SJeff Kirsher if (avail) { 424f7917c00SJeff Kirsher /* 425f7917c00SJeff Kirsher * Limit the amount of clean up work we do at a time to keep 426f7917c00SJeff Kirsher * the Tx lock hold time O(1). 427f7917c00SJeff Kirsher */ 428f7917c00SJeff Kirsher if (avail > MAX_TX_RECLAIM) 429f7917c00SJeff Kirsher avail = MAX_TX_RECLAIM; 430f7917c00SJeff Kirsher 431f7917c00SJeff Kirsher free_tx_desc(adap, q, avail, unmap); 432f7917c00SJeff Kirsher q->in_use -= avail; 433f7917c00SJeff Kirsher } 434f7917c00SJeff Kirsher } 435f7917c00SJeff Kirsher 43652367a76SVipul Pandya static inline int get_buf_size(struct adapter *adapter, 43752367a76SVipul Pandya const struct rx_sw_desc *d) 438f7917c00SJeff Kirsher { 43952367a76SVipul Pandya struct sge *s = &adapter->sge; 44052367a76SVipul Pandya unsigned int rx_buf_size_idx = d->dma_addr & RX_BUF_SIZE; 44152367a76SVipul Pandya int buf_size; 44252367a76SVipul Pandya 44352367a76SVipul Pandya switch (rx_buf_size_idx) { 44452367a76SVipul Pandya case RX_SMALL_PG_BUF: 44552367a76SVipul Pandya buf_size = PAGE_SIZE; 44652367a76SVipul Pandya break; 44752367a76SVipul Pandya 44852367a76SVipul Pandya case RX_LARGE_PG_BUF: 44952367a76SVipul Pandya buf_size = PAGE_SIZE << s->fl_pg_order; 45052367a76SVipul Pandya break; 45152367a76SVipul Pandya 45252367a76SVipul Pandya case RX_SMALL_MTU_BUF: 45352367a76SVipul Pandya buf_size = FL_MTU_SMALL_BUFSIZE(adapter); 45452367a76SVipul Pandya break; 45552367a76SVipul Pandya 45652367a76SVipul Pandya case RX_LARGE_MTU_BUF: 45752367a76SVipul Pandya buf_size = FL_MTU_LARGE_BUFSIZE(adapter); 45852367a76SVipul Pandya break; 45952367a76SVipul Pandya 46052367a76SVipul Pandya default: 46152367a76SVipul Pandya BUG_ON(1); 46252367a76SVipul Pandya } 46352367a76SVipul Pandya 46452367a76SVipul Pandya return buf_size; 465f7917c00SJeff Kirsher } 466f7917c00SJeff Kirsher 467f7917c00SJeff Kirsher /** 468f7917c00SJeff Kirsher * free_rx_bufs - free the Rx buffers on an SGE free list 469f7917c00SJeff Kirsher * @adap: the adapter 470f7917c00SJeff Kirsher * @q: the SGE free list to free buffers from 471f7917c00SJeff Kirsher * @n: how many buffers to free 472f7917c00SJeff Kirsher * 473f7917c00SJeff Kirsher * Release the next @n buffers on an SGE free-buffer Rx queue. The 474f7917c00SJeff Kirsher * buffers must be made inaccessible to HW before calling this function. 475f7917c00SJeff Kirsher */ 476f7917c00SJeff Kirsher static void free_rx_bufs(struct adapter *adap, struct sge_fl *q, int n) 477f7917c00SJeff Kirsher { 478f7917c00SJeff Kirsher while (n--) { 479f7917c00SJeff Kirsher struct rx_sw_desc *d = &q->sdesc[q->cidx]; 480f7917c00SJeff Kirsher 481f7917c00SJeff Kirsher if (is_buf_mapped(d)) 482f7917c00SJeff Kirsher dma_unmap_page(adap->pdev_dev, get_buf_addr(d), 48352367a76SVipul Pandya get_buf_size(adap, d), 48452367a76SVipul Pandya PCI_DMA_FROMDEVICE); 485f7917c00SJeff Kirsher put_page(d->page); 486f7917c00SJeff Kirsher d->page = NULL; 487f7917c00SJeff Kirsher if (++q->cidx == q->size) 488f7917c00SJeff Kirsher q->cidx = 0; 489f7917c00SJeff Kirsher q->avail--; 490f7917c00SJeff Kirsher } 491f7917c00SJeff Kirsher } 492f7917c00SJeff Kirsher 493f7917c00SJeff Kirsher /** 494f7917c00SJeff Kirsher * unmap_rx_buf - unmap the current Rx buffer on an SGE free list 495f7917c00SJeff Kirsher * @adap: the adapter 496f7917c00SJeff Kirsher * @q: the SGE free list 497f7917c00SJeff Kirsher * 498f7917c00SJeff Kirsher * Unmap the current buffer on an SGE free-buffer Rx queue. The 499f7917c00SJeff Kirsher * buffer must be made inaccessible to HW before calling this function. 500f7917c00SJeff Kirsher * 501f7917c00SJeff Kirsher * This is similar to @free_rx_bufs above but does not free the buffer. 502f7917c00SJeff Kirsher * Do note that the FL still loses any further access to the buffer. 503f7917c00SJeff Kirsher */ 504f7917c00SJeff Kirsher static void unmap_rx_buf(struct adapter *adap, struct sge_fl *q) 505f7917c00SJeff Kirsher { 506f7917c00SJeff Kirsher struct rx_sw_desc *d = &q->sdesc[q->cidx]; 507f7917c00SJeff Kirsher 508f7917c00SJeff Kirsher if (is_buf_mapped(d)) 509f7917c00SJeff Kirsher dma_unmap_page(adap->pdev_dev, get_buf_addr(d), 51052367a76SVipul Pandya get_buf_size(adap, d), PCI_DMA_FROMDEVICE); 511f7917c00SJeff Kirsher d->page = NULL; 512f7917c00SJeff Kirsher if (++q->cidx == q->size) 513f7917c00SJeff Kirsher q->cidx = 0; 514f7917c00SJeff Kirsher q->avail--; 515f7917c00SJeff Kirsher } 516f7917c00SJeff Kirsher 517f7917c00SJeff Kirsher static inline void ring_fl_db(struct adapter *adap, struct sge_fl *q) 518f7917c00SJeff Kirsher { 5190a57a536SSantosh Rastapur u32 val; 520f7917c00SJeff Kirsher if (q->pend_cred >= 8) { 5210a57a536SSantosh Rastapur val = PIDX(q->pend_cred / 8); 522d14807ddSHariprasad Shenai if (!is_t4(adap->params.chip)) 5230a57a536SSantosh Rastapur val |= DBTYPE(1); 524f7917c00SJeff Kirsher wmb(); 525ce91a923SNaresh Kumar Inna t4_write_reg(adap, MYPF_REG(SGE_PF_KDOORBELL), DBPRIO(1) | 5260a57a536SSantosh Rastapur QID(q->cntxt_id) | val); 527f7917c00SJeff Kirsher q->pend_cred &= 7; 528f7917c00SJeff Kirsher } 529f7917c00SJeff Kirsher } 530f7917c00SJeff Kirsher 531f7917c00SJeff Kirsher static inline void set_rx_sw_desc(struct rx_sw_desc *sd, struct page *pg, 532f7917c00SJeff Kirsher dma_addr_t mapping) 533f7917c00SJeff Kirsher { 534f7917c00SJeff Kirsher sd->page = pg; 535f7917c00SJeff Kirsher sd->dma_addr = mapping; /* includes size low bits */ 536f7917c00SJeff Kirsher } 537f7917c00SJeff Kirsher 538f7917c00SJeff Kirsher /** 539f7917c00SJeff Kirsher * refill_fl - refill an SGE Rx buffer ring 540f7917c00SJeff Kirsher * @adap: the adapter 541f7917c00SJeff Kirsher * @q: the ring to refill 542f7917c00SJeff Kirsher * @n: the number of new buffers to allocate 543f7917c00SJeff Kirsher * @gfp: the gfp flags for the allocations 544f7917c00SJeff Kirsher * 545f7917c00SJeff Kirsher * (Re)populate an SGE free-buffer queue with up to @n new packet buffers, 546f7917c00SJeff Kirsher * allocated with the supplied gfp flags. The caller must assure that 547f7917c00SJeff Kirsher * @n does not exceed the queue's capacity. If afterwards the queue is 548f7917c00SJeff Kirsher * found critically low mark it as starving in the bitmap of starving FLs. 549f7917c00SJeff Kirsher * 550f7917c00SJeff Kirsher * Returns the number of buffers allocated. 551f7917c00SJeff Kirsher */ 552f7917c00SJeff Kirsher static unsigned int refill_fl(struct adapter *adap, struct sge_fl *q, int n, 553f7917c00SJeff Kirsher gfp_t gfp) 554f7917c00SJeff Kirsher { 55552367a76SVipul Pandya struct sge *s = &adap->sge; 556f7917c00SJeff Kirsher struct page *pg; 557f7917c00SJeff Kirsher dma_addr_t mapping; 558f7917c00SJeff Kirsher unsigned int cred = q->avail; 559f7917c00SJeff Kirsher __be64 *d = &q->desc[q->pidx]; 560f7917c00SJeff Kirsher struct rx_sw_desc *sd = &q->sdesc[q->pidx]; 561f7917c00SJeff Kirsher 5621f2149c1SEric Dumazet gfp |= __GFP_NOWARN | __GFP_COLD; 563f7917c00SJeff Kirsher 56452367a76SVipul Pandya if (s->fl_pg_order == 0) 56552367a76SVipul Pandya goto alloc_small_pages; 56652367a76SVipul Pandya 567f7917c00SJeff Kirsher /* 568f7917c00SJeff Kirsher * Prefer large buffers 569f7917c00SJeff Kirsher */ 570f7917c00SJeff Kirsher while (n) { 57152367a76SVipul Pandya pg = alloc_pages(gfp | __GFP_COMP, s->fl_pg_order); 572f7917c00SJeff Kirsher if (unlikely(!pg)) { 573f7917c00SJeff Kirsher q->large_alloc_failed++; 574f7917c00SJeff Kirsher break; /* fall back to single pages */ 575f7917c00SJeff Kirsher } 576f7917c00SJeff Kirsher 577f7917c00SJeff Kirsher mapping = dma_map_page(adap->pdev_dev, pg, 0, 57852367a76SVipul Pandya PAGE_SIZE << s->fl_pg_order, 579f7917c00SJeff Kirsher PCI_DMA_FROMDEVICE); 580f7917c00SJeff Kirsher if (unlikely(dma_mapping_error(adap->pdev_dev, mapping))) { 58152367a76SVipul Pandya __free_pages(pg, s->fl_pg_order); 582f7917c00SJeff Kirsher goto out; /* do not try small pages for this error */ 583f7917c00SJeff Kirsher } 58452367a76SVipul Pandya mapping |= RX_LARGE_PG_BUF; 585f7917c00SJeff Kirsher *d++ = cpu_to_be64(mapping); 586f7917c00SJeff Kirsher 587f7917c00SJeff Kirsher set_rx_sw_desc(sd, pg, mapping); 588f7917c00SJeff Kirsher sd++; 589f7917c00SJeff Kirsher 590f7917c00SJeff Kirsher q->avail++; 591f7917c00SJeff Kirsher if (++q->pidx == q->size) { 592f7917c00SJeff Kirsher q->pidx = 0; 593f7917c00SJeff Kirsher sd = q->sdesc; 594f7917c00SJeff Kirsher d = q->desc; 595f7917c00SJeff Kirsher } 596f7917c00SJeff Kirsher n--; 597f7917c00SJeff Kirsher } 598f7917c00SJeff Kirsher 59952367a76SVipul Pandya alloc_small_pages: 600f7917c00SJeff Kirsher while (n--) { 6010614002bSMel Gorman pg = __skb_alloc_page(gfp, NULL); 602f7917c00SJeff Kirsher if (unlikely(!pg)) { 603f7917c00SJeff Kirsher q->alloc_failed++; 604f7917c00SJeff Kirsher break; 605f7917c00SJeff Kirsher } 606f7917c00SJeff Kirsher 607f7917c00SJeff Kirsher mapping = dma_map_page(adap->pdev_dev, pg, 0, PAGE_SIZE, 608f7917c00SJeff Kirsher PCI_DMA_FROMDEVICE); 609f7917c00SJeff Kirsher if (unlikely(dma_mapping_error(adap->pdev_dev, mapping))) { 6101f2149c1SEric Dumazet put_page(pg); 611f7917c00SJeff Kirsher goto out; 612f7917c00SJeff Kirsher } 613f7917c00SJeff Kirsher *d++ = cpu_to_be64(mapping); 614f7917c00SJeff Kirsher 615f7917c00SJeff Kirsher set_rx_sw_desc(sd, pg, mapping); 616f7917c00SJeff Kirsher sd++; 617f7917c00SJeff Kirsher 618f7917c00SJeff Kirsher q->avail++; 619f7917c00SJeff Kirsher if (++q->pidx == q->size) { 620f7917c00SJeff Kirsher q->pidx = 0; 621f7917c00SJeff Kirsher sd = q->sdesc; 622f7917c00SJeff Kirsher d = q->desc; 623f7917c00SJeff Kirsher } 624f7917c00SJeff Kirsher } 625f7917c00SJeff Kirsher 626f7917c00SJeff Kirsher out: cred = q->avail - cred; 627f7917c00SJeff Kirsher q->pend_cred += cred; 628f7917c00SJeff Kirsher ring_fl_db(adap, q); 629f7917c00SJeff Kirsher 630f7917c00SJeff Kirsher if (unlikely(fl_starving(q))) { 631f7917c00SJeff Kirsher smp_wmb(); 632f7917c00SJeff Kirsher set_bit(q->cntxt_id - adap->sge.egr_start, 633f7917c00SJeff Kirsher adap->sge.starving_fl); 634f7917c00SJeff Kirsher } 635f7917c00SJeff Kirsher 636f7917c00SJeff Kirsher return cred; 637f7917c00SJeff Kirsher } 638f7917c00SJeff Kirsher 639f7917c00SJeff Kirsher static inline void __refill_fl(struct adapter *adap, struct sge_fl *fl) 640f7917c00SJeff Kirsher { 641f7917c00SJeff Kirsher refill_fl(adap, fl, min(MAX_RX_REFILL, fl_cap(fl) - fl->avail), 642f7917c00SJeff Kirsher GFP_ATOMIC); 643f7917c00SJeff Kirsher } 644f7917c00SJeff Kirsher 645f7917c00SJeff Kirsher /** 646f7917c00SJeff Kirsher * alloc_ring - allocate resources for an SGE descriptor ring 647f7917c00SJeff Kirsher * @dev: the PCI device's core device 648f7917c00SJeff Kirsher * @nelem: the number of descriptors 649f7917c00SJeff Kirsher * @elem_size: the size of each descriptor 650f7917c00SJeff Kirsher * @sw_size: the size of the SW state associated with each ring element 651f7917c00SJeff Kirsher * @phys: the physical address of the allocated ring 652f7917c00SJeff Kirsher * @metadata: address of the array holding the SW state for the ring 653f7917c00SJeff Kirsher * @stat_size: extra space in HW ring for status information 654f7917c00SJeff Kirsher * @node: preferred node for memory allocations 655f7917c00SJeff Kirsher * 656f7917c00SJeff Kirsher * Allocates resources for an SGE descriptor ring, such as Tx queues, 657f7917c00SJeff Kirsher * free buffer lists, or response queues. Each SGE ring requires 658f7917c00SJeff Kirsher * space for its HW descriptors plus, optionally, space for the SW state 659f7917c00SJeff Kirsher * associated with each HW entry (the metadata). The function returns 660f7917c00SJeff Kirsher * three values: the virtual address for the HW ring (the return value 661f7917c00SJeff Kirsher * of the function), the bus address of the HW ring, and the address 662f7917c00SJeff Kirsher * of the SW ring. 663f7917c00SJeff Kirsher */ 664f7917c00SJeff Kirsher static void *alloc_ring(struct device *dev, size_t nelem, size_t elem_size, 665f7917c00SJeff Kirsher size_t sw_size, dma_addr_t *phys, void *metadata, 666f7917c00SJeff Kirsher size_t stat_size, int node) 667f7917c00SJeff Kirsher { 668f7917c00SJeff Kirsher size_t len = nelem * elem_size + stat_size; 669f7917c00SJeff Kirsher void *s = NULL; 670f7917c00SJeff Kirsher void *p = dma_alloc_coherent(dev, len, phys, GFP_KERNEL); 671f7917c00SJeff Kirsher 672f7917c00SJeff Kirsher if (!p) 673f7917c00SJeff Kirsher return NULL; 674f7917c00SJeff Kirsher if (sw_size) { 675f7917c00SJeff Kirsher s = kzalloc_node(nelem * sw_size, GFP_KERNEL, node); 676f7917c00SJeff Kirsher 677f7917c00SJeff Kirsher if (!s) { 678f7917c00SJeff Kirsher dma_free_coherent(dev, len, p, *phys); 679f7917c00SJeff Kirsher return NULL; 680f7917c00SJeff Kirsher } 681f7917c00SJeff Kirsher } 682f7917c00SJeff Kirsher if (metadata) 683f7917c00SJeff Kirsher *(void **)metadata = s; 684f7917c00SJeff Kirsher memset(p, 0, len); 685f7917c00SJeff Kirsher return p; 686f7917c00SJeff Kirsher } 687f7917c00SJeff Kirsher 688f7917c00SJeff Kirsher /** 689f7917c00SJeff Kirsher * sgl_len - calculates the size of an SGL of the given capacity 690f7917c00SJeff Kirsher * @n: the number of SGL entries 691f7917c00SJeff Kirsher * 692f7917c00SJeff Kirsher * Calculates the number of flits needed for a scatter/gather list that 693f7917c00SJeff Kirsher * can hold the given number of entries. 694f7917c00SJeff Kirsher */ 695f7917c00SJeff Kirsher static inline unsigned int sgl_len(unsigned int n) 696f7917c00SJeff Kirsher { 697f7917c00SJeff Kirsher n--; 698f7917c00SJeff Kirsher return (3 * n) / 2 + (n & 1) + 2; 699f7917c00SJeff Kirsher } 700f7917c00SJeff Kirsher 701f7917c00SJeff Kirsher /** 702f7917c00SJeff Kirsher * flits_to_desc - returns the num of Tx descriptors for the given flits 703f7917c00SJeff Kirsher * @n: the number of flits 704f7917c00SJeff Kirsher * 705f7917c00SJeff Kirsher * Returns the number of Tx descriptors needed for the supplied number 706f7917c00SJeff Kirsher * of flits. 707f7917c00SJeff Kirsher */ 708f7917c00SJeff Kirsher static inline unsigned int flits_to_desc(unsigned int n) 709f7917c00SJeff Kirsher { 710f7917c00SJeff Kirsher BUG_ON(n > SGE_MAX_WR_LEN / 8); 711f7917c00SJeff Kirsher return DIV_ROUND_UP(n, 8); 712f7917c00SJeff Kirsher } 713f7917c00SJeff Kirsher 714f7917c00SJeff Kirsher /** 715f7917c00SJeff Kirsher * is_eth_imm - can an Ethernet packet be sent as immediate data? 716f7917c00SJeff Kirsher * @skb: the packet 717f7917c00SJeff Kirsher * 718f7917c00SJeff Kirsher * Returns whether an Ethernet packet is small enough to fit as 7190034b298SKumar Sanghvi * immediate data. Return value corresponds to headroom required. 720f7917c00SJeff Kirsher */ 721f7917c00SJeff Kirsher static inline int is_eth_imm(const struct sk_buff *skb) 722f7917c00SJeff Kirsher { 7230034b298SKumar Sanghvi int hdrlen = skb_shinfo(skb)->gso_size ? 7240034b298SKumar Sanghvi sizeof(struct cpl_tx_pkt_lso_core) : 0; 7250034b298SKumar Sanghvi 7260034b298SKumar Sanghvi hdrlen += sizeof(struct cpl_tx_pkt); 7270034b298SKumar Sanghvi if (skb->len <= MAX_IMM_TX_PKT_LEN - hdrlen) 7280034b298SKumar Sanghvi return hdrlen; 7290034b298SKumar Sanghvi return 0; 730f7917c00SJeff Kirsher } 731f7917c00SJeff Kirsher 732f7917c00SJeff Kirsher /** 733f7917c00SJeff Kirsher * calc_tx_flits - calculate the number of flits for a packet Tx WR 734f7917c00SJeff Kirsher * @skb: the packet 735f7917c00SJeff Kirsher * 736f7917c00SJeff Kirsher * Returns the number of flits needed for a Tx WR for the given Ethernet 737f7917c00SJeff Kirsher * packet, including the needed WR and CPL headers. 738f7917c00SJeff Kirsher */ 739f7917c00SJeff Kirsher static inline unsigned int calc_tx_flits(const struct sk_buff *skb) 740f7917c00SJeff Kirsher { 741f7917c00SJeff Kirsher unsigned int flits; 7420034b298SKumar Sanghvi int hdrlen = is_eth_imm(skb); 743f7917c00SJeff Kirsher 7440034b298SKumar Sanghvi if (hdrlen) 7450034b298SKumar Sanghvi return DIV_ROUND_UP(skb->len + hdrlen, sizeof(__be64)); 746f7917c00SJeff Kirsher 747f7917c00SJeff Kirsher flits = sgl_len(skb_shinfo(skb)->nr_frags + 1) + 4; 748f7917c00SJeff Kirsher if (skb_shinfo(skb)->gso_size) 749f7917c00SJeff Kirsher flits += 2; 750f7917c00SJeff Kirsher return flits; 751f7917c00SJeff Kirsher } 752f7917c00SJeff Kirsher 753f7917c00SJeff Kirsher /** 754f7917c00SJeff Kirsher * calc_tx_descs - calculate the number of Tx descriptors for a packet 755f7917c00SJeff Kirsher * @skb: the packet 756f7917c00SJeff Kirsher * 757f7917c00SJeff Kirsher * Returns the number of Tx descriptors needed for the given Ethernet 758f7917c00SJeff Kirsher * packet, including the needed WR and CPL headers. 759f7917c00SJeff Kirsher */ 760f7917c00SJeff Kirsher static inline unsigned int calc_tx_descs(const struct sk_buff *skb) 761f7917c00SJeff Kirsher { 762f7917c00SJeff Kirsher return flits_to_desc(calc_tx_flits(skb)); 763f7917c00SJeff Kirsher } 764f7917c00SJeff Kirsher 765f7917c00SJeff Kirsher /** 766f7917c00SJeff Kirsher * write_sgl - populate a scatter/gather list for a packet 767f7917c00SJeff Kirsher * @skb: the packet 768f7917c00SJeff Kirsher * @q: the Tx queue we are writing into 769f7917c00SJeff Kirsher * @sgl: starting location for writing the SGL 770f7917c00SJeff Kirsher * @end: points right after the end of the SGL 771f7917c00SJeff Kirsher * @start: start offset into skb main-body data to include in the SGL 772f7917c00SJeff Kirsher * @addr: the list of bus addresses for the SGL elements 773f7917c00SJeff Kirsher * 774f7917c00SJeff Kirsher * Generates a gather list for the buffers that make up a packet. 775f7917c00SJeff Kirsher * The caller must provide adequate space for the SGL that will be written. 776f7917c00SJeff Kirsher * The SGL includes all of the packet's page fragments and the data in its 777f7917c00SJeff Kirsher * main body except for the first @start bytes. @sgl must be 16-byte 778f7917c00SJeff Kirsher * aligned and within a Tx descriptor with available space. @end points 779f7917c00SJeff Kirsher * right after the end of the SGL but does not account for any potential 780f7917c00SJeff Kirsher * wrap around, i.e., @end > @sgl. 781f7917c00SJeff Kirsher */ 782f7917c00SJeff Kirsher static void write_sgl(const struct sk_buff *skb, struct sge_txq *q, 783f7917c00SJeff Kirsher struct ulptx_sgl *sgl, u64 *end, unsigned int start, 784f7917c00SJeff Kirsher const dma_addr_t *addr) 785f7917c00SJeff Kirsher { 786f7917c00SJeff Kirsher unsigned int i, len; 787f7917c00SJeff Kirsher struct ulptx_sge_pair *to; 788f7917c00SJeff Kirsher const struct skb_shared_info *si = skb_shinfo(skb); 789f7917c00SJeff Kirsher unsigned int nfrags = si->nr_frags; 790f7917c00SJeff Kirsher struct ulptx_sge_pair buf[MAX_SKB_FRAGS / 2 + 1]; 791f7917c00SJeff Kirsher 792f7917c00SJeff Kirsher len = skb_headlen(skb) - start; 793f7917c00SJeff Kirsher if (likely(len)) { 794f7917c00SJeff Kirsher sgl->len0 = htonl(len); 795f7917c00SJeff Kirsher sgl->addr0 = cpu_to_be64(addr[0] + start); 796f7917c00SJeff Kirsher nfrags++; 797f7917c00SJeff Kirsher } else { 7989e903e08SEric Dumazet sgl->len0 = htonl(skb_frag_size(&si->frags[0])); 799f7917c00SJeff Kirsher sgl->addr0 = cpu_to_be64(addr[1]); 800f7917c00SJeff Kirsher } 801f7917c00SJeff Kirsher 802f7917c00SJeff Kirsher sgl->cmd_nsge = htonl(ULPTX_CMD(ULP_TX_SC_DSGL) | ULPTX_NSGE(nfrags)); 803f7917c00SJeff Kirsher if (likely(--nfrags == 0)) 804f7917c00SJeff Kirsher return; 805f7917c00SJeff Kirsher /* 806f7917c00SJeff Kirsher * Most of the complexity below deals with the possibility we hit the 807f7917c00SJeff Kirsher * end of the queue in the middle of writing the SGL. For this case 808f7917c00SJeff Kirsher * only we create the SGL in a temporary buffer and then copy it. 809f7917c00SJeff Kirsher */ 810f7917c00SJeff Kirsher to = (u8 *)end > (u8 *)q->stat ? buf : sgl->sge; 811f7917c00SJeff Kirsher 812f7917c00SJeff Kirsher for (i = (nfrags != si->nr_frags); nfrags >= 2; nfrags -= 2, to++) { 8139e903e08SEric Dumazet to->len[0] = cpu_to_be32(skb_frag_size(&si->frags[i])); 8149e903e08SEric Dumazet to->len[1] = cpu_to_be32(skb_frag_size(&si->frags[++i])); 815f7917c00SJeff Kirsher to->addr[0] = cpu_to_be64(addr[i]); 816f7917c00SJeff Kirsher to->addr[1] = cpu_to_be64(addr[++i]); 817f7917c00SJeff Kirsher } 818f7917c00SJeff Kirsher if (nfrags) { 8199e903e08SEric Dumazet to->len[0] = cpu_to_be32(skb_frag_size(&si->frags[i])); 820f7917c00SJeff Kirsher to->len[1] = cpu_to_be32(0); 821f7917c00SJeff Kirsher to->addr[0] = cpu_to_be64(addr[i + 1]); 822f7917c00SJeff Kirsher } 823f7917c00SJeff Kirsher if (unlikely((u8 *)end > (u8 *)q->stat)) { 824f7917c00SJeff Kirsher unsigned int part0 = (u8 *)q->stat - (u8 *)sgl->sge, part1; 825f7917c00SJeff Kirsher 826f7917c00SJeff Kirsher if (likely(part0)) 827f7917c00SJeff Kirsher memcpy(sgl->sge, buf, part0); 828f7917c00SJeff Kirsher part1 = (u8 *)end - (u8 *)q->stat; 829f7917c00SJeff Kirsher memcpy(q->desc, (u8 *)buf + part0, part1); 830f7917c00SJeff Kirsher end = (void *)q->desc + part1; 831f7917c00SJeff Kirsher } 832f7917c00SJeff Kirsher if ((uintptr_t)end & 8) /* 0-pad to multiple of 16 */ 83364699336SJoe Perches *end = 0; 834f7917c00SJeff Kirsher } 835f7917c00SJeff Kirsher 83622adfe0aSSantosh Rastapur /* This function copies 64 byte coalesced work request to 83722adfe0aSSantosh Rastapur * memory mapped BAR2 space(user space writes). 83822adfe0aSSantosh Rastapur * For coalesced WR SGE, fetches data from the FIFO instead of from Host. 83922adfe0aSSantosh Rastapur */ 84022adfe0aSSantosh Rastapur static void cxgb_pio_copy(u64 __iomem *dst, u64 *src) 84122adfe0aSSantosh Rastapur { 84222adfe0aSSantosh Rastapur int count = 8; 84322adfe0aSSantosh Rastapur 84422adfe0aSSantosh Rastapur while (count) { 84522adfe0aSSantosh Rastapur writeq(*src, dst); 84622adfe0aSSantosh Rastapur src++; 84722adfe0aSSantosh Rastapur dst++; 84822adfe0aSSantosh Rastapur count--; 84922adfe0aSSantosh Rastapur } 85022adfe0aSSantosh Rastapur } 85122adfe0aSSantosh Rastapur 852f7917c00SJeff Kirsher /** 853f7917c00SJeff Kirsher * ring_tx_db - check and potentially ring a Tx queue's doorbell 854f7917c00SJeff Kirsher * @adap: the adapter 855f7917c00SJeff Kirsher * @q: the Tx queue 856f7917c00SJeff Kirsher * @n: number of new descriptors to give to HW 857f7917c00SJeff Kirsher * 858f7917c00SJeff Kirsher * Ring the doorbel for a Tx queue. 859f7917c00SJeff Kirsher */ 860f7917c00SJeff Kirsher static inline void ring_tx_db(struct adapter *adap, struct sge_txq *q, int n) 861f7917c00SJeff Kirsher { 86222adfe0aSSantosh Rastapur unsigned int *wr, index; 86322adfe0aSSantosh Rastapur 864f7917c00SJeff Kirsher wmb(); /* write descriptors before telling HW */ 8653069ee9bSVipul Pandya spin_lock(&q->db_lock); 8663069ee9bSVipul Pandya if (!q->db_disabled) { 867d14807ddSHariprasad Shenai if (is_t4(adap->params.chip)) { 868840f3000SVipul Pandya t4_write_reg(adap, MYPF_REG(SGE_PF_KDOORBELL), 869840f3000SVipul Pandya QID(q->cntxt_id) | PIDX(n)); 87022adfe0aSSantosh Rastapur } else { 87122adfe0aSSantosh Rastapur if (n == 1) { 87222adfe0aSSantosh Rastapur index = q->pidx ? (q->pidx - 1) : (q->size - 1); 87322adfe0aSSantosh Rastapur wr = (unsigned int *)&q->desc[index]; 87422adfe0aSSantosh Rastapur cxgb_pio_copy((u64 __iomem *) 87522adfe0aSSantosh Rastapur (adap->bar2 + q->udb + 64), 87622adfe0aSSantosh Rastapur (u64 *)wr); 87722adfe0aSSantosh Rastapur } else 87822adfe0aSSantosh Rastapur writel(n, adap->bar2 + q->udb + 8); 87922adfe0aSSantosh Rastapur wmb(); 88022adfe0aSSantosh Rastapur } 8813069ee9bSVipul Pandya } 8823069ee9bSVipul Pandya q->db_pidx = q->pidx; 8833069ee9bSVipul Pandya spin_unlock(&q->db_lock); 884f7917c00SJeff Kirsher } 885f7917c00SJeff Kirsher 886f7917c00SJeff Kirsher /** 887f7917c00SJeff Kirsher * inline_tx_skb - inline a packet's data into Tx descriptors 888f7917c00SJeff Kirsher * @skb: the packet 889f7917c00SJeff Kirsher * @q: the Tx queue where the packet will be inlined 890f7917c00SJeff Kirsher * @pos: starting position in the Tx queue where to inline the packet 891f7917c00SJeff Kirsher * 892f7917c00SJeff Kirsher * Inline a packet's contents directly into Tx descriptors, starting at 893f7917c00SJeff Kirsher * the given position within the Tx DMA ring. 894f7917c00SJeff Kirsher * Most of the complexity of this operation is dealing with wrap arounds 895f7917c00SJeff Kirsher * in the middle of the packet we want to inline. 896f7917c00SJeff Kirsher */ 897f7917c00SJeff Kirsher static void inline_tx_skb(const struct sk_buff *skb, const struct sge_txq *q, 898f7917c00SJeff Kirsher void *pos) 899f7917c00SJeff Kirsher { 900f7917c00SJeff Kirsher u64 *p; 901f7917c00SJeff Kirsher int left = (void *)q->stat - pos; 902f7917c00SJeff Kirsher 903f7917c00SJeff Kirsher if (likely(skb->len <= left)) { 904f7917c00SJeff Kirsher if (likely(!skb->data_len)) 905f7917c00SJeff Kirsher skb_copy_from_linear_data(skb, pos, skb->len); 906f7917c00SJeff Kirsher else 907f7917c00SJeff Kirsher skb_copy_bits(skb, 0, pos, skb->len); 908f7917c00SJeff Kirsher pos += skb->len; 909f7917c00SJeff Kirsher } else { 910f7917c00SJeff Kirsher skb_copy_bits(skb, 0, pos, left); 911f7917c00SJeff Kirsher skb_copy_bits(skb, left, q->desc, skb->len - left); 912f7917c00SJeff Kirsher pos = (void *)q->desc + (skb->len - left); 913f7917c00SJeff Kirsher } 914f7917c00SJeff Kirsher 915f7917c00SJeff Kirsher /* 0-pad to multiple of 16 */ 916f7917c00SJeff Kirsher p = PTR_ALIGN(pos, 8); 917f7917c00SJeff Kirsher if ((uintptr_t)p & 8) 918f7917c00SJeff Kirsher *p = 0; 919f7917c00SJeff Kirsher } 920f7917c00SJeff Kirsher 921f7917c00SJeff Kirsher /* 922f7917c00SJeff Kirsher * Figure out what HW csum a packet wants and return the appropriate control 923f7917c00SJeff Kirsher * bits. 924f7917c00SJeff Kirsher */ 925f7917c00SJeff Kirsher static u64 hwcsum(const struct sk_buff *skb) 926f7917c00SJeff Kirsher { 927f7917c00SJeff Kirsher int csum_type; 928f7917c00SJeff Kirsher const struct iphdr *iph = ip_hdr(skb); 929f7917c00SJeff Kirsher 930f7917c00SJeff Kirsher if (iph->version == 4) { 931f7917c00SJeff Kirsher if (iph->protocol == IPPROTO_TCP) 932f7917c00SJeff Kirsher csum_type = TX_CSUM_TCPIP; 933f7917c00SJeff Kirsher else if (iph->protocol == IPPROTO_UDP) 934f7917c00SJeff Kirsher csum_type = TX_CSUM_UDPIP; 935f7917c00SJeff Kirsher else { 936f7917c00SJeff Kirsher nocsum: /* 937f7917c00SJeff Kirsher * unknown protocol, disable HW csum 938f7917c00SJeff Kirsher * and hope a bad packet is detected 939f7917c00SJeff Kirsher */ 940f7917c00SJeff Kirsher return TXPKT_L4CSUM_DIS; 941f7917c00SJeff Kirsher } 942f7917c00SJeff Kirsher } else { 943f7917c00SJeff Kirsher /* 944f7917c00SJeff Kirsher * this doesn't work with extension headers 945f7917c00SJeff Kirsher */ 946f7917c00SJeff Kirsher const struct ipv6hdr *ip6h = (const struct ipv6hdr *)iph; 947f7917c00SJeff Kirsher 948f7917c00SJeff Kirsher if (ip6h->nexthdr == IPPROTO_TCP) 949f7917c00SJeff Kirsher csum_type = TX_CSUM_TCPIP6; 950f7917c00SJeff Kirsher else if (ip6h->nexthdr == IPPROTO_UDP) 951f7917c00SJeff Kirsher csum_type = TX_CSUM_UDPIP6; 952f7917c00SJeff Kirsher else 953f7917c00SJeff Kirsher goto nocsum; 954f7917c00SJeff Kirsher } 955f7917c00SJeff Kirsher 956f7917c00SJeff Kirsher if (likely(csum_type >= TX_CSUM_TCPIP)) 957f7917c00SJeff Kirsher return TXPKT_CSUM_TYPE(csum_type) | 958f7917c00SJeff Kirsher TXPKT_IPHDR_LEN(skb_network_header_len(skb)) | 959f7917c00SJeff Kirsher TXPKT_ETHHDR_LEN(skb_network_offset(skb) - ETH_HLEN); 960f7917c00SJeff Kirsher else { 961f7917c00SJeff Kirsher int start = skb_transport_offset(skb); 962f7917c00SJeff Kirsher 963f7917c00SJeff Kirsher return TXPKT_CSUM_TYPE(csum_type) | TXPKT_CSUM_START(start) | 964f7917c00SJeff Kirsher TXPKT_CSUM_LOC(start + skb->csum_offset); 965f7917c00SJeff Kirsher } 966f7917c00SJeff Kirsher } 967f7917c00SJeff Kirsher 968f7917c00SJeff Kirsher static void eth_txq_stop(struct sge_eth_txq *q) 969f7917c00SJeff Kirsher { 970f7917c00SJeff Kirsher netif_tx_stop_queue(q->txq); 971f7917c00SJeff Kirsher q->q.stops++; 972f7917c00SJeff Kirsher } 973f7917c00SJeff Kirsher 974f7917c00SJeff Kirsher static inline void txq_advance(struct sge_txq *q, unsigned int n) 975f7917c00SJeff Kirsher { 976f7917c00SJeff Kirsher q->in_use += n; 977f7917c00SJeff Kirsher q->pidx += n; 978f7917c00SJeff Kirsher if (q->pidx >= q->size) 979f7917c00SJeff Kirsher q->pidx -= q->size; 980f7917c00SJeff Kirsher } 981f7917c00SJeff Kirsher 982f7917c00SJeff Kirsher /** 983f7917c00SJeff Kirsher * t4_eth_xmit - add a packet to an Ethernet Tx queue 984f7917c00SJeff Kirsher * @skb: the packet 985f7917c00SJeff Kirsher * @dev: the egress net device 986f7917c00SJeff Kirsher * 987f7917c00SJeff Kirsher * Add a packet to an SGE Ethernet Tx queue. Runs with softirqs disabled. 988f7917c00SJeff Kirsher */ 989f7917c00SJeff Kirsher netdev_tx_t t4_eth_xmit(struct sk_buff *skb, struct net_device *dev) 990f7917c00SJeff Kirsher { 9910034b298SKumar Sanghvi int len; 992f7917c00SJeff Kirsher u32 wr_mid; 993f7917c00SJeff Kirsher u64 cntrl, *end; 994f7917c00SJeff Kirsher int qidx, credits; 995f7917c00SJeff Kirsher unsigned int flits, ndesc; 996f7917c00SJeff Kirsher struct adapter *adap; 997f7917c00SJeff Kirsher struct sge_eth_txq *q; 998f7917c00SJeff Kirsher const struct port_info *pi; 999f7917c00SJeff Kirsher struct fw_eth_tx_pkt_wr *wr; 1000f7917c00SJeff Kirsher struct cpl_tx_pkt_core *cpl; 1001f7917c00SJeff Kirsher const struct skb_shared_info *ssi; 1002f7917c00SJeff Kirsher dma_addr_t addr[MAX_SKB_FRAGS + 1]; 10030034b298SKumar Sanghvi bool immediate = false; 1004f7917c00SJeff Kirsher 1005f7917c00SJeff Kirsher /* 1006f7917c00SJeff Kirsher * The chip min packet length is 10 octets but play safe and reject 1007f7917c00SJeff Kirsher * anything shorter than an Ethernet header. 1008f7917c00SJeff Kirsher */ 1009f7917c00SJeff Kirsher if (unlikely(skb->len < ETH_HLEN)) { 1010f7917c00SJeff Kirsher out_free: dev_kfree_skb(skb); 1011f7917c00SJeff Kirsher return NETDEV_TX_OK; 1012f7917c00SJeff Kirsher } 1013f7917c00SJeff Kirsher 1014f7917c00SJeff Kirsher pi = netdev_priv(dev); 1015f7917c00SJeff Kirsher adap = pi->adapter; 1016f7917c00SJeff Kirsher qidx = skb_get_queue_mapping(skb); 1017f7917c00SJeff Kirsher q = &adap->sge.ethtxq[qidx + pi->first_qset]; 1018f7917c00SJeff Kirsher 1019f7917c00SJeff Kirsher reclaim_completed_tx(adap, &q->q, true); 1020f7917c00SJeff Kirsher 1021f7917c00SJeff Kirsher flits = calc_tx_flits(skb); 1022f7917c00SJeff Kirsher ndesc = flits_to_desc(flits); 1023f7917c00SJeff Kirsher credits = txq_avail(&q->q) - ndesc; 1024f7917c00SJeff Kirsher 1025f7917c00SJeff Kirsher if (unlikely(credits < 0)) { 1026f7917c00SJeff Kirsher eth_txq_stop(q); 1027f7917c00SJeff Kirsher dev_err(adap->pdev_dev, 1028f7917c00SJeff Kirsher "%s: Tx ring %u full while queue awake!\n", 1029f7917c00SJeff Kirsher dev->name, qidx); 1030f7917c00SJeff Kirsher return NETDEV_TX_BUSY; 1031f7917c00SJeff Kirsher } 1032f7917c00SJeff Kirsher 10330034b298SKumar Sanghvi if (is_eth_imm(skb)) 10340034b298SKumar Sanghvi immediate = true; 10350034b298SKumar Sanghvi 10360034b298SKumar Sanghvi if (!immediate && 1037f7917c00SJeff Kirsher unlikely(map_skb(adap->pdev_dev, skb, addr) < 0)) { 1038f7917c00SJeff Kirsher q->mapping_err++; 1039f7917c00SJeff Kirsher goto out_free; 1040f7917c00SJeff Kirsher } 1041f7917c00SJeff Kirsher 1042f7917c00SJeff Kirsher wr_mid = FW_WR_LEN16(DIV_ROUND_UP(flits, 2)); 1043f7917c00SJeff Kirsher if (unlikely(credits < ETHTXQ_STOP_THRES)) { 1044f7917c00SJeff Kirsher eth_txq_stop(q); 1045f7917c00SJeff Kirsher wr_mid |= FW_WR_EQUEQ | FW_WR_EQUIQ; 1046f7917c00SJeff Kirsher } 1047f7917c00SJeff Kirsher 1048f7917c00SJeff Kirsher wr = (void *)&q->q.desc[q->q.pidx]; 1049f7917c00SJeff Kirsher wr->equiq_to_len16 = htonl(wr_mid); 1050f7917c00SJeff Kirsher wr->r3 = cpu_to_be64(0); 1051f7917c00SJeff Kirsher end = (u64 *)wr + flits; 1052f7917c00SJeff Kirsher 10530034b298SKumar Sanghvi len = immediate ? skb->len : 0; 1054f7917c00SJeff Kirsher ssi = skb_shinfo(skb); 1055f7917c00SJeff Kirsher if (ssi->gso_size) { 1056f7917c00SJeff Kirsher struct cpl_tx_pkt_lso *lso = (void *)wr; 1057f7917c00SJeff Kirsher bool v6 = (ssi->gso_type & SKB_GSO_TCPV6) != 0; 1058f7917c00SJeff Kirsher int l3hdr_len = skb_network_header_len(skb); 1059f7917c00SJeff Kirsher int eth_xtra_len = skb_network_offset(skb) - ETH_HLEN; 1060f7917c00SJeff Kirsher 10610034b298SKumar Sanghvi len += sizeof(*lso); 1062f7917c00SJeff Kirsher wr->op_immdlen = htonl(FW_WR_OP(FW_ETH_TX_PKT_WR) | 10630034b298SKumar Sanghvi FW_WR_IMMDLEN(len)); 1064f7917c00SJeff Kirsher lso->c.lso_ctrl = htonl(LSO_OPCODE(CPL_TX_PKT_LSO) | 1065f7917c00SJeff Kirsher LSO_FIRST_SLICE | LSO_LAST_SLICE | 1066f7917c00SJeff Kirsher LSO_IPV6(v6) | 1067f7917c00SJeff Kirsher LSO_ETHHDR_LEN(eth_xtra_len / 4) | 1068f7917c00SJeff Kirsher LSO_IPHDR_LEN(l3hdr_len / 4) | 1069f7917c00SJeff Kirsher LSO_TCPHDR_LEN(tcp_hdr(skb)->doff)); 1070f7917c00SJeff Kirsher lso->c.ipid_ofst = htons(0); 1071f7917c00SJeff Kirsher lso->c.mss = htons(ssi->gso_size); 1072f7917c00SJeff Kirsher lso->c.seqno_offset = htonl(0); 1073f7917c00SJeff Kirsher lso->c.len = htonl(skb->len); 1074f7917c00SJeff Kirsher cpl = (void *)(lso + 1); 1075f7917c00SJeff Kirsher cntrl = TXPKT_CSUM_TYPE(v6 ? TX_CSUM_TCPIP6 : TX_CSUM_TCPIP) | 1076f7917c00SJeff Kirsher TXPKT_IPHDR_LEN(l3hdr_len) | 1077f7917c00SJeff Kirsher TXPKT_ETHHDR_LEN(eth_xtra_len); 1078f7917c00SJeff Kirsher q->tso++; 1079f7917c00SJeff Kirsher q->tx_cso += ssi->gso_segs; 1080f7917c00SJeff Kirsher } else { 1081ca71de6bSKumar Sanghvi len += sizeof(*cpl); 1082f7917c00SJeff Kirsher wr->op_immdlen = htonl(FW_WR_OP(FW_ETH_TX_PKT_WR) | 1083f7917c00SJeff Kirsher FW_WR_IMMDLEN(len)); 1084f7917c00SJeff Kirsher cpl = (void *)(wr + 1); 1085f7917c00SJeff Kirsher if (skb->ip_summed == CHECKSUM_PARTIAL) { 1086f7917c00SJeff Kirsher cntrl = hwcsum(skb) | TXPKT_IPCSUM_DIS; 1087f7917c00SJeff Kirsher q->tx_cso++; 1088f7917c00SJeff Kirsher } else 1089f7917c00SJeff Kirsher cntrl = TXPKT_L4CSUM_DIS | TXPKT_IPCSUM_DIS; 1090f7917c00SJeff Kirsher } 1091f7917c00SJeff Kirsher 1092f7917c00SJeff Kirsher if (vlan_tx_tag_present(skb)) { 1093f7917c00SJeff Kirsher q->vlan_ins++; 1094f7917c00SJeff Kirsher cntrl |= TXPKT_VLAN_VLD | TXPKT_VLAN(vlan_tx_tag_get(skb)); 1095f7917c00SJeff Kirsher } 1096f7917c00SJeff Kirsher 1097f7917c00SJeff Kirsher cpl->ctrl0 = htonl(TXPKT_OPCODE(CPL_TX_PKT_XT) | 1098f7917c00SJeff Kirsher TXPKT_INTF(pi->tx_chan) | TXPKT_PF(adap->fn)); 1099f7917c00SJeff Kirsher cpl->pack = htons(0); 1100f7917c00SJeff Kirsher cpl->len = htons(skb->len); 1101f7917c00SJeff Kirsher cpl->ctrl1 = cpu_to_be64(cntrl); 1102f7917c00SJeff Kirsher 11030034b298SKumar Sanghvi if (immediate) { 1104f7917c00SJeff Kirsher inline_tx_skb(skb, &q->q, cpl + 1); 1105f7917c00SJeff Kirsher dev_kfree_skb(skb); 1106f7917c00SJeff Kirsher } else { 1107f7917c00SJeff Kirsher int last_desc; 1108f7917c00SJeff Kirsher 1109f7917c00SJeff Kirsher write_sgl(skb, &q->q, (struct ulptx_sgl *)(cpl + 1), end, 0, 1110f7917c00SJeff Kirsher addr); 1111f7917c00SJeff Kirsher skb_orphan(skb); 1112f7917c00SJeff Kirsher 1113f7917c00SJeff Kirsher last_desc = q->q.pidx + ndesc - 1; 1114f7917c00SJeff Kirsher if (last_desc >= q->q.size) 1115f7917c00SJeff Kirsher last_desc -= q->q.size; 1116f7917c00SJeff Kirsher q->q.sdesc[last_desc].skb = skb; 1117f7917c00SJeff Kirsher q->q.sdesc[last_desc].sgl = (struct ulptx_sgl *)(cpl + 1); 1118f7917c00SJeff Kirsher } 1119f7917c00SJeff Kirsher 1120f7917c00SJeff Kirsher txq_advance(&q->q, ndesc); 1121f7917c00SJeff Kirsher 1122f7917c00SJeff Kirsher ring_tx_db(adap, &q->q, ndesc); 1123f7917c00SJeff Kirsher return NETDEV_TX_OK; 1124f7917c00SJeff Kirsher } 1125f7917c00SJeff Kirsher 1126f7917c00SJeff Kirsher /** 1127f7917c00SJeff Kirsher * reclaim_completed_tx_imm - reclaim completed control-queue Tx descs 1128f7917c00SJeff Kirsher * @q: the SGE control Tx queue 1129f7917c00SJeff Kirsher * 1130f7917c00SJeff Kirsher * This is a variant of reclaim_completed_tx() that is used for Tx queues 1131f7917c00SJeff Kirsher * that send only immediate data (presently just the control queues) and 1132f7917c00SJeff Kirsher * thus do not have any sk_buffs to release. 1133f7917c00SJeff Kirsher */ 1134f7917c00SJeff Kirsher static inline void reclaim_completed_tx_imm(struct sge_txq *q) 1135f7917c00SJeff Kirsher { 1136f7917c00SJeff Kirsher int hw_cidx = ntohs(q->stat->cidx); 1137f7917c00SJeff Kirsher int reclaim = hw_cidx - q->cidx; 1138f7917c00SJeff Kirsher 1139f7917c00SJeff Kirsher if (reclaim < 0) 1140f7917c00SJeff Kirsher reclaim += q->size; 1141f7917c00SJeff Kirsher 1142f7917c00SJeff Kirsher q->in_use -= reclaim; 1143f7917c00SJeff Kirsher q->cidx = hw_cidx; 1144f7917c00SJeff Kirsher } 1145f7917c00SJeff Kirsher 1146f7917c00SJeff Kirsher /** 1147f7917c00SJeff Kirsher * is_imm - check whether a packet can be sent as immediate data 1148f7917c00SJeff Kirsher * @skb: the packet 1149f7917c00SJeff Kirsher * 1150f7917c00SJeff Kirsher * Returns true if a packet can be sent as a WR with immediate data. 1151f7917c00SJeff Kirsher */ 1152f7917c00SJeff Kirsher static inline int is_imm(const struct sk_buff *skb) 1153f7917c00SJeff Kirsher { 1154f7917c00SJeff Kirsher return skb->len <= MAX_CTRL_WR_LEN; 1155f7917c00SJeff Kirsher } 1156f7917c00SJeff Kirsher 1157f7917c00SJeff Kirsher /** 1158f7917c00SJeff Kirsher * ctrlq_check_stop - check if a control queue is full and should stop 1159f7917c00SJeff Kirsher * @q: the queue 1160f7917c00SJeff Kirsher * @wr: most recent WR written to the queue 1161f7917c00SJeff Kirsher * 1162f7917c00SJeff Kirsher * Check if a control queue has become full and should be stopped. 1163f7917c00SJeff Kirsher * We clean up control queue descriptors very lazily, only when we are out. 1164f7917c00SJeff Kirsher * If the queue is still full after reclaiming any completed descriptors 1165f7917c00SJeff Kirsher * we suspend it and have the last WR wake it up. 1166f7917c00SJeff Kirsher */ 1167f7917c00SJeff Kirsher static void ctrlq_check_stop(struct sge_ctrl_txq *q, struct fw_wr_hdr *wr) 1168f7917c00SJeff Kirsher { 1169f7917c00SJeff Kirsher reclaim_completed_tx_imm(&q->q); 1170f7917c00SJeff Kirsher if (unlikely(txq_avail(&q->q) < TXQ_STOP_THRES)) { 1171f7917c00SJeff Kirsher wr->lo |= htonl(FW_WR_EQUEQ | FW_WR_EQUIQ); 1172f7917c00SJeff Kirsher q->q.stops++; 1173f7917c00SJeff Kirsher q->full = 1; 1174f7917c00SJeff Kirsher } 1175f7917c00SJeff Kirsher } 1176f7917c00SJeff Kirsher 1177f7917c00SJeff Kirsher /** 1178f7917c00SJeff Kirsher * ctrl_xmit - send a packet through an SGE control Tx queue 1179f7917c00SJeff Kirsher * @q: the control queue 1180f7917c00SJeff Kirsher * @skb: the packet 1181f7917c00SJeff Kirsher * 1182f7917c00SJeff Kirsher * Send a packet through an SGE control Tx queue. Packets sent through 1183f7917c00SJeff Kirsher * a control queue must fit entirely as immediate data. 1184f7917c00SJeff Kirsher */ 1185f7917c00SJeff Kirsher static int ctrl_xmit(struct sge_ctrl_txq *q, struct sk_buff *skb) 1186f7917c00SJeff Kirsher { 1187f7917c00SJeff Kirsher unsigned int ndesc; 1188f7917c00SJeff Kirsher struct fw_wr_hdr *wr; 1189f7917c00SJeff Kirsher 1190f7917c00SJeff Kirsher if (unlikely(!is_imm(skb))) { 1191f7917c00SJeff Kirsher WARN_ON(1); 1192f7917c00SJeff Kirsher dev_kfree_skb(skb); 1193f7917c00SJeff Kirsher return NET_XMIT_DROP; 1194f7917c00SJeff Kirsher } 1195f7917c00SJeff Kirsher 1196f7917c00SJeff Kirsher ndesc = DIV_ROUND_UP(skb->len, sizeof(struct tx_desc)); 1197f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1198f7917c00SJeff Kirsher 1199f7917c00SJeff Kirsher if (unlikely(q->full)) { 1200f7917c00SJeff Kirsher skb->priority = ndesc; /* save for restart */ 1201f7917c00SJeff Kirsher __skb_queue_tail(&q->sendq, skb); 1202f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1203f7917c00SJeff Kirsher return NET_XMIT_CN; 1204f7917c00SJeff Kirsher } 1205f7917c00SJeff Kirsher 1206f7917c00SJeff Kirsher wr = (struct fw_wr_hdr *)&q->q.desc[q->q.pidx]; 1207f7917c00SJeff Kirsher inline_tx_skb(skb, &q->q, wr); 1208f7917c00SJeff Kirsher 1209f7917c00SJeff Kirsher txq_advance(&q->q, ndesc); 1210f7917c00SJeff Kirsher if (unlikely(txq_avail(&q->q) < TXQ_STOP_THRES)) 1211f7917c00SJeff Kirsher ctrlq_check_stop(q, wr); 1212f7917c00SJeff Kirsher 1213f7917c00SJeff Kirsher ring_tx_db(q->adap, &q->q, ndesc); 1214f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1215f7917c00SJeff Kirsher 1216f7917c00SJeff Kirsher kfree_skb(skb); 1217f7917c00SJeff Kirsher return NET_XMIT_SUCCESS; 1218f7917c00SJeff Kirsher } 1219f7917c00SJeff Kirsher 1220f7917c00SJeff Kirsher /** 1221f7917c00SJeff Kirsher * restart_ctrlq - restart a suspended control queue 1222f7917c00SJeff Kirsher * @data: the control queue to restart 1223f7917c00SJeff Kirsher * 1224f7917c00SJeff Kirsher * Resumes transmission on a suspended Tx control queue. 1225f7917c00SJeff Kirsher */ 1226f7917c00SJeff Kirsher static void restart_ctrlq(unsigned long data) 1227f7917c00SJeff Kirsher { 1228f7917c00SJeff Kirsher struct sk_buff *skb; 1229f7917c00SJeff Kirsher unsigned int written = 0; 1230f7917c00SJeff Kirsher struct sge_ctrl_txq *q = (struct sge_ctrl_txq *)data; 1231f7917c00SJeff Kirsher 1232f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1233f7917c00SJeff Kirsher reclaim_completed_tx_imm(&q->q); 1234f7917c00SJeff Kirsher BUG_ON(txq_avail(&q->q) < TXQ_STOP_THRES); /* q should be empty */ 1235f7917c00SJeff Kirsher 1236f7917c00SJeff Kirsher while ((skb = __skb_dequeue(&q->sendq)) != NULL) { 1237f7917c00SJeff Kirsher struct fw_wr_hdr *wr; 1238f7917c00SJeff Kirsher unsigned int ndesc = skb->priority; /* previously saved */ 1239f7917c00SJeff Kirsher 1240f7917c00SJeff Kirsher /* 1241f7917c00SJeff Kirsher * Write descriptors and free skbs outside the lock to limit 1242f7917c00SJeff Kirsher * wait times. q->full is still set so new skbs will be queued. 1243f7917c00SJeff Kirsher */ 1244f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1245f7917c00SJeff Kirsher 1246f7917c00SJeff Kirsher wr = (struct fw_wr_hdr *)&q->q.desc[q->q.pidx]; 1247f7917c00SJeff Kirsher inline_tx_skb(skb, &q->q, wr); 1248f7917c00SJeff Kirsher kfree_skb(skb); 1249f7917c00SJeff Kirsher 1250f7917c00SJeff Kirsher written += ndesc; 1251f7917c00SJeff Kirsher txq_advance(&q->q, ndesc); 1252f7917c00SJeff Kirsher if (unlikely(txq_avail(&q->q) < TXQ_STOP_THRES)) { 1253f7917c00SJeff Kirsher unsigned long old = q->q.stops; 1254f7917c00SJeff Kirsher 1255f7917c00SJeff Kirsher ctrlq_check_stop(q, wr); 1256f7917c00SJeff Kirsher if (q->q.stops != old) { /* suspended anew */ 1257f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1258f7917c00SJeff Kirsher goto ringdb; 1259f7917c00SJeff Kirsher } 1260f7917c00SJeff Kirsher } 1261f7917c00SJeff Kirsher if (written > 16) { 1262f7917c00SJeff Kirsher ring_tx_db(q->adap, &q->q, written); 1263f7917c00SJeff Kirsher written = 0; 1264f7917c00SJeff Kirsher } 1265f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1266f7917c00SJeff Kirsher } 1267f7917c00SJeff Kirsher q->full = 0; 1268f7917c00SJeff Kirsher ringdb: if (written) 1269f7917c00SJeff Kirsher ring_tx_db(q->adap, &q->q, written); 1270f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1271f7917c00SJeff Kirsher } 1272f7917c00SJeff Kirsher 1273f7917c00SJeff Kirsher /** 1274f7917c00SJeff Kirsher * t4_mgmt_tx - send a management message 1275f7917c00SJeff Kirsher * @adap: the adapter 1276f7917c00SJeff Kirsher * @skb: the packet containing the management message 1277f7917c00SJeff Kirsher * 1278f7917c00SJeff Kirsher * Send a management message through control queue 0. 1279f7917c00SJeff Kirsher */ 1280f7917c00SJeff Kirsher int t4_mgmt_tx(struct adapter *adap, struct sk_buff *skb) 1281f7917c00SJeff Kirsher { 1282f7917c00SJeff Kirsher int ret; 1283f7917c00SJeff Kirsher 1284f7917c00SJeff Kirsher local_bh_disable(); 1285f7917c00SJeff Kirsher ret = ctrl_xmit(&adap->sge.ctrlq[0], skb); 1286f7917c00SJeff Kirsher local_bh_enable(); 1287f7917c00SJeff Kirsher return ret; 1288f7917c00SJeff Kirsher } 1289f7917c00SJeff Kirsher 1290f7917c00SJeff Kirsher /** 1291f7917c00SJeff Kirsher * is_ofld_imm - check whether a packet can be sent as immediate data 1292f7917c00SJeff Kirsher * @skb: the packet 1293f7917c00SJeff Kirsher * 1294f7917c00SJeff Kirsher * Returns true if a packet can be sent as an offload WR with immediate 1295f7917c00SJeff Kirsher * data. We currently use the same limit as for Ethernet packets. 1296f7917c00SJeff Kirsher */ 1297f7917c00SJeff Kirsher static inline int is_ofld_imm(const struct sk_buff *skb) 1298f7917c00SJeff Kirsher { 1299f7917c00SJeff Kirsher return skb->len <= MAX_IMM_TX_PKT_LEN; 1300f7917c00SJeff Kirsher } 1301f7917c00SJeff Kirsher 1302f7917c00SJeff Kirsher /** 1303f7917c00SJeff Kirsher * calc_tx_flits_ofld - calculate # of flits for an offload packet 1304f7917c00SJeff Kirsher * @skb: the packet 1305f7917c00SJeff Kirsher * 1306f7917c00SJeff Kirsher * Returns the number of flits needed for the given offload packet. 1307f7917c00SJeff Kirsher * These packets are already fully constructed and no additional headers 1308f7917c00SJeff Kirsher * will be added. 1309f7917c00SJeff Kirsher */ 1310f7917c00SJeff Kirsher static inline unsigned int calc_tx_flits_ofld(const struct sk_buff *skb) 1311f7917c00SJeff Kirsher { 1312f7917c00SJeff Kirsher unsigned int flits, cnt; 1313f7917c00SJeff Kirsher 1314f7917c00SJeff Kirsher if (is_ofld_imm(skb)) 1315f7917c00SJeff Kirsher return DIV_ROUND_UP(skb->len, 8); 1316f7917c00SJeff Kirsher 1317f7917c00SJeff Kirsher flits = skb_transport_offset(skb) / 8U; /* headers */ 1318f7917c00SJeff Kirsher cnt = skb_shinfo(skb)->nr_frags; 131915dd16c2SLi RongQing if (skb_tail_pointer(skb) != skb_transport_header(skb)) 1320f7917c00SJeff Kirsher cnt++; 1321f7917c00SJeff Kirsher return flits + sgl_len(cnt); 1322f7917c00SJeff Kirsher } 1323f7917c00SJeff Kirsher 1324f7917c00SJeff Kirsher /** 1325f7917c00SJeff Kirsher * txq_stop_maperr - stop a Tx queue due to I/O MMU exhaustion 1326f7917c00SJeff Kirsher * @adap: the adapter 1327f7917c00SJeff Kirsher * @q: the queue to stop 1328f7917c00SJeff Kirsher * 1329f7917c00SJeff Kirsher * Mark a Tx queue stopped due to I/O MMU exhaustion and resulting 1330f7917c00SJeff Kirsher * inability to map packets. A periodic timer attempts to restart 1331f7917c00SJeff Kirsher * queues so marked. 1332f7917c00SJeff Kirsher */ 1333f7917c00SJeff Kirsher static void txq_stop_maperr(struct sge_ofld_txq *q) 1334f7917c00SJeff Kirsher { 1335f7917c00SJeff Kirsher q->mapping_err++; 1336f7917c00SJeff Kirsher q->q.stops++; 1337f7917c00SJeff Kirsher set_bit(q->q.cntxt_id - q->adap->sge.egr_start, 1338f7917c00SJeff Kirsher q->adap->sge.txq_maperr); 1339f7917c00SJeff Kirsher } 1340f7917c00SJeff Kirsher 1341f7917c00SJeff Kirsher /** 1342f7917c00SJeff Kirsher * ofldtxq_stop - stop an offload Tx queue that has become full 1343f7917c00SJeff Kirsher * @q: the queue to stop 1344f7917c00SJeff Kirsher * @skb: the packet causing the queue to become full 1345f7917c00SJeff Kirsher * 1346f7917c00SJeff Kirsher * Stops an offload Tx queue that has become full and modifies the packet 1347f7917c00SJeff Kirsher * being written to request a wakeup. 1348f7917c00SJeff Kirsher */ 1349f7917c00SJeff Kirsher static void ofldtxq_stop(struct sge_ofld_txq *q, struct sk_buff *skb) 1350f7917c00SJeff Kirsher { 1351f7917c00SJeff Kirsher struct fw_wr_hdr *wr = (struct fw_wr_hdr *)skb->data; 1352f7917c00SJeff Kirsher 1353f7917c00SJeff Kirsher wr->lo |= htonl(FW_WR_EQUEQ | FW_WR_EQUIQ); 1354f7917c00SJeff Kirsher q->q.stops++; 1355f7917c00SJeff Kirsher q->full = 1; 1356f7917c00SJeff Kirsher } 1357f7917c00SJeff Kirsher 1358f7917c00SJeff Kirsher /** 1359f7917c00SJeff Kirsher * service_ofldq - restart a suspended offload queue 1360f7917c00SJeff Kirsher * @q: the offload queue 1361f7917c00SJeff Kirsher * 1362f7917c00SJeff Kirsher * Services an offload Tx queue by moving packets from its packet queue 1363f7917c00SJeff Kirsher * to the HW Tx ring. The function starts and ends with the queue locked. 1364f7917c00SJeff Kirsher */ 1365f7917c00SJeff Kirsher static void service_ofldq(struct sge_ofld_txq *q) 1366f7917c00SJeff Kirsher { 1367f7917c00SJeff Kirsher u64 *pos; 1368f7917c00SJeff Kirsher int credits; 1369f7917c00SJeff Kirsher struct sk_buff *skb; 1370f7917c00SJeff Kirsher unsigned int written = 0; 1371f7917c00SJeff Kirsher unsigned int flits, ndesc; 1372f7917c00SJeff Kirsher 1373f7917c00SJeff Kirsher while ((skb = skb_peek(&q->sendq)) != NULL && !q->full) { 1374f7917c00SJeff Kirsher /* 1375f7917c00SJeff Kirsher * We drop the lock but leave skb on sendq, thus retaining 1376f7917c00SJeff Kirsher * exclusive access to the state of the queue. 1377f7917c00SJeff Kirsher */ 1378f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1379f7917c00SJeff Kirsher 1380f7917c00SJeff Kirsher reclaim_completed_tx(q->adap, &q->q, false); 1381f7917c00SJeff Kirsher 1382f7917c00SJeff Kirsher flits = skb->priority; /* previously saved */ 1383f7917c00SJeff Kirsher ndesc = flits_to_desc(flits); 1384f7917c00SJeff Kirsher credits = txq_avail(&q->q) - ndesc; 1385f7917c00SJeff Kirsher BUG_ON(credits < 0); 1386f7917c00SJeff Kirsher if (unlikely(credits < TXQ_STOP_THRES)) 1387f7917c00SJeff Kirsher ofldtxq_stop(q, skb); 1388f7917c00SJeff Kirsher 1389f7917c00SJeff Kirsher pos = (u64 *)&q->q.desc[q->q.pidx]; 1390f7917c00SJeff Kirsher if (is_ofld_imm(skb)) 1391f7917c00SJeff Kirsher inline_tx_skb(skb, &q->q, pos); 1392f7917c00SJeff Kirsher else if (map_skb(q->adap->pdev_dev, skb, 1393f7917c00SJeff Kirsher (dma_addr_t *)skb->head)) { 1394f7917c00SJeff Kirsher txq_stop_maperr(q); 1395f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1396f7917c00SJeff Kirsher break; 1397f7917c00SJeff Kirsher } else { 1398f7917c00SJeff Kirsher int last_desc, hdr_len = skb_transport_offset(skb); 1399f7917c00SJeff Kirsher 1400f7917c00SJeff Kirsher memcpy(pos, skb->data, hdr_len); 1401f7917c00SJeff Kirsher write_sgl(skb, &q->q, (void *)pos + hdr_len, 1402f7917c00SJeff Kirsher pos + flits, hdr_len, 1403f7917c00SJeff Kirsher (dma_addr_t *)skb->head); 1404f7917c00SJeff Kirsher #ifdef CONFIG_NEED_DMA_MAP_STATE 1405f7917c00SJeff Kirsher skb->dev = q->adap->port[0]; 1406f7917c00SJeff Kirsher skb->destructor = deferred_unmap_destructor; 1407f7917c00SJeff Kirsher #endif 1408f7917c00SJeff Kirsher last_desc = q->q.pidx + ndesc - 1; 1409f7917c00SJeff Kirsher if (last_desc >= q->q.size) 1410f7917c00SJeff Kirsher last_desc -= q->q.size; 1411f7917c00SJeff Kirsher q->q.sdesc[last_desc].skb = skb; 1412f7917c00SJeff Kirsher } 1413f7917c00SJeff Kirsher 1414f7917c00SJeff Kirsher txq_advance(&q->q, ndesc); 1415f7917c00SJeff Kirsher written += ndesc; 1416f7917c00SJeff Kirsher if (unlikely(written > 32)) { 1417f7917c00SJeff Kirsher ring_tx_db(q->adap, &q->q, written); 1418f7917c00SJeff Kirsher written = 0; 1419f7917c00SJeff Kirsher } 1420f7917c00SJeff Kirsher 1421f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1422f7917c00SJeff Kirsher __skb_unlink(skb, &q->sendq); 1423f7917c00SJeff Kirsher if (is_ofld_imm(skb)) 1424f7917c00SJeff Kirsher kfree_skb(skb); 1425f7917c00SJeff Kirsher } 1426f7917c00SJeff Kirsher if (likely(written)) 1427f7917c00SJeff Kirsher ring_tx_db(q->adap, &q->q, written); 1428f7917c00SJeff Kirsher } 1429f7917c00SJeff Kirsher 1430f7917c00SJeff Kirsher /** 1431f7917c00SJeff Kirsher * ofld_xmit - send a packet through an offload queue 1432f7917c00SJeff Kirsher * @q: the Tx offload queue 1433f7917c00SJeff Kirsher * @skb: the packet 1434f7917c00SJeff Kirsher * 1435f7917c00SJeff Kirsher * Send an offload packet through an SGE offload queue. 1436f7917c00SJeff Kirsher */ 1437f7917c00SJeff Kirsher static int ofld_xmit(struct sge_ofld_txq *q, struct sk_buff *skb) 1438f7917c00SJeff Kirsher { 1439f7917c00SJeff Kirsher skb->priority = calc_tx_flits_ofld(skb); /* save for restart */ 1440f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1441f7917c00SJeff Kirsher __skb_queue_tail(&q->sendq, skb); 1442f7917c00SJeff Kirsher if (q->sendq.qlen == 1) 1443f7917c00SJeff Kirsher service_ofldq(q); 1444f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1445f7917c00SJeff Kirsher return NET_XMIT_SUCCESS; 1446f7917c00SJeff Kirsher } 1447f7917c00SJeff Kirsher 1448f7917c00SJeff Kirsher /** 1449f7917c00SJeff Kirsher * restart_ofldq - restart a suspended offload queue 1450f7917c00SJeff Kirsher * @data: the offload queue to restart 1451f7917c00SJeff Kirsher * 1452f7917c00SJeff Kirsher * Resumes transmission on a suspended Tx offload queue. 1453f7917c00SJeff Kirsher */ 1454f7917c00SJeff Kirsher static void restart_ofldq(unsigned long data) 1455f7917c00SJeff Kirsher { 1456f7917c00SJeff Kirsher struct sge_ofld_txq *q = (struct sge_ofld_txq *)data; 1457f7917c00SJeff Kirsher 1458f7917c00SJeff Kirsher spin_lock(&q->sendq.lock); 1459f7917c00SJeff Kirsher q->full = 0; /* the queue actually is completely empty now */ 1460f7917c00SJeff Kirsher service_ofldq(q); 1461f7917c00SJeff Kirsher spin_unlock(&q->sendq.lock); 1462f7917c00SJeff Kirsher } 1463f7917c00SJeff Kirsher 1464f7917c00SJeff Kirsher /** 1465f7917c00SJeff Kirsher * skb_txq - return the Tx queue an offload packet should use 1466f7917c00SJeff Kirsher * @skb: the packet 1467f7917c00SJeff Kirsher * 1468f7917c00SJeff Kirsher * Returns the Tx queue an offload packet should use as indicated by bits 1469f7917c00SJeff Kirsher * 1-15 in the packet's queue_mapping. 1470f7917c00SJeff Kirsher */ 1471f7917c00SJeff Kirsher static inline unsigned int skb_txq(const struct sk_buff *skb) 1472f7917c00SJeff Kirsher { 1473f7917c00SJeff Kirsher return skb->queue_mapping >> 1; 1474f7917c00SJeff Kirsher } 1475f7917c00SJeff Kirsher 1476f7917c00SJeff Kirsher /** 1477f7917c00SJeff Kirsher * is_ctrl_pkt - return whether an offload packet is a control packet 1478f7917c00SJeff Kirsher * @skb: the packet 1479f7917c00SJeff Kirsher * 1480f7917c00SJeff Kirsher * Returns whether an offload packet should use an OFLD or a CTRL 1481f7917c00SJeff Kirsher * Tx queue as indicated by bit 0 in the packet's queue_mapping. 1482f7917c00SJeff Kirsher */ 1483f7917c00SJeff Kirsher static inline unsigned int is_ctrl_pkt(const struct sk_buff *skb) 1484f7917c00SJeff Kirsher { 1485f7917c00SJeff Kirsher return skb->queue_mapping & 1; 1486f7917c00SJeff Kirsher } 1487f7917c00SJeff Kirsher 1488f7917c00SJeff Kirsher static inline int ofld_send(struct adapter *adap, struct sk_buff *skb) 1489f7917c00SJeff Kirsher { 1490f7917c00SJeff Kirsher unsigned int idx = skb_txq(skb); 1491f7917c00SJeff Kirsher 14924fe44dd7SKumar Sanghvi if (unlikely(is_ctrl_pkt(skb))) { 14934fe44dd7SKumar Sanghvi /* Single ctrl queue is a requirement for LE workaround path */ 14944fe44dd7SKumar Sanghvi if (adap->tids.nsftids) 14954fe44dd7SKumar Sanghvi idx = 0; 1496f7917c00SJeff Kirsher return ctrl_xmit(&adap->sge.ctrlq[idx], skb); 14974fe44dd7SKumar Sanghvi } 1498f7917c00SJeff Kirsher return ofld_xmit(&adap->sge.ofldtxq[idx], skb); 1499f7917c00SJeff Kirsher } 1500f7917c00SJeff Kirsher 1501f7917c00SJeff Kirsher /** 1502f7917c00SJeff Kirsher * t4_ofld_send - send an offload packet 1503f7917c00SJeff Kirsher * @adap: the adapter 1504f7917c00SJeff Kirsher * @skb: the packet 1505f7917c00SJeff Kirsher * 1506f7917c00SJeff Kirsher * Sends an offload packet. We use the packet queue_mapping to select the 1507f7917c00SJeff Kirsher * appropriate Tx queue as follows: bit 0 indicates whether the packet 1508f7917c00SJeff Kirsher * should be sent as regular or control, bits 1-15 select the queue. 1509f7917c00SJeff Kirsher */ 1510f7917c00SJeff Kirsher int t4_ofld_send(struct adapter *adap, struct sk_buff *skb) 1511f7917c00SJeff Kirsher { 1512f7917c00SJeff Kirsher int ret; 1513f7917c00SJeff Kirsher 1514f7917c00SJeff Kirsher local_bh_disable(); 1515f7917c00SJeff Kirsher ret = ofld_send(adap, skb); 1516f7917c00SJeff Kirsher local_bh_enable(); 1517f7917c00SJeff Kirsher return ret; 1518f7917c00SJeff Kirsher } 1519f7917c00SJeff Kirsher 1520f7917c00SJeff Kirsher /** 1521f7917c00SJeff Kirsher * cxgb4_ofld_send - send an offload packet 1522f7917c00SJeff Kirsher * @dev: the net device 1523f7917c00SJeff Kirsher * @skb: the packet 1524f7917c00SJeff Kirsher * 1525f7917c00SJeff Kirsher * Sends an offload packet. This is an exported version of @t4_ofld_send, 1526f7917c00SJeff Kirsher * intended for ULDs. 1527f7917c00SJeff Kirsher */ 1528f7917c00SJeff Kirsher int cxgb4_ofld_send(struct net_device *dev, struct sk_buff *skb) 1529f7917c00SJeff Kirsher { 1530f7917c00SJeff Kirsher return t4_ofld_send(netdev2adap(dev), skb); 1531f7917c00SJeff Kirsher } 1532f7917c00SJeff Kirsher EXPORT_SYMBOL(cxgb4_ofld_send); 1533f7917c00SJeff Kirsher 1534e91b0f24SIan Campbell static inline void copy_frags(struct sk_buff *skb, 1535f7917c00SJeff Kirsher const struct pkt_gl *gl, unsigned int offset) 1536f7917c00SJeff Kirsher { 1537e91b0f24SIan Campbell int i; 1538f7917c00SJeff Kirsher 1539f7917c00SJeff Kirsher /* usually there's just one frag */ 1540e91b0f24SIan Campbell __skb_fill_page_desc(skb, 0, gl->frags[0].page, 1541e91b0f24SIan Campbell gl->frags[0].offset + offset, 1542e91b0f24SIan Campbell gl->frags[0].size - offset); 1543e91b0f24SIan Campbell skb_shinfo(skb)->nr_frags = gl->nfrags; 1544e91b0f24SIan Campbell for (i = 1; i < gl->nfrags; i++) 1545e91b0f24SIan Campbell __skb_fill_page_desc(skb, i, gl->frags[i].page, 1546e91b0f24SIan Campbell gl->frags[i].offset, 1547e91b0f24SIan Campbell gl->frags[i].size); 1548f7917c00SJeff Kirsher 1549f7917c00SJeff Kirsher /* get a reference to the last page, we don't own it */ 1550e91b0f24SIan Campbell get_page(gl->frags[gl->nfrags - 1].page); 1551f7917c00SJeff Kirsher } 1552f7917c00SJeff Kirsher 1553f7917c00SJeff Kirsher /** 1554f7917c00SJeff Kirsher * cxgb4_pktgl_to_skb - build an sk_buff from a packet gather list 1555f7917c00SJeff Kirsher * @gl: the gather list 1556f7917c00SJeff Kirsher * @skb_len: size of sk_buff main body if it carries fragments 1557f7917c00SJeff Kirsher * @pull_len: amount of data to move to the sk_buff's main body 1558f7917c00SJeff Kirsher * 1559f7917c00SJeff Kirsher * Builds an sk_buff from the given packet gather list. Returns the 1560f7917c00SJeff Kirsher * sk_buff or %NULL if sk_buff allocation failed. 1561f7917c00SJeff Kirsher */ 1562f7917c00SJeff Kirsher struct sk_buff *cxgb4_pktgl_to_skb(const struct pkt_gl *gl, 1563f7917c00SJeff Kirsher unsigned int skb_len, unsigned int pull_len) 1564f7917c00SJeff Kirsher { 1565f7917c00SJeff Kirsher struct sk_buff *skb; 1566f7917c00SJeff Kirsher 1567f7917c00SJeff Kirsher /* 1568f7917c00SJeff Kirsher * Below we rely on RX_COPY_THRES being less than the smallest Rx buffer 1569f7917c00SJeff Kirsher * size, which is expected since buffers are at least PAGE_SIZEd. 1570f7917c00SJeff Kirsher * In this case packets up to RX_COPY_THRES have only one fragment. 1571f7917c00SJeff Kirsher */ 1572f7917c00SJeff Kirsher if (gl->tot_len <= RX_COPY_THRES) { 1573f7917c00SJeff Kirsher skb = dev_alloc_skb(gl->tot_len); 1574f7917c00SJeff Kirsher if (unlikely(!skb)) 1575f7917c00SJeff Kirsher goto out; 1576f7917c00SJeff Kirsher __skb_put(skb, gl->tot_len); 1577f7917c00SJeff Kirsher skb_copy_to_linear_data(skb, gl->va, gl->tot_len); 1578f7917c00SJeff Kirsher } else { 1579f7917c00SJeff Kirsher skb = dev_alloc_skb(skb_len); 1580f7917c00SJeff Kirsher if (unlikely(!skb)) 1581f7917c00SJeff Kirsher goto out; 1582f7917c00SJeff Kirsher __skb_put(skb, pull_len); 1583f7917c00SJeff Kirsher skb_copy_to_linear_data(skb, gl->va, pull_len); 1584f7917c00SJeff Kirsher 1585e91b0f24SIan Campbell copy_frags(skb, gl, pull_len); 1586f7917c00SJeff Kirsher skb->len = gl->tot_len; 1587f7917c00SJeff Kirsher skb->data_len = skb->len - pull_len; 1588f7917c00SJeff Kirsher skb->truesize += skb->data_len; 1589f7917c00SJeff Kirsher } 1590f7917c00SJeff Kirsher out: return skb; 1591f7917c00SJeff Kirsher } 1592f7917c00SJeff Kirsher EXPORT_SYMBOL(cxgb4_pktgl_to_skb); 1593f7917c00SJeff Kirsher 1594f7917c00SJeff Kirsher /** 1595f7917c00SJeff Kirsher * t4_pktgl_free - free a packet gather list 1596f7917c00SJeff Kirsher * @gl: the gather list 1597f7917c00SJeff Kirsher * 1598f7917c00SJeff Kirsher * Releases the pages of a packet gather list. We do not own the last 1599f7917c00SJeff Kirsher * page on the list and do not free it. 1600f7917c00SJeff Kirsher */ 1601f7917c00SJeff Kirsher static void t4_pktgl_free(const struct pkt_gl *gl) 1602f7917c00SJeff Kirsher { 1603f7917c00SJeff Kirsher int n; 1604e91b0f24SIan Campbell const struct page_frag *p; 1605f7917c00SJeff Kirsher 1606f7917c00SJeff Kirsher for (p = gl->frags, n = gl->nfrags - 1; n--; p++) 1607f7917c00SJeff Kirsher put_page(p->page); 1608f7917c00SJeff Kirsher } 1609f7917c00SJeff Kirsher 1610f7917c00SJeff Kirsher /* 1611f7917c00SJeff Kirsher * Process an MPS trace packet. Give it an unused protocol number so it won't 1612f7917c00SJeff Kirsher * be delivered to anyone and send it to the stack for capture. 1613f7917c00SJeff Kirsher */ 1614f7917c00SJeff Kirsher static noinline int handle_trace_pkt(struct adapter *adap, 1615f7917c00SJeff Kirsher const struct pkt_gl *gl) 1616f7917c00SJeff Kirsher { 1617f7917c00SJeff Kirsher struct sk_buff *skb; 1618f7917c00SJeff Kirsher 1619f7917c00SJeff Kirsher skb = cxgb4_pktgl_to_skb(gl, RX_PULL_LEN, RX_PULL_LEN); 1620f7917c00SJeff Kirsher if (unlikely(!skb)) { 1621f7917c00SJeff Kirsher t4_pktgl_free(gl); 1622f7917c00SJeff Kirsher return 0; 1623f7917c00SJeff Kirsher } 1624f7917c00SJeff Kirsher 1625d14807ddSHariprasad Shenai if (is_t4(adap->params.chip)) 16260a57a536SSantosh Rastapur __skb_pull(skb, sizeof(struct cpl_trace_pkt)); 16270a57a536SSantosh Rastapur else 16280a57a536SSantosh Rastapur __skb_pull(skb, sizeof(struct cpl_t5_trace_pkt)); 16290a57a536SSantosh Rastapur 1630f7917c00SJeff Kirsher skb_reset_mac_header(skb); 1631f7917c00SJeff Kirsher skb->protocol = htons(0xffff); 1632f7917c00SJeff Kirsher skb->dev = adap->port[0]; 1633f7917c00SJeff Kirsher netif_receive_skb(skb); 1634f7917c00SJeff Kirsher return 0; 1635f7917c00SJeff Kirsher } 1636f7917c00SJeff Kirsher 1637f7917c00SJeff Kirsher static void do_gro(struct sge_eth_rxq *rxq, const struct pkt_gl *gl, 1638f7917c00SJeff Kirsher const struct cpl_rx_pkt *pkt) 1639f7917c00SJeff Kirsher { 164052367a76SVipul Pandya struct adapter *adapter = rxq->rspq.adap; 164152367a76SVipul Pandya struct sge *s = &adapter->sge; 1642f7917c00SJeff Kirsher int ret; 1643f7917c00SJeff Kirsher struct sk_buff *skb; 1644f7917c00SJeff Kirsher 1645f7917c00SJeff Kirsher skb = napi_get_frags(&rxq->rspq.napi); 1646f7917c00SJeff Kirsher if (unlikely(!skb)) { 1647f7917c00SJeff Kirsher t4_pktgl_free(gl); 1648f7917c00SJeff Kirsher rxq->stats.rx_drops++; 1649f7917c00SJeff Kirsher return; 1650f7917c00SJeff Kirsher } 1651f7917c00SJeff Kirsher 165252367a76SVipul Pandya copy_frags(skb, gl, s->pktshift); 165352367a76SVipul Pandya skb->len = gl->tot_len - s->pktshift; 1654f7917c00SJeff Kirsher skb->data_len = skb->len; 1655f7917c00SJeff Kirsher skb->truesize += skb->data_len; 1656f7917c00SJeff Kirsher skb->ip_summed = CHECKSUM_UNNECESSARY; 1657f7917c00SJeff Kirsher skb_record_rx_queue(skb, rxq->rspq.idx); 1658f7917c00SJeff Kirsher if (rxq->rspq.netdev->features & NETIF_F_RXHASH) 16598264989cSTom Herbert skb_set_hash(skb, (__force u32)pkt->rsshdr.hash_val, 16608264989cSTom Herbert PKT_HASH_TYPE_L3); 1661f7917c00SJeff Kirsher 1662f7917c00SJeff Kirsher if (unlikely(pkt->vlan_ex)) { 166386a9bad3SPatrick McHardy __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), ntohs(pkt->vlan)); 1664f7917c00SJeff Kirsher rxq->stats.vlan_ex++; 1665f7917c00SJeff Kirsher } 1666f7917c00SJeff Kirsher ret = napi_gro_frags(&rxq->rspq.napi); 1667f7917c00SJeff Kirsher if (ret == GRO_HELD) 1668f7917c00SJeff Kirsher rxq->stats.lro_pkts++; 1669f7917c00SJeff Kirsher else if (ret == GRO_MERGED || ret == GRO_MERGED_FREE) 1670f7917c00SJeff Kirsher rxq->stats.lro_merged++; 1671f7917c00SJeff Kirsher rxq->stats.pkts++; 1672f7917c00SJeff Kirsher rxq->stats.rx_cso++; 1673f7917c00SJeff Kirsher } 1674f7917c00SJeff Kirsher 1675f7917c00SJeff Kirsher /** 1676f7917c00SJeff Kirsher * t4_ethrx_handler - process an ingress ethernet packet 1677f7917c00SJeff Kirsher * @q: the response queue that received the packet 1678f7917c00SJeff Kirsher * @rsp: the response queue descriptor holding the RX_PKT message 1679f7917c00SJeff Kirsher * @si: the gather list of packet fragments 1680f7917c00SJeff Kirsher * 1681f7917c00SJeff Kirsher * Process an ingress ethernet packet and deliver it to the stack. 1682f7917c00SJeff Kirsher */ 1683f7917c00SJeff Kirsher int t4_ethrx_handler(struct sge_rspq *q, const __be64 *rsp, 1684f7917c00SJeff Kirsher const struct pkt_gl *si) 1685f7917c00SJeff Kirsher { 1686f7917c00SJeff Kirsher bool csum_ok; 1687f7917c00SJeff Kirsher struct sk_buff *skb; 1688f7917c00SJeff Kirsher const struct cpl_rx_pkt *pkt; 1689f7917c00SJeff Kirsher struct sge_eth_rxq *rxq = container_of(q, struct sge_eth_rxq, rspq); 169052367a76SVipul Pandya struct sge *s = &q->adap->sge; 1691d14807ddSHariprasad Shenai int cpl_trace_pkt = is_t4(q->adap->params.chip) ? 16920a57a536SSantosh Rastapur CPL_TRACE_PKT : CPL_TRACE_PKT_T5; 1693f7917c00SJeff Kirsher 16940a57a536SSantosh Rastapur if (unlikely(*(u8 *)rsp == cpl_trace_pkt)) 1695f7917c00SJeff Kirsher return handle_trace_pkt(q->adap, si); 1696f7917c00SJeff Kirsher 1697f7917c00SJeff Kirsher pkt = (const struct cpl_rx_pkt *)rsp; 1698f7917c00SJeff Kirsher csum_ok = pkt->csum_calc && !pkt->err_vec; 1699f7917c00SJeff Kirsher if ((pkt->l2info & htonl(RXF_TCP)) && 1700f7917c00SJeff Kirsher (q->netdev->features & NETIF_F_GRO) && csum_ok && !pkt->ip_frag) { 1701f7917c00SJeff Kirsher do_gro(rxq, si, pkt); 1702f7917c00SJeff Kirsher return 0; 1703f7917c00SJeff Kirsher } 1704f7917c00SJeff Kirsher 1705f7917c00SJeff Kirsher skb = cxgb4_pktgl_to_skb(si, RX_PKT_SKB_LEN, RX_PULL_LEN); 1706f7917c00SJeff Kirsher if (unlikely(!skb)) { 1707f7917c00SJeff Kirsher t4_pktgl_free(si); 1708f7917c00SJeff Kirsher rxq->stats.rx_drops++; 1709f7917c00SJeff Kirsher return 0; 1710f7917c00SJeff Kirsher } 1711f7917c00SJeff Kirsher 171252367a76SVipul Pandya __skb_pull(skb, s->pktshift); /* remove ethernet header padding */ 1713f7917c00SJeff Kirsher skb->protocol = eth_type_trans(skb, q->netdev); 1714f7917c00SJeff Kirsher skb_record_rx_queue(skb, q->idx); 1715f7917c00SJeff Kirsher if (skb->dev->features & NETIF_F_RXHASH) 17168264989cSTom Herbert skb_set_hash(skb, (__force u32)pkt->rsshdr.hash_val, 17178264989cSTom Herbert PKT_HASH_TYPE_L3); 1718f7917c00SJeff Kirsher 1719f7917c00SJeff Kirsher rxq->stats.pkts++; 1720f7917c00SJeff Kirsher 1721f7917c00SJeff Kirsher if (csum_ok && (q->netdev->features & NETIF_F_RXCSUM) && 1722f7917c00SJeff Kirsher (pkt->l2info & htonl(RXF_UDP | RXF_TCP))) { 1723f7917c00SJeff Kirsher if (!pkt->ip_frag) { 1724f7917c00SJeff Kirsher skb->ip_summed = CHECKSUM_UNNECESSARY; 1725f7917c00SJeff Kirsher rxq->stats.rx_cso++; 1726f7917c00SJeff Kirsher } else if (pkt->l2info & htonl(RXF_IP)) { 1727f7917c00SJeff Kirsher __sum16 c = (__force __sum16)pkt->csum; 1728f7917c00SJeff Kirsher skb->csum = csum_unfold(c); 1729f7917c00SJeff Kirsher skb->ip_summed = CHECKSUM_COMPLETE; 1730f7917c00SJeff Kirsher rxq->stats.rx_cso++; 1731f7917c00SJeff Kirsher } 1732f7917c00SJeff Kirsher } else 1733f7917c00SJeff Kirsher skb_checksum_none_assert(skb); 1734f7917c00SJeff Kirsher 1735f7917c00SJeff Kirsher if (unlikely(pkt->vlan_ex)) { 173686a9bad3SPatrick McHardy __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), ntohs(pkt->vlan)); 1737f7917c00SJeff Kirsher rxq->stats.vlan_ex++; 1738f7917c00SJeff Kirsher } 1739f7917c00SJeff Kirsher netif_receive_skb(skb); 1740f7917c00SJeff Kirsher return 0; 1741f7917c00SJeff Kirsher } 1742f7917c00SJeff Kirsher 1743f7917c00SJeff Kirsher /** 1744f7917c00SJeff Kirsher * restore_rx_bufs - put back a packet's Rx buffers 1745f7917c00SJeff Kirsher * @si: the packet gather list 1746f7917c00SJeff Kirsher * @q: the SGE free list 1747f7917c00SJeff Kirsher * @frags: number of FL buffers to restore 1748f7917c00SJeff Kirsher * 1749f7917c00SJeff Kirsher * Puts back on an FL the Rx buffers associated with @si. The buffers 1750f7917c00SJeff Kirsher * have already been unmapped and are left unmapped, we mark them so to 1751f7917c00SJeff Kirsher * prevent further unmapping attempts. 1752f7917c00SJeff Kirsher * 1753f7917c00SJeff Kirsher * This function undoes a series of @unmap_rx_buf calls when we find out 1754f7917c00SJeff Kirsher * that the current packet can't be processed right away afterall and we 1755f7917c00SJeff Kirsher * need to come back to it later. This is a very rare event and there's 1756f7917c00SJeff Kirsher * no effort to make this particularly efficient. 1757f7917c00SJeff Kirsher */ 1758f7917c00SJeff Kirsher static void restore_rx_bufs(const struct pkt_gl *si, struct sge_fl *q, 1759f7917c00SJeff Kirsher int frags) 1760f7917c00SJeff Kirsher { 1761f7917c00SJeff Kirsher struct rx_sw_desc *d; 1762f7917c00SJeff Kirsher 1763f7917c00SJeff Kirsher while (frags--) { 1764f7917c00SJeff Kirsher if (q->cidx == 0) 1765f7917c00SJeff Kirsher q->cidx = q->size - 1; 1766f7917c00SJeff Kirsher else 1767f7917c00SJeff Kirsher q->cidx--; 1768f7917c00SJeff Kirsher d = &q->sdesc[q->cidx]; 1769f7917c00SJeff Kirsher d->page = si->frags[frags].page; 1770f7917c00SJeff Kirsher d->dma_addr |= RX_UNMAPPED_BUF; 1771f7917c00SJeff Kirsher q->avail++; 1772f7917c00SJeff Kirsher } 1773f7917c00SJeff Kirsher } 1774f7917c00SJeff Kirsher 1775f7917c00SJeff Kirsher /** 1776f7917c00SJeff Kirsher * is_new_response - check if a response is newly written 1777f7917c00SJeff Kirsher * @r: the response descriptor 1778f7917c00SJeff Kirsher * @q: the response queue 1779f7917c00SJeff Kirsher * 1780f7917c00SJeff Kirsher * Returns true if a response descriptor contains a yet unprocessed 1781f7917c00SJeff Kirsher * response. 1782f7917c00SJeff Kirsher */ 1783f7917c00SJeff Kirsher static inline bool is_new_response(const struct rsp_ctrl *r, 1784f7917c00SJeff Kirsher const struct sge_rspq *q) 1785f7917c00SJeff Kirsher { 1786f7917c00SJeff Kirsher return RSPD_GEN(r->type_gen) == q->gen; 1787f7917c00SJeff Kirsher } 1788f7917c00SJeff Kirsher 1789f7917c00SJeff Kirsher /** 1790f7917c00SJeff Kirsher * rspq_next - advance to the next entry in a response queue 1791f7917c00SJeff Kirsher * @q: the queue 1792f7917c00SJeff Kirsher * 1793f7917c00SJeff Kirsher * Updates the state of a response queue to advance it to the next entry. 1794f7917c00SJeff Kirsher */ 1795f7917c00SJeff Kirsher static inline void rspq_next(struct sge_rspq *q) 1796f7917c00SJeff Kirsher { 1797f7917c00SJeff Kirsher q->cur_desc = (void *)q->cur_desc + q->iqe_len; 1798f7917c00SJeff Kirsher if (unlikely(++q->cidx == q->size)) { 1799f7917c00SJeff Kirsher q->cidx = 0; 1800f7917c00SJeff Kirsher q->gen ^= 1; 1801f7917c00SJeff Kirsher q->cur_desc = q->desc; 1802f7917c00SJeff Kirsher } 1803f7917c00SJeff Kirsher } 1804f7917c00SJeff Kirsher 1805f7917c00SJeff Kirsher /** 1806f7917c00SJeff Kirsher * process_responses - process responses from an SGE response queue 1807f7917c00SJeff Kirsher * @q: the ingress queue to process 1808f7917c00SJeff Kirsher * @budget: how many responses can be processed in this round 1809f7917c00SJeff Kirsher * 1810f7917c00SJeff Kirsher * Process responses from an SGE response queue up to the supplied budget. 1811f7917c00SJeff Kirsher * Responses include received packets as well as control messages from FW 1812f7917c00SJeff Kirsher * or HW. 1813f7917c00SJeff Kirsher * 1814f7917c00SJeff Kirsher * Additionally choose the interrupt holdoff time for the next interrupt 1815f7917c00SJeff Kirsher * on this queue. If the system is under memory shortage use a fairly 1816f7917c00SJeff Kirsher * long delay to help recovery. 1817f7917c00SJeff Kirsher */ 1818f7917c00SJeff Kirsher static int process_responses(struct sge_rspq *q, int budget) 1819f7917c00SJeff Kirsher { 1820f7917c00SJeff Kirsher int ret, rsp_type; 1821f7917c00SJeff Kirsher int budget_left = budget; 1822f7917c00SJeff Kirsher const struct rsp_ctrl *rc; 1823f7917c00SJeff Kirsher struct sge_eth_rxq *rxq = container_of(q, struct sge_eth_rxq, rspq); 182452367a76SVipul Pandya struct adapter *adapter = q->adap; 182552367a76SVipul Pandya struct sge *s = &adapter->sge; 1826f7917c00SJeff Kirsher 1827f7917c00SJeff Kirsher while (likely(budget_left)) { 1828f7917c00SJeff Kirsher rc = (void *)q->cur_desc + (q->iqe_len - sizeof(*rc)); 1829f7917c00SJeff Kirsher if (!is_new_response(rc, q)) 1830f7917c00SJeff Kirsher break; 1831f7917c00SJeff Kirsher 1832f7917c00SJeff Kirsher rmb(); 1833f7917c00SJeff Kirsher rsp_type = RSPD_TYPE(rc->type_gen); 1834f7917c00SJeff Kirsher if (likely(rsp_type == RSP_TYPE_FLBUF)) { 1835e91b0f24SIan Campbell struct page_frag *fp; 1836f7917c00SJeff Kirsher struct pkt_gl si; 1837f7917c00SJeff Kirsher const struct rx_sw_desc *rsd; 1838f7917c00SJeff Kirsher u32 len = ntohl(rc->pldbuflen_qid), bufsz, frags; 1839f7917c00SJeff Kirsher 1840f7917c00SJeff Kirsher if (len & RSPD_NEWBUF) { 1841f7917c00SJeff Kirsher if (likely(q->offset > 0)) { 1842f7917c00SJeff Kirsher free_rx_bufs(q->adap, &rxq->fl, 1); 1843f7917c00SJeff Kirsher q->offset = 0; 1844f7917c00SJeff Kirsher } 1845f7917c00SJeff Kirsher len = RSPD_LEN(len); 1846f7917c00SJeff Kirsher } 1847f7917c00SJeff Kirsher si.tot_len = len; 1848f7917c00SJeff Kirsher 1849f7917c00SJeff Kirsher /* gather packet fragments */ 1850f7917c00SJeff Kirsher for (frags = 0, fp = si.frags; ; frags++, fp++) { 1851f7917c00SJeff Kirsher rsd = &rxq->fl.sdesc[rxq->fl.cidx]; 185252367a76SVipul Pandya bufsz = get_buf_size(adapter, rsd); 1853f7917c00SJeff Kirsher fp->page = rsd->page; 1854e91b0f24SIan Campbell fp->offset = q->offset; 1855e91b0f24SIan Campbell fp->size = min(bufsz, len); 1856e91b0f24SIan Campbell len -= fp->size; 1857f7917c00SJeff Kirsher if (!len) 1858f7917c00SJeff Kirsher break; 1859f7917c00SJeff Kirsher unmap_rx_buf(q->adap, &rxq->fl); 1860f7917c00SJeff Kirsher } 1861f7917c00SJeff Kirsher 1862f7917c00SJeff Kirsher /* 1863f7917c00SJeff Kirsher * Last buffer remains mapped so explicitly make it 1864f7917c00SJeff Kirsher * coherent for CPU access. 1865f7917c00SJeff Kirsher */ 1866f7917c00SJeff Kirsher dma_sync_single_for_cpu(q->adap->pdev_dev, 1867f7917c00SJeff Kirsher get_buf_addr(rsd), 1868e91b0f24SIan Campbell fp->size, DMA_FROM_DEVICE); 1869f7917c00SJeff Kirsher 1870f7917c00SJeff Kirsher si.va = page_address(si.frags[0].page) + 1871e91b0f24SIan Campbell si.frags[0].offset; 1872f7917c00SJeff Kirsher prefetch(si.va); 1873f7917c00SJeff Kirsher 1874f7917c00SJeff Kirsher si.nfrags = frags + 1; 1875f7917c00SJeff Kirsher ret = q->handler(q, q->cur_desc, &si); 1876f7917c00SJeff Kirsher if (likely(ret == 0)) 187752367a76SVipul Pandya q->offset += ALIGN(fp->size, s->fl_align); 1878f7917c00SJeff Kirsher else 1879f7917c00SJeff Kirsher restore_rx_bufs(&si, &rxq->fl, frags); 1880f7917c00SJeff Kirsher } else if (likely(rsp_type == RSP_TYPE_CPL)) { 1881f7917c00SJeff Kirsher ret = q->handler(q, q->cur_desc, NULL); 1882f7917c00SJeff Kirsher } else { 1883f7917c00SJeff Kirsher ret = q->handler(q, (const __be64 *)rc, CXGB4_MSG_AN); 1884f7917c00SJeff Kirsher } 1885f7917c00SJeff Kirsher 1886f7917c00SJeff Kirsher if (unlikely(ret)) { 1887f7917c00SJeff Kirsher /* couldn't process descriptor, back off for recovery */ 1888f7917c00SJeff Kirsher q->next_intr_params = QINTR_TIMER_IDX(NOMEM_TMR_IDX); 1889f7917c00SJeff Kirsher break; 1890f7917c00SJeff Kirsher } 1891f7917c00SJeff Kirsher 1892f7917c00SJeff Kirsher rspq_next(q); 1893f7917c00SJeff Kirsher budget_left--; 1894f7917c00SJeff Kirsher } 1895f7917c00SJeff Kirsher 1896f7917c00SJeff Kirsher if (q->offset >= 0 && rxq->fl.size - rxq->fl.avail >= 16) 1897f7917c00SJeff Kirsher __refill_fl(q->adap, &rxq->fl); 1898f7917c00SJeff Kirsher return budget - budget_left; 1899f7917c00SJeff Kirsher } 1900f7917c00SJeff Kirsher 1901f7917c00SJeff Kirsher /** 1902f7917c00SJeff Kirsher * napi_rx_handler - the NAPI handler for Rx processing 1903f7917c00SJeff Kirsher * @napi: the napi instance 1904f7917c00SJeff Kirsher * @budget: how many packets we can process in this round 1905f7917c00SJeff Kirsher * 1906f7917c00SJeff Kirsher * Handler for new data events when using NAPI. This does not need any 1907f7917c00SJeff Kirsher * locking or protection from interrupts as data interrupts are off at 1908f7917c00SJeff Kirsher * this point and other adapter interrupts do not interfere (the latter 1909f7917c00SJeff Kirsher * in not a concern at all with MSI-X as non-data interrupts then have 1910f7917c00SJeff Kirsher * a separate handler). 1911f7917c00SJeff Kirsher */ 1912f7917c00SJeff Kirsher static int napi_rx_handler(struct napi_struct *napi, int budget) 1913f7917c00SJeff Kirsher { 1914f7917c00SJeff Kirsher unsigned int params; 1915f7917c00SJeff Kirsher struct sge_rspq *q = container_of(napi, struct sge_rspq, napi); 1916f7917c00SJeff Kirsher int work_done = process_responses(q, budget); 1917f7917c00SJeff Kirsher 1918f7917c00SJeff Kirsher if (likely(work_done < budget)) { 1919f7917c00SJeff Kirsher napi_complete(napi); 1920f7917c00SJeff Kirsher params = q->next_intr_params; 1921f7917c00SJeff Kirsher q->next_intr_params = q->intr_params; 1922f7917c00SJeff Kirsher } else 1923f7917c00SJeff Kirsher params = QINTR_TIMER_IDX(7); 1924f7917c00SJeff Kirsher 1925f7917c00SJeff Kirsher t4_write_reg(q->adap, MYPF_REG(SGE_PF_GTS), CIDXINC(work_done) | 1926f7917c00SJeff Kirsher INGRESSQID((u32)q->cntxt_id) | SEINTARM(params)); 1927f7917c00SJeff Kirsher return work_done; 1928f7917c00SJeff Kirsher } 1929f7917c00SJeff Kirsher 1930f7917c00SJeff Kirsher /* 1931f7917c00SJeff Kirsher * The MSI-X interrupt handler for an SGE response queue. 1932f7917c00SJeff Kirsher */ 1933f7917c00SJeff Kirsher irqreturn_t t4_sge_intr_msix(int irq, void *cookie) 1934f7917c00SJeff Kirsher { 1935f7917c00SJeff Kirsher struct sge_rspq *q = cookie; 1936f7917c00SJeff Kirsher 1937f7917c00SJeff Kirsher napi_schedule(&q->napi); 1938f7917c00SJeff Kirsher return IRQ_HANDLED; 1939f7917c00SJeff Kirsher } 1940f7917c00SJeff Kirsher 1941f7917c00SJeff Kirsher /* 1942f7917c00SJeff Kirsher * Process the indirect interrupt entries in the interrupt queue and kick off 1943f7917c00SJeff Kirsher * NAPI for each queue that has generated an entry. 1944f7917c00SJeff Kirsher */ 1945f7917c00SJeff Kirsher static unsigned int process_intrq(struct adapter *adap) 1946f7917c00SJeff Kirsher { 1947f7917c00SJeff Kirsher unsigned int credits; 1948f7917c00SJeff Kirsher const struct rsp_ctrl *rc; 1949f7917c00SJeff Kirsher struct sge_rspq *q = &adap->sge.intrq; 1950f7917c00SJeff Kirsher 1951f7917c00SJeff Kirsher spin_lock(&adap->sge.intrq_lock); 1952f7917c00SJeff Kirsher for (credits = 0; ; credits++) { 1953f7917c00SJeff Kirsher rc = (void *)q->cur_desc + (q->iqe_len - sizeof(*rc)); 1954f7917c00SJeff Kirsher if (!is_new_response(rc, q)) 1955f7917c00SJeff Kirsher break; 1956f7917c00SJeff Kirsher 1957f7917c00SJeff Kirsher rmb(); 1958f7917c00SJeff Kirsher if (RSPD_TYPE(rc->type_gen) == RSP_TYPE_INTR) { 1959f7917c00SJeff Kirsher unsigned int qid = ntohl(rc->pldbuflen_qid); 1960f7917c00SJeff Kirsher 1961f7917c00SJeff Kirsher qid -= adap->sge.ingr_start; 1962f7917c00SJeff Kirsher napi_schedule(&adap->sge.ingr_map[qid]->napi); 1963f7917c00SJeff Kirsher } 1964f7917c00SJeff Kirsher 1965f7917c00SJeff Kirsher rspq_next(q); 1966f7917c00SJeff Kirsher } 1967f7917c00SJeff Kirsher 1968f7917c00SJeff Kirsher t4_write_reg(adap, MYPF_REG(SGE_PF_GTS), CIDXINC(credits) | 1969f7917c00SJeff Kirsher INGRESSQID(q->cntxt_id) | SEINTARM(q->intr_params)); 1970f7917c00SJeff Kirsher spin_unlock(&adap->sge.intrq_lock); 1971f7917c00SJeff Kirsher return credits; 1972f7917c00SJeff Kirsher } 1973f7917c00SJeff Kirsher 1974f7917c00SJeff Kirsher /* 1975f7917c00SJeff Kirsher * The MSI interrupt handler, which handles data events from SGE response queues 1976f7917c00SJeff Kirsher * as well as error and other async events as they all use the same MSI vector. 1977f7917c00SJeff Kirsher */ 1978f7917c00SJeff Kirsher static irqreturn_t t4_intr_msi(int irq, void *cookie) 1979f7917c00SJeff Kirsher { 1980f7917c00SJeff Kirsher struct adapter *adap = cookie; 1981f7917c00SJeff Kirsher 1982f7917c00SJeff Kirsher t4_slow_intr_handler(adap); 1983f7917c00SJeff Kirsher process_intrq(adap); 1984f7917c00SJeff Kirsher return IRQ_HANDLED; 1985f7917c00SJeff Kirsher } 1986f7917c00SJeff Kirsher 1987f7917c00SJeff Kirsher /* 1988f7917c00SJeff Kirsher * Interrupt handler for legacy INTx interrupts. 1989f7917c00SJeff Kirsher * Handles data events from SGE response queues as well as error and other 1990f7917c00SJeff Kirsher * async events as they all use the same interrupt line. 1991f7917c00SJeff Kirsher */ 1992f7917c00SJeff Kirsher static irqreturn_t t4_intr_intx(int irq, void *cookie) 1993f7917c00SJeff Kirsher { 1994f7917c00SJeff Kirsher struct adapter *adap = cookie; 1995f7917c00SJeff Kirsher 1996f7917c00SJeff Kirsher t4_write_reg(adap, MYPF_REG(PCIE_PF_CLI), 0); 1997f7917c00SJeff Kirsher if (t4_slow_intr_handler(adap) | process_intrq(adap)) 1998f7917c00SJeff Kirsher return IRQ_HANDLED; 1999f7917c00SJeff Kirsher return IRQ_NONE; /* probably shared interrupt */ 2000f7917c00SJeff Kirsher } 2001f7917c00SJeff Kirsher 2002f7917c00SJeff Kirsher /** 2003f7917c00SJeff Kirsher * t4_intr_handler - select the top-level interrupt handler 2004f7917c00SJeff Kirsher * @adap: the adapter 2005f7917c00SJeff Kirsher * 2006f7917c00SJeff Kirsher * Selects the top-level interrupt handler based on the type of interrupts 2007f7917c00SJeff Kirsher * (MSI-X, MSI, or INTx). 2008f7917c00SJeff Kirsher */ 2009f7917c00SJeff Kirsher irq_handler_t t4_intr_handler(struct adapter *adap) 2010f7917c00SJeff Kirsher { 2011f7917c00SJeff Kirsher if (adap->flags & USING_MSIX) 2012f7917c00SJeff Kirsher return t4_sge_intr_msix; 2013f7917c00SJeff Kirsher if (adap->flags & USING_MSI) 2014f7917c00SJeff Kirsher return t4_intr_msi; 2015f7917c00SJeff Kirsher return t4_intr_intx; 2016f7917c00SJeff Kirsher } 2017f7917c00SJeff Kirsher 2018f7917c00SJeff Kirsher static void sge_rx_timer_cb(unsigned long data) 2019f7917c00SJeff Kirsher { 2020f7917c00SJeff Kirsher unsigned long m; 20210f4d201fSKumar Sanghvi unsigned int i, idma_same_state_cnt[2]; 2022f7917c00SJeff Kirsher struct adapter *adap = (struct adapter *)data; 2023f7917c00SJeff Kirsher struct sge *s = &adap->sge; 2024f7917c00SJeff Kirsher 2025f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(s->starving_fl); i++) 2026f7917c00SJeff Kirsher for (m = s->starving_fl[i]; m; m &= m - 1) { 2027f7917c00SJeff Kirsher struct sge_eth_rxq *rxq; 2028f7917c00SJeff Kirsher unsigned int id = __ffs(m) + i * BITS_PER_LONG; 2029f7917c00SJeff Kirsher struct sge_fl *fl = s->egr_map[id]; 2030f7917c00SJeff Kirsher 2031f7917c00SJeff Kirsher clear_bit(id, s->starving_fl); 2032f7917c00SJeff Kirsher smp_mb__after_clear_bit(); 2033f7917c00SJeff Kirsher 2034f7917c00SJeff Kirsher if (fl_starving(fl)) { 2035f7917c00SJeff Kirsher rxq = container_of(fl, struct sge_eth_rxq, fl); 2036f7917c00SJeff Kirsher if (napi_reschedule(&rxq->rspq.napi)) 2037f7917c00SJeff Kirsher fl->starving++; 2038f7917c00SJeff Kirsher else 2039f7917c00SJeff Kirsher set_bit(id, s->starving_fl); 2040f7917c00SJeff Kirsher } 2041f7917c00SJeff Kirsher } 2042f7917c00SJeff Kirsher 2043f7917c00SJeff Kirsher t4_write_reg(adap, SGE_DEBUG_INDEX, 13); 20440f4d201fSKumar Sanghvi idma_same_state_cnt[0] = t4_read_reg(adap, SGE_DEBUG_DATA_HIGH); 20450f4d201fSKumar Sanghvi idma_same_state_cnt[1] = t4_read_reg(adap, SGE_DEBUG_DATA_LOW); 2046f7917c00SJeff Kirsher 20470f4d201fSKumar Sanghvi for (i = 0; i < 2; i++) { 20480f4d201fSKumar Sanghvi u32 debug0, debug11; 20490f4d201fSKumar Sanghvi 20500f4d201fSKumar Sanghvi /* If the Ingress DMA Same State Counter ("timer") is less 20510f4d201fSKumar Sanghvi * than 1s, then we can reset our synthesized Stall Timer and 20520f4d201fSKumar Sanghvi * continue. If we have previously emitted warnings about a 20530f4d201fSKumar Sanghvi * potential stalled Ingress Queue, issue a note indicating 20540f4d201fSKumar Sanghvi * that the Ingress Queue has resumed forward progress. 20550f4d201fSKumar Sanghvi */ 20560f4d201fSKumar Sanghvi if (idma_same_state_cnt[i] < s->idma_1s_thresh) { 20570f4d201fSKumar Sanghvi if (s->idma_stalled[i] >= SGE_IDMA_WARN_THRESH) 20580f4d201fSKumar Sanghvi CH_WARN(adap, "SGE idma%d, queue%u,resumed after %d sec\n", 20590f4d201fSKumar Sanghvi i, s->idma_qid[i], 20600f4d201fSKumar Sanghvi s->idma_stalled[i]/HZ); 20610f4d201fSKumar Sanghvi s->idma_stalled[i] = 0; 2062f7917c00SJeff Kirsher continue; 20630f4d201fSKumar Sanghvi } 20640f4d201fSKumar Sanghvi 20650f4d201fSKumar Sanghvi /* Synthesize an SGE Ingress DMA Same State Timer in the Hz 20660f4d201fSKumar Sanghvi * domain. The first time we get here it'll be because we 20670f4d201fSKumar Sanghvi * passed the 1s Threshold; each additional time it'll be 20680f4d201fSKumar Sanghvi * because the RX Timer Callback is being fired on its regular 20690f4d201fSKumar Sanghvi * schedule. 20700f4d201fSKumar Sanghvi * 20710f4d201fSKumar Sanghvi * If the stall is below our Potential Hung Ingress Queue 20720f4d201fSKumar Sanghvi * Warning Threshold, continue. 20730f4d201fSKumar Sanghvi */ 20740f4d201fSKumar Sanghvi if (s->idma_stalled[i] == 0) 20750f4d201fSKumar Sanghvi s->idma_stalled[i] = HZ; 20760f4d201fSKumar Sanghvi else 20770f4d201fSKumar Sanghvi s->idma_stalled[i] += RX_QCHECK_PERIOD; 20780f4d201fSKumar Sanghvi 20790f4d201fSKumar Sanghvi if (s->idma_stalled[i] < SGE_IDMA_WARN_THRESH) 20800f4d201fSKumar Sanghvi continue; 20810f4d201fSKumar Sanghvi 20820f4d201fSKumar Sanghvi /* We'll issue a warning every SGE_IDMA_WARN_REPEAT Hz */ 20830f4d201fSKumar Sanghvi if (((s->idma_stalled[i] - HZ) % SGE_IDMA_WARN_REPEAT) != 0) 20840f4d201fSKumar Sanghvi continue; 20850f4d201fSKumar Sanghvi 20860f4d201fSKumar Sanghvi /* Read and save the SGE IDMA State and Queue ID information. 20870f4d201fSKumar Sanghvi * We do this every time in case it changes across time ... 20880f4d201fSKumar Sanghvi */ 20890f4d201fSKumar Sanghvi t4_write_reg(adap, SGE_DEBUG_INDEX, 0); 20900f4d201fSKumar Sanghvi debug0 = t4_read_reg(adap, SGE_DEBUG_DATA_LOW); 20910f4d201fSKumar Sanghvi s->idma_state[i] = (debug0 >> (i * 9)) & 0x3f; 20920f4d201fSKumar Sanghvi 2093f7917c00SJeff Kirsher t4_write_reg(adap, SGE_DEBUG_INDEX, 11); 20940f4d201fSKumar Sanghvi debug11 = t4_read_reg(adap, SGE_DEBUG_DATA_LOW); 20950f4d201fSKumar Sanghvi s->idma_qid[i] = (debug11 >> (i * 16)) & 0xffff; 20960f4d201fSKumar Sanghvi 20970f4d201fSKumar Sanghvi CH_WARN(adap, "SGE idma%u, queue%u, maybe stuck state%u %dsecs (debug0=%#x, debug11=%#x)\n", 20980f4d201fSKumar Sanghvi i, s->idma_qid[i], s->idma_state[i], 20990f4d201fSKumar Sanghvi s->idma_stalled[i]/HZ, debug0, debug11); 21000f4d201fSKumar Sanghvi t4_sge_decode_idma_state(adap, s->idma_state[i]); 21010f4d201fSKumar Sanghvi } 2102f7917c00SJeff Kirsher 2103f7917c00SJeff Kirsher mod_timer(&s->rx_timer, jiffies + RX_QCHECK_PERIOD); 2104f7917c00SJeff Kirsher } 2105f7917c00SJeff Kirsher 2106f7917c00SJeff Kirsher static void sge_tx_timer_cb(unsigned long data) 2107f7917c00SJeff Kirsher { 2108f7917c00SJeff Kirsher unsigned long m; 2109f7917c00SJeff Kirsher unsigned int i, budget; 2110f7917c00SJeff Kirsher struct adapter *adap = (struct adapter *)data; 2111f7917c00SJeff Kirsher struct sge *s = &adap->sge; 2112f7917c00SJeff Kirsher 2113f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(s->txq_maperr); i++) 2114f7917c00SJeff Kirsher for (m = s->txq_maperr[i]; m; m &= m - 1) { 2115f7917c00SJeff Kirsher unsigned long id = __ffs(m) + i * BITS_PER_LONG; 2116f7917c00SJeff Kirsher struct sge_ofld_txq *txq = s->egr_map[id]; 2117f7917c00SJeff Kirsher 2118f7917c00SJeff Kirsher clear_bit(id, s->txq_maperr); 2119f7917c00SJeff Kirsher tasklet_schedule(&txq->qresume_tsk); 2120f7917c00SJeff Kirsher } 2121f7917c00SJeff Kirsher 2122f7917c00SJeff Kirsher budget = MAX_TIMER_TX_RECLAIM; 2123f7917c00SJeff Kirsher i = s->ethtxq_rover; 2124f7917c00SJeff Kirsher do { 2125f7917c00SJeff Kirsher struct sge_eth_txq *q = &s->ethtxq[i]; 2126f7917c00SJeff Kirsher 2127f7917c00SJeff Kirsher if (q->q.in_use && 2128f7917c00SJeff Kirsher time_after_eq(jiffies, q->txq->trans_start + HZ / 100) && 2129f7917c00SJeff Kirsher __netif_tx_trylock(q->txq)) { 2130f7917c00SJeff Kirsher int avail = reclaimable(&q->q); 2131f7917c00SJeff Kirsher 2132f7917c00SJeff Kirsher if (avail) { 2133f7917c00SJeff Kirsher if (avail > budget) 2134f7917c00SJeff Kirsher avail = budget; 2135f7917c00SJeff Kirsher 2136f7917c00SJeff Kirsher free_tx_desc(adap, &q->q, avail, true); 2137f7917c00SJeff Kirsher q->q.in_use -= avail; 2138f7917c00SJeff Kirsher budget -= avail; 2139f7917c00SJeff Kirsher } 2140f7917c00SJeff Kirsher __netif_tx_unlock(q->txq); 2141f7917c00SJeff Kirsher } 2142f7917c00SJeff Kirsher 2143f7917c00SJeff Kirsher if (++i >= s->ethqsets) 2144f7917c00SJeff Kirsher i = 0; 2145f7917c00SJeff Kirsher } while (budget && i != s->ethtxq_rover); 2146f7917c00SJeff Kirsher s->ethtxq_rover = i; 2147f7917c00SJeff Kirsher mod_timer(&s->tx_timer, jiffies + (budget ? TX_QCHECK_PERIOD : 2)); 2148f7917c00SJeff Kirsher } 2149f7917c00SJeff Kirsher 2150f7917c00SJeff Kirsher int t4_sge_alloc_rxq(struct adapter *adap, struct sge_rspq *iq, bool fwevtq, 2151f7917c00SJeff Kirsher struct net_device *dev, int intr_idx, 2152f7917c00SJeff Kirsher struct sge_fl *fl, rspq_handler_t hnd) 2153f7917c00SJeff Kirsher { 2154f7917c00SJeff Kirsher int ret, flsz = 0; 2155f7917c00SJeff Kirsher struct fw_iq_cmd c; 215652367a76SVipul Pandya struct sge *s = &adap->sge; 2157f7917c00SJeff Kirsher struct port_info *pi = netdev_priv(dev); 2158f7917c00SJeff Kirsher 2159f7917c00SJeff Kirsher /* Size needs to be multiple of 16, including status entry. */ 2160f7917c00SJeff Kirsher iq->size = roundup(iq->size, 16); 2161f7917c00SJeff Kirsher 2162f7917c00SJeff Kirsher iq->desc = alloc_ring(adap->pdev_dev, iq->size, iq->iqe_len, 0, 2163f7917c00SJeff Kirsher &iq->phys_addr, NULL, 0, NUMA_NO_NODE); 2164f7917c00SJeff Kirsher if (!iq->desc) 2165f7917c00SJeff Kirsher return -ENOMEM; 2166f7917c00SJeff Kirsher 2167f7917c00SJeff Kirsher memset(&c, 0, sizeof(c)); 2168f7917c00SJeff Kirsher c.op_to_vfn = htonl(FW_CMD_OP(FW_IQ_CMD) | FW_CMD_REQUEST | 2169f7917c00SJeff Kirsher FW_CMD_WRITE | FW_CMD_EXEC | 2170f7917c00SJeff Kirsher FW_IQ_CMD_PFN(adap->fn) | FW_IQ_CMD_VFN(0)); 2171f7917c00SJeff Kirsher c.alloc_to_len16 = htonl(FW_IQ_CMD_ALLOC | FW_IQ_CMD_IQSTART(1) | 2172f7917c00SJeff Kirsher FW_LEN16(c)); 2173f7917c00SJeff Kirsher c.type_to_iqandstindex = htonl(FW_IQ_CMD_TYPE(FW_IQ_TYPE_FL_INT_CAP) | 2174f7917c00SJeff Kirsher FW_IQ_CMD_IQASYNCH(fwevtq) | FW_IQ_CMD_VIID(pi->viid) | 2175f7917c00SJeff Kirsher FW_IQ_CMD_IQANDST(intr_idx < 0) | FW_IQ_CMD_IQANUD(1) | 2176f7917c00SJeff Kirsher FW_IQ_CMD_IQANDSTINDEX(intr_idx >= 0 ? intr_idx : 2177f7917c00SJeff Kirsher -intr_idx - 1)); 2178f7917c00SJeff Kirsher c.iqdroprss_to_iqesize = htons(FW_IQ_CMD_IQPCIECH(pi->tx_chan) | 2179f7917c00SJeff Kirsher FW_IQ_CMD_IQGTSMODE | 2180f7917c00SJeff Kirsher FW_IQ_CMD_IQINTCNTTHRESH(iq->pktcnt_idx) | 2181f7917c00SJeff Kirsher FW_IQ_CMD_IQESIZE(ilog2(iq->iqe_len) - 4)); 2182f7917c00SJeff Kirsher c.iqsize = htons(iq->size); 2183f7917c00SJeff Kirsher c.iqaddr = cpu_to_be64(iq->phys_addr); 2184f7917c00SJeff Kirsher 2185f7917c00SJeff Kirsher if (fl) { 2186f7917c00SJeff Kirsher fl->size = roundup(fl->size, 8); 2187f7917c00SJeff Kirsher fl->desc = alloc_ring(adap->pdev_dev, fl->size, sizeof(__be64), 2188f7917c00SJeff Kirsher sizeof(struct rx_sw_desc), &fl->addr, 218952367a76SVipul Pandya &fl->sdesc, s->stat_len, NUMA_NO_NODE); 2190f7917c00SJeff Kirsher if (!fl->desc) 2191f7917c00SJeff Kirsher goto fl_nomem; 2192f7917c00SJeff Kirsher 219352367a76SVipul Pandya flsz = fl->size / 8 + s->stat_len / sizeof(struct tx_desc); 2194ce91a923SNaresh Kumar Inna c.iqns_to_fl0congen = htonl(FW_IQ_CMD_FL0PACKEN(1) | 2195f7917c00SJeff Kirsher FW_IQ_CMD_FL0FETCHRO(1) | 2196f7917c00SJeff Kirsher FW_IQ_CMD_FL0DATARO(1) | 2197ce91a923SNaresh Kumar Inna FW_IQ_CMD_FL0PADEN(1)); 2198f7917c00SJeff Kirsher c.fl0dcaen_to_fl0cidxfthresh = htons(FW_IQ_CMD_FL0FBMIN(2) | 2199f7917c00SJeff Kirsher FW_IQ_CMD_FL0FBMAX(3)); 2200f7917c00SJeff Kirsher c.fl0size = htons(flsz); 2201f7917c00SJeff Kirsher c.fl0addr = cpu_to_be64(fl->addr); 2202f7917c00SJeff Kirsher } 2203f7917c00SJeff Kirsher 2204f7917c00SJeff Kirsher ret = t4_wr_mbox(adap, adap->fn, &c, sizeof(c), &c); 2205f7917c00SJeff Kirsher if (ret) 2206f7917c00SJeff Kirsher goto err; 2207f7917c00SJeff Kirsher 2208f7917c00SJeff Kirsher netif_napi_add(dev, &iq->napi, napi_rx_handler, 64); 2209f7917c00SJeff Kirsher iq->cur_desc = iq->desc; 2210f7917c00SJeff Kirsher iq->cidx = 0; 2211f7917c00SJeff Kirsher iq->gen = 1; 2212f7917c00SJeff Kirsher iq->next_intr_params = iq->intr_params; 2213f7917c00SJeff Kirsher iq->cntxt_id = ntohs(c.iqid); 2214f7917c00SJeff Kirsher iq->abs_id = ntohs(c.physiqid); 2215f7917c00SJeff Kirsher iq->size--; /* subtract status entry */ 2216f7917c00SJeff Kirsher iq->adap = adap; 2217f7917c00SJeff Kirsher iq->netdev = dev; 2218f7917c00SJeff Kirsher iq->handler = hnd; 2219f7917c00SJeff Kirsher 2220f7917c00SJeff Kirsher /* set offset to -1 to distinguish ingress queues without FL */ 2221f7917c00SJeff Kirsher iq->offset = fl ? 0 : -1; 2222f7917c00SJeff Kirsher 2223f7917c00SJeff Kirsher adap->sge.ingr_map[iq->cntxt_id - adap->sge.ingr_start] = iq; 2224f7917c00SJeff Kirsher 2225f7917c00SJeff Kirsher if (fl) { 2226f7917c00SJeff Kirsher fl->cntxt_id = ntohs(c.fl0id); 2227f7917c00SJeff Kirsher fl->avail = fl->pend_cred = 0; 2228f7917c00SJeff Kirsher fl->pidx = fl->cidx = 0; 2229f7917c00SJeff Kirsher fl->alloc_failed = fl->large_alloc_failed = fl->starving = 0; 2230f7917c00SJeff Kirsher adap->sge.egr_map[fl->cntxt_id - adap->sge.egr_start] = fl; 2231f7917c00SJeff Kirsher refill_fl(adap, fl, fl_cap(fl), GFP_KERNEL); 2232f7917c00SJeff Kirsher } 2233f7917c00SJeff Kirsher return 0; 2234f7917c00SJeff Kirsher 2235f7917c00SJeff Kirsher fl_nomem: 2236f7917c00SJeff Kirsher ret = -ENOMEM; 2237f7917c00SJeff Kirsher err: 2238f7917c00SJeff Kirsher if (iq->desc) { 2239f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, iq->size * iq->iqe_len, 2240f7917c00SJeff Kirsher iq->desc, iq->phys_addr); 2241f7917c00SJeff Kirsher iq->desc = NULL; 2242f7917c00SJeff Kirsher } 2243f7917c00SJeff Kirsher if (fl && fl->desc) { 2244f7917c00SJeff Kirsher kfree(fl->sdesc); 2245f7917c00SJeff Kirsher fl->sdesc = NULL; 2246f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, flsz * sizeof(struct tx_desc), 2247f7917c00SJeff Kirsher fl->desc, fl->addr); 2248f7917c00SJeff Kirsher fl->desc = NULL; 2249f7917c00SJeff Kirsher } 2250f7917c00SJeff Kirsher return ret; 2251f7917c00SJeff Kirsher } 2252f7917c00SJeff Kirsher 2253f7917c00SJeff Kirsher static void init_txq(struct adapter *adap, struct sge_txq *q, unsigned int id) 2254f7917c00SJeff Kirsher { 225522adfe0aSSantosh Rastapur q->cntxt_id = id; 2256d14807ddSHariprasad Shenai if (!is_t4(adap->params.chip)) { 225722adfe0aSSantosh Rastapur unsigned int s_qpp; 225822adfe0aSSantosh Rastapur unsigned short udb_density; 225922adfe0aSSantosh Rastapur unsigned long qpshift; 226022adfe0aSSantosh Rastapur int page; 226122adfe0aSSantosh Rastapur 226222adfe0aSSantosh Rastapur s_qpp = QUEUESPERPAGEPF1 * adap->fn; 226322adfe0aSSantosh Rastapur udb_density = 1 << QUEUESPERPAGEPF0_GET((t4_read_reg(adap, 226422adfe0aSSantosh Rastapur SGE_EGRESS_QUEUES_PER_PAGE_PF) >> s_qpp)); 226522adfe0aSSantosh Rastapur qpshift = PAGE_SHIFT - ilog2(udb_density); 226622adfe0aSSantosh Rastapur q->udb = q->cntxt_id << qpshift; 226722adfe0aSSantosh Rastapur q->udb &= PAGE_MASK; 226822adfe0aSSantosh Rastapur page = q->udb / PAGE_SIZE; 226922adfe0aSSantosh Rastapur q->udb += (q->cntxt_id - (page * udb_density)) * 128; 227022adfe0aSSantosh Rastapur } 227122adfe0aSSantosh Rastapur 2272f7917c00SJeff Kirsher q->in_use = 0; 2273f7917c00SJeff Kirsher q->cidx = q->pidx = 0; 2274f7917c00SJeff Kirsher q->stops = q->restarts = 0; 2275f7917c00SJeff Kirsher q->stat = (void *)&q->desc[q->size]; 22763069ee9bSVipul Pandya spin_lock_init(&q->db_lock); 2277f7917c00SJeff Kirsher adap->sge.egr_map[id - adap->sge.egr_start] = q; 2278f7917c00SJeff Kirsher } 2279f7917c00SJeff Kirsher 2280f7917c00SJeff Kirsher int t4_sge_alloc_eth_txq(struct adapter *adap, struct sge_eth_txq *txq, 2281f7917c00SJeff Kirsher struct net_device *dev, struct netdev_queue *netdevq, 2282f7917c00SJeff Kirsher unsigned int iqid) 2283f7917c00SJeff Kirsher { 2284f7917c00SJeff Kirsher int ret, nentries; 2285f7917c00SJeff Kirsher struct fw_eq_eth_cmd c; 228652367a76SVipul Pandya struct sge *s = &adap->sge; 2287f7917c00SJeff Kirsher struct port_info *pi = netdev_priv(dev); 2288f7917c00SJeff Kirsher 2289f7917c00SJeff Kirsher /* Add status entries */ 229052367a76SVipul Pandya nentries = txq->q.size + s->stat_len / sizeof(struct tx_desc); 2291f7917c00SJeff Kirsher 2292f7917c00SJeff Kirsher txq->q.desc = alloc_ring(adap->pdev_dev, txq->q.size, 2293f7917c00SJeff Kirsher sizeof(struct tx_desc), sizeof(struct tx_sw_desc), 229452367a76SVipul Pandya &txq->q.phys_addr, &txq->q.sdesc, s->stat_len, 2295f7917c00SJeff Kirsher netdev_queue_numa_node_read(netdevq)); 2296f7917c00SJeff Kirsher if (!txq->q.desc) 2297f7917c00SJeff Kirsher return -ENOMEM; 2298f7917c00SJeff Kirsher 2299f7917c00SJeff Kirsher memset(&c, 0, sizeof(c)); 2300f7917c00SJeff Kirsher c.op_to_vfn = htonl(FW_CMD_OP(FW_EQ_ETH_CMD) | FW_CMD_REQUEST | 2301f7917c00SJeff Kirsher FW_CMD_WRITE | FW_CMD_EXEC | 2302f7917c00SJeff Kirsher FW_EQ_ETH_CMD_PFN(adap->fn) | FW_EQ_ETH_CMD_VFN(0)); 2303f7917c00SJeff Kirsher c.alloc_to_len16 = htonl(FW_EQ_ETH_CMD_ALLOC | 2304f7917c00SJeff Kirsher FW_EQ_ETH_CMD_EQSTART | FW_LEN16(c)); 2305f7917c00SJeff Kirsher c.viid_pkd = htonl(FW_EQ_ETH_CMD_VIID(pi->viid)); 2306f7917c00SJeff Kirsher c.fetchszm_to_iqid = htonl(FW_EQ_ETH_CMD_HOSTFCMODE(2) | 2307f7917c00SJeff Kirsher FW_EQ_ETH_CMD_PCIECHN(pi->tx_chan) | 2308f7917c00SJeff Kirsher FW_EQ_ETH_CMD_FETCHRO(1) | 2309f7917c00SJeff Kirsher FW_EQ_ETH_CMD_IQID(iqid)); 2310f7917c00SJeff Kirsher c.dcaen_to_eqsize = htonl(FW_EQ_ETH_CMD_FBMIN(2) | 2311f7917c00SJeff Kirsher FW_EQ_ETH_CMD_FBMAX(3) | 2312f7917c00SJeff Kirsher FW_EQ_ETH_CMD_CIDXFTHRESH(5) | 2313f7917c00SJeff Kirsher FW_EQ_ETH_CMD_EQSIZE(nentries)); 2314f7917c00SJeff Kirsher c.eqaddr = cpu_to_be64(txq->q.phys_addr); 2315f7917c00SJeff Kirsher 2316f7917c00SJeff Kirsher ret = t4_wr_mbox(adap, adap->fn, &c, sizeof(c), &c); 2317f7917c00SJeff Kirsher if (ret) { 2318f7917c00SJeff Kirsher kfree(txq->q.sdesc); 2319f7917c00SJeff Kirsher txq->q.sdesc = NULL; 2320f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, 2321f7917c00SJeff Kirsher nentries * sizeof(struct tx_desc), 2322f7917c00SJeff Kirsher txq->q.desc, txq->q.phys_addr); 2323f7917c00SJeff Kirsher txq->q.desc = NULL; 2324f7917c00SJeff Kirsher return ret; 2325f7917c00SJeff Kirsher } 2326f7917c00SJeff Kirsher 2327f7917c00SJeff Kirsher init_txq(adap, &txq->q, FW_EQ_ETH_CMD_EQID_GET(ntohl(c.eqid_pkd))); 2328f7917c00SJeff Kirsher txq->txq = netdevq; 2329f7917c00SJeff Kirsher txq->tso = txq->tx_cso = txq->vlan_ins = 0; 2330f7917c00SJeff Kirsher txq->mapping_err = 0; 2331f7917c00SJeff Kirsher return 0; 2332f7917c00SJeff Kirsher } 2333f7917c00SJeff Kirsher 2334f7917c00SJeff Kirsher int t4_sge_alloc_ctrl_txq(struct adapter *adap, struct sge_ctrl_txq *txq, 2335f7917c00SJeff Kirsher struct net_device *dev, unsigned int iqid, 2336f7917c00SJeff Kirsher unsigned int cmplqid) 2337f7917c00SJeff Kirsher { 2338f7917c00SJeff Kirsher int ret, nentries; 2339f7917c00SJeff Kirsher struct fw_eq_ctrl_cmd c; 234052367a76SVipul Pandya struct sge *s = &adap->sge; 2341f7917c00SJeff Kirsher struct port_info *pi = netdev_priv(dev); 2342f7917c00SJeff Kirsher 2343f7917c00SJeff Kirsher /* Add status entries */ 234452367a76SVipul Pandya nentries = txq->q.size + s->stat_len / sizeof(struct tx_desc); 2345f7917c00SJeff Kirsher 2346f7917c00SJeff Kirsher txq->q.desc = alloc_ring(adap->pdev_dev, nentries, 2347f7917c00SJeff Kirsher sizeof(struct tx_desc), 0, &txq->q.phys_addr, 2348f7917c00SJeff Kirsher NULL, 0, NUMA_NO_NODE); 2349f7917c00SJeff Kirsher if (!txq->q.desc) 2350f7917c00SJeff Kirsher return -ENOMEM; 2351f7917c00SJeff Kirsher 2352f7917c00SJeff Kirsher c.op_to_vfn = htonl(FW_CMD_OP(FW_EQ_CTRL_CMD) | FW_CMD_REQUEST | 2353f7917c00SJeff Kirsher FW_CMD_WRITE | FW_CMD_EXEC | 2354f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_PFN(adap->fn) | 2355f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_VFN(0)); 2356f7917c00SJeff Kirsher c.alloc_to_len16 = htonl(FW_EQ_CTRL_CMD_ALLOC | 2357f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_EQSTART | FW_LEN16(c)); 2358f7917c00SJeff Kirsher c.cmpliqid_eqid = htonl(FW_EQ_CTRL_CMD_CMPLIQID(cmplqid)); 2359f7917c00SJeff Kirsher c.physeqid_pkd = htonl(0); 2360f7917c00SJeff Kirsher c.fetchszm_to_iqid = htonl(FW_EQ_CTRL_CMD_HOSTFCMODE(2) | 2361f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_PCIECHN(pi->tx_chan) | 2362f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_FETCHRO | 2363f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_IQID(iqid)); 2364f7917c00SJeff Kirsher c.dcaen_to_eqsize = htonl(FW_EQ_CTRL_CMD_FBMIN(2) | 2365f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_FBMAX(3) | 2366f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_CIDXFTHRESH(5) | 2367f7917c00SJeff Kirsher FW_EQ_CTRL_CMD_EQSIZE(nentries)); 2368f7917c00SJeff Kirsher c.eqaddr = cpu_to_be64(txq->q.phys_addr); 2369f7917c00SJeff Kirsher 2370f7917c00SJeff Kirsher ret = t4_wr_mbox(adap, adap->fn, &c, sizeof(c), &c); 2371f7917c00SJeff Kirsher if (ret) { 2372f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, 2373f7917c00SJeff Kirsher nentries * sizeof(struct tx_desc), 2374f7917c00SJeff Kirsher txq->q.desc, txq->q.phys_addr); 2375f7917c00SJeff Kirsher txq->q.desc = NULL; 2376f7917c00SJeff Kirsher return ret; 2377f7917c00SJeff Kirsher } 2378f7917c00SJeff Kirsher 2379f7917c00SJeff Kirsher init_txq(adap, &txq->q, FW_EQ_CTRL_CMD_EQID_GET(ntohl(c.cmpliqid_eqid))); 2380f7917c00SJeff Kirsher txq->adap = adap; 2381f7917c00SJeff Kirsher skb_queue_head_init(&txq->sendq); 2382f7917c00SJeff Kirsher tasklet_init(&txq->qresume_tsk, restart_ctrlq, (unsigned long)txq); 2383f7917c00SJeff Kirsher txq->full = 0; 2384f7917c00SJeff Kirsher return 0; 2385f7917c00SJeff Kirsher } 2386f7917c00SJeff Kirsher 2387f7917c00SJeff Kirsher int t4_sge_alloc_ofld_txq(struct adapter *adap, struct sge_ofld_txq *txq, 2388f7917c00SJeff Kirsher struct net_device *dev, unsigned int iqid) 2389f7917c00SJeff Kirsher { 2390f7917c00SJeff Kirsher int ret, nentries; 2391f7917c00SJeff Kirsher struct fw_eq_ofld_cmd c; 239252367a76SVipul Pandya struct sge *s = &adap->sge; 2393f7917c00SJeff Kirsher struct port_info *pi = netdev_priv(dev); 2394f7917c00SJeff Kirsher 2395f7917c00SJeff Kirsher /* Add status entries */ 239652367a76SVipul Pandya nentries = txq->q.size + s->stat_len / sizeof(struct tx_desc); 2397f7917c00SJeff Kirsher 2398f7917c00SJeff Kirsher txq->q.desc = alloc_ring(adap->pdev_dev, txq->q.size, 2399f7917c00SJeff Kirsher sizeof(struct tx_desc), sizeof(struct tx_sw_desc), 240052367a76SVipul Pandya &txq->q.phys_addr, &txq->q.sdesc, s->stat_len, 2401f7917c00SJeff Kirsher NUMA_NO_NODE); 2402f7917c00SJeff Kirsher if (!txq->q.desc) 2403f7917c00SJeff Kirsher return -ENOMEM; 2404f7917c00SJeff Kirsher 2405f7917c00SJeff Kirsher memset(&c, 0, sizeof(c)); 2406f7917c00SJeff Kirsher c.op_to_vfn = htonl(FW_CMD_OP(FW_EQ_OFLD_CMD) | FW_CMD_REQUEST | 2407f7917c00SJeff Kirsher FW_CMD_WRITE | FW_CMD_EXEC | 2408f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_PFN(adap->fn) | 2409f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_VFN(0)); 2410f7917c00SJeff Kirsher c.alloc_to_len16 = htonl(FW_EQ_OFLD_CMD_ALLOC | 2411f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_EQSTART | FW_LEN16(c)); 2412f7917c00SJeff Kirsher c.fetchszm_to_iqid = htonl(FW_EQ_OFLD_CMD_HOSTFCMODE(2) | 2413f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_PCIECHN(pi->tx_chan) | 2414f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_FETCHRO(1) | 2415f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_IQID(iqid)); 2416f7917c00SJeff Kirsher c.dcaen_to_eqsize = htonl(FW_EQ_OFLD_CMD_FBMIN(2) | 2417f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_FBMAX(3) | 2418f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_CIDXFTHRESH(5) | 2419f7917c00SJeff Kirsher FW_EQ_OFLD_CMD_EQSIZE(nentries)); 2420f7917c00SJeff Kirsher c.eqaddr = cpu_to_be64(txq->q.phys_addr); 2421f7917c00SJeff Kirsher 2422f7917c00SJeff Kirsher ret = t4_wr_mbox(adap, adap->fn, &c, sizeof(c), &c); 2423f7917c00SJeff Kirsher if (ret) { 2424f7917c00SJeff Kirsher kfree(txq->q.sdesc); 2425f7917c00SJeff Kirsher txq->q.sdesc = NULL; 2426f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, 2427f7917c00SJeff Kirsher nentries * sizeof(struct tx_desc), 2428f7917c00SJeff Kirsher txq->q.desc, txq->q.phys_addr); 2429f7917c00SJeff Kirsher txq->q.desc = NULL; 2430f7917c00SJeff Kirsher return ret; 2431f7917c00SJeff Kirsher } 2432f7917c00SJeff Kirsher 2433f7917c00SJeff Kirsher init_txq(adap, &txq->q, FW_EQ_OFLD_CMD_EQID_GET(ntohl(c.eqid_pkd))); 2434f7917c00SJeff Kirsher txq->adap = adap; 2435f7917c00SJeff Kirsher skb_queue_head_init(&txq->sendq); 2436f7917c00SJeff Kirsher tasklet_init(&txq->qresume_tsk, restart_ofldq, (unsigned long)txq); 2437f7917c00SJeff Kirsher txq->full = 0; 2438f7917c00SJeff Kirsher txq->mapping_err = 0; 2439f7917c00SJeff Kirsher return 0; 2440f7917c00SJeff Kirsher } 2441f7917c00SJeff Kirsher 2442f7917c00SJeff Kirsher static void free_txq(struct adapter *adap, struct sge_txq *q) 2443f7917c00SJeff Kirsher { 244452367a76SVipul Pandya struct sge *s = &adap->sge; 244552367a76SVipul Pandya 2446f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, 244752367a76SVipul Pandya q->size * sizeof(struct tx_desc) + s->stat_len, 2448f7917c00SJeff Kirsher q->desc, q->phys_addr); 2449f7917c00SJeff Kirsher q->cntxt_id = 0; 2450f7917c00SJeff Kirsher q->sdesc = NULL; 2451f7917c00SJeff Kirsher q->desc = NULL; 2452f7917c00SJeff Kirsher } 2453f7917c00SJeff Kirsher 2454f7917c00SJeff Kirsher static void free_rspq_fl(struct adapter *adap, struct sge_rspq *rq, 2455f7917c00SJeff Kirsher struct sge_fl *fl) 2456f7917c00SJeff Kirsher { 245752367a76SVipul Pandya struct sge *s = &adap->sge; 2458f7917c00SJeff Kirsher unsigned int fl_id = fl ? fl->cntxt_id : 0xffff; 2459f7917c00SJeff Kirsher 2460f7917c00SJeff Kirsher adap->sge.ingr_map[rq->cntxt_id - adap->sge.ingr_start] = NULL; 2461f7917c00SJeff Kirsher t4_iq_free(adap, adap->fn, adap->fn, 0, FW_IQ_TYPE_FL_INT_CAP, 2462f7917c00SJeff Kirsher rq->cntxt_id, fl_id, 0xffff); 2463f7917c00SJeff Kirsher dma_free_coherent(adap->pdev_dev, (rq->size + 1) * rq->iqe_len, 2464f7917c00SJeff Kirsher rq->desc, rq->phys_addr); 2465f7917c00SJeff Kirsher netif_napi_del(&rq->napi); 2466f7917c00SJeff Kirsher rq->netdev = NULL; 2467f7917c00SJeff Kirsher rq->cntxt_id = rq->abs_id = 0; 2468f7917c00SJeff Kirsher rq->desc = NULL; 2469f7917c00SJeff Kirsher 2470f7917c00SJeff Kirsher if (fl) { 2471f7917c00SJeff Kirsher free_rx_bufs(adap, fl, fl->avail); 247252367a76SVipul Pandya dma_free_coherent(adap->pdev_dev, fl->size * 8 + s->stat_len, 2473f7917c00SJeff Kirsher fl->desc, fl->addr); 2474f7917c00SJeff Kirsher kfree(fl->sdesc); 2475f7917c00SJeff Kirsher fl->sdesc = NULL; 2476f7917c00SJeff Kirsher fl->cntxt_id = 0; 2477f7917c00SJeff Kirsher fl->desc = NULL; 2478f7917c00SJeff Kirsher } 2479f7917c00SJeff Kirsher } 2480f7917c00SJeff Kirsher 2481f7917c00SJeff Kirsher /** 2482f7917c00SJeff Kirsher * t4_free_sge_resources - free SGE resources 2483f7917c00SJeff Kirsher * @adap: the adapter 2484f7917c00SJeff Kirsher * 2485f7917c00SJeff Kirsher * Frees resources used by the SGE queue sets. 2486f7917c00SJeff Kirsher */ 2487f7917c00SJeff Kirsher void t4_free_sge_resources(struct adapter *adap) 2488f7917c00SJeff Kirsher { 2489f7917c00SJeff Kirsher int i; 2490f7917c00SJeff Kirsher struct sge_eth_rxq *eq = adap->sge.ethrxq; 2491f7917c00SJeff Kirsher struct sge_eth_txq *etq = adap->sge.ethtxq; 2492f7917c00SJeff Kirsher struct sge_ofld_rxq *oq = adap->sge.ofldrxq; 2493f7917c00SJeff Kirsher 2494f7917c00SJeff Kirsher /* clean up Ethernet Tx/Rx queues */ 2495f7917c00SJeff Kirsher for (i = 0; i < adap->sge.ethqsets; i++, eq++, etq++) { 2496f7917c00SJeff Kirsher if (eq->rspq.desc) 2497f7917c00SJeff Kirsher free_rspq_fl(adap, &eq->rspq, &eq->fl); 2498f7917c00SJeff Kirsher if (etq->q.desc) { 2499f7917c00SJeff Kirsher t4_eth_eq_free(adap, adap->fn, adap->fn, 0, 2500f7917c00SJeff Kirsher etq->q.cntxt_id); 2501f7917c00SJeff Kirsher free_tx_desc(adap, &etq->q, etq->q.in_use, true); 2502f7917c00SJeff Kirsher kfree(etq->q.sdesc); 2503f7917c00SJeff Kirsher free_txq(adap, &etq->q); 2504f7917c00SJeff Kirsher } 2505f7917c00SJeff Kirsher } 2506f7917c00SJeff Kirsher 2507f7917c00SJeff Kirsher /* clean up RDMA and iSCSI Rx queues */ 2508f7917c00SJeff Kirsher for (i = 0; i < adap->sge.ofldqsets; i++, oq++) { 2509f7917c00SJeff Kirsher if (oq->rspq.desc) 2510f7917c00SJeff Kirsher free_rspq_fl(adap, &oq->rspq, &oq->fl); 2511f7917c00SJeff Kirsher } 2512f7917c00SJeff Kirsher for (i = 0, oq = adap->sge.rdmarxq; i < adap->sge.rdmaqs; i++, oq++) { 2513f7917c00SJeff Kirsher if (oq->rspq.desc) 2514f7917c00SJeff Kirsher free_rspq_fl(adap, &oq->rspq, &oq->fl); 2515f7917c00SJeff Kirsher } 2516f7917c00SJeff Kirsher 2517f7917c00SJeff Kirsher /* clean up offload Tx queues */ 2518f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(adap->sge.ofldtxq); i++) { 2519f7917c00SJeff Kirsher struct sge_ofld_txq *q = &adap->sge.ofldtxq[i]; 2520f7917c00SJeff Kirsher 2521f7917c00SJeff Kirsher if (q->q.desc) { 2522f7917c00SJeff Kirsher tasklet_kill(&q->qresume_tsk); 2523f7917c00SJeff Kirsher t4_ofld_eq_free(adap, adap->fn, adap->fn, 0, 2524f7917c00SJeff Kirsher q->q.cntxt_id); 2525f7917c00SJeff Kirsher free_tx_desc(adap, &q->q, q->q.in_use, false); 2526f7917c00SJeff Kirsher kfree(q->q.sdesc); 2527f7917c00SJeff Kirsher __skb_queue_purge(&q->sendq); 2528f7917c00SJeff Kirsher free_txq(adap, &q->q); 2529f7917c00SJeff Kirsher } 2530f7917c00SJeff Kirsher } 2531f7917c00SJeff Kirsher 2532f7917c00SJeff Kirsher /* clean up control Tx queues */ 2533f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(adap->sge.ctrlq); i++) { 2534f7917c00SJeff Kirsher struct sge_ctrl_txq *cq = &adap->sge.ctrlq[i]; 2535f7917c00SJeff Kirsher 2536f7917c00SJeff Kirsher if (cq->q.desc) { 2537f7917c00SJeff Kirsher tasklet_kill(&cq->qresume_tsk); 2538f7917c00SJeff Kirsher t4_ctrl_eq_free(adap, adap->fn, adap->fn, 0, 2539f7917c00SJeff Kirsher cq->q.cntxt_id); 2540f7917c00SJeff Kirsher __skb_queue_purge(&cq->sendq); 2541f7917c00SJeff Kirsher free_txq(adap, &cq->q); 2542f7917c00SJeff Kirsher } 2543f7917c00SJeff Kirsher } 2544f7917c00SJeff Kirsher 2545f7917c00SJeff Kirsher if (adap->sge.fw_evtq.desc) 2546f7917c00SJeff Kirsher free_rspq_fl(adap, &adap->sge.fw_evtq, NULL); 2547f7917c00SJeff Kirsher 2548f7917c00SJeff Kirsher if (adap->sge.intrq.desc) 2549f7917c00SJeff Kirsher free_rspq_fl(adap, &adap->sge.intrq, NULL); 2550f7917c00SJeff Kirsher 2551f7917c00SJeff Kirsher /* clear the reverse egress queue map */ 2552f7917c00SJeff Kirsher memset(adap->sge.egr_map, 0, sizeof(adap->sge.egr_map)); 2553f7917c00SJeff Kirsher } 2554f7917c00SJeff Kirsher 2555f7917c00SJeff Kirsher void t4_sge_start(struct adapter *adap) 2556f7917c00SJeff Kirsher { 2557f7917c00SJeff Kirsher adap->sge.ethtxq_rover = 0; 2558f7917c00SJeff Kirsher mod_timer(&adap->sge.rx_timer, jiffies + RX_QCHECK_PERIOD); 2559f7917c00SJeff Kirsher mod_timer(&adap->sge.tx_timer, jiffies + TX_QCHECK_PERIOD); 2560f7917c00SJeff Kirsher } 2561f7917c00SJeff Kirsher 2562f7917c00SJeff Kirsher /** 2563f7917c00SJeff Kirsher * t4_sge_stop - disable SGE operation 2564f7917c00SJeff Kirsher * @adap: the adapter 2565f7917c00SJeff Kirsher * 2566f7917c00SJeff Kirsher * Stop tasklets and timers associated with the DMA engine. Note that 2567f7917c00SJeff Kirsher * this is effective only if measures have been taken to disable any HW 2568f7917c00SJeff Kirsher * events that may restart them. 2569f7917c00SJeff Kirsher */ 2570f7917c00SJeff Kirsher void t4_sge_stop(struct adapter *adap) 2571f7917c00SJeff Kirsher { 2572f7917c00SJeff Kirsher int i; 2573f7917c00SJeff Kirsher struct sge *s = &adap->sge; 2574f7917c00SJeff Kirsher 2575f7917c00SJeff Kirsher if (in_interrupt()) /* actions below require waiting */ 2576f7917c00SJeff Kirsher return; 2577f7917c00SJeff Kirsher 2578f7917c00SJeff Kirsher if (s->rx_timer.function) 2579f7917c00SJeff Kirsher del_timer_sync(&s->rx_timer); 2580f7917c00SJeff Kirsher if (s->tx_timer.function) 2581f7917c00SJeff Kirsher del_timer_sync(&s->tx_timer); 2582f7917c00SJeff Kirsher 2583f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(s->ofldtxq); i++) { 2584f7917c00SJeff Kirsher struct sge_ofld_txq *q = &s->ofldtxq[i]; 2585f7917c00SJeff Kirsher 2586f7917c00SJeff Kirsher if (q->q.desc) 2587f7917c00SJeff Kirsher tasklet_kill(&q->qresume_tsk); 2588f7917c00SJeff Kirsher } 2589f7917c00SJeff Kirsher for (i = 0; i < ARRAY_SIZE(s->ctrlq); i++) { 2590f7917c00SJeff Kirsher struct sge_ctrl_txq *cq = &s->ctrlq[i]; 2591f7917c00SJeff Kirsher 2592f7917c00SJeff Kirsher if (cq->q.desc) 2593f7917c00SJeff Kirsher tasklet_kill(&cq->qresume_tsk); 2594f7917c00SJeff Kirsher } 2595f7917c00SJeff Kirsher } 2596f7917c00SJeff Kirsher 2597f7917c00SJeff Kirsher /** 2598f7917c00SJeff Kirsher * t4_sge_init - initialize SGE 2599f7917c00SJeff Kirsher * @adap: the adapter 2600f7917c00SJeff Kirsher * 2601f7917c00SJeff Kirsher * Performs SGE initialization needed every time after a chip reset. 2602f7917c00SJeff Kirsher * We do not initialize any of the queues here, instead the driver 2603f7917c00SJeff Kirsher * top-level must request them individually. 260452367a76SVipul Pandya * 260552367a76SVipul Pandya * Called in two different modes: 260652367a76SVipul Pandya * 260752367a76SVipul Pandya * 1. Perform actual hardware initialization and record hard-coded 260852367a76SVipul Pandya * parameters which were used. This gets used when we're the 260952367a76SVipul Pandya * Master PF and the Firmware Configuration File support didn't 261052367a76SVipul Pandya * work for some reason. 261152367a76SVipul Pandya * 261252367a76SVipul Pandya * 2. We're not the Master PF or initialization was performed with 261352367a76SVipul Pandya * a Firmware Configuration File. In this case we need to grab 261452367a76SVipul Pandya * any of the SGE operating parameters that we need to have in 261552367a76SVipul Pandya * order to do our job and make sure we can live with them ... 2616f7917c00SJeff Kirsher */ 2617f7917c00SJeff Kirsher 261852367a76SVipul Pandya static int t4_sge_init_soft(struct adapter *adap) 261952367a76SVipul Pandya { 262052367a76SVipul Pandya struct sge *s = &adap->sge; 262152367a76SVipul Pandya u32 fl_small_pg, fl_large_pg, fl_small_mtu, fl_large_mtu; 262252367a76SVipul Pandya u32 timer_value_0_and_1, timer_value_2_and_3, timer_value_4_and_5; 262352367a76SVipul Pandya u32 ingress_rx_threshold; 262452367a76SVipul Pandya 262552367a76SVipul Pandya /* 262652367a76SVipul Pandya * Verify that CPL messages are going to the Ingress Queue for 262752367a76SVipul Pandya * process_responses() and that only packet data is going to the 262852367a76SVipul Pandya * Free Lists. 262952367a76SVipul Pandya */ 263052367a76SVipul Pandya if ((t4_read_reg(adap, SGE_CONTROL) & RXPKTCPLMODE_MASK) != 263152367a76SVipul Pandya RXPKTCPLMODE(X_RXPKTCPLMODE_SPLIT)) { 263252367a76SVipul Pandya dev_err(adap->pdev_dev, "bad SGE CPL MODE\n"); 263352367a76SVipul Pandya return -EINVAL; 263452367a76SVipul Pandya } 263552367a76SVipul Pandya 263652367a76SVipul Pandya /* 263752367a76SVipul Pandya * Validate the Host Buffer Register Array indices that we want to 263852367a76SVipul Pandya * use ... 263952367a76SVipul Pandya * 264052367a76SVipul Pandya * XXX Note that we should really read through the Host Buffer Size 264152367a76SVipul Pandya * XXX register array and find the indices of the Buffer Sizes which 264252367a76SVipul Pandya * XXX meet our needs! 264352367a76SVipul Pandya */ 264452367a76SVipul Pandya #define READ_FL_BUF(x) \ 264552367a76SVipul Pandya t4_read_reg(adap, SGE_FL_BUFFER_SIZE0+(x)*sizeof(u32)) 264652367a76SVipul Pandya 264752367a76SVipul Pandya fl_small_pg = READ_FL_BUF(RX_SMALL_PG_BUF); 264852367a76SVipul Pandya fl_large_pg = READ_FL_BUF(RX_LARGE_PG_BUF); 264952367a76SVipul Pandya fl_small_mtu = READ_FL_BUF(RX_SMALL_MTU_BUF); 265052367a76SVipul Pandya fl_large_mtu = READ_FL_BUF(RX_LARGE_MTU_BUF); 265152367a76SVipul Pandya 265292ddcc7bSKumar Sanghvi /* We only bother using the Large Page logic if the Large Page Buffer 265392ddcc7bSKumar Sanghvi * is larger than our Page Size Buffer. 265492ddcc7bSKumar Sanghvi */ 265592ddcc7bSKumar Sanghvi if (fl_large_pg <= fl_small_pg) 265692ddcc7bSKumar Sanghvi fl_large_pg = 0; 265792ddcc7bSKumar Sanghvi 265852367a76SVipul Pandya #undef READ_FL_BUF 265952367a76SVipul Pandya 266092ddcc7bSKumar Sanghvi /* The Page Size Buffer must be exactly equal to our Page Size and the 266192ddcc7bSKumar Sanghvi * Large Page Size Buffer should be 0 (per above) or a power of 2. 266292ddcc7bSKumar Sanghvi */ 266352367a76SVipul Pandya if (fl_small_pg != PAGE_SIZE || 266492ddcc7bSKumar Sanghvi (fl_large_pg & (fl_large_pg-1)) != 0) { 266552367a76SVipul Pandya dev_err(adap->pdev_dev, "bad SGE FL page buffer sizes [%d, %d]\n", 266652367a76SVipul Pandya fl_small_pg, fl_large_pg); 266752367a76SVipul Pandya return -EINVAL; 266852367a76SVipul Pandya } 266952367a76SVipul Pandya if (fl_large_pg) 267052367a76SVipul Pandya s->fl_pg_order = ilog2(fl_large_pg) - PAGE_SHIFT; 267152367a76SVipul Pandya 267252367a76SVipul Pandya if (fl_small_mtu < FL_MTU_SMALL_BUFSIZE(adap) || 267352367a76SVipul Pandya fl_large_mtu < FL_MTU_LARGE_BUFSIZE(adap)) { 267452367a76SVipul Pandya dev_err(adap->pdev_dev, "bad SGE FL MTU sizes [%d, %d]\n", 267552367a76SVipul Pandya fl_small_mtu, fl_large_mtu); 267652367a76SVipul Pandya return -EINVAL; 267752367a76SVipul Pandya } 267852367a76SVipul Pandya 267952367a76SVipul Pandya /* 268052367a76SVipul Pandya * Retrieve our RX interrupt holdoff timer values and counter 268152367a76SVipul Pandya * threshold values from the SGE parameters. 268252367a76SVipul Pandya */ 268352367a76SVipul Pandya timer_value_0_and_1 = t4_read_reg(adap, SGE_TIMER_VALUE_0_AND_1); 268452367a76SVipul Pandya timer_value_2_and_3 = t4_read_reg(adap, SGE_TIMER_VALUE_2_AND_3); 268552367a76SVipul Pandya timer_value_4_and_5 = t4_read_reg(adap, SGE_TIMER_VALUE_4_AND_5); 268652367a76SVipul Pandya s->timer_val[0] = core_ticks_to_us(adap, 268752367a76SVipul Pandya TIMERVALUE0_GET(timer_value_0_and_1)); 268852367a76SVipul Pandya s->timer_val[1] = core_ticks_to_us(adap, 268952367a76SVipul Pandya TIMERVALUE1_GET(timer_value_0_and_1)); 269052367a76SVipul Pandya s->timer_val[2] = core_ticks_to_us(adap, 269152367a76SVipul Pandya TIMERVALUE2_GET(timer_value_2_and_3)); 269252367a76SVipul Pandya s->timer_val[3] = core_ticks_to_us(adap, 269352367a76SVipul Pandya TIMERVALUE3_GET(timer_value_2_and_3)); 269452367a76SVipul Pandya s->timer_val[4] = core_ticks_to_us(adap, 269552367a76SVipul Pandya TIMERVALUE4_GET(timer_value_4_and_5)); 269652367a76SVipul Pandya s->timer_val[5] = core_ticks_to_us(adap, 269752367a76SVipul Pandya TIMERVALUE5_GET(timer_value_4_and_5)); 269852367a76SVipul Pandya 269952367a76SVipul Pandya ingress_rx_threshold = t4_read_reg(adap, SGE_INGRESS_RX_THRESHOLD); 270052367a76SVipul Pandya s->counter_val[0] = THRESHOLD_0_GET(ingress_rx_threshold); 270152367a76SVipul Pandya s->counter_val[1] = THRESHOLD_1_GET(ingress_rx_threshold); 270252367a76SVipul Pandya s->counter_val[2] = THRESHOLD_2_GET(ingress_rx_threshold); 270352367a76SVipul Pandya s->counter_val[3] = THRESHOLD_3_GET(ingress_rx_threshold); 270452367a76SVipul Pandya 270552367a76SVipul Pandya return 0; 270652367a76SVipul Pandya } 270752367a76SVipul Pandya 270852367a76SVipul Pandya static int t4_sge_init_hard(struct adapter *adap) 270952367a76SVipul Pandya { 271052367a76SVipul Pandya struct sge *s = &adap->sge; 271152367a76SVipul Pandya 271252367a76SVipul Pandya /* 271352367a76SVipul Pandya * Set up our basic SGE mode to deliver CPL messages to our Ingress 271452367a76SVipul Pandya * Queue and Packet Date to the Free List. 271552367a76SVipul Pandya */ 271652367a76SVipul Pandya t4_set_reg_field(adap, SGE_CONTROL, RXPKTCPLMODE_MASK, 271752367a76SVipul Pandya RXPKTCPLMODE_MASK); 2718f7917c00SJeff Kirsher 27193069ee9bSVipul Pandya /* 27203069ee9bSVipul Pandya * Set up to drop DOORBELL writes when the DOORBELL FIFO overflows 27213069ee9bSVipul Pandya * and generate an interrupt when this occurs so we can recover. 27223069ee9bSVipul Pandya */ 2723d14807ddSHariprasad Shenai if (is_t4(adap->params.chip)) { 2724881806bcSVipul Pandya t4_set_reg_field(adap, A_SGE_DBFIFO_STATUS, 27253069ee9bSVipul Pandya V_HP_INT_THRESH(M_HP_INT_THRESH) | 27263069ee9bSVipul Pandya V_LP_INT_THRESH(M_LP_INT_THRESH), 27273069ee9bSVipul Pandya V_HP_INT_THRESH(dbfifo_int_thresh) | 27283069ee9bSVipul Pandya V_LP_INT_THRESH(dbfifo_int_thresh)); 27290a57a536SSantosh Rastapur } else { 27300a57a536SSantosh Rastapur t4_set_reg_field(adap, A_SGE_DBFIFO_STATUS, 27310a57a536SSantosh Rastapur V_LP_INT_THRESH_T5(M_LP_INT_THRESH_T5), 27320a57a536SSantosh Rastapur V_LP_INT_THRESH_T5(dbfifo_int_thresh)); 27330a57a536SSantosh Rastapur t4_set_reg_field(adap, SGE_DBFIFO_STATUS2, 27340a57a536SSantosh Rastapur V_HP_INT_THRESH_T5(M_HP_INT_THRESH_T5), 27350a57a536SSantosh Rastapur V_HP_INT_THRESH_T5(dbfifo_int_thresh)); 27360a57a536SSantosh Rastapur } 2737881806bcSVipul Pandya t4_set_reg_field(adap, A_SGE_DOORBELL_CONTROL, F_ENABLE_DROP, 2738881806bcSVipul Pandya F_ENABLE_DROP); 2739881806bcSVipul Pandya 274052367a76SVipul Pandya /* 274152367a76SVipul Pandya * SGE_FL_BUFFER_SIZE0 (RX_SMALL_PG_BUF) is set up by 274252367a76SVipul Pandya * t4_fixup_host_params(). 274352367a76SVipul Pandya */ 274452367a76SVipul Pandya s->fl_pg_order = FL_PG_ORDER; 274552367a76SVipul Pandya if (s->fl_pg_order) 274652367a76SVipul Pandya t4_write_reg(adap, 274752367a76SVipul Pandya SGE_FL_BUFFER_SIZE0+RX_LARGE_PG_BUF*sizeof(u32), 274852367a76SVipul Pandya PAGE_SIZE << FL_PG_ORDER); 274952367a76SVipul Pandya t4_write_reg(adap, SGE_FL_BUFFER_SIZE0+RX_SMALL_MTU_BUF*sizeof(u32), 275052367a76SVipul Pandya FL_MTU_SMALL_BUFSIZE(adap)); 275152367a76SVipul Pandya t4_write_reg(adap, SGE_FL_BUFFER_SIZE0+RX_LARGE_MTU_BUF*sizeof(u32), 275252367a76SVipul Pandya FL_MTU_LARGE_BUFSIZE(adap)); 275352367a76SVipul Pandya 275452367a76SVipul Pandya /* 275552367a76SVipul Pandya * Note that the SGE Ingress Packet Count Interrupt Threshold and 275652367a76SVipul Pandya * Timer Holdoff values must be supplied by our caller. 275752367a76SVipul Pandya */ 2758f7917c00SJeff Kirsher t4_write_reg(adap, SGE_INGRESS_RX_THRESHOLD, 2759f7917c00SJeff Kirsher THRESHOLD_0(s->counter_val[0]) | 2760f7917c00SJeff Kirsher THRESHOLD_1(s->counter_val[1]) | 2761f7917c00SJeff Kirsher THRESHOLD_2(s->counter_val[2]) | 2762f7917c00SJeff Kirsher THRESHOLD_3(s->counter_val[3])); 2763f7917c00SJeff Kirsher t4_write_reg(adap, SGE_TIMER_VALUE_0_AND_1, 2764f7917c00SJeff Kirsher TIMERVALUE0(us_to_core_ticks(adap, s->timer_val[0])) | 2765f7917c00SJeff Kirsher TIMERVALUE1(us_to_core_ticks(adap, s->timer_val[1]))); 2766f7917c00SJeff Kirsher t4_write_reg(adap, SGE_TIMER_VALUE_2_AND_3, 276752367a76SVipul Pandya TIMERVALUE2(us_to_core_ticks(adap, s->timer_val[2])) | 276852367a76SVipul Pandya TIMERVALUE3(us_to_core_ticks(adap, s->timer_val[3]))); 2769f7917c00SJeff Kirsher t4_write_reg(adap, SGE_TIMER_VALUE_4_AND_5, 277052367a76SVipul Pandya TIMERVALUE4(us_to_core_ticks(adap, s->timer_val[4])) | 277152367a76SVipul Pandya TIMERVALUE5(us_to_core_ticks(adap, s->timer_val[5]))); 277252367a76SVipul Pandya 277352367a76SVipul Pandya return 0; 277452367a76SVipul Pandya } 277552367a76SVipul Pandya 277652367a76SVipul Pandya int t4_sge_init(struct adapter *adap) 277752367a76SVipul Pandya { 277852367a76SVipul Pandya struct sge *s = &adap->sge; 2779c2b955e0SKumar Sanghvi u32 sge_control, sge_conm_ctrl; 2780c2b955e0SKumar Sanghvi int ret, egress_threshold; 278152367a76SVipul Pandya 278252367a76SVipul Pandya /* 278352367a76SVipul Pandya * Ingress Padding Boundary and Egress Status Page Size are set up by 278452367a76SVipul Pandya * t4_fixup_host_params(). 278552367a76SVipul Pandya */ 278652367a76SVipul Pandya sge_control = t4_read_reg(adap, SGE_CONTROL); 278752367a76SVipul Pandya s->pktshift = PKTSHIFT_GET(sge_control); 278852367a76SVipul Pandya s->stat_len = (sge_control & EGRSTATUSPAGESIZE_MASK) ? 128 : 64; 278952367a76SVipul Pandya s->fl_align = 1 << (INGPADBOUNDARY_GET(sge_control) + 279052367a76SVipul Pandya X_INGPADBOUNDARY_SHIFT); 279152367a76SVipul Pandya 279252367a76SVipul Pandya if (adap->flags & USING_SOFT_PARAMS) 279352367a76SVipul Pandya ret = t4_sge_init_soft(adap); 279452367a76SVipul Pandya else 279552367a76SVipul Pandya ret = t4_sge_init_hard(adap); 279652367a76SVipul Pandya if (ret < 0) 279752367a76SVipul Pandya return ret; 279852367a76SVipul Pandya 279952367a76SVipul Pandya /* 280052367a76SVipul Pandya * A FL with <= fl_starve_thres buffers is starving and a periodic 280152367a76SVipul Pandya * timer will attempt to refill it. This needs to be larger than the 280252367a76SVipul Pandya * SGE's Egress Congestion Threshold. If it isn't, then we can get 280352367a76SVipul Pandya * stuck waiting for new packets while the SGE is waiting for us to 280452367a76SVipul Pandya * give it more Free List entries. (Note that the SGE's Egress 2805c2b955e0SKumar Sanghvi * Congestion Threshold is in units of 2 Free List pointers.) For T4, 2806c2b955e0SKumar Sanghvi * there was only a single field to control this. For T5 there's the 2807c2b955e0SKumar Sanghvi * original field which now only applies to Unpacked Mode Free List 2808c2b955e0SKumar Sanghvi * buffers and a new field which only applies to Packed Mode Free List 2809c2b955e0SKumar Sanghvi * buffers. 281052367a76SVipul Pandya */ 2811c2b955e0SKumar Sanghvi sge_conm_ctrl = t4_read_reg(adap, SGE_CONM_CTRL); 2812c2b955e0SKumar Sanghvi if (is_t4(adap->params.chip)) 2813c2b955e0SKumar Sanghvi egress_threshold = EGRTHRESHOLD_GET(sge_conm_ctrl); 2814c2b955e0SKumar Sanghvi else 2815c2b955e0SKumar Sanghvi egress_threshold = EGRTHRESHOLDPACKING_GET(sge_conm_ctrl); 2816c2b955e0SKumar Sanghvi s->fl_starve_thres = 2*egress_threshold + 1; 281752367a76SVipul Pandya 2818f7917c00SJeff Kirsher setup_timer(&s->rx_timer, sge_rx_timer_cb, (unsigned long)adap); 2819f7917c00SJeff Kirsher setup_timer(&s->tx_timer, sge_tx_timer_cb, (unsigned long)adap); 28200f4d201fSKumar Sanghvi s->idma_1s_thresh = core_ticks_per_usec(adap) * 1000000; /* 1 s */ 28210f4d201fSKumar Sanghvi s->idma_stalled[0] = 0; 28220f4d201fSKumar Sanghvi s->idma_stalled[1] = 0; 2823f7917c00SJeff Kirsher spin_lock_init(&s->intrq_lock); 282452367a76SVipul Pandya 282552367a76SVipul Pandya return 0; 2826f7917c00SJeff Kirsher } 2827