1 /* bnx2x_cmn.c: Broadcom Everest network driver.
2 *
3 * Copyright (c) 2007-2013 Broadcom Corporation
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation.
8 *
9 * Maintained by: Eilon Greenstein <eilong@broadcom.com>
10 * Written by: Eliezer Tamir
11 * Based on code from Michael Chan's bnx2 driver
12 * UDP CSUM errata workaround by Arik Gendelman
13 * Slowpath and fastpath rework by Vladislav Zolotarov
14 * Statistics and Link management by Yitchak Gertner
15 *
16 */
17
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19
20 #include <linux/etherdevice.h>
21 #include <linux/if_vlan.h>
22 #include <linux/interrupt.h>
23 #include <linux/ip.h>
24 #include <net/tcp.h>
25 #include <net/ipv6.h>
26 #include <net/ip6_checksum.h>
27 #include <linux/prefetch.h>
28 #include "bnx2x_cmn.h"
29 #include "bnx2x_init.h"
30 #include "bnx2x_sp.h"
31
32 /**
33 * bnx2x_move_fp - move content of the fastpath structure.
34 *
35 * @bp: driver handle
36 * @from: source FP index
37 * @to: destination FP index
38 *
39 * Makes sure the contents of the bp->fp[to].napi is kept
40 * intact. This is done by first copying the napi struct from
41 * the target to the source, and then mem copying the entire
42 * source onto the target. Update txdata pointers and related
43 * content.
44 */
bnx2x_move_fp(struct bnx2x * bp,int from,int to)45 static inline void bnx2x_move_fp(struct bnx2x *bp, int from, int to)
46 {
47 struct bnx2x_fastpath *from_fp = &bp->fp[from];
48 struct bnx2x_fastpath *to_fp = &bp->fp[to];
49 struct bnx2x_sp_objs *from_sp_objs = &bp->sp_objs[from];
50 struct bnx2x_sp_objs *to_sp_objs = &bp->sp_objs[to];
51 struct bnx2x_fp_stats *from_fp_stats = &bp->fp_stats[from];
52 struct bnx2x_fp_stats *to_fp_stats = &bp->fp_stats[to];
53 int old_max_eth_txqs, new_max_eth_txqs;
54 int old_txdata_index = 0, new_txdata_index = 0;
55
56 /* Copy the NAPI object as it has been already initialized */
57 from_fp->napi = to_fp->napi;
58
59 /* Move bnx2x_fastpath contents */
60 memcpy(to_fp, from_fp, sizeof(*to_fp));
61 to_fp->index = to;
62
63 /* move sp_objs contents as well, as their indices match fp ones */
64 memcpy(to_sp_objs, from_sp_objs, sizeof(*to_sp_objs));
65
66 /* move fp_stats contents as well, as their indices match fp ones */
67 memcpy(to_fp_stats, from_fp_stats, sizeof(*to_fp_stats));
68
69 /* Update txdata pointers in fp and move txdata content accordingly:
70 * Each fp consumes 'max_cos' txdata structures, so the index should be
71 * decremented by max_cos x delta.
72 */
73
74 old_max_eth_txqs = BNX2X_NUM_ETH_QUEUES(bp) * (bp)->max_cos;
75 new_max_eth_txqs = (BNX2X_NUM_ETH_QUEUES(bp) - from + to) *
76 (bp)->max_cos;
77 if (from == FCOE_IDX(bp)) {
78 old_txdata_index = old_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
79 new_txdata_index = new_max_eth_txqs + FCOE_TXQ_IDX_OFFSET;
80 }
81
82 memcpy(&bp->bnx2x_txq[new_txdata_index],
83 &bp->bnx2x_txq[old_txdata_index],
84 sizeof(struct bnx2x_fp_txdata));
85 to_fp->txdata_ptr[0] = &bp->bnx2x_txq[new_txdata_index];
86 }
87
88 /**
89 * bnx2x_fill_fw_str - Fill buffer with FW version string.
90 *
91 * @bp: driver handle
92 * @buf: character buffer to fill with the fw name
93 * @buf_len: length of the above buffer
94 *
95 */
bnx2x_fill_fw_str(struct bnx2x * bp,char * buf,size_t buf_len)96 void bnx2x_fill_fw_str(struct bnx2x *bp, char *buf, size_t buf_len)
97 {
98 if (IS_PF(bp)) {
99 u8 phy_fw_ver[PHY_FW_VER_LEN];
100
101 phy_fw_ver[0] = '\0';
102 bnx2x_get_ext_phy_fw_version(&bp->link_params,
103 phy_fw_ver, PHY_FW_VER_LEN);
104 strlcpy(buf, bp->fw_ver, buf_len);
105 snprintf(buf + strlen(bp->fw_ver), 32 - strlen(bp->fw_ver),
106 "bc %d.%d.%d%s%s",
107 (bp->common.bc_ver & 0xff0000) >> 16,
108 (bp->common.bc_ver & 0xff00) >> 8,
109 (bp->common.bc_ver & 0xff),
110 ((phy_fw_ver[0] != '\0') ? " phy " : ""), phy_fw_ver);
111 } else {
112 bnx2x_vf_fill_fw_str(bp, buf, buf_len);
113 }
114 }
115
116 /**
117 * bnx2x_shrink_eth_fp - guarantees fastpath structures stay intact
118 *
119 * @bp: driver handle
120 * @delta: number of eth queues which were not allocated
121 */
bnx2x_shrink_eth_fp(struct bnx2x * bp,int delta)122 static void bnx2x_shrink_eth_fp(struct bnx2x *bp, int delta)
123 {
124 int i, cos, old_eth_num = BNX2X_NUM_ETH_QUEUES(bp);
125
126 /* Queue pointer cannot be re-set on an fp-basis, as moving pointer
127 * backward along the array could cause memory to be overriden
128 */
129 for (cos = 1; cos < bp->max_cos; cos++) {
130 for (i = 0; i < old_eth_num - delta; i++) {
131 struct bnx2x_fastpath *fp = &bp->fp[i];
132 int new_idx = cos * (old_eth_num - delta) + i;
133
134 memcpy(&bp->bnx2x_txq[new_idx], fp->txdata_ptr[cos],
135 sizeof(struct bnx2x_fp_txdata));
136 fp->txdata_ptr[cos] = &bp->bnx2x_txq[new_idx];
137 }
138 }
139 }
140
141 int load_count[2][3] = { {0} }; /* per-path: 0-common, 1-port0, 2-port1 */
142
143 /* free skb in the packet ring at pos idx
144 * return idx of last bd freed
145 */
bnx2x_free_tx_pkt(struct bnx2x * bp,struct bnx2x_fp_txdata * txdata,u16 idx,unsigned int * pkts_compl,unsigned int * bytes_compl)146 static u16 bnx2x_free_tx_pkt(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata,
147 u16 idx, unsigned int *pkts_compl,
148 unsigned int *bytes_compl)
149 {
150 struct sw_tx_bd *tx_buf = &txdata->tx_buf_ring[idx];
151 struct eth_tx_start_bd *tx_start_bd;
152 struct eth_tx_bd *tx_data_bd;
153 struct sk_buff *skb = tx_buf->skb;
154 u16 bd_idx = TX_BD(tx_buf->first_bd), new_cons;
155 int nbd;
156
157 /* prefetch skb end pointer to speedup dev_kfree_skb() */
158 prefetch(&skb->end);
159
160 DP(NETIF_MSG_TX_DONE, "fp[%d]: pkt_idx %d buff @(%p)->skb %p\n",
161 txdata->txq_index, idx, tx_buf, skb);
162
163 /* unmap first bd */
164 tx_start_bd = &txdata->tx_desc_ring[bd_idx].start_bd;
165 dma_unmap_single(&bp->pdev->dev, BD_UNMAP_ADDR(tx_start_bd),
166 BD_UNMAP_LEN(tx_start_bd), DMA_TO_DEVICE);
167
168
169 nbd = le16_to_cpu(tx_start_bd->nbd) - 1;
170 #ifdef BNX2X_STOP_ON_ERROR
171 if ((nbd - 1) > (MAX_SKB_FRAGS + 2)) {
172 BNX2X_ERR("BAD nbd!\n");
173 bnx2x_panic();
174 }
175 #endif
176 new_cons = nbd + tx_buf->first_bd;
177
178 /* Get the next bd */
179 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
180
181 /* Skip a parse bd... */
182 --nbd;
183 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
184
185 /* ...and the TSO split header bd since they have no mapping */
186 if (tx_buf->flags & BNX2X_TSO_SPLIT_BD) {
187 --nbd;
188 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
189 }
190
191 /* now free frags */
192 while (nbd > 0) {
193
194 tx_data_bd = &txdata->tx_desc_ring[bd_idx].reg_bd;
195 dma_unmap_page(&bp->pdev->dev, BD_UNMAP_ADDR(tx_data_bd),
196 BD_UNMAP_LEN(tx_data_bd), DMA_TO_DEVICE);
197 if (--nbd)
198 bd_idx = TX_BD(NEXT_TX_IDX(bd_idx));
199 }
200
201 /* release skb */
202 WARN_ON(!skb);
203 if (likely(skb)) {
204 (*pkts_compl)++;
205 (*bytes_compl) += skb->len;
206 }
207
208 dev_kfree_skb_any(skb);
209 tx_buf->first_bd = 0;
210 tx_buf->skb = NULL;
211
212 return new_cons;
213 }
214
bnx2x_tx_int(struct bnx2x * bp,struct bnx2x_fp_txdata * txdata)215 int bnx2x_tx_int(struct bnx2x *bp, struct bnx2x_fp_txdata *txdata)
216 {
217 struct netdev_queue *txq;
218 u16 hw_cons, sw_cons, bd_cons = txdata->tx_bd_cons;
219 unsigned int pkts_compl = 0, bytes_compl = 0;
220
221 #ifdef BNX2X_STOP_ON_ERROR
222 if (unlikely(bp->panic))
223 return -1;
224 #endif
225
226 txq = netdev_get_tx_queue(bp->dev, txdata->txq_index);
227 hw_cons = le16_to_cpu(*txdata->tx_cons_sb);
228 sw_cons = txdata->tx_pkt_cons;
229
230 while (sw_cons != hw_cons) {
231 u16 pkt_cons;
232
233 pkt_cons = TX_BD(sw_cons);
234
235 DP(NETIF_MSG_TX_DONE,
236 "queue[%d]: hw_cons %u sw_cons %u pkt_cons %u\n",
237 txdata->txq_index, hw_cons, sw_cons, pkt_cons);
238
239 bd_cons = bnx2x_free_tx_pkt(bp, txdata, pkt_cons,
240 &pkts_compl, &bytes_compl);
241
242 sw_cons++;
243 }
244
245 netdev_tx_completed_queue(txq, pkts_compl, bytes_compl);
246
247 txdata->tx_pkt_cons = sw_cons;
248 txdata->tx_bd_cons = bd_cons;
249
250 /* Need to make the tx_bd_cons update visible to start_xmit()
251 * before checking for netif_tx_queue_stopped(). Without the
252 * memory barrier, there is a small possibility that
253 * start_xmit() will miss it and cause the queue to be stopped
254 * forever.
255 * On the other hand we need an rmb() here to ensure the proper
256 * ordering of bit testing in the following
257 * netif_tx_queue_stopped(txq) call.
258 */
259 smp_mb();
260
261 if (unlikely(netif_tx_queue_stopped(txq))) {
262 /* Taking tx_lock() is needed to prevent reenabling the queue
263 * while it's empty. This could have happen if rx_action() gets
264 * suspended in bnx2x_tx_int() after the condition before
265 * netif_tx_wake_queue(), while tx_action (bnx2x_start_xmit()):
266 *
267 * stops the queue->sees fresh tx_bd_cons->releases the queue->
268 * sends some packets consuming the whole queue again->
269 * stops the queue
270 */
271
272 __netif_tx_lock(txq, smp_processor_id());
273
274 if ((netif_tx_queue_stopped(txq)) &&
275 (bp->state == BNX2X_STATE_OPEN) &&
276 (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT))
277 netif_tx_wake_queue(txq);
278
279 __netif_tx_unlock(txq);
280 }
281 return 0;
282 }
283
bnx2x_update_last_max_sge(struct bnx2x_fastpath * fp,u16 idx)284 static inline void bnx2x_update_last_max_sge(struct bnx2x_fastpath *fp,
285 u16 idx)
286 {
287 u16 last_max = fp->last_max_sge;
288
289 if (SUB_S16(idx, last_max) > 0)
290 fp->last_max_sge = idx;
291 }
292
bnx2x_update_sge_prod(struct bnx2x_fastpath * fp,u16 sge_len,struct eth_end_agg_rx_cqe * cqe)293 static inline void bnx2x_update_sge_prod(struct bnx2x_fastpath *fp,
294 u16 sge_len,
295 struct eth_end_agg_rx_cqe *cqe)
296 {
297 struct bnx2x *bp = fp->bp;
298 u16 last_max, last_elem, first_elem;
299 u16 delta = 0;
300 u16 i;
301
302 if (!sge_len)
303 return;
304
305 /* First mark all used pages */
306 for (i = 0; i < sge_len; i++)
307 BIT_VEC64_CLEAR_BIT(fp->sge_mask,
308 RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[i])));
309
310 DP(NETIF_MSG_RX_STATUS, "fp_cqe->sgl[%d] = %d\n",
311 sge_len - 1, le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
312
313 /* Here we assume that the last SGE index is the biggest */
314 prefetch((void *)(fp->sge_mask));
315 bnx2x_update_last_max_sge(fp,
316 le16_to_cpu(cqe->sgl_or_raw_data.sgl[sge_len - 1]));
317
318 last_max = RX_SGE(fp->last_max_sge);
319 last_elem = last_max >> BIT_VEC64_ELEM_SHIFT;
320 first_elem = RX_SGE(fp->rx_sge_prod) >> BIT_VEC64_ELEM_SHIFT;
321
322 /* If ring is not full */
323 if (last_elem + 1 != first_elem)
324 last_elem++;
325
326 /* Now update the prod */
327 for (i = first_elem; i != last_elem; i = NEXT_SGE_MASK_ELEM(i)) {
328 if (likely(fp->sge_mask[i]))
329 break;
330
331 fp->sge_mask[i] = BIT_VEC64_ELEM_ONE_MASK;
332 delta += BIT_VEC64_ELEM_SZ;
333 }
334
335 if (delta > 0) {
336 fp->rx_sge_prod += delta;
337 /* clear page-end entries */
338 bnx2x_clear_sge_mask_next_elems(fp);
339 }
340
341 DP(NETIF_MSG_RX_STATUS,
342 "fp->last_max_sge = %d fp->rx_sge_prod = %d\n",
343 fp->last_max_sge, fp->rx_sge_prod);
344 }
345
346 /* Get Toeplitz hash value in the skb using the value from the
347 * CQE (calculated by HW).
348 */
bnx2x_get_rxhash(const struct bnx2x * bp,const struct eth_fast_path_rx_cqe * cqe,bool * l4_rxhash)349 static u32 bnx2x_get_rxhash(const struct bnx2x *bp,
350 const struct eth_fast_path_rx_cqe *cqe,
351 bool *l4_rxhash)
352 {
353 /* Get Toeplitz hash from CQE */
354 if ((bp->dev->features & NETIF_F_RXHASH) &&
355 (cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_FLG)) {
356 enum eth_rss_hash_type htype;
357
358 htype = cqe->status_flags & ETH_FAST_PATH_RX_CQE_RSS_HASH_TYPE;
359 *l4_rxhash = (htype == TCP_IPV4_HASH_TYPE) ||
360 (htype == TCP_IPV6_HASH_TYPE);
361 return le32_to_cpu(cqe->rss_hash_result);
362 }
363 *l4_rxhash = false;
364 return 0;
365 }
366
bnx2x_tpa_start(struct bnx2x_fastpath * fp,u16 queue,u16 cons,u16 prod,struct eth_fast_path_rx_cqe * cqe)367 static void bnx2x_tpa_start(struct bnx2x_fastpath *fp, u16 queue,
368 u16 cons, u16 prod,
369 struct eth_fast_path_rx_cqe *cqe)
370 {
371 struct bnx2x *bp = fp->bp;
372 struct sw_rx_bd *cons_rx_buf = &fp->rx_buf_ring[cons];
373 struct sw_rx_bd *prod_rx_buf = &fp->rx_buf_ring[prod];
374 struct eth_rx_bd *prod_bd = &fp->rx_desc_ring[prod];
375 dma_addr_t mapping;
376 struct bnx2x_agg_info *tpa_info = &fp->tpa_info[queue];
377 struct sw_rx_bd *first_buf = &tpa_info->first_buf;
378
379 /* print error if current state != stop */
380 if (tpa_info->tpa_state != BNX2X_TPA_STOP)
381 BNX2X_ERR("start of bin not in stop [%d]\n", queue);
382
383 /* Try to map an empty data buffer from the aggregation info */
384 mapping = dma_map_single(&bp->pdev->dev,
385 first_buf->data + NET_SKB_PAD,
386 fp->rx_buf_size, DMA_FROM_DEVICE);
387 /*
388 * ...if it fails - move the skb from the consumer to the producer
389 * and set the current aggregation state as ERROR to drop it
390 * when TPA_STOP arrives.
391 */
392
393 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
394 /* Move the BD from the consumer to the producer */
395 bnx2x_reuse_rx_data(fp, cons, prod);
396 tpa_info->tpa_state = BNX2X_TPA_ERROR;
397 return;
398 }
399
400 /* move empty data from pool to prod */
401 prod_rx_buf->data = first_buf->data;
402 dma_unmap_addr_set(prod_rx_buf, mapping, mapping);
403 /* point prod_bd to new data */
404 prod_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
405 prod_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
406
407 /* move partial skb from cons to pool (don't unmap yet) */
408 *first_buf = *cons_rx_buf;
409
410 /* mark bin state as START */
411 tpa_info->parsing_flags =
412 le16_to_cpu(cqe->pars_flags.flags);
413 tpa_info->vlan_tag = le16_to_cpu(cqe->vlan_tag);
414 tpa_info->tpa_state = BNX2X_TPA_START;
415 tpa_info->len_on_bd = le16_to_cpu(cqe->len_on_bd);
416 tpa_info->placement_offset = cqe->placement_offset;
417 tpa_info->rxhash = bnx2x_get_rxhash(bp, cqe, &tpa_info->l4_rxhash);
418 if (fp->mode == TPA_MODE_GRO) {
419 u16 gro_size = le16_to_cpu(cqe->pkt_len_or_gro_seg_len);
420 tpa_info->full_page = SGE_PAGES / gro_size * gro_size;
421 tpa_info->gro_size = gro_size;
422 }
423
424 #ifdef BNX2X_STOP_ON_ERROR
425 fp->tpa_queue_used |= (1 << queue);
426 #ifdef _ASM_GENERIC_INT_L64_H
427 DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%lx\n",
428 #else
429 DP(NETIF_MSG_RX_STATUS, "fp->tpa_queue_used = 0x%llx\n",
430 #endif
431 fp->tpa_queue_used);
432 #endif
433 }
434
435 /* Timestamp option length allowed for TPA aggregation:
436 *
437 * nop nop kind length echo val
438 */
439 #define TPA_TSTAMP_OPT_LEN 12
440 /**
441 * bnx2x_set_gro_params - compute GRO values
442 *
443 * @skb: packet skb
444 * @parsing_flags: parsing flags from the START CQE
445 * @len_on_bd: total length of the first packet for the
446 * aggregation.
447 * @pkt_len: length of all segments
448 *
449 * Approximate value of the MSS for this aggregation calculated using
450 * the first packet of it.
451 * Compute number of aggregated segments, and gso_type.
452 */
bnx2x_set_gro_params(struct sk_buff * skb,u16 parsing_flags,u16 len_on_bd,unsigned int pkt_len,u16 num_of_coalesced_segs)453 static void bnx2x_set_gro_params(struct sk_buff *skb, u16 parsing_flags,
454 u16 len_on_bd, unsigned int pkt_len,
455 u16 num_of_coalesced_segs)
456 {
457 /* TPA aggregation won't have either IP options or TCP options
458 * other than timestamp or IPv6 extension headers.
459 */
460 u16 hdrs_len = ETH_HLEN + sizeof(struct tcphdr);
461
462 if (GET_FLAG(parsing_flags, PARSING_FLAGS_OVER_ETHERNET_PROTOCOL) ==
463 PRS_FLAG_OVERETH_IPV6) {
464 hdrs_len += sizeof(struct ipv6hdr);
465 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6;
466 } else {
467 hdrs_len += sizeof(struct iphdr);
468 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4;
469 }
470
471 /* Check if there was a TCP timestamp, if there is it's will
472 * always be 12 bytes length: nop nop kind length echo val.
473 *
474 * Otherwise FW would close the aggregation.
475 */
476 if (parsing_flags & PARSING_FLAGS_TIME_STAMP_EXIST_FLAG)
477 hdrs_len += TPA_TSTAMP_OPT_LEN;
478
479 skb_shinfo(skb)->gso_size = len_on_bd - hdrs_len;
480
481 /* tcp_gro_complete() will copy NAPI_GRO_CB(skb)->count
482 * to skb_shinfo(skb)->gso_segs
483 */
484 NAPI_GRO_CB(skb)->count = num_of_coalesced_segs;
485 }
486
bnx2x_alloc_rx_sge(struct bnx2x * bp,struct bnx2x_fastpath * fp,u16 index)487 static int bnx2x_alloc_rx_sge(struct bnx2x *bp,
488 struct bnx2x_fastpath *fp, u16 index)
489 {
490 struct page *page = alloc_pages(GFP_ATOMIC, PAGES_PER_SGE_SHIFT);
491 struct sw_rx_page *sw_buf = &fp->rx_page_ring[index];
492 struct eth_rx_sge *sge = &fp->rx_sge_ring[index];
493 dma_addr_t mapping;
494
495 if (unlikely(page == NULL)) {
496 BNX2X_ERR("Can't alloc sge\n");
497 return -ENOMEM;
498 }
499
500 mapping = dma_map_page(&bp->pdev->dev, page, 0,
501 SGE_PAGES, DMA_FROM_DEVICE);
502 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
503 __free_pages(page, PAGES_PER_SGE_SHIFT);
504 BNX2X_ERR("Can't map sge\n");
505 return -ENOMEM;
506 }
507
508 sw_buf->page = page;
509 dma_unmap_addr_set(sw_buf, mapping, mapping);
510
511 sge->addr_hi = cpu_to_le32(U64_HI(mapping));
512 sge->addr_lo = cpu_to_le32(U64_LO(mapping));
513
514 return 0;
515 }
516
bnx2x_fill_frag_skb(struct bnx2x * bp,struct bnx2x_fastpath * fp,struct bnx2x_agg_info * tpa_info,u16 pages,struct sk_buff * skb,struct eth_end_agg_rx_cqe * cqe,u16 cqe_idx)517 static int bnx2x_fill_frag_skb(struct bnx2x *bp, struct bnx2x_fastpath *fp,
518 struct bnx2x_agg_info *tpa_info,
519 u16 pages,
520 struct sk_buff *skb,
521 struct eth_end_agg_rx_cqe *cqe,
522 u16 cqe_idx)
523 {
524 struct sw_rx_page *rx_pg, old_rx_pg;
525 u32 i, frag_len, frag_size;
526 int err, j, frag_id = 0;
527 u16 len_on_bd = tpa_info->len_on_bd;
528 u16 full_page = 0, gro_size = 0;
529
530 frag_size = le16_to_cpu(cqe->pkt_len) - len_on_bd;
531
532 if (fp->mode == TPA_MODE_GRO) {
533 gro_size = tpa_info->gro_size;
534 full_page = tpa_info->full_page;
535 }
536
537 /* This is needed in order to enable forwarding support */
538 if (frag_size)
539 bnx2x_set_gro_params(skb, tpa_info->parsing_flags, len_on_bd,
540 le16_to_cpu(cqe->pkt_len),
541 le16_to_cpu(cqe->num_of_coalesced_segs));
542
543 #ifdef BNX2X_STOP_ON_ERROR
544 if (pages > min_t(u32, 8, MAX_SKB_FRAGS) * SGE_PAGES) {
545 BNX2X_ERR("SGL length is too long: %d. CQE index is %d\n",
546 pages, cqe_idx);
547 BNX2X_ERR("cqe->pkt_len = %d\n", cqe->pkt_len);
548 bnx2x_panic();
549 return -EINVAL;
550 }
551 #endif
552
553 /* Run through the SGL and compose the fragmented skb */
554 for (i = 0, j = 0; i < pages; i += PAGES_PER_SGE, j++) {
555 u16 sge_idx = RX_SGE(le16_to_cpu(cqe->sgl_or_raw_data.sgl[j]));
556
557 /* FW gives the indices of the SGE as if the ring is an array
558 (meaning that "next" element will consume 2 indices) */
559 if (fp->mode == TPA_MODE_GRO)
560 frag_len = min_t(u32, frag_size, (u32)full_page);
561 else /* LRO */
562 frag_len = min_t(u32, frag_size, (u32)SGE_PAGES);
563
564 rx_pg = &fp->rx_page_ring[sge_idx];
565 old_rx_pg = *rx_pg;
566
567 /* If we fail to allocate a substitute page, we simply stop
568 where we are and drop the whole packet */
569 err = bnx2x_alloc_rx_sge(bp, fp, sge_idx);
570 if (unlikely(err)) {
571 bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
572 return err;
573 }
574
575 /* Unmap the page as we r going to pass it to the stack */
576 dma_unmap_page(&bp->pdev->dev,
577 dma_unmap_addr(&old_rx_pg, mapping),
578 SGE_PAGES, DMA_FROM_DEVICE);
579 /* Add one frag and update the appropriate fields in the skb */
580 if (fp->mode == TPA_MODE_LRO)
581 skb_fill_page_desc(skb, j, old_rx_pg.page, 0, frag_len);
582 else { /* GRO */
583 int rem;
584 int offset = 0;
585 for (rem = frag_len; rem > 0; rem -= gro_size) {
586 int len = rem > gro_size ? gro_size : rem;
587 skb_fill_page_desc(skb, frag_id++,
588 old_rx_pg.page, offset, len);
589 if (offset)
590 get_page(old_rx_pg.page);
591 offset += len;
592 }
593 }
594
595 skb->data_len += frag_len;
596 skb->truesize += SGE_PAGES;
597 skb->len += frag_len;
598
599 frag_size -= frag_len;
600 }
601
602 return 0;
603 }
604
bnx2x_frag_free(const struct bnx2x_fastpath * fp,void * data)605 static void bnx2x_frag_free(const struct bnx2x_fastpath *fp, void *data)
606 {
607 if (fp->rx_frag_size)
608 put_page(virt_to_head_page(data));
609 else
610 kfree(data);
611 }
612
bnx2x_frag_alloc(const struct bnx2x_fastpath * fp)613 static void *bnx2x_frag_alloc(const struct bnx2x_fastpath *fp)
614 {
615 if (fp->rx_frag_size)
616 return netdev_alloc_frag(fp->rx_frag_size);
617
618 return kmalloc(fp->rx_buf_size + NET_SKB_PAD, GFP_ATOMIC);
619 }
620
621 #ifdef CONFIG_INET
bnx2x_gro_ip_csum(struct bnx2x * bp,struct sk_buff * skb)622 static void bnx2x_gro_ip_csum(struct bnx2x *bp, struct sk_buff *skb)
623 {
624 const struct iphdr *iph = ip_hdr(skb);
625 struct tcphdr *th;
626
627 skb_set_transport_header(skb, sizeof(struct iphdr));
628 th = tcp_hdr(skb);
629
630 th->check = ~tcp_v4_check(skb->len - skb_transport_offset(skb),
631 iph->saddr, iph->daddr, 0);
632 }
633
bnx2x_gro_ipv6_csum(struct bnx2x * bp,struct sk_buff * skb)634 static void bnx2x_gro_ipv6_csum(struct bnx2x *bp, struct sk_buff *skb)
635 {
636 struct ipv6hdr *iph = ipv6_hdr(skb);
637 struct tcphdr *th;
638
639 skb_set_transport_header(skb, sizeof(struct ipv6hdr));
640 th = tcp_hdr(skb);
641
642 th->check = ~tcp_v6_check(skb->len - skb_transport_offset(skb),
643 &iph->saddr, &iph->daddr, 0);
644 }
645
bnx2x_gro_csum(struct bnx2x * bp,struct sk_buff * skb,void (* gro_func)(struct bnx2x *,struct sk_buff *))646 static void bnx2x_gro_csum(struct bnx2x *bp, struct sk_buff *skb,
647 void (*gro_func)(struct bnx2x*, struct sk_buff*))
648 {
649 skb_set_network_header(skb, 0);
650 gro_func(bp, skb);
651 tcp_gro_complete(skb);
652 }
653 #endif
654
bnx2x_gro_receive(struct bnx2x * bp,struct bnx2x_fastpath * fp,struct sk_buff * skb)655 static void bnx2x_gro_receive(struct bnx2x *bp, struct bnx2x_fastpath *fp,
656 struct sk_buff *skb)
657 {
658 #ifdef CONFIG_INET
659 if (skb_shinfo(skb)->gso_size) {
660 switch (be16_to_cpu(skb->protocol)) {
661 case ETH_P_IP:
662 bnx2x_gro_csum(bp, skb, bnx2x_gro_ip_csum);
663 break;
664 case ETH_P_IPV6:
665 bnx2x_gro_csum(bp, skb, bnx2x_gro_ipv6_csum);
666 break;
667 default:
668 BNX2X_ERR("Error: FW GRO supports only IPv4/IPv6, not 0x%04x\n",
669 be16_to_cpu(skb->protocol));
670 }
671 }
672 #endif
673 napi_gro_receive(&fp->napi, skb);
674 }
675
bnx2x_tpa_stop(struct bnx2x * bp,struct bnx2x_fastpath * fp,struct bnx2x_agg_info * tpa_info,u16 pages,struct eth_end_agg_rx_cqe * cqe,u16 cqe_idx)676 static void bnx2x_tpa_stop(struct bnx2x *bp, struct bnx2x_fastpath *fp,
677 struct bnx2x_agg_info *tpa_info,
678 u16 pages,
679 struct eth_end_agg_rx_cqe *cqe,
680 u16 cqe_idx)
681 {
682 struct sw_rx_bd *rx_buf = &tpa_info->first_buf;
683 u8 pad = tpa_info->placement_offset;
684 u16 len = tpa_info->len_on_bd;
685 struct sk_buff *skb = NULL;
686 u8 *new_data, *data = rx_buf->data;
687 u8 old_tpa_state = tpa_info->tpa_state;
688
689 tpa_info->tpa_state = BNX2X_TPA_STOP;
690
691 /* If we there was an error during the handling of the TPA_START -
692 * drop this aggregation.
693 */
694 if (old_tpa_state == BNX2X_TPA_ERROR)
695 goto drop;
696
697 /* Try to allocate the new data */
698 new_data = bnx2x_frag_alloc(fp);
699 /* Unmap skb in the pool anyway, as we are going to change
700 pool entry status to BNX2X_TPA_STOP even if new skb allocation
701 fails. */
702 dma_unmap_single(&bp->pdev->dev, dma_unmap_addr(rx_buf, mapping),
703 fp->rx_buf_size, DMA_FROM_DEVICE);
704 if (likely(new_data))
705 skb = build_skb(data, fp->rx_frag_size);
706
707 if (likely(skb)) {
708 #ifdef BNX2X_STOP_ON_ERROR
709 if (pad + len > fp->rx_buf_size) {
710 BNX2X_ERR("skb_put is about to fail... pad %d len %d rx_buf_size %d\n",
711 pad, len, fp->rx_buf_size);
712 bnx2x_panic();
713 return;
714 }
715 #endif
716
717 skb_reserve(skb, pad + NET_SKB_PAD);
718 skb_put(skb, len);
719 skb->rxhash = tpa_info->rxhash;
720 skb->l4_rxhash = tpa_info->l4_rxhash;
721
722 skb->protocol = eth_type_trans(skb, bp->dev);
723 skb->ip_summed = CHECKSUM_UNNECESSARY;
724
725 if (!bnx2x_fill_frag_skb(bp, fp, tpa_info, pages,
726 skb, cqe, cqe_idx)) {
727 if (tpa_info->parsing_flags & PARSING_FLAGS_VLAN)
728 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q), tpa_info->vlan_tag);
729 bnx2x_gro_receive(bp, fp, skb);
730 } else {
731 DP(NETIF_MSG_RX_STATUS,
732 "Failed to allocate new pages - dropping packet!\n");
733 dev_kfree_skb_any(skb);
734 }
735
736
737 /* put new data in bin */
738 rx_buf->data = new_data;
739
740 return;
741 }
742 bnx2x_frag_free(fp, new_data);
743 drop:
744 /* drop the packet and keep the buffer in the bin */
745 DP(NETIF_MSG_RX_STATUS,
746 "Failed to allocate or map a new skb - dropping packet!\n");
747 bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed++;
748 }
749
bnx2x_alloc_rx_data(struct bnx2x * bp,struct bnx2x_fastpath * fp,u16 index)750 static int bnx2x_alloc_rx_data(struct bnx2x *bp,
751 struct bnx2x_fastpath *fp, u16 index)
752 {
753 u8 *data;
754 struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[index];
755 struct eth_rx_bd *rx_bd = &fp->rx_desc_ring[index];
756 dma_addr_t mapping;
757
758 data = bnx2x_frag_alloc(fp);
759 if (unlikely(data == NULL))
760 return -ENOMEM;
761
762 mapping = dma_map_single(&bp->pdev->dev, data + NET_SKB_PAD,
763 fp->rx_buf_size,
764 DMA_FROM_DEVICE);
765 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
766 bnx2x_frag_free(fp, data);
767 BNX2X_ERR("Can't map rx data\n");
768 return -ENOMEM;
769 }
770
771 rx_buf->data = data;
772 dma_unmap_addr_set(rx_buf, mapping, mapping);
773
774 rx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
775 rx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
776
777 return 0;
778 }
779
780 static
bnx2x_csum_validate(struct sk_buff * skb,union eth_rx_cqe * cqe,struct bnx2x_fastpath * fp,struct bnx2x_eth_q_stats * qstats)781 void bnx2x_csum_validate(struct sk_buff *skb, union eth_rx_cqe *cqe,
782 struct bnx2x_fastpath *fp,
783 struct bnx2x_eth_q_stats *qstats)
784 {
785 /* Do nothing if no L4 csum validation was done.
786 * We do not check whether IP csum was validated. For IPv4 we assume
787 * that if the card got as far as validating the L4 csum, it also
788 * validated the IP csum. IPv6 has no IP csum.
789 */
790 if (cqe->fast_path_cqe.status_flags &
791 ETH_FAST_PATH_RX_CQE_L4_XSUM_NO_VALIDATION_FLG)
792 return;
793
794 /* If L4 validation was done, check if an error was found. */
795
796 if (cqe->fast_path_cqe.type_error_flags &
797 (ETH_FAST_PATH_RX_CQE_IP_BAD_XSUM_FLG |
798 ETH_FAST_PATH_RX_CQE_L4_BAD_XSUM_FLG))
799 qstats->hw_csum_err++;
800 else
801 skb->ip_summed = CHECKSUM_UNNECESSARY;
802 }
803
bnx2x_rx_int(struct bnx2x_fastpath * fp,int budget)804 int bnx2x_rx_int(struct bnx2x_fastpath *fp, int budget)
805 {
806 struct bnx2x *bp = fp->bp;
807 u16 bd_cons, bd_prod, bd_prod_fw, comp_ring_cons;
808 u16 hw_comp_cons, sw_comp_cons, sw_comp_prod;
809 int rx_pkt = 0;
810
811 #ifdef BNX2X_STOP_ON_ERROR
812 if (unlikely(bp->panic))
813 return 0;
814 #endif
815
816 /* CQ "next element" is of the size of the regular element,
817 that's why it's ok here */
818 hw_comp_cons = le16_to_cpu(*fp->rx_cons_sb);
819 if ((hw_comp_cons & MAX_RCQ_DESC_CNT) == MAX_RCQ_DESC_CNT)
820 hw_comp_cons++;
821
822 bd_cons = fp->rx_bd_cons;
823 bd_prod = fp->rx_bd_prod;
824 bd_prod_fw = bd_prod;
825 sw_comp_cons = fp->rx_comp_cons;
826 sw_comp_prod = fp->rx_comp_prod;
827
828 /* Memory barrier necessary as speculative reads of the rx
829 * buffer can be ahead of the index in the status block
830 */
831 rmb();
832
833 DP(NETIF_MSG_RX_STATUS,
834 "queue[%d]: hw_comp_cons %u sw_comp_cons %u\n",
835 fp->index, hw_comp_cons, sw_comp_cons);
836
837 while (sw_comp_cons != hw_comp_cons) {
838 struct sw_rx_bd *rx_buf = NULL;
839 struct sk_buff *skb;
840 union eth_rx_cqe *cqe;
841 struct eth_fast_path_rx_cqe *cqe_fp;
842 u8 cqe_fp_flags;
843 enum eth_rx_cqe_type cqe_fp_type;
844 u16 len, pad, queue;
845 u8 *data;
846 bool l4_rxhash;
847
848 #ifdef BNX2X_STOP_ON_ERROR
849 if (unlikely(bp->panic))
850 return 0;
851 #endif
852
853 comp_ring_cons = RCQ_BD(sw_comp_cons);
854 bd_prod = RX_BD(bd_prod);
855 bd_cons = RX_BD(bd_cons);
856
857 cqe = &fp->rx_comp_ring[comp_ring_cons];
858 cqe_fp = &cqe->fast_path_cqe;
859 cqe_fp_flags = cqe_fp->type_error_flags;
860 cqe_fp_type = cqe_fp_flags & ETH_FAST_PATH_RX_CQE_TYPE;
861
862 DP(NETIF_MSG_RX_STATUS,
863 "CQE type %x err %x status %x queue %x vlan %x len %u\n",
864 CQE_TYPE(cqe_fp_flags),
865 cqe_fp_flags, cqe_fp->status_flags,
866 le32_to_cpu(cqe_fp->rss_hash_result),
867 le16_to_cpu(cqe_fp->vlan_tag),
868 le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len));
869
870 /* is this a slowpath msg? */
871 if (unlikely(CQE_TYPE_SLOW(cqe_fp_type))) {
872 bnx2x_sp_event(fp, cqe);
873 goto next_cqe;
874 }
875
876 rx_buf = &fp->rx_buf_ring[bd_cons];
877 data = rx_buf->data;
878
879 if (!CQE_TYPE_FAST(cqe_fp_type)) {
880 struct bnx2x_agg_info *tpa_info;
881 u16 frag_size, pages;
882 #ifdef BNX2X_STOP_ON_ERROR
883 /* sanity check */
884 if (fp->disable_tpa &&
885 (CQE_TYPE_START(cqe_fp_type) ||
886 CQE_TYPE_STOP(cqe_fp_type)))
887 BNX2X_ERR("START/STOP packet while disable_tpa type %x\n",
888 CQE_TYPE(cqe_fp_type));
889 #endif
890
891 if (CQE_TYPE_START(cqe_fp_type)) {
892 u16 queue = cqe_fp->queue_index;
893 DP(NETIF_MSG_RX_STATUS,
894 "calling tpa_start on queue %d\n",
895 queue);
896
897 bnx2x_tpa_start(fp, queue,
898 bd_cons, bd_prod,
899 cqe_fp);
900
901 goto next_rx;
902
903 }
904 queue = cqe->end_agg_cqe.queue_index;
905 tpa_info = &fp->tpa_info[queue];
906 DP(NETIF_MSG_RX_STATUS,
907 "calling tpa_stop on queue %d\n",
908 queue);
909
910 frag_size = le16_to_cpu(cqe->end_agg_cqe.pkt_len) -
911 tpa_info->len_on_bd;
912
913 if (fp->mode == TPA_MODE_GRO)
914 pages = (frag_size + tpa_info->full_page - 1) /
915 tpa_info->full_page;
916 else
917 pages = SGE_PAGE_ALIGN(frag_size) >>
918 SGE_PAGE_SHIFT;
919
920 bnx2x_tpa_stop(bp, fp, tpa_info, pages,
921 &cqe->end_agg_cqe, comp_ring_cons);
922 #ifdef BNX2X_STOP_ON_ERROR
923 if (bp->panic)
924 return 0;
925 #endif
926
927 bnx2x_update_sge_prod(fp, pages, &cqe->end_agg_cqe);
928 goto next_cqe;
929 }
930 /* non TPA */
931 len = le16_to_cpu(cqe_fp->pkt_len_or_gro_seg_len);
932 pad = cqe_fp->placement_offset;
933 dma_sync_single_for_cpu(&bp->pdev->dev,
934 dma_unmap_addr(rx_buf, mapping),
935 pad + RX_COPY_THRESH,
936 DMA_FROM_DEVICE);
937 pad += NET_SKB_PAD;
938 prefetch(data + pad); /* speedup eth_type_trans() */
939 /* is this an error packet? */
940 if (unlikely(cqe_fp_flags & ETH_RX_ERROR_FALGS)) {
941 DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
942 "ERROR flags %x rx packet %u\n",
943 cqe_fp_flags, sw_comp_cons);
944 bnx2x_fp_qstats(bp, fp)->rx_err_discard_pkt++;
945 goto reuse_rx;
946 }
947
948 /* Since we don't have a jumbo ring
949 * copy small packets if mtu > 1500
950 */
951 if ((bp->dev->mtu > ETH_MAX_PACKET_SIZE) &&
952 (len <= RX_COPY_THRESH)) {
953 skb = netdev_alloc_skb_ip_align(bp->dev, len);
954 if (skb == NULL) {
955 DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
956 "ERROR packet dropped because of alloc failure\n");
957 bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
958 goto reuse_rx;
959 }
960 memcpy(skb->data, data + pad, len);
961 bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
962 } else {
963 if (likely(bnx2x_alloc_rx_data(bp, fp, bd_prod) == 0)) {
964 dma_unmap_single(&bp->pdev->dev,
965 dma_unmap_addr(rx_buf, mapping),
966 fp->rx_buf_size,
967 DMA_FROM_DEVICE);
968 skb = build_skb(data, fp->rx_frag_size);
969 if (unlikely(!skb)) {
970 bnx2x_frag_free(fp, data);
971 bnx2x_fp_qstats(bp, fp)->
972 rx_skb_alloc_failed++;
973 goto next_rx;
974 }
975 skb_reserve(skb, pad);
976 } else {
977 DP(NETIF_MSG_RX_ERR | NETIF_MSG_RX_STATUS,
978 "ERROR packet dropped because of alloc failure\n");
979 bnx2x_fp_qstats(bp, fp)->rx_skb_alloc_failed++;
980 reuse_rx:
981 bnx2x_reuse_rx_data(fp, bd_cons, bd_prod);
982 goto next_rx;
983 }
984 }
985
986 skb_put(skb, len);
987 skb->protocol = eth_type_trans(skb, bp->dev);
988
989 /* Set Toeplitz hash for a none-LRO skb */
990 skb->rxhash = bnx2x_get_rxhash(bp, cqe_fp, &l4_rxhash);
991 skb->l4_rxhash = l4_rxhash;
992
993 skb_checksum_none_assert(skb);
994
995 if (bp->dev->features & NETIF_F_RXCSUM)
996 bnx2x_csum_validate(skb, cqe, fp,
997 bnx2x_fp_qstats(bp, fp));
998
999 skb_record_rx_queue(skb, fp->rx_queue);
1000
1001 if (le16_to_cpu(cqe_fp->pars_flags.flags) &
1002 PARSING_FLAGS_VLAN)
1003 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
1004 le16_to_cpu(cqe_fp->vlan_tag));
1005 napi_gro_receive(&fp->napi, skb);
1006
1007
1008 next_rx:
1009 rx_buf->data = NULL;
1010
1011 bd_cons = NEXT_RX_IDX(bd_cons);
1012 bd_prod = NEXT_RX_IDX(bd_prod);
1013 bd_prod_fw = NEXT_RX_IDX(bd_prod_fw);
1014 rx_pkt++;
1015 next_cqe:
1016 sw_comp_prod = NEXT_RCQ_IDX(sw_comp_prod);
1017 sw_comp_cons = NEXT_RCQ_IDX(sw_comp_cons);
1018
1019 if (rx_pkt == budget)
1020 break;
1021 } /* while */
1022
1023 fp->rx_bd_cons = bd_cons;
1024 fp->rx_bd_prod = bd_prod_fw;
1025 fp->rx_comp_cons = sw_comp_cons;
1026 fp->rx_comp_prod = sw_comp_prod;
1027
1028 /* Update producers */
1029 bnx2x_update_rx_prod(bp, fp, bd_prod_fw, sw_comp_prod,
1030 fp->rx_sge_prod);
1031
1032 fp->rx_pkt += rx_pkt;
1033 fp->rx_calls++;
1034
1035 return rx_pkt;
1036 }
1037
bnx2x_msix_fp_int(int irq,void * fp_cookie)1038 static irqreturn_t bnx2x_msix_fp_int(int irq, void *fp_cookie)
1039 {
1040 struct bnx2x_fastpath *fp = fp_cookie;
1041 struct bnx2x *bp = fp->bp;
1042 u8 cos;
1043
1044 DP(NETIF_MSG_INTR,
1045 "got an MSI-X interrupt on IDX:SB [fp %d fw_sd %d igusb %d]\n",
1046 fp->index, fp->fw_sb_id, fp->igu_sb_id);
1047
1048 bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID, 0, IGU_INT_DISABLE, 0);
1049
1050 #ifdef BNX2X_STOP_ON_ERROR
1051 if (unlikely(bp->panic))
1052 return IRQ_HANDLED;
1053 #endif
1054
1055 /* Handle Rx and Tx according to MSI-X vector */
1056 prefetch(fp->rx_cons_sb);
1057
1058 for_each_cos_in_tx_queue(fp, cos)
1059 prefetch(fp->txdata_ptr[cos]->tx_cons_sb);
1060
1061 prefetch(&fp->sb_running_index[SM_RX_ID]);
1062 napi_schedule(&bnx2x_fp(bp, fp->index, napi));
1063
1064 return IRQ_HANDLED;
1065 }
1066
1067 /* HW Lock for shared dual port PHYs */
bnx2x_acquire_phy_lock(struct bnx2x * bp)1068 void bnx2x_acquire_phy_lock(struct bnx2x *bp)
1069 {
1070 mutex_lock(&bp->port.phy_mutex);
1071
1072 bnx2x_acquire_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1073 }
1074
bnx2x_release_phy_lock(struct bnx2x * bp)1075 void bnx2x_release_phy_lock(struct bnx2x *bp)
1076 {
1077 bnx2x_release_hw_lock(bp, HW_LOCK_RESOURCE_MDIO);
1078
1079 mutex_unlock(&bp->port.phy_mutex);
1080 }
1081
1082 /* calculates MF speed according to current linespeed and MF configuration */
bnx2x_get_mf_speed(struct bnx2x * bp)1083 u16 bnx2x_get_mf_speed(struct bnx2x *bp)
1084 {
1085 u16 line_speed = bp->link_vars.line_speed;
1086 if (IS_MF(bp)) {
1087 u16 maxCfg = bnx2x_extract_max_cfg(bp,
1088 bp->mf_config[BP_VN(bp)]);
1089
1090 /* Calculate the current MAX line speed limit for the MF
1091 * devices
1092 */
1093 if (IS_MF_SI(bp))
1094 line_speed = (line_speed * maxCfg) / 100;
1095 else { /* SD mode */
1096 u16 vn_max_rate = maxCfg * 100;
1097
1098 if (vn_max_rate < line_speed)
1099 line_speed = vn_max_rate;
1100 }
1101 }
1102
1103 return line_speed;
1104 }
1105
1106 /**
1107 * bnx2x_fill_report_data - fill link report data to report
1108 *
1109 * @bp: driver handle
1110 * @data: link state to update
1111 *
1112 * It uses a none-atomic bit operations because is called under the mutex.
1113 */
bnx2x_fill_report_data(struct bnx2x * bp,struct bnx2x_link_report_data * data)1114 static void bnx2x_fill_report_data(struct bnx2x *bp,
1115 struct bnx2x_link_report_data *data)
1116 {
1117 u16 line_speed = bnx2x_get_mf_speed(bp);
1118
1119 memset(data, 0, sizeof(*data));
1120
1121 /* Fill the report data: efective line speed */
1122 data->line_speed = line_speed;
1123
1124 /* Link is down */
1125 if (!bp->link_vars.link_up || (bp->flags & MF_FUNC_DIS))
1126 __set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1127 &data->link_report_flags);
1128
1129 /* Full DUPLEX */
1130 if (bp->link_vars.duplex == DUPLEX_FULL)
1131 __set_bit(BNX2X_LINK_REPORT_FD, &data->link_report_flags);
1132
1133 /* Rx Flow Control is ON */
1134 if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_RX)
1135 __set_bit(BNX2X_LINK_REPORT_RX_FC_ON, &data->link_report_flags);
1136
1137 /* Tx Flow Control is ON */
1138 if (bp->link_vars.flow_ctrl & BNX2X_FLOW_CTRL_TX)
1139 __set_bit(BNX2X_LINK_REPORT_TX_FC_ON, &data->link_report_flags);
1140 }
1141
1142 /**
1143 * bnx2x_link_report - report link status to OS.
1144 *
1145 * @bp: driver handle
1146 *
1147 * Calls the __bnx2x_link_report() under the same locking scheme
1148 * as a link/PHY state managing code to ensure a consistent link
1149 * reporting.
1150 */
1151
bnx2x_link_report(struct bnx2x * bp)1152 void bnx2x_link_report(struct bnx2x *bp)
1153 {
1154 bnx2x_acquire_phy_lock(bp);
1155 __bnx2x_link_report(bp);
1156 bnx2x_release_phy_lock(bp);
1157 }
1158
1159 /**
1160 * __bnx2x_link_report - report link status to OS.
1161 *
1162 * @bp: driver handle
1163 *
1164 * None atomic inmlementation.
1165 * Should be called under the phy_lock.
1166 */
__bnx2x_link_report(struct bnx2x * bp)1167 void __bnx2x_link_report(struct bnx2x *bp)
1168 {
1169 struct bnx2x_link_report_data cur_data;
1170
1171 /* reread mf_cfg */
1172 if (IS_PF(bp) && !CHIP_IS_E1(bp))
1173 bnx2x_read_mf_cfg(bp);
1174
1175 /* Read the current link report info */
1176 bnx2x_fill_report_data(bp, &cur_data);
1177
1178 /* Don't report link down or exactly the same link status twice */
1179 if (!memcmp(&cur_data, &bp->last_reported_link, sizeof(cur_data)) ||
1180 (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1181 &bp->last_reported_link.link_report_flags) &&
1182 test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1183 &cur_data.link_report_flags)))
1184 return;
1185
1186 bp->link_cnt++;
1187
1188 /* We are going to report a new link parameters now -
1189 * remember the current data for the next time.
1190 */
1191 memcpy(&bp->last_reported_link, &cur_data, sizeof(cur_data));
1192
1193 if (test_bit(BNX2X_LINK_REPORT_LINK_DOWN,
1194 &cur_data.link_report_flags)) {
1195 netif_carrier_off(bp->dev);
1196 netdev_err(bp->dev, "NIC Link is Down\n");
1197 return;
1198 } else {
1199 const char *duplex;
1200 const char *flow;
1201
1202 netif_carrier_on(bp->dev);
1203
1204 if (test_and_clear_bit(BNX2X_LINK_REPORT_FD,
1205 &cur_data.link_report_flags))
1206 duplex = "full";
1207 else
1208 duplex = "half";
1209
1210 /* Handle the FC at the end so that only these flags would be
1211 * possibly set. This way we may easily check if there is no FC
1212 * enabled.
1213 */
1214 if (cur_data.link_report_flags) {
1215 if (test_bit(BNX2X_LINK_REPORT_RX_FC_ON,
1216 &cur_data.link_report_flags)) {
1217 if (test_bit(BNX2X_LINK_REPORT_TX_FC_ON,
1218 &cur_data.link_report_flags))
1219 flow = "ON - receive & transmit";
1220 else
1221 flow = "ON - receive";
1222 } else {
1223 flow = "ON - transmit";
1224 }
1225 } else {
1226 flow = "none";
1227 }
1228 netdev_info(bp->dev, "NIC Link is Up, %d Mbps %s duplex, Flow control: %s\n",
1229 cur_data.line_speed, duplex, flow);
1230 }
1231 }
1232
bnx2x_set_next_page_sgl(struct bnx2x_fastpath * fp)1233 static void bnx2x_set_next_page_sgl(struct bnx2x_fastpath *fp)
1234 {
1235 int i;
1236
1237 for (i = 1; i <= NUM_RX_SGE_PAGES; i++) {
1238 struct eth_rx_sge *sge;
1239
1240 sge = &fp->rx_sge_ring[RX_SGE_CNT * i - 2];
1241 sge->addr_hi =
1242 cpu_to_le32(U64_HI(fp->rx_sge_mapping +
1243 BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1244
1245 sge->addr_lo =
1246 cpu_to_le32(U64_LO(fp->rx_sge_mapping +
1247 BCM_PAGE_SIZE*(i % NUM_RX_SGE_PAGES)));
1248 }
1249 }
1250
bnx2x_free_tpa_pool(struct bnx2x * bp,struct bnx2x_fastpath * fp,int last)1251 static void bnx2x_free_tpa_pool(struct bnx2x *bp,
1252 struct bnx2x_fastpath *fp, int last)
1253 {
1254 int i;
1255
1256 for (i = 0; i < last; i++) {
1257 struct bnx2x_agg_info *tpa_info = &fp->tpa_info[i];
1258 struct sw_rx_bd *first_buf = &tpa_info->first_buf;
1259 u8 *data = first_buf->data;
1260
1261 if (data == NULL) {
1262 DP(NETIF_MSG_IFDOWN, "tpa bin %d empty on free\n", i);
1263 continue;
1264 }
1265 if (tpa_info->tpa_state == BNX2X_TPA_START)
1266 dma_unmap_single(&bp->pdev->dev,
1267 dma_unmap_addr(first_buf, mapping),
1268 fp->rx_buf_size, DMA_FROM_DEVICE);
1269 bnx2x_frag_free(fp, data);
1270 first_buf->data = NULL;
1271 }
1272 }
1273
bnx2x_init_rx_rings_cnic(struct bnx2x * bp)1274 void bnx2x_init_rx_rings_cnic(struct bnx2x *bp)
1275 {
1276 int j;
1277
1278 for_each_rx_queue_cnic(bp, j) {
1279 struct bnx2x_fastpath *fp = &bp->fp[j];
1280
1281 fp->rx_bd_cons = 0;
1282
1283 /* Activate BD ring */
1284 /* Warning!
1285 * this will generate an interrupt (to the TSTORM)
1286 * must only be done after chip is initialized
1287 */
1288 bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1289 fp->rx_sge_prod);
1290 }
1291 }
1292
bnx2x_init_rx_rings(struct bnx2x * bp)1293 void bnx2x_init_rx_rings(struct bnx2x *bp)
1294 {
1295 int func = BP_FUNC(bp);
1296 u16 ring_prod;
1297 int i, j;
1298
1299 /* Allocate TPA resources */
1300 for_each_eth_queue(bp, j) {
1301 struct bnx2x_fastpath *fp = &bp->fp[j];
1302
1303 DP(NETIF_MSG_IFUP,
1304 "mtu %d rx_buf_size %d\n", bp->dev->mtu, fp->rx_buf_size);
1305
1306 if (!fp->disable_tpa) {
1307 /* Fill the per-aggregtion pool */
1308 for (i = 0; i < MAX_AGG_QS(bp); i++) {
1309 struct bnx2x_agg_info *tpa_info =
1310 &fp->tpa_info[i];
1311 struct sw_rx_bd *first_buf =
1312 &tpa_info->first_buf;
1313
1314 first_buf->data = bnx2x_frag_alloc(fp);
1315 if (!first_buf->data) {
1316 BNX2X_ERR("Failed to allocate TPA skb pool for queue[%d] - disabling TPA on this queue!\n",
1317 j);
1318 bnx2x_free_tpa_pool(bp, fp, i);
1319 fp->disable_tpa = 1;
1320 break;
1321 }
1322 dma_unmap_addr_set(first_buf, mapping, 0);
1323 tpa_info->tpa_state = BNX2X_TPA_STOP;
1324 }
1325
1326 /* "next page" elements initialization */
1327 bnx2x_set_next_page_sgl(fp);
1328
1329 /* set SGEs bit mask */
1330 bnx2x_init_sge_ring_bit_mask(fp);
1331
1332 /* Allocate SGEs and initialize the ring elements */
1333 for (i = 0, ring_prod = 0;
1334 i < MAX_RX_SGE_CNT*NUM_RX_SGE_PAGES; i++) {
1335
1336 if (bnx2x_alloc_rx_sge(bp, fp, ring_prod) < 0) {
1337 BNX2X_ERR("was only able to allocate %d rx sges\n",
1338 i);
1339 BNX2X_ERR("disabling TPA for queue[%d]\n",
1340 j);
1341 /* Cleanup already allocated elements */
1342 bnx2x_free_rx_sge_range(bp, fp,
1343 ring_prod);
1344 bnx2x_free_tpa_pool(bp, fp,
1345 MAX_AGG_QS(bp));
1346 fp->disable_tpa = 1;
1347 ring_prod = 0;
1348 break;
1349 }
1350 ring_prod = NEXT_SGE_IDX(ring_prod);
1351 }
1352
1353 fp->rx_sge_prod = ring_prod;
1354 }
1355 }
1356
1357 for_each_eth_queue(bp, j) {
1358 struct bnx2x_fastpath *fp = &bp->fp[j];
1359
1360 fp->rx_bd_cons = 0;
1361
1362 /* Activate BD ring */
1363 /* Warning!
1364 * this will generate an interrupt (to the TSTORM)
1365 * must only be done after chip is initialized
1366 */
1367 bnx2x_update_rx_prod(bp, fp, fp->rx_bd_prod, fp->rx_comp_prod,
1368 fp->rx_sge_prod);
1369
1370 if (j != 0)
1371 continue;
1372
1373 if (CHIP_IS_E1(bp)) {
1374 REG_WR(bp, BAR_USTRORM_INTMEM +
1375 USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func),
1376 U64_LO(fp->rx_comp_mapping));
1377 REG_WR(bp, BAR_USTRORM_INTMEM +
1378 USTORM_MEM_WORKAROUND_ADDRESS_OFFSET(func) + 4,
1379 U64_HI(fp->rx_comp_mapping));
1380 }
1381 }
1382 }
1383
bnx2x_free_tx_skbs_queue(struct bnx2x_fastpath * fp)1384 static void bnx2x_free_tx_skbs_queue(struct bnx2x_fastpath *fp)
1385 {
1386 u8 cos;
1387 struct bnx2x *bp = fp->bp;
1388
1389 for_each_cos_in_tx_queue(fp, cos) {
1390 struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
1391 unsigned pkts_compl = 0, bytes_compl = 0;
1392
1393 u16 sw_prod = txdata->tx_pkt_prod;
1394 u16 sw_cons = txdata->tx_pkt_cons;
1395
1396 while (sw_cons != sw_prod) {
1397 bnx2x_free_tx_pkt(bp, txdata, TX_BD(sw_cons),
1398 &pkts_compl, &bytes_compl);
1399 sw_cons++;
1400 }
1401
1402 netdev_tx_reset_queue(
1403 netdev_get_tx_queue(bp->dev,
1404 txdata->txq_index));
1405 }
1406 }
1407
bnx2x_free_tx_skbs_cnic(struct bnx2x * bp)1408 static void bnx2x_free_tx_skbs_cnic(struct bnx2x *bp)
1409 {
1410 int i;
1411
1412 for_each_tx_queue_cnic(bp, i) {
1413 bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1414 }
1415 }
1416
bnx2x_free_tx_skbs(struct bnx2x * bp)1417 static void bnx2x_free_tx_skbs(struct bnx2x *bp)
1418 {
1419 int i;
1420
1421 for_each_eth_queue(bp, i) {
1422 bnx2x_free_tx_skbs_queue(&bp->fp[i]);
1423 }
1424 }
1425
bnx2x_free_rx_bds(struct bnx2x_fastpath * fp)1426 static void bnx2x_free_rx_bds(struct bnx2x_fastpath *fp)
1427 {
1428 struct bnx2x *bp = fp->bp;
1429 int i;
1430
1431 /* ring wasn't allocated */
1432 if (fp->rx_buf_ring == NULL)
1433 return;
1434
1435 for (i = 0; i < NUM_RX_BD; i++) {
1436 struct sw_rx_bd *rx_buf = &fp->rx_buf_ring[i];
1437 u8 *data = rx_buf->data;
1438
1439 if (data == NULL)
1440 continue;
1441 dma_unmap_single(&bp->pdev->dev,
1442 dma_unmap_addr(rx_buf, mapping),
1443 fp->rx_buf_size, DMA_FROM_DEVICE);
1444
1445 rx_buf->data = NULL;
1446 bnx2x_frag_free(fp, data);
1447 }
1448 }
1449
bnx2x_free_rx_skbs_cnic(struct bnx2x * bp)1450 static void bnx2x_free_rx_skbs_cnic(struct bnx2x *bp)
1451 {
1452 int j;
1453
1454 for_each_rx_queue_cnic(bp, j) {
1455 bnx2x_free_rx_bds(&bp->fp[j]);
1456 }
1457 }
1458
bnx2x_free_rx_skbs(struct bnx2x * bp)1459 static void bnx2x_free_rx_skbs(struct bnx2x *bp)
1460 {
1461 int j;
1462
1463 for_each_eth_queue(bp, j) {
1464 struct bnx2x_fastpath *fp = &bp->fp[j];
1465
1466 bnx2x_free_rx_bds(fp);
1467
1468 if (!fp->disable_tpa)
1469 bnx2x_free_tpa_pool(bp, fp, MAX_AGG_QS(bp));
1470 }
1471 }
1472
bnx2x_free_skbs_cnic(struct bnx2x * bp)1473 void bnx2x_free_skbs_cnic(struct bnx2x *bp)
1474 {
1475 bnx2x_free_tx_skbs_cnic(bp);
1476 bnx2x_free_rx_skbs_cnic(bp);
1477 }
1478
bnx2x_free_skbs(struct bnx2x * bp)1479 void bnx2x_free_skbs(struct bnx2x *bp)
1480 {
1481 bnx2x_free_tx_skbs(bp);
1482 bnx2x_free_rx_skbs(bp);
1483 }
1484
bnx2x_update_max_mf_config(struct bnx2x * bp,u32 value)1485 void bnx2x_update_max_mf_config(struct bnx2x *bp, u32 value)
1486 {
1487 /* load old values */
1488 u32 mf_cfg = bp->mf_config[BP_VN(bp)];
1489
1490 if (value != bnx2x_extract_max_cfg(bp, mf_cfg)) {
1491 /* leave all but MAX value */
1492 mf_cfg &= ~FUNC_MF_CFG_MAX_BW_MASK;
1493
1494 /* set new MAX value */
1495 mf_cfg |= (value << FUNC_MF_CFG_MAX_BW_SHIFT)
1496 & FUNC_MF_CFG_MAX_BW_MASK;
1497
1498 bnx2x_fw_command(bp, DRV_MSG_CODE_SET_MF_BW, mf_cfg);
1499 }
1500 }
1501
1502 /**
1503 * bnx2x_free_msix_irqs - free previously requested MSI-X IRQ vectors
1504 *
1505 * @bp: driver handle
1506 * @nvecs: number of vectors to be released
1507 */
bnx2x_free_msix_irqs(struct bnx2x * bp,int nvecs)1508 static void bnx2x_free_msix_irqs(struct bnx2x *bp, int nvecs)
1509 {
1510 int i, offset = 0;
1511
1512 if (nvecs == offset)
1513 return;
1514
1515 /* VFs don't have a default SB */
1516 if (IS_PF(bp)) {
1517 free_irq(bp->msix_table[offset].vector, bp->dev);
1518 DP(NETIF_MSG_IFDOWN, "released sp irq (%d)\n",
1519 bp->msix_table[offset].vector);
1520 offset++;
1521 }
1522
1523 if (CNIC_SUPPORT(bp)) {
1524 if (nvecs == offset)
1525 return;
1526 offset++;
1527 }
1528
1529 for_each_eth_queue(bp, i) {
1530 if (nvecs == offset)
1531 return;
1532 DP(NETIF_MSG_IFDOWN, "about to release fp #%d->%d irq\n",
1533 i, bp->msix_table[offset].vector);
1534
1535 free_irq(bp->msix_table[offset++].vector, &bp->fp[i]);
1536 }
1537 }
1538
bnx2x_free_irq(struct bnx2x * bp)1539 void bnx2x_free_irq(struct bnx2x *bp)
1540 {
1541 if (bp->flags & USING_MSIX_FLAG &&
1542 !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1543 int nvecs = BNX2X_NUM_ETH_QUEUES(bp) + CNIC_SUPPORT(bp);
1544
1545 /* vfs don't have a default status block */
1546 if (IS_PF(bp))
1547 nvecs++;
1548
1549 bnx2x_free_msix_irqs(bp, nvecs);
1550 } else {
1551 free_irq(bp->dev->irq, bp->dev);
1552 }
1553 }
1554
bnx2x_enable_msix(struct bnx2x * bp)1555 int bnx2x_enable_msix(struct bnx2x *bp)
1556 {
1557 int msix_vec = 0, i, rc;
1558
1559 /* VFs don't have a default status block */
1560 if (IS_PF(bp)) {
1561 bp->msix_table[msix_vec].entry = msix_vec;
1562 BNX2X_DEV_INFO("msix_table[0].entry = %d (slowpath)\n",
1563 bp->msix_table[0].entry);
1564 msix_vec++;
1565 }
1566
1567 /* Cnic requires an msix vector for itself */
1568 if (CNIC_SUPPORT(bp)) {
1569 bp->msix_table[msix_vec].entry = msix_vec;
1570 BNX2X_DEV_INFO("msix_table[%d].entry = %d (CNIC)\n",
1571 msix_vec, bp->msix_table[msix_vec].entry);
1572 msix_vec++;
1573 }
1574
1575 /* We need separate vectors for ETH queues only (not FCoE) */
1576 for_each_eth_queue(bp, i) {
1577 bp->msix_table[msix_vec].entry = msix_vec;
1578 BNX2X_DEV_INFO("msix_table[%d].entry = %d (fastpath #%u)\n",
1579 msix_vec, msix_vec, i);
1580 msix_vec++;
1581 }
1582
1583 DP(BNX2X_MSG_SP, "about to request enable msix with %d vectors\n",
1584 msix_vec);
1585
1586 rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], msix_vec);
1587
1588 /*
1589 * reconfigure number of tx/rx queues according to available
1590 * MSI-X vectors
1591 */
1592 if (rc >= BNX2X_MIN_MSIX_VEC_CNT(bp)) {
1593 /* how less vectors we will have? */
1594 int diff = msix_vec - rc;
1595
1596 BNX2X_DEV_INFO("Trying to use less MSI-X vectors: %d\n", rc);
1597
1598 rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], rc);
1599
1600 if (rc) {
1601 BNX2X_DEV_INFO("MSI-X is not attainable rc %d\n", rc);
1602 goto no_msix;
1603 }
1604 /*
1605 * decrease number of queues by number of unallocated entries
1606 */
1607 bp->num_ethernet_queues -= diff;
1608 bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1609
1610 BNX2X_DEV_INFO("New queue configuration set: %d\n",
1611 bp->num_queues);
1612 } else if (rc > 0) {
1613 /* Get by with single vector */
1614 rc = pci_enable_msix(bp->pdev, &bp->msix_table[0], 1);
1615 if (rc) {
1616 BNX2X_DEV_INFO("Single MSI-X is not attainable rc %d\n",
1617 rc);
1618 goto no_msix;
1619 }
1620
1621 BNX2X_DEV_INFO("Using single MSI-X vector\n");
1622 bp->flags |= USING_SINGLE_MSIX_FLAG;
1623
1624 BNX2X_DEV_INFO("set number of queues to 1\n");
1625 bp->num_ethernet_queues = 1;
1626 bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1627 } else if (rc < 0) {
1628 BNX2X_DEV_INFO("MSI-X is not attainable rc %d\n", rc);
1629 goto no_msix;
1630 }
1631
1632 bp->flags |= USING_MSIX_FLAG;
1633
1634 return 0;
1635
1636 no_msix:
1637 /* fall to INTx if not enough memory */
1638 if (rc == -ENOMEM)
1639 bp->flags |= DISABLE_MSI_FLAG;
1640
1641 return rc;
1642 }
1643
bnx2x_req_msix_irqs(struct bnx2x * bp)1644 static int bnx2x_req_msix_irqs(struct bnx2x *bp)
1645 {
1646 int i, rc, offset = 0;
1647
1648 /* no default status block for vf */
1649 if (IS_PF(bp)) {
1650 rc = request_irq(bp->msix_table[offset++].vector,
1651 bnx2x_msix_sp_int, 0,
1652 bp->dev->name, bp->dev);
1653 if (rc) {
1654 BNX2X_ERR("request sp irq failed\n");
1655 return -EBUSY;
1656 }
1657 }
1658
1659 if (CNIC_SUPPORT(bp))
1660 offset++;
1661
1662 for_each_eth_queue(bp, i) {
1663 struct bnx2x_fastpath *fp = &bp->fp[i];
1664 snprintf(fp->name, sizeof(fp->name), "%s-fp-%d",
1665 bp->dev->name, i);
1666
1667 rc = request_irq(bp->msix_table[offset].vector,
1668 bnx2x_msix_fp_int, 0, fp->name, fp);
1669 if (rc) {
1670 BNX2X_ERR("request fp #%d irq (%d) failed rc %d\n", i,
1671 bp->msix_table[offset].vector, rc);
1672 bnx2x_free_msix_irqs(bp, offset);
1673 return -EBUSY;
1674 }
1675
1676 offset++;
1677 }
1678
1679 i = BNX2X_NUM_ETH_QUEUES(bp);
1680 if (IS_PF(bp)) {
1681 offset = 1 + CNIC_SUPPORT(bp);
1682 netdev_info(bp->dev,
1683 "using MSI-X IRQs: sp %d fp[%d] %d ... fp[%d] %d\n",
1684 bp->msix_table[0].vector,
1685 0, bp->msix_table[offset].vector,
1686 i - 1, bp->msix_table[offset + i - 1].vector);
1687 } else {
1688 offset = CNIC_SUPPORT(bp);
1689 netdev_info(bp->dev,
1690 "using MSI-X IRQs: fp[%d] %d ... fp[%d] %d\n",
1691 0, bp->msix_table[offset].vector,
1692 i - 1, bp->msix_table[offset + i - 1].vector);
1693 }
1694 return 0;
1695 }
1696
bnx2x_enable_msi(struct bnx2x * bp)1697 int bnx2x_enable_msi(struct bnx2x *bp)
1698 {
1699 int rc;
1700
1701 rc = pci_enable_msi(bp->pdev);
1702 if (rc) {
1703 BNX2X_DEV_INFO("MSI is not attainable\n");
1704 return -1;
1705 }
1706 bp->flags |= USING_MSI_FLAG;
1707
1708 return 0;
1709 }
1710
bnx2x_req_irq(struct bnx2x * bp)1711 static int bnx2x_req_irq(struct bnx2x *bp)
1712 {
1713 unsigned long flags;
1714 unsigned int irq;
1715
1716 if (bp->flags & (USING_MSI_FLAG | USING_MSIX_FLAG))
1717 flags = 0;
1718 else
1719 flags = IRQF_SHARED;
1720
1721 if (bp->flags & USING_MSIX_FLAG)
1722 irq = bp->msix_table[0].vector;
1723 else
1724 irq = bp->pdev->irq;
1725
1726 return request_irq(irq, bnx2x_interrupt, flags, bp->dev->name, bp->dev);
1727 }
1728
bnx2x_setup_irqs(struct bnx2x * bp)1729 int bnx2x_setup_irqs(struct bnx2x *bp)
1730 {
1731 int rc = 0;
1732 if (bp->flags & USING_MSIX_FLAG &&
1733 !(bp->flags & USING_SINGLE_MSIX_FLAG)) {
1734 rc = bnx2x_req_msix_irqs(bp);
1735 if (rc)
1736 return rc;
1737 } else {
1738 rc = bnx2x_req_irq(bp);
1739 if (rc) {
1740 BNX2X_ERR("IRQ request failed rc %d, aborting\n", rc);
1741 return rc;
1742 }
1743 if (bp->flags & USING_MSI_FLAG) {
1744 bp->dev->irq = bp->pdev->irq;
1745 netdev_info(bp->dev, "using MSI IRQ %d\n",
1746 bp->dev->irq);
1747 }
1748 if (bp->flags & USING_MSIX_FLAG) {
1749 bp->dev->irq = bp->msix_table[0].vector;
1750 netdev_info(bp->dev, "using MSIX IRQ %d\n",
1751 bp->dev->irq);
1752 }
1753 }
1754
1755 return 0;
1756 }
1757
bnx2x_napi_enable_cnic(struct bnx2x * bp)1758 static void bnx2x_napi_enable_cnic(struct bnx2x *bp)
1759 {
1760 int i;
1761
1762 for_each_rx_queue_cnic(bp, i)
1763 napi_enable(&bnx2x_fp(bp, i, napi));
1764 }
1765
bnx2x_napi_enable(struct bnx2x * bp)1766 static void bnx2x_napi_enable(struct bnx2x *bp)
1767 {
1768 int i;
1769
1770 for_each_eth_queue(bp, i)
1771 napi_enable(&bnx2x_fp(bp, i, napi));
1772 }
1773
bnx2x_napi_disable_cnic(struct bnx2x * bp)1774 static void bnx2x_napi_disable_cnic(struct bnx2x *bp)
1775 {
1776 int i;
1777
1778 for_each_rx_queue_cnic(bp, i)
1779 napi_disable(&bnx2x_fp(bp, i, napi));
1780 }
1781
bnx2x_napi_disable(struct bnx2x * bp)1782 static void bnx2x_napi_disable(struct bnx2x *bp)
1783 {
1784 int i;
1785
1786 for_each_eth_queue(bp, i)
1787 napi_disable(&bnx2x_fp(bp, i, napi));
1788 }
1789
bnx2x_netif_start(struct bnx2x * bp)1790 void bnx2x_netif_start(struct bnx2x *bp)
1791 {
1792 if (netif_running(bp->dev)) {
1793 bnx2x_napi_enable(bp);
1794 if (CNIC_LOADED(bp))
1795 bnx2x_napi_enable_cnic(bp);
1796 bnx2x_int_enable(bp);
1797 if (bp->state == BNX2X_STATE_OPEN)
1798 netif_tx_wake_all_queues(bp->dev);
1799 }
1800 }
1801
bnx2x_netif_stop(struct bnx2x * bp,int disable_hw)1802 void bnx2x_netif_stop(struct bnx2x *bp, int disable_hw)
1803 {
1804 bnx2x_int_disable_sync(bp, disable_hw);
1805 bnx2x_napi_disable(bp);
1806 if (CNIC_LOADED(bp))
1807 bnx2x_napi_disable_cnic(bp);
1808 }
1809
bnx2x_select_queue(struct net_device * dev,struct sk_buff * skb)1810 u16 bnx2x_select_queue(struct net_device *dev, struct sk_buff *skb)
1811 {
1812 struct bnx2x *bp = netdev_priv(dev);
1813
1814 if (CNIC_LOADED(bp) && !NO_FCOE(bp)) {
1815 struct ethhdr *hdr = (struct ethhdr *)skb->data;
1816 u16 ether_type = ntohs(hdr->h_proto);
1817
1818 /* Skip VLAN tag if present */
1819 if (ether_type == ETH_P_8021Q) {
1820 struct vlan_ethhdr *vhdr =
1821 (struct vlan_ethhdr *)skb->data;
1822
1823 ether_type = ntohs(vhdr->h_vlan_encapsulated_proto);
1824 }
1825
1826 /* If ethertype is FCoE or FIP - use FCoE ring */
1827 if ((ether_type == ETH_P_FCOE) || (ether_type == ETH_P_FIP))
1828 return bnx2x_fcoe_tx(bp, txq_index);
1829 }
1830
1831 /* select a non-FCoE queue */
1832 return __skb_tx_hash(dev, skb, BNX2X_NUM_ETH_QUEUES(bp));
1833 }
1834
bnx2x_set_num_queues(struct bnx2x * bp)1835 void bnx2x_set_num_queues(struct bnx2x *bp)
1836 {
1837 /* RSS queues */
1838 bp->num_ethernet_queues = bnx2x_calc_num_queues(bp);
1839
1840 /* override in STORAGE SD modes */
1841 if (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))
1842 bp->num_ethernet_queues = 1;
1843
1844 /* Add special queues */
1845 bp->num_cnic_queues = CNIC_SUPPORT(bp); /* For FCOE */
1846 bp->num_queues = bp->num_ethernet_queues + bp->num_cnic_queues;
1847
1848 BNX2X_DEV_INFO("set number of queues to %d\n", bp->num_queues);
1849 }
1850
1851 /**
1852 * bnx2x_set_real_num_queues - configure netdev->real_num_[tx,rx]_queues
1853 *
1854 * @bp: Driver handle
1855 *
1856 * We currently support for at most 16 Tx queues for each CoS thus we will
1857 * allocate a multiple of 16 for ETH L2 rings according to the value of the
1858 * bp->max_cos.
1859 *
1860 * If there is an FCoE L2 queue the appropriate Tx queue will have the next
1861 * index after all ETH L2 indices.
1862 *
1863 * If the actual number of Tx queues (for each CoS) is less than 16 then there
1864 * will be the holes at the end of each group of 16 ETh L2 indices (0..15,
1865 * 16..31,...) with indicies that are not coupled with any real Tx queue.
1866 *
1867 * The proper configuration of skb->queue_mapping is handled by
1868 * bnx2x_select_queue() and __skb_tx_hash().
1869 *
1870 * bnx2x_setup_tc() takes care of the proper TC mappings so that __skb_tx_hash()
1871 * will return a proper Tx index if TC is enabled (netdev->num_tc > 0).
1872 */
bnx2x_set_real_num_queues(struct bnx2x * bp,int include_cnic)1873 static int bnx2x_set_real_num_queues(struct bnx2x *bp, int include_cnic)
1874 {
1875 int rc, tx, rx;
1876
1877 tx = BNX2X_NUM_ETH_QUEUES(bp) * bp->max_cos;
1878 rx = BNX2X_NUM_ETH_QUEUES(bp);
1879
1880 /* account for fcoe queue */
1881 if (include_cnic && !NO_FCOE(bp)) {
1882 rx++;
1883 tx++;
1884 }
1885
1886 rc = netif_set_real_num_tx_queues(bp->dev, tx);
1887 if (rc) {
1888 BNX2X_ERR("Failed to set real number of Tx queues: %d\n", rc);
1889 return rc;
1890 }
1891 rc = netif_set_real_num_rx_queues(bp->dev, rx);
1892 if (rc) {
1893 BNX2X_ERR("Failed to set real number of Rx queues: %d\n", rc);
1894 return rc;
1895 }
1896
1897 DP(NETIF_MSG_IFUP, "Setting real num queues to (tx, rx) (%d, %d)\n",
1898 tx, rx);
1899
1900 return rc;
1901 }
1902
bnx2x_set_rx_buf_size(struct bnx2x * bp)1903 static void bnx2x_set_rx_buf_size(struct bnx2x *bp)
1904 {
1905 int i;
1906
1907 for_each_queue(bp, i) {
1908 struct bnx2x_fastpath *fp = &bp->fp[i];
1909 u32 mtu;
1910
1911 /* Always use a mini-jumbo MTU for the FCoE L2 ring */
1912 if (IS_FCOE_IDX(i))
1913 /*
1914 * Although there are no IP frames expected to arrive to
1915 * this ring we still want to add an
1916 * IP_HEADER_ALIGNMENT_PADDING to prevent a buffer
1917 * overrun attack.
1918 */
1919 mtu = BNX2X_FCOE_MINI_JUMBO_MTU;
1920 else
1921 mtu = bp->dev->mtu;
1922 fp->rx_buf_size = BNX2X_FW_RX_ALIGN_START +
1923 IP_HEADER_ALIGNMENT_PADDING +
1924 ETH_OVREHEAD +
1925 mtu +
1926 BNX2X_FW_RX_ALIGN_END;
1927 /* Note : rx_buf_size doesnt take into account NET_SKB_PAD */
1928 if (fp->rx_buf_size + NET_SKB_PAD <= PAGE_SIZE)
1929 fp->rx_frag_size = fp->rx_buf_size + NET_SKB_PAD;
1930 else
1931 fp->rx_frag_size = 0;
1932 }
1933 }
1934
bnx2x_init_rss_pf(struct bnx2x * bp)1935 static int bnx2x_init_rss_pf(struct bnx2x *bp)
1936 {
1937 int i;
1938 u8 num_eth_queues = BNX2X_NUM_ETH_QUEUES(bp);
1939
1940 /* Prepare the initial contents fo the indirection table if RSS is
1941 * enabled
1942 */
1943 for (i = 0; i < sizeof(bp->rss_conf_obj.ind_table); i++)
1944 bp->rss_conf_obj.ind_table[i] =
1945 bp->fp->cl_id +
1946 ethtool_rxfh_indir_default(i, num_eth_queues);
1947
1948 /*
1949 * For 57710 and 57711 SEARCHER configuration (rss_keys) is
1950 * per-port, so if explicit configuration is needed , do it only
1951 * for a PMF.
1952 *
1953 * For 57712 and newer on the other hand it's a per-function
1954 * configuration.
1955 */
1956 return bnx2x_config_rss_eth(bp, bp->port.pmf || !CHIP_IS_E1x(bp));
1957 }
1958
bnx2x_config_rss_pf(struct bnx2x * bp,struct bnx2x_rss_config_obj * rss_obj,bool config_hash)1959 int bnx2x_config_rss_pf(struct bnx2x *bp, struct bnx2x_rss_config_obj *rss_obj,
1960 bool config_hash)
1961 {
1962 struct bnx2x_config_rss_params params = {NULL};
1963
1964 /* Although RSS is meaningless when there is a single HW queue we
1965 * still need it enabled in order to have HW Rx hash generated.
1966 *
1967 * if (!is_eth_multi(bp))
1968 * bp->multi_mode = ETH_RSS_MODE_DISABLED;
1969 */
1970
1971 params.rss_obj = rss_obj;
1972
1973 __set_bit(RAMROD_COMP_WAIT, ¶ms.ramrod_flags);
1974
1975 __set_bit(BNX2X_RSS_MODE_REGULAR, ¶ms.rss_flags);
1976
1977 /* RSS configuration */
1978 __set_bit(BNX2X_RSS_IPV4, ¶ms.rss_flags);
1979 __set_bit(BNX2X_RSS_IPV4_TCP, ¶ms.rss_flags);
1980 __set_bit(BNX2X_RSS_IPV6, ¶ms.rss_flags);
1981 __set_bit(BNX2X_RSS_IPV6_TCP, ¶ms.rss_flags);
1982 if (rss_obj->udp_rss_v4)
1983 __set_bit(BNX2X_RSS_IPV4_UDP, ¶ms.rss_flags);
1984 if (rss_obj->udp_rss_v6)
1985 __set_bit(BNX2X_RSS_IPV6_UDP, ¶ms.rss_flags);
1986
1987 /* Hash bits */
1988 params.rss_result_mask = MULTI_MASK;
1989
1990 memcpy(params.ind_table, rss_obj->ind_table, sizeof(params.ind_table));
1991
1992 if (config_hash) {
1993 /* RSS keys */
1994 prandom_bytes(params.rss_key, sizeof(params.rss_key));
1995 __set_bit(BNX2X_RSS_SET_SRCH, ¶ms.rss_flags);
1996 }
1997
1998 return bnx2x_config_rss(bp, ¶ms);
1999 }
2000
bnx2x_init_hw(struct bnx2x * bp,u32 load_code)2001 static int bnx2x_init_hw(struct bnx2x *bp, u32 load_code)
2002 {
2003 struct bnx2x_func_state_params func_params = {NULL};
2004
2005 /* Prepare parameters for function state transitions */
2006 __set_bit(RAMROD_COMP_WAIT, &func_params.ramrod_flags);
2007
2008 func_params.f_obj = &bp->func_obj;
2009 func_params.cmd = BNX2X_F_CMD_HW_INIT;
2010
2011 func_params.params.hw_init.load_phase = load_code;
2012
2013 return bnx2x_func_state_change(bp, &func_params);
2014 }
2015
2016 /*
2017 * Cleans the object that have internal lists without sending
2018 * ramrods. Should be run when interrutps are disabled.
2019 */
bnx2x_squeeze_objects(struct bnx2x * bp)2020 void bnx2x_squeeze_objects(struct bnx2x *bp)
2021 {
2022 int rc;
2023 unsigned long ramrod_flags = 0, vlan_mac_flags = 0;
2024 struct bnx2x_mcast_ramrod_params rparam = {NULL};
2025 struct bnx2x_vlan_mac_obj *mac_obj = &bp->sp_objs->mac_obj;
2026
2027 /***************** Cleanup MACs' object first *************************/
2028
2029 /* Wait for completion of requested */
2030 __set_bit(RAMROD_COMP_WAIT, &ramrod_flags);
2031 /* Perform a dry cleanup */
2032 __set_bit(RAMROD_DRV_CLR_ONLY, &ramrod_flags);
2033
2034 /* Clean ETH primary MAC */
2035 __set_bit(BNX2X_ETH_MAC, &vlan_mac_flags);
2036 rc = mac_obj->delete_all(bp, &bp->sp_objs->mac_obj, &vlan_mac_flags,
2037 &ramrod_flags);
2038 if (rc != 0)
2039 BNX2X_ERR("Failed to clean ETH MACs: %d\n", rc);
2040
2041 /* Cleanup UC list */
2042 vlan_mac_flags = 0;
2043 __set_bit(BNX2X_UC_LIST_MAC, &vlan_mac_flags);
2044 rc = mac_obj->delete_all(bp, mac_obj, &vlan_mac_flags,
2045 &ramrod_flags);
2046 if (rc != 0)
2047 BNX2X_ERR("Failed to clean UC list MACs: %d\n", rc);
2048
2049 /***************** Now clean mcast object *****************************/
2050 rparam.mcast_obj = &bp->mcast_obj;
2051 __set_bit(RAMROD_DRV_CLR_ONLY, &rparam.ramrod_flags);
2052
2053 /* Add a DEL command... */
2054 rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_DEL);
2055 if (rc < 0)
2056 BNX2X_ERR("Failed to add a new DEL command to a multi-cast object: %d\n",
2057 rc);
2058
2059 /* ...and wait until all pending commands are cleared */
2060 rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2061 while (rc != 0) {
2062 if (rc < 0) {
2063 BNX2X_ERR("Failed to clean multi-cast object: %d\n",
2064 rc);
2065 return;
2066 }
2067
2068 rc = bnx2x_config_mcast(bp, &rparam, BNX2X_MCAST_CMD_CONT);
2069 }
2070 }
2071
2072 #ifndef BNX2X_STOP_ON_ERROR
2073 #define LOAD_ERROR_EXIT(bp, label) \
2074 do { \
2075 (bp)->state = BNX2X_STATE_ERROR; \
2076 goto label; \
2077 } while (0)
2078
2079 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2080 do { \
2081 bp->cnic_loaded = false; \
2082 goto label; \
2083 } while (0)
2084 #else /*BNX2X_STOP_ON_ERROR*/
2085 #define LOAD_ERROR_EXIT(bp, label) \
2086 do { \
2087 (bp)->state = BNX2X_STATE_ERROR; \
2088 (bp)->panic = 1; \
2089 return -EBUSY; \
2090 } while (0)
2091 #define LOAD_ERROR_EXIT_CNIC(bp, label) \
2092 do { \
2093 bp->cnic_loaded = false; \
2094 (bp)->panic = 1; \
2095 return -EBUSY; \
2096 } while (0)
2097 #endif /*BNX2X_STOP_ON_ERROR*/
2098
bnx2x_free_fw_stats_mem(struct bnx2x * bp)2099 static void bnx2x_free_fw_stats_mem(struct bnx2x *bp)
2100 {
2101 BNX2X_PCI_FREE(bp->fw_stats, bp->fw_stats_mapping,
2102 bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2103 return;
2104 }
2105
bnx2x_alloc_fw_stats_mem(struct bnx2x * bp)2106 static int bnx2x_alloc_fw_stats_mem(struct bnx2x *bp)
2107 {
2108 int num_groups, vf_headroom = 0;
2109 int is_fcoe_stats = NO_FCOE(bp) ? 0 : 1;
2110
2111 /* number of queues for statistics is number of eth queues + FCoE */
2112 u8 num_queue_stats = BNX2X_NUM_ETH_QUEUES(bp) + is_fcoe_stats;
2113
2114 /* Total number of FW statistics requests =
2115 * 1 for port stats + 1 for PF stats + potential 2 for FCoE (fcoe proper
2116 * and fcoe l2 queue) stats + num of queues (which includes another 1
2117 * for fcoe l2 queue if applicable)
2118 */
2119 bp->fw_stats_num = 2 + is_fcoe_stats + num_queue_stats;
2120
2121 /* vf stats appear in the request list, but their data is allocated by
2122 * the VFs themselves. We don't include them in the bp->fw_stats_num as
2123 * it is used to determine where to place the vf stats queries in the
2124 * request struct
2125 */
2126 if (IS_SRIOV(bp))
2127 vf_headroom = bnx2x_vf_headroom(bp);
2128
2129 /* Request is built from stats_query_header and an array of
2130 * stats_query_cmd_group each of which contains
2131 * STATS_QUERY_CMD_COUNT rules. The real number or requests is
2132 * configured in the stats_query_header.
2133 */
2134 num_groups =
2135 (((bp->fw_stats_num + vf_headroom) / STATS_QUERY_CMD_COUNT) +
2136 (((bp->fw_stats_num + vf_headroom) % STATS_QUERY_CMD_COUNT) ?
2137 1 : 0));
2138
2139 DP(BNX2X_MSG_SP, "stats fw_stats_num %d, vf headroom %d, num_groups %d\n",
2140 bp->fw_stats_num, vf_headroom, num_groups);
2141 bp->fw_stats_req_sz = sizeof(struct stats_query_header) +
2142 num_groups * sizeof(struct stats_query_cmd_group);
2143
2144 /* Data for statistics requests + stats_counter
2145 * stats_counter holds per-STORM counters that are incremented
2146 * when STORM has finished with the current request.
2147 * memory for FCoE offloaded statistics are counted anyway,
2148 * even if they will not be sent.
2149 * VF stats are not accounted for here as the data of VF stats is stored
2150 * in memory allocated by the VF, not here.
2151 */
2152 bp->fw_stats_data_sz = sizeof(struct per_port_stats) +
2153 sizeof(struct per_pf_stats) +
2154 sizeof(struct fcoe_statistics_params) +
2155 sizeof(struct per_queue_stats) * num_queue_stats +
2156 sizeof(struct stats_counter);
2157
2158 BNX2X_PCI_ALLOC(bp->fw_stats, &bp->fw_stats_mapping,
2159 bp->fw_stats_data_sz + bp->fw_stats_req_sz);
2160
2161 /* Set shortcuts */
2162 bp->fw_stats_req = (struct bnx2x_fw_stats_req *)bp->fw_stats;
2163 bp->fw_stats_req_mapping = bp->fw_stats_mapping;
2164 bp->fw_stats_data = (struct bnx2x_fw_stats_data *)
2165 ((u8 *)bp->fw_stats + bp->fw_stats_req_sz);
2166 bp->fw_stats_data_mapping = bp->fw_stats_mapping +
2167 bp->fw_stats_req_sz;
2168
2169 DP(BNX2X_MSG_SP, "statistics request base address set to %x %x",
2170 U64_HI(bp->fw_stats_req_mapping),
2171 U64_LO(bp->fw_stats_req_mapping));
2172 DP(BNX2X_MSG_SP, "statistics data base address set to %x %x",
2173 U64_HI(bp->fw_stats_data_mapping),
2174 U64_LO(bp->fw_stats_data_mapping));
2175 return 0;
2176
2177 alloc_mem_err:
2178 bnx2x_free_fw_stats_mem(bp);
2179 BNX2X_ERR("Can't allocate FW stats memory\n");
2180 return -ENOMEM;
2181 }
2182
2183 /* send load request to mcp and analyze response */
bnx2x_nic_load_request(struct bnx2x * bp,u32 * load_code)2184 static int bnx2x_nic_load_request(struct bnx2x *bp, u32 *load_code)
2185 {
2186 /* init fw_seq */
2187 bp->fw_seq =
2188 (SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_mb_header) &
2189 DRV_MSG_SEQ_NUMBER_MASK);
2190 BNX2X_DEV_INFO("fw_seq 0x%08x\n", bp->fw_seq);
2191
2192 /* Get current FW pulse sequence */
2193 bp->fw_drv_pulse_wr_seq =
2194 (SHMEM_RD(bp, func_mb[BP_FW_MB_IDX(bp)].drv_pulse_mb) &
2195 DRV_PULSE_SEQ_MASK);
2196 BNX2X_DEV_INFO("drv_pulse 0x%x\n", bp->fw_drv_pulse_wr_seq);
2197
2198 /* load request */
2199 (*load_code) = bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_REQ,
2200 DRV_MSG_CODE_LOAD_REQ_WITH_LFA);
2201
2202 /* if mcp fails to respond we must abort */
2203 if (!(*load_code)) {
2204 BNX2X_ERR("MCP response failure, aborting\n");
2205 return -EBUSY;
2206 }
2207
2208 /* If mcp refused (e.g. other port is in diagnostic mode) we
2209 * must abort
2210 */
2211 if ((*load_code) == FW_MSG_CODE_DRV_LOAD_REFUSED) {
2212 BNX2X_ERR("MCP refused load request, aborting\n");
2213 return -EBUSY;
2214 }
2215 return 0;
2216 }
2217
2218 /* check whether another PF has already loaded FW to chip. In
2219 * virtualized environments a pf from another VM may have already
2220 * initialized the device including loading FW
2221 */
bnx2x_nic_load_analyze_req(struct bnx2x * bp,u32 load_code)2222 int bnx2x_nic_load_analyze_req(struct bnx2x *bp, u32 load_code)
2223 {
2224 /* is another pf loaded on this engine? */
2225 if (load_code != FW_MSG_CODE_DRV_LOAD_COMMON_CHIP &&
2226 load_code != FW_MSG_CODE_DRV_LOAD_COMMON) {
2227 /* build my FW version dword */
2228 u32 my_fw = (BCM_5710_FW_MAJOR_VERSION) +
2229 (BCM_5710_FW_MINOR_VERSION << 8) +
2230 (BCM_5710_FW_REVISION_VERSION << 16) +
2231 (BCM_5710_FW_ENGINEERING_VERSION << 24);
2232
2233 /* read loaded FW from chip */
2234 u32 loaded_fw = REG_RD(bp, XSEM_REG_PRAM);
2235
2236 DP(BNX2X_MSG_SP, "loaded fw %x, my fw %x\n",
2237 loaded_fw, my_fw);
2238
2239 /* abort nic load if version mismatch */
2240 if (my_fw != loaded_fw) {
2241 BNX2X_ERR("bnx2x with FW %x was already loaded which mismatches my %x FW. aborting\n",
2242 loaded_fw, my_fw);
2243 return -EBUSY;
2244 }
2245 }
2246 return 0;
2247 }
2248
2249 /* returns the "mcp load_code" according to global load_count array */
bnx2x_nic_load_no_mcp(struct bnx2x * bp,int port)2250 static int bnx2x_nic_load_no_mcp(struct bnx2x *bp, int port)
2251 {
2252 int path = BP_PATH(bp);
2253
2254 DP(NETIF_MSG_IFUP, "NO MCP - load counts[%d] %d, %d, %d\n",
2255 path, load_count[path][0], load_count[path][1],
2256 load_count[path][2]);
2257 load_count[path][0]++;
2258 load_count[path][1 + port]++;
2259 DP(NETIF_MSG_IFUP, "NO MCP - new load counts[%d] %d, %d, %d\n",
2260 path, load_count[path][0], load_count[path][1],
2261 load_count[path][2]);
2262 if (load_count[path][0] == 1)
2263 return FW_MSG_CODE_DRV_LOAD_COMMON;
2264 else if (load_count[path][1 + port] == 1)
2265 return FW_MSG_CODE_DRV_LOAD_PORT;
2266 else
2267 return FW_MSG_CODE_DRV_LOAD_FUNCTION;
2268 }
2269
2270 /* mark PMF if applicable */
bnx2x_nic_load_pmf(struct bnx2x * bp,u32 load_code)2271 static void bnx2x_nic_load_pmf(struct bnx2x *bp, u32 load_code)
2272 {
2273 if ((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2274 (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP) ||
2275 (load_code == FW_MSG_CODE_DRV_LOAD_PORT)) {
2276 bp->port.pmf = 1;
2277 /* We need the barrier to ensure the ordering between the
2278 * writing to bp->port.pmf here and reading it from the
2279 * bnx2x_periodic_task().
2280 */
2281 smp_mb();
2282 } else {
2283 bp->port.pmf = 0;
2284 }
2285
2286 DP(NETIF_MSG_LINK, "pmf %d\n", bp->port.pmf);
2287 }
2288
bnx2x_nic_load_afex_dcc(struct bnx2x * bp,int load_code)2289 static void bnx2x_nic_load_afex_dcc(struct bnx2x *bp, int load_code)
2290 {
2291 if (((load_code == FW_MSG_CODE_DRV_LOAD_COMMON) ||
2292 (load_code == FW_MSG_CODE_DRV_LOAD_COMMON_CHIP)) &&
2293 (bp->common.shmem2_base)) {
2294 if (SHMEM2_HAS(bp, dcc_support))
2295 SHMEM2_WR(bp, dcc_support,
2296 (SHMEM_DCC_SUPPORT_DISABLE_ENABLE_PF_TLV |
2297 SHMEM_DCC_SUPPORT_BANDWIDTH_ALLOCATION_TLV));
2298 if (SHMEM2_HAS(bp, afex_driver_support))
2299 SHMEM2_WR(bp, afex_driver_support,
2300 SHMEM_AFEX_SUPPORTED_VERSION_ONE);
2301 }
2302
2303 /* Set AFEX default VLAN tag to an invalid value */
2304 bp->afex_def_vlan_tag = -1;
2305 }
2306
2307 /**
2308 * bnx2x_bz_fp - zero content of the fastpath structure.
2309 *
2310 * @bp: driver handle
2311 * @index: fastpath index to be zeroed
2312 *
2313 * Makes sure the contents of the bp->fp[index].napi is kept
2314 * intact.
2315 */
bnx2x_bz_fp(struct bnx2x * bp,int index)2316 static void bnx2x_bz_fp(struct bnx2x *bp, int index)
2317 {
2318 struct bnx2x_fastpath *fp = &bp->fp[index];
2319
2320 int cos;
2321 struct napi_struct orig_napi = fp->napi;
2322 struct bnx2x_agg_info *orig_tpa_info = fp->tpa_info;
2323 /* bzero bnx2x_fastpath contents */
2324 if (fp->tpa_info)
2325 memset(fp->tpa_info, 0, ETH_MAX_AGGREGATION_QUEUES_E1H_E2 *
2326 sizeof(struct bnx2x_agg_info));
2327 memset(fp, 0, sizeof(*fp));
2328
2329 /* Restore the NAPI object as it has been already initialized */
2330 fp->napi = orig_napi;
2331 fp->tpa_info = orig_tpa_info;
2332 fp->bp = bp;
2333 fp->index = index;
2334 if (IS_ETH_FP(fp))
2335 fp->max_cos = bp->max_cos;
2336 else
2337 /* Special queues support only one CoS */
2338 fp->max_cos = 1;
2339
2340 /* Init txdata pointers */
2341 if (IS_FCOE_FP(fp))
2342 fp->txdata_ptr[0] = &bp->bnx2x_txq[FCOE_TXQ_IDX(bp)];
2343 if (IS_ETH_FP(fp))
2344 for_each_cos_in_tx_queue(fp, cos)
2345 fp->txdata_ptr[cos] = &bp->bnx2x_txq[cos *
2346 BNX2X_NUM_ETH_QUEUES(bp) + index];
2347
2348 /*
2349 * set the tpa flag for each queue. The tpa flag determines the queue
2350 * minimal size so it must be set prior to queue memory allocation
2351 */
2352 fp->disable_tpa = !(bp->flags & TPA_ENABLE_FLAG ||
2353 (bp->flags & GRO_ENABLE_FLAG &&
2354 bnx2x_mtu_allows_gro(bp->dev->mtu)));
2355 if (bp->flags & TPA_ENABLE_FLAG)
2356 fp->mode = TPA_MODE_LRO;
2357 else if (bp->flags & GRO_ENABLE_FLAG)
2358 fp->mode = TPA_MODE_GRO;
2359
2360 /* We don't want TPA on an FCoE L2 ring */
2361 if (IS_FCOE_FP(fp))
2362 fp->disable_tpa = 1;
2363 }
2364
bnx2x_load_cnic(struct bnx2x * bp)2365 int bnx2x_load_cnic(struct bnx2x *bp)
2366 {
2367 int i, rc, port = BP_PORT(bp);
2368
2369 DP(NETIF_MSG_IFUP, "Starting CNIC-related load\n");
2370
2371 mutex_init(&bp->cnic_mutex);
2372
2373 if (IS_PF(bp)) {
2374 rc = bnx2x_alloc_mem_cnic(bp);
2375 if (rc) {
2376 BNX2X_ERR("Unable to allocate bp memory for cnic\n");
2377 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2378 }
2379 }
2380
2381 rc = bnx2x_alloc_fp_mem_cnic(bp);
2382 if (rc) {
2383 BNX2X_ERR("Unable to allocate memory for cnic fps\n");
2384 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2385 }
2386
2387 /* Update the number of queues with the cnic queues */
2388 rc = bnx2x_set_real_num_queues(bp, 1);
2389 if (rc) {
2390 BNX2X_ERR("Unable to set real_num_queues including cnic\n");
2391 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic0);
2392 }
2393
2394 /* Add all CNIC NAPI objects */
2395 bnx2x_add_all_napi_cnic(bp);
2396 DP(NETIF_MSG_IFUP, "cnic napi added\n");
2397 bnx2x_napi_enable_cnic(bp);
2398
2399 rc = bnx2x_init_hw_func_cnic(bp);
2400 if (rc)
2401 LOAD_ERROR_EXIT_CNIC(bp, load_error_cnic1);
2402
2403 bnx2x_nic_init_cnic(bp);
2404
2405 if (IS_PF(bp)) {
2406 /* Enable Timer scan */
2407 REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 1);
2408
2409 /* setup cnic queues */
2410 for_each_cnic_queue(bp, i) {
2411 rc = bnx2x_setup_queue(bp, &bp->fp[i], 0);
2412 if (rc) {
2413 BNX2X_ERR("Queue setup failed\n");
2414 LOAD_ERROR_EXIT(bp, load_error_cnic2);
2415 }
2416 }
2417 }
2418
2419 /* Initialize Rx filter. */
2420 netif_addr_lock_bh(bp->dev);
2421 bnx2x_set_rx_mode(bp->dev);
2422 netif_addr_unlock_bh(bp->dev);
2423
2424 /* re-read iscsi info */
2425 bnx2x_get_iscsi_info(bp);
2426 bnx2x_setup_cnic_irq_info(bp);
2427 bnx2x_setup_cnic_info(bp);
2428 bp->cnic_loaded = true;
2429 if (bp->state == BNX2X_STATE_OPEN)
2430 bnx2x_cnic_notify(bp, CNIC_CTL_START_CMD);
2431
2432
2433 DP(NETIF_MSG_IFUP, "Ending successfully CNIC-related load\n");
2434
2435 return 0;
2436
2437 #ifndef BNX2X_STOP_ON_ERROR
2438 load_error_cnic2:
2439 /* Disable Timer scan */
2440 REG_WR(bp, TM_REG_EN_LINEAR0_TIMER + port*4, 0);
2441
2442 load_error_cnic1:
2443 bnx2x_napi_disable_cnic(bp);
2444 /* Update the number of queues without the cnic queues */
2445 rc = bnx2x_set_real_num_queues(bp, 0);
2446 if (rc)
2447 BNX2X_ERR("Unable to set real_num_queues not including cnic\n");
2448 load_error_cnic0:
2449 BNX2X_ERR("CNIC-related load failed\n");
2450 bnx2x_free_fp_mem_cnic(bp);
2451 bnx2x_free_mem_cnic(bp);
2452 return rc;
2453 #endif /* ! BNX2X_STOP_ON_ERROR */
2454 }
2455
2456 /* must be called with rtnl_lock */
bnx2x_nic_load(struct bnx2x * bp,int load_mode)2457 int bnx2x_nic_load(struct bnx2x *bp, int load_mode)
2458 {
2459 int port = BP_PORT(bp);
2460 int i, rc = 0, load_code = 0;
2461
2462 DP(NETIF_MSG_IFUP, "Starting NIC load\n");
2463 DP(NETIF_MSG_IFUP,
2464 "CNIC is %s\n", CNIC_ENABLED(bp) ? "enabled" : "disabled");
2465
2466 #ifdef BNX2X_STOP_ON_ERROR
2467 if (unlikely(bp->panic)) {
2468 BNX2X_ERR("Can't load NIC when there is panic\n");
2469 return -EPERM;
2470 }
2471 #endif
2472
2473 bp->state = BNX2X_STATE_OPENING_WAIT4_LOAD;
2474
2475 memset(&bp->last_reported_link, 0, sizeof(bp->last_reported_link));
2476 __set_bit(BNX2X_LINK_REPORT_LINK_DOWN,
2477 &bp->last_reported_link.link_report_flags);
2478
2479 if (IS_PF(bp))
2480 /* must be called before memory allocation and HW init */
2481 bnx2x_ilt_set_info(bp);
2482
2483 /*
2484 * Zero fastpath structures preserving invariants like napi, which are
2485 * allocated only once, fp index, max_cos, bp pointer.
2486 * Also set fp->disable_tpa and txdata_ptr.
2487 */
2488 DP(NETIF_MSG_IFUP, "num queues: %d", bp->num_queues);
2489 for_each_queue(bp, i)
2490 bnx2x_bz_fp(bp, i);
2491 memset(bp->bnx2x_txq, 0, (BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS +
2492 bp->num_cnic_queues) *
2493 sizeof(struct bnx2x_fp_txdata));
2494
2495 bp->fcoe_init = false;
2496
2497 /* Set the receive queues buffer size */
2498 bnx2x_set_rx_buf_size(bp);
2499
2500 if (IS_PF(bp)) {
2501 rc = bnx2x_alloc_mem(bp);
2502 if (rc) {
2503 BNX2X_ERR("Unable to allocate bp memory\n");
2504 return rc;
2505 }
2506 }
2507
2508 /* Allocated memory for FW statistics */
2509 if (bnx2x_alloc_fw_stats_mem(bp))
2510 LOAD_ERROR_EXIT(bp, load_error0);
2511
2512 /* need to be done after alloc mem, since it's self adjusting to amount
2513 * of memory available for RSS queues
2514 */
2515 rc = bnx2x_alloc_fp_mem(bp);
2516 if (rc) {
2517 BNX2X_ERR("Unable to allocate memory for fps\n");
2518 LOAD_ERROR_EXIT(bp, load_error0);
2519 }
2520
2521 /* request pf to initialize status blocks */
2522 if (IS_VF(bp)) {
2523 rc = bnx2x_vfpf_init(bp);
2524 if (rc)
2525 LOAD_ERROR_EXIT(bp, load_error0);
2526 }
2527
2528 /* As long as bnx2x_alloc_mem() may possibly update
2529 * bp->num_queues, bnx2x_set_real_num_queues() should always
2530 * come after it. At this stage cnic queues are not counted.
2531 */
2532 rc = bnx2x_set_real_num_queues(bp, 0);
2533 if (rc) {
2534 BNX2X_ERR("Unable to set real_num_queues\n");
2535 LOAD_ERROR_EXIT(bp, load_error0);
2536 }
2537
2538 /* configure multi cos mappings in kernel.
2539 * this configuration may be overriden by a multi class queue discipline
2540 * or by a dcbx negotiation result.
2541 */
2542 bnx2x_setup_tc(bp->dev, bp->max_cos);
2543
2544 /* Add all NAPI objects */
2545 bnx2x_add_all_napi(bp);
2546 DP(NETIF_MSG_IFUP, "napi added\n");
2547 bnx2x_napi_enable(bp);
2548
2549 if (IS_PF(bp)) {
2550 /* set pf load just before approaching the MCP */
2551 bnx2x_set_pf_load(bp);
2552
2553 /* if mcp exists send load request and analyze response */
2554 if (!BP_NOMCP(bp)) {
2555 /* attempt to load pf */
2556 rc = bnx2x_nic_load_request(bp, &load_code);
2557 if (rc)
2558 LOAD_ERROR_EXIT(bp, load_error1);
2559
2560 /* what did mcp say? */
2561 rc = bnx2x_nic_load_analyze_req(bp, load_code);
2562 if (rc) {
2563 bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2564 LOAD_ERROR_EXIT(bp, load_error2);
2565 }
2566 } else {
2567 load_code = bnx2x_nic_load_no_mcp(bp, port);
2568 }
2569
2570 /* mark pmf if applicable */
2571 bnx2x_nic_load_pmf(bp, load_code);
2572
2573 /* Init Function state controlling object */
2574 bnx2x__init_func_obj(bp);
2575
2576 /* Initialize HW */
2577 rc = bnx2x_init_hw(bp, load_code);
2578 if (rc) {
2579 BNX2X_ERR("HW init failed, aborting\n");
2580 bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2581 LOAD_ERROR_EXIT(bp, load_error2);
2582 }
2583 }
2584
2585 bnx2x_pre_irq_nic_init(bp);
2586
2587 /* Connect to IRQs */
2588 rc = bnx2x_setup_irqs(bp);
2589 if (rc) {
2590 BNX2X_ERR("setup irqs failed\n");
2591 if (IS_PF(bp))
2592 bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2593 LOAD_ERROR_EXIT(bp, load_error2);
2594 }
2595
2596 /* Init per-function objects */
2597 if (IS_PF(bp)) {
2598 /* Setup NIC internals and enable interrupts */
2599 bnx2x_post_irq_nic_init(bp, load_code);
2600
2601 bnx2x_init_bp_objs(bp);
2602 bnx2x_iov_nic_init(bp);
2603
2604 /* Set AFEX default VLAN tag to an invalid value */
2605 bp->afex_def_vlan_tag = -1;
2606 bnx2x_nic_load_afex_dcc(bp, load_code);
2607 bp->state = BNX2X_STATE_OPENING_WAIT4_PORT;
2608 rc = bnx2x_func_start(bp);
2609 if (rc) {
2610 BNX2X_ERR("Function start failed!\n");
2611 bnx2x_fw_command(bp, DRV_MSG_CODE_LOAD_DONE, 0);
2612
2613 LOAD_ERROR_EXIT(bp, load_error3);
2614 }
2615
2616 /* Send LOAD_DONE command to MCP */
2617 if (!BP_NOMCP(bp)) {
2618 load_code = bnx2x_fw_command(bp,
2619 DRV_MSG_CODE_LOAD_DONE, 0);
2620 if (!load_code) {
2621 BNX2X_ERR("MCP response failure, aborting\n");
2622 rc = -EBUSY;
2623 LOAD_ERROR_EXIT(bp, load_error3);
2624 }
2625 }
2626
2627 /* initialize FW coalescing state machines in RAM */
2628 bnx2x_update_coalesce(bp);
2629
2630 /* setup the leading queue */
2631 rc = bnx2x_setup_leading(bp);
2632 if (rc) {
2633 BNX2X_ERR("Setup leading failed!\n");
2634 LOAD_ERROR_EXIT(bp, load_error3);
2635 }
2636
2637 /* set up the rest of the queues */
2638 for_each_nondefault_eth_queue(bp, i) {
2639 rc = bnx2x_setup_queue(bp, &bp->fp[i], 0);
2640 if (rc) {
2641 BNX2X_ERR("Queue setup failed\n");
2642 LOAD_ERROR_EXIT(bp, load_error3);
2643 }
2644 }
2645
2646 /* setup rss */
2647 rc = bnx2x_init_rss_pf(bp);
2648 if (rc) {
2649 BNX2X_ERR("PF RSS init failed\n");
2650 LOAD_ERROR_EXIT(bp, load_error3);
2651 }
2652
2653 } else { /* vf */
2654 for_each_eth_queue(bp, i) {
2655 rc = bnx2x_vfpf_setup_q(bp, i);
2656 if (rc) {
2657 BNX2X_ERR("Queue setup failed\n");
2658 LOAD_ERROR_EXIT(bp, load_error3);
2659 }
2660 }
2661 }
2662
2663 /* Now when Clients are configured we are ready to work */
2664 bp->state = BNX2X_STATE_OPEN;
2665
2666 /* Configure a ucast MAC */
2667 if (IS_PF(bp))
2668 rc = bnx2x_set_eth_mac(bp, true);
2669 else /* vf */
2670 rc = bnx2x_vfpf_config_mac(bp, bp->dev->dev_addr, bp->fp->index,
2671 true);
2672 if (rc) {
2673 BNX2X_ERR("Setting Ethernet MAC failed\n");
2674 LOAD_ERROR_EXIT(bp, load_error3);
2675 }
2676
2677 if (IS_PF(bp) && bp->pending_max) {
2678 bnx2x_update_max_mf_config(bp, bp->pending_max);
2679 bp->pending_max = 0;
2680 }
2681
2682 if (bp->port.pmf) {
2683 rc = bnx2x_initial_phy_init(bp, load_mode);
2684 if (rc)
2685 LOAD_ERROR_EXIT(bp, load_error3);
2686 }
2687 bp->link_params.feature_config_flags &= ~FEATURE_CONFIG_BOOT_FROM_SAN;
2688
2689 /* Start fast path */
2690
2691 /* Initialize Rx filter. */
2692 netif_addr_lock_bh(bp->dev);
2693 bnx2x_set_rx_mode(bp->dev);
2694 netif_addr_unlock_bh(bp->dev);
2695
2696 /* Start the Tx */
2697 switch (load_mode) {
2698 case LOAD_NORMAL:
2699 /* Tx queue should be only reenabled */
2700 netif_tx_wake_all_queues(bp->dev);
2701 break;
2702
2703 case LOAD_OPEN:
2704 netif_tx_start_all_queues(bp->dev);
2705 smp_mb__after_clear_bit();
2706 break;
2707
2708 case LOAD_DIAG:
2709 case LOAD_LOOPBACK_EXT:
2710 bp->state = BNX2X_STATE_DIAG;
2711 break;
2712
2713 default:
2714 break;
2715 }
2716
2717 if (bp->port.pmf)
2718 bnx2x_update_drv_flags(bp, 1 << DRV_FLAGS_PORT_MASK, 0);
2719 else
2720 bnx2x__link_status_update(bp);
2721
2722 /* start the timer */
2723 mod_timer(&bp->timer, jiffies + bp->current_interval);
2724
2725 if (CNIC_ENABLED(bp))
2726 bnx2x_load_cnic(bp);
2727
2728 if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2729 /* mark driver is loaded in shmem2 */
2730 u32 val;
2731 val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2732 SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2733 val | DRV_FLAGS_CAPABILITIES_LOADED_SUPPORTED |
2734 DRV_FLAGS_CAPABILITIES_LOADED_L2);
2735 }
2736
2737 /* Wait for all pending SP commands to complete */
2738 if (IS_PF(bp) && !bnx2x_wait_sp_comp(bp, ~0x0UL)) {
2739 BNX2X_ERR("Timeout waiting for SP elements to complete\n");
2740 bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
2741 return -EBUSY;
2742 }
2743
2744 /* If PMF - send ADMIN DCBX msg to MFW to initiate DCBX FSM */
2745 if (bp->port.pmf && (bp->state != BNX2X_STATE_DIAG))
2746 bnx2x_dcbx_init(bp, false);
2747
2748 DP(NETIF_MSG_IFUP, "Ending successfully NIC load\n");
2749
2750 return 0;
2751
2752 #ifndef BNX2X_STOP_ON_ERROR
2753 load_error3:
2754 if (IS_PF(bp)) {
2755 bnx2x_int_disable_sync(bp, 1);
2756
2757 /* Clean queueable objects */
2758 bnx2x_squeeze_objects(bp);
2759 }
2760
2761 /* Free SKBs, SGEs, TPA pool and driver internals */
2762 bnx2x_free_skbs(bp);
2763 for_each_rx_queue(bp, i)
2764 bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
2765
2766 /* Release IRQs */
2767 bnx2x_free_irq(bp);
2768 load_error2:
2769 if (IS_PF(bp) && !BP_NOMCP(bp)) {
2770 bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_REQ_WOL_MCP, 0);
2771 bnx2x_fw_command(bp, DRV_MSG_CODE_UNLOAD_DONE, 0);
2772 }
2773
2774 bp->port.pmf = 0;
2775 load_error1:
2776 bnx2x_napi_disable(bp);
2777 bnx2x_del_all_napi(bp);
2778
2779 /* clear pf_load status, as it was already set */
2780 if (IS_PF(bp))
2781 bnx2x_clear_pf_load(bp);
2782 load_error0:
2783 bnx2x_free_fp_mem(bp);
2784 bnx2x_free_fw_stats_mem(bp);
2785 bnx2x_free_mem(bp);
2786
2787 return rc;
2788 #endif /* ! BNX2X_STOP_ON_ERROR */
2789 }
2790
bnx2x_drain_tx_queues(struct bnx2x * bp)2791 int bnx2x_drain_tx_queues(struct bnx2x *bp)
2792 {
2793 u8 rc = 0, cos, i;
2794
2795 /* Wait until tx fastpath tasks complete */
2796 for_each_tx_queue(bp, i) {
2797 struct bnx2x_fastpath *fp = &bp->fp[i];
2798
2799 for_each_cos_in_tx_queue(fp, cos)
2800 rc = bnx2x_clean_tx_queue(bp, fp->txdata_ptr[cos]);
2801 if (rc)
2802 return rc;
2803 }
2804 return 0;
2805 }
2806
2807 /* must be called with rtnl_lock */
bnx2x_nic_unload(struct bnx2x * bp,int unload_mode,bool keep_link)2808 int bnx2x_nic_unload(struct bnx2x *bp, int unload_mode, bool keep_link)
2809 {
2810 int i;
2811 bool global = false;
2812
2813 DP(NETIF_MSG_IFUP, "Starting NIC unload\n");
2814
2815 /* mark driver is unloaded in shmem2 */
2816 if (IS_PF(bp) && SHMEM2_HAS(bp, drv_capabilities_flag)) {
2817 u32 val;
2818 val = SHMEM2_RD(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)]);
2819 SHMEM2_WR(bp, drv_capabilities_flag[BP_FW_MB_IDX(bp)],
2820 val & ~DRV_FLAGS_CAPABILITIES_LOADED_L2);
2821 }
2822
2823 if (IS_PF(bp) && bp->recovery_state != BNX2X_RECOVERY_DONE &&
2824 (bp->state == BNX2X_STATE_CLOSED ||
2825 bp->state == BNX2X_STATE_ERROR)) {
2826 /* We can get here if the driver has been unloaded
2827 * during parity error recovery and is either waiting for a
2828 * leader to complete or for other functions to unload and
2829 * then ifdown has been issued. In this case we want to
2830 * unload and let other functions to complete a recovery
2831 * process.
2832 */
2833 bp->recovery_state = BNX2X_RECOVERY_DONE;
2834 bp->is_leader = 0;
2835 bnx2x_release_leader_lock(bp);
2836 smp_mb();
2837
2838 DP(NETIF_MSG_IFDOWN, "Releasing a leadership...\n");
2839 BNX2X_ERR("Can't unload in closed or error state\n");
2840 return -EINVAL;
2841 }
2842
2843 /* Nothing to do during unload if previous bnx2x_nic_load()
2844 * have not completed succesfully - all resourses are released.
2845 *
2846 * we can get here only after unsuccessful ndo_* callback, during which
2847 * dev->IFF_UP flag is still on.
2848 */
2849 if (bp->state == BNX2X_STATE_CLOSED || bp->state == BNX2X_STATE_ERROR)
2850 return 0;
2851
2852 /* It's important to set the bp->state to the value different from
2853 * BNX2X_STATE_OPEN and only then stop the Tx. Otherwise bnx2x_tx_int()
2854 * may restart the Tx from the NAPI context (see bnx2x_tx_int()).
2855 */
2856 bp->state = BNX2X_STATE_CLOSING_WAIT4_HALT;
2857 smp_mb();
2858
2859 if (CNIC_LOADED(bp))
2860 bnx2x_cnic_notify(bp, CNIC_CTL_STOP_CMD);
2861
2862 /* Stop Tx */
2863 bnx2x_tx_disable(bp);
2864 netdev_reset_tc(bp->dev);
2865
2866 bp->rx_mode = BNX2X_RX_MODE_NONE;
2867
2868 del_timer_sync(&bp->timer);
2869
2870 if (IS_PF(bp)) {
2871 /* Set ALWAYS_ALIVE bit in shmem */
2872 bp->fw_drv_pulse_wr_seq |= DRV_PULSE_ALWAYS_ALIVE;
2873 bnx2x_drv_pulse(bp);
2874 bnx2x_stats_handle(bp, STATS_EVENT_STOP);
2875 bnx2x_save_statistics(bp);
2876 }
2877
2878 /* wait till consumers catch up with producers in all queues */
2879 bnx2x_drain_tx_queues(bp);
2880
2881 /* if VF indicate to PF this function is going down (PF will delete sp
2882 * elements and clear initializations
2883 */
2884 if (IS_VF(bp))
2885 bnx2x_vfpf_close_vf(bp);
2886 else if (unload_mode != UNLOAD_RECOVERY)
2887 /* if this is a normal/close unload need to clean up chip*/
2888 bnx2x_chip_cleanup(bp, unload_mode, keep_link);
2889 else {
2890 /* Send the UNLOAD_REQUEST to the MCP */
2891 bnx2x_send_unload_req(bp, unload_mode);
2892
2893 /*
2894 * Prevent transactions to host from the functions on the
2895 * engine that doesn't reset global blocks in case of global
2896 * attention once gloabl blocks are reset and gates are opened
2897 * (the engine which leader will perform the recovery
2898 * last).
2899 */
2900 if (!CHIP_IS_E1x(bp))
2901 bnx2x_pf_disable(bp);
2902
2903 /* Disable HW interrupts, NAPI */
2904 bnx2x_netif_stop(bp, 1);
2905 /* Delete all NAPI objects */
2906 bnx2x_del_all_napi(bp);
2907 if (CNIC_LOADED(bp))
2908 bnx2x_del_all_napi_cnic(bp);
2909 /* Release IRQs */
2910 bnx2x_free_irq(bp);
2911
2912 /* Report UNLOAD_DONE to MCP */
2913 bnx2x_send_unload_done(bp, false);
2914 }
2915
2916 /*
2917 * At this stage no more interrupts will arrive so we may safly clean
2918 * the queueable objects here in case they failed to get cleaned so far.
2919 */
2920 if (IS_PF(bp))
2921 bnx2x_squeeze_objects(bp);
2922
2923 /* There should be no more pending SP commands at this stage */
2924 bp->sp_state = 0;
2925
2926 bp->port.pmf = 0;
2927
2928 /* Free SKBs, SGEs, TPA pool and driver internals */
2929 bnx2x_free_skbs(bp);
2930 if (CNIC_LOADED(bp))
2931 bnx2x_free_skbs_cnic(bp);
2932 for_each_rx_queue(bp, i)
2933 bnx2x_free_rx_sge_range(bp, bp->fp + i, NUM_RX_SGE);
2934
2935 bnx2x_free_fp_mem(bp);
2936 if (CNIC_LOADED(bp))
2937 bnx2x_free_fp_mem_cnic(bp);
2938
2939 if (IS_PF(bp)) {
2940 if (CNIC_LOADED(bp))
2941 bnx2x_free_mem_cnic(bp);
2942 bnx2x_free_mem(bp);
2943 }
2944 bp->state = BNX2X_STATE_CLOSED;
2945 bp->cnic_loaded = false;
2946
2947 /* Check if there are pending parity attentions. If there are - set
2948 * RECOVERY_IN_PROGRESS.
2949 */
2950 if (IS_PF(bp) && bnx2x_chk_parity_attn(bp, &global, false)) {
2951 bnx2x_set_reset_in_progress(bp);
2952
2953 /* Set RESET_IS_GLOBAL if needed */
2954 if (global)
2955 bnx2x_set_reset_global(bp);
2956 }
2957
2958
2959 /* The last driver must disable a "close the gate" if there is no
2960 * parity attention or "process kill" pending.
2961 */
2962 if (IS_PF(bp) &&
2963 !bnx2x_clear_pf_load(bp) &&
2964 bnx2x_reset_is_done(bp, BP_PATH(bp)))
2965 bnx2x_disable_close_the_gate(bp);
2966
2967 DP(NETIF_MSG_IFUP, "Ending NIC unload\n");
2968
2969 return 0;
2970 }
2971
bnx2x_set_power_state(struct bnx2x * bp,pci_power_t state)2972 int bnx2x_set_power_state(struct bnx2x *bp, pci_power_t state)
2973 {
2974 u16 pmcsr;
2975
2976 /* If there is no power capability, silently succeed */
2977 if (!bp->pm_cap) {
2978 BNX2X_DEV_INFO("No power capability. Breaking.\n");
2979 return 0;
2980 }
2981
2982 pci_read_config_word(bp->pdev, bp->pm_cap + PCI_PM_CTRL, &pmcsr);
2983
2984 switch (state) {
2985 case PCI_D0:
2986 pci_write_config_word(bp->pdev, bp->pm_cap + PCI_PM_CTRL,
2987 ((pmcsr & ~PCI_PM_CTRL_STATE_MASK) |
2988 PCI_PM_CTRL_PME_STATUS));
2989
2990 if (pmcsr & PCI_PM_CTRL_STATE_MASK)
2991 /* delay required during transition out of D3hot */
2992 msleep(20);
2993 break;
2994
2995 case PCI_D3hot:
2996 /* If there are other clients above don't
2997 shut down the power */
2998 if (atomic_read(&bp->pdev->enable_cnt) != 1)
2999 return 0;
3000 /* Don't shut down the power for emulation and FPGA */
3001 if (CHIP_REV_IS_SLOW(bp))
3002 return 0;
3003
3004 pmcsr &= ~PCI_PM_CTRL_STATE_MASK;
3005 pmcsr |= 3;
3006
3007 if (bp->wol)
3008 pmcsr |= PCI_PM_CTRL_PME_ENABLE;
3009
3010 pci_write_config_word(bp->pdev, bp->pm_cap + PCI_PM_CTRL,
3011 pmcsr);
3012
3013 /* No more memory access after this point until
3014 * device is brought back to D0.
3015 */
3016 break;
3017
3018 default:
3019 dev_err(&bp->pdev->dev, "Can't support state = %d\n", state);
3020 return -EINVAL;
3021 }
3022 return 0;
3023 }
3024
3025 /*
3026 * net_device service functions
3027 */
bnx2x_poll(struct napi_struct * napi,int budget)3028 int bnx2x_poll(struct napi_struct *napi, int budget)
3029 {
3030 int work_done = 0;
3031 u8 cos;
3032 struct bnx2x_fastpath *fp = container_of(napi, struct bnx2x_fastpath,
3033 napi);
3034 struct bnx2x *bp = fp->bp;
3035
3036 while (1) {
3037 #ifdef BNX2X_STOP_ON_ERROR
3038 if (unlikely(bp->panic)) {
3039 napi_complete(napi);
3040 return 0;
3041 }
3042 #endif
3043
3044 for_each_cos_in_tx_queue(fp, cos)
3045 if (bnx2x_tx_queue_has_work(fp->txdata_ptr[cos]))
3046 bnx2x_tx_int(bp, fp->txdata_ptr[cos]);
3047
3048 if (bnx2x_has_rx_work(fp)) {
3049 work_done += bnx2x_rx_int(fp, budget - work_done);
3050
3051 /* must not complete if we consumed full budget */
3052 if (work_done >= budget)
3053 break;
3054 }
3055
3056 /* Fall out from the NAPI loop if needed */
3057 if (!(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3058
3059 /* No need to update SB for FCoE L2 ring as long as
3060 * it's connected to the default SB and the SB
3061 * has been updated when NAPI was scheduled.
3062 */
3063 if (IS_FCOE_FP(fp)) {
3064 napi_complete(napi);
3065 break;
3066 }
3067 bnx2x_update_fpsb_idx(fp);
3068 /* bnx2x_has_rx_work() reads the status block,
3069 * thus we need to ensure that status block indices
3070 * have been actually read (bnx2x_update_fpsb_idx)
3071 * prior to this check (bnx2x_has_rx_work) so that
3072 * we won't write the "newer" value of the status block
3073 * to IGU (if there was a DMA right after
3074 * bnx2x_has_rx_work and if there is no rmb, the memory
3075 * reading (bnx2x_update_fpsb_idx) may be postponed
3076 * to right before bnx2x_ack_sb). In this case there
3077 * will never be another interrupt until there is
3078 * another update of the status block, while there
3079 * is still unhandled work.
3080 */
3081 rmb();
3082
3083 if (!(bnx2x_has_rx_work(fp) || bnx2x_has_tx_work(fp))) {
3084 napi_complete(napi);
3085 /* Re-enable interrupts */
3086 DP(NETIF_MSG_RX_STATUS,
3087 "Update index to %d\n", fp->fp_hc_idx);
3088 bnx2x_ack_sb(bp, fp->igu_sb_id, USTORM_ID,
3089 le16_to_cpu(fp->fp_hc_idx),
3090 IGU_INT_ENABLE, 1);
3091 break;
3092 }
3093 }
3094 }
3095
3096 return work_done;
3097 }
3098
3099 /* we split the first BD into headers and data BDs
3100 * to ease the pain of our fellow microcode engineers
3101 * we use one mapping for both BDs
3102 */
bnx2x_tx_split(struct bnx2x * bp,struct bnx2x_fp_txdata * txdata,struct sw_tx_bd * tx_buf,struct eth_tx_start_bd ** tx_bd,u16 hlen,u16 bd_prod)3103 static u16 bnx2x_tx_split(struct bnx2x *bp,
3104 struct bnx2x_fp_txdata *txdata,
3105 struct sw_tx_bd *tx_buf,
3106 struct eth_tx_start_bd **tx_bd, u16 hlen,
3107 u16 bd_prod)
3108 {
3109 struct eth_tx_start_bd *h_tx_bd = *tx_bd;
3110 struct eth_tx_bd *d_tx_bd;
3111 dma_addr_t mapping;
3112 int old_len = le16_to_cpu(h_tx_bd->nbytes);
3113
3114 /* first fix first BD */
3115 h_tx_bd->nbytes = cpu_to_le16(hlen);
3116
3117 DP(NETIF_MSG_TX_QUEUED, "TSO split header size is %d (%x:%x)\n",
3118 h_tx_bd->nbytes, h_tx_bd->addr_hi, h_tx_bd->addr_lo);
3119
3120 /* now get a new data BD
3121 * (after the pbd) and fill it */
3122 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3123 d_tx_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3124
3125 mapping = HILO_U64(le32_to_cpu(h_tx_bd->addr_hi),
3126 le32_to_cpu(h_tx_bd->addr_lo)) + hlen;
3127
3128 d_tx_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3129 d_tx_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3130 d_tx_bd->nbytes = cpu_to_le16(old_len - hlen);
3131
3132 /* this marks the BD as one that has no individual mapping */
3133 tx_buf->flags |= BNX2X_TSO_SPLIT_BD;
3134
3135 DP(NETIF_MSG_TX_QUEUED,
3136 "TSO split data size is %d (%x:%x)\n",
3137 d_tx_bd->nbytes, d_tx_bd->addr_hi, d_tx_bd->addr_lo);
3138
3139 /* update tx_bd */
3140 *tx_bd = (struct eth_tx_start_bd *)d_tx_bd;
3141
3142 return bd_prod;
3143 }
3144
3145 #define bswab32(b32) ((__force __le32) swab32((__force __u32) (b32)))
3146 #define bswab16(b16) ((__force __le16) swab16((__force __u16) (b16)))
bnx2x_csum_fix(unsigned char * t_header,u16 csum,s8 fix)3147 static __le16 bnx2x_csum_fix(unsigned char *t_header, u16 csum, s8 fix)
3148 {
3149 __sum16 tsum = (__force __sum16) csum;
3150
3151 if (fix > 0)
3152 tsum = ~csum_fold(csum_sub((__force __wsum) csum,
3153 csum_partial(t_header - fix, fix, 0)));
3154
3155 else if (fix < 0)
3156 tsum = ~csum_fold(csum_add((__force __wsum) csum,
3157 csum_partial(t_header, -fix, 0)));
3158
3159 return bswab16(tsum);
3160 }
3161
bnx2x_xmit_type(struct bnx2x * bp,struct sk_buff * skb)3162 static u32 bnx2x_xmit_type(struct bnx2x *bp, struct sk_buff *skb)
3163 {
3164 u32 rc;
3165 __u8 prot = 0;
3166 __be16 protocol;
3167
3168 if (skb->ip_summed != CHECKSUM_PARTIAL)
3169 return XMIT_PLAIN;
3170
3171 protocol = vlan_get_protocol(skb);
3172 if (protocol == htons(ETH_P_IPV6)) {
3173 rc = XMIT_CSUM_V6;
3174 prot = ipv6_hdr(skb)->nexthdr;
3175 } else {
3176 rc = XMIT_CSUM_V4;
3177 prot = ip_hdr(skb)->protocol;
3178 }
3179
3180 if (!CHIP_IS_E1x(bp) && skb->encapsulation) {
3181 if (inner_ip_hdr(skb)->version == 6) {
3182 rc |= XMIT_CSUM_ENC_V6;
3183 if (inner_ipv6_hdr(skb)->nexthdr == IPPROTO_TCP)
3184 rc |= XMIT_CSUM_TCP;
3185 } else {
3186 rc |= XMIT_CSUM_ENC_V4;
3187 if (inner_ip_hdr(skb)->protocol == IPPROTO_TCP)
3188 rc |= XMIT_CSUM_TCP;
3189 }
3190 }
3191 if (prot == IPPROTO_TCP)
3192 rc |= XMIT_CSUM_TCP;
3193
3194 if (skb_is_gso_v6(skb)) {
3195 rc |= (XMIT_GSO_V6 | XMIT_CSUM_TCP);
3196 if (rc & XMIT_CSUM_ENC)
3197 rc |= XMIT_GSO_ENC_V6;
3198 } else if (skb_is_gso(skb)) {
3199 rc |= (XMIT_GSO_V4 | XMIT_CSUM_TCP);
3200 if (rc & XMIT_CSUM_ENC)
3201 rc |= XMIT_GSO_ENC_V4;
3202 }
3203
3204 return rc;
3205 }
3206
3207 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - 3)
3208 /* check if packet requires linearization (packet is too fragmented)
3209 no need to check fragmentation if page size > 8K (there will be no
3210 violation to FW restrictions) */
bnx2x_pkt_req_lin(struct bnx2x * bp,struct sk_buff * skb,u32 xmit_type)3211 static int bnx2x_pkt_req_lin(struct bnx2x *bp, struct sk_buff *skb,
3212 u32 xmit_type)
3213 {
3214 int to_copy = 0;
3215 int hlen = 0;
3216 int first_bd_sz = 0;
3217
3218 /* 3 = 1 (for linear data BD) + 2 (for PBD and last BD) */
3219 if (skb_shinfo(skb)->nr_frags >= (MAX_FETCH_BD - 3)) {
3220
3221 if (xmit_type & XMIT_GSO) {
3222 unsigned short lso_mss = skb_shinfo(skb)->gso_size;
3223 /* Check if LSO packet needs to be copied:
3224 3 = 1 (for headers BD) + 2 (for PBD and last BD) */
3225 int wnd_size = MAX_FETCH_BD - 3;
3226 /* Number of windows to check */
3227 int num_wnds = skb_shinfo(skb)->nr_frags - wnd_size;
3228 int wnd_idx = 0;
3229 int frag_idx = 0;
3230 u32 wnd_sum = 0;
3231
3232 /* Headers length */
3233 hlen = (int)(skb_transport_header(skb) - skb->data) +
3234 tcp_hdrlen(skb);
3235
3236 /* Amount of data (w/o headers) on linear part of SKB*/
3237 first_bd_sz = skb_headlen(skb) - hlen;
3238
3239 wnd_sum = first_bd_sz;
3240
3241 /* Calculate the first sum - it's special */
3242 for (frag_idx = 0; frag_idx < wnd_size - 1; frag_idx++)
3243 wnd_sum +=
3244 skb_frag_size(&skb_shinfo(skb)->frags[frag_idx]);
3245
3246 /* If there was data on linear skb data - check it */
3247 if (first_bd_sz > 0) {
3248 if (unlikely(wnd_sum < lso_mss)) {
3249 to_copy = 1;
3250 goto exit_lbl;
3251 }
3252
3253 wnd_sum -= first_bd_sz;
3254 }
3255
3256 /* Others are easier: run through the frag list and
3257 check all windows */
3258 for (wnd_idx = 0; wnd_idx <= num_wnds; wnd_idx++) {
3259 wnd_sum +=
3260 skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx + wnd_size - 1]);
3261
3262 if (unlikely(wnd_sum < lso_mss)) {
3263 to_copy = 1;
3264 break;
3265 }
3266 wnd_sum -=
3267 skb_frag_size(&skb_shinfo(skb)->frags[wnd_idx]);
3268 }
3269 } else {
3270 /* in non-LSO too fragmented packet should always
3271 be linearized */
3272 to_copy = 1;
3273 }
3274 }
3275
3276 exit_lbl:
3277 if (unlikely(to_copy))
3278 DP(NETIF_MSG_TX_QUEUED,
3279 "Linearization IS REQUIRED for %s packet. num_frags %d hlen %d first_bd_sz %d\n",
3280 (xmit_type & XMIT_GSO) ? "LSO" : "non-LSO",
3281 skb_shinfo(skb)->nr_frags, hlen, first_bd_sz);
3282
3283 return to_copy;
3284 }
3285 #endif
3286
bnx2x_set_pbd_gso_e2(struct sk_buff * skb,u32 * parsing_data,u32 xmit_type)3287 static void bnx2x_set_pbd_gso_e2(struct sk_buff *skb, u32 *parsing_data,
3288 u32 xmit_type)
3289 {
3290 struct ipv6hdr *ipv6;
3291
3292 *parsing_data |= (skb_shinfo(skb)->gso_size <<
3293 ETH_TX_PARSE_BD_E2_LSO_MSS_SHIFT) &
3294 ETH_TX_PARSE_BD_E2_LSO_MSS;
3295
3296 if (xmit_type & XMIT_GSO_ENC_V6)
3297 ipv6 = inner_ipv6_hdr(skb);
3298 else if (xmit_type & XMIT_GSO_V6)
3299 ipv6 = ipv6_hdr(skb);
3300 else
3301 ipv6 = NULL;
3302
3303 if (ipv6 && ipv6->nexthdr == NEXTHDR_IPV6)
3304 *parsing_data |= ETH_TX_PARSE_BD_E2_IPV6_WITH_EXT_HDR;
3305 }
3306
3307 /**
3308 * bnx2x_set_pbd_gso - update PBD in GSO case.
3309 *
3310 * @skb: packet skb
3311 * @pbd: parse BD
3312 * @xmit_type: xmit flags
3313 */
bnx2x_set_pbd_gso(struct sk_buff * skb,struct eth_tx_parse_bd_e1x * pbd,struct eth_tx_start_bd * tx_start_bd,u32 xmit_type)3314 static void bnx2x_set_pbd_gso(struct sk_buff *skb,
3315 struct eth_tx_parse_bd_e1x *pbd,
3316 struct eth_tx_start_bd *tx_start_bd,
3317 u32 xmit_type)
3318 {
3319 pbd->lso_mss = cpu_to_le16(skb_shinfo(skb)->gso_size);
3320 pbd->tcp_send_seq = bswab32(tcp_hdr(skb)->seq);
3321 pbd->tcp_flags = pbd_tcp_flags(tcp_hdr(skb));
3322
3323 if (xmit_type & XMIT_GSO_V4) {
3324 pbd->ip_id = bswab16(ip_hdr(skb)->id);
3325 pbd->tcp_pseudo_csum =
3326 bswab16(~csum_tcpudp_magic(ip_hdr(skb)->saddr,
3327 ip_hdr(skb)->daddr,
3328 0, IPPROTO_TCP, 0));
3329
3330 /* GSO on 57710/57711 needs FW to calculate IP checksum */
3331 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IP_CSUM;
3332 } else {
3333 pbd->tcp_pseudo_csum =
3334 bswab16(~csum_ipv6_magic(&ipv6_hdr(skb)->saddr,
3335 &ipv6_hdr(skb)->daddr,
3336 0, IPPROTO_TCP, 0));
3337 }
3338
3339 pbd->global_data |=
3340 cpu_to_le16(ETH_TX_PARSE_BD_E1X_PSEUDO_CS_WITHOUT_LEN);
3341 }
3342
3343 /**
3344 * bnx2x_set_pbd_csum_enc - update PBD with checksum and return header length
3345 *
3346 * @bp: driver handle
3347 * @skb: packet skb
3348 * @parsing_data: data to be updated
3349 * @xmit_type: xmit flags
3350 *
3351 * 57712/578xx related, when skb has encapsulation
3352 */
bnx2x_set_pbd_csum_enc(struct bnx2x * bp,struct sk_buff * skb,u32 * parsing_data,u32 xmit_type)3353 static u8 bnx2x_set_pbd_csum_enc(struct bnx2x *bp, struct sk_buff *skb,
3354 u32 *parsing_data, u32 xmit_type)
3355 {
3356 *parsing_data |=
3357 ((((u8 *)skb_inner_transport_header(skb) - skb->data) >> 1) <<
3358 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3359 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3360
3361 if (xmit_type & XMIT_CSUM_TCP) {
3362 *parsing_data |= ((inner_tcp_hdrlen(skb) / 4) <<
3363 ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3364 ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3365
3366 return skb_inner_transport_header(skb) +
3367 inner_tcp_hdrlen(skb) - skb->data;
3368 }
3369
3370 /* We support checksum offload for TCP and UDP only.
3371 * No need to pass the UDP header length - it's a constant.
3372 */
3373 return skb_inner_transport_header(skb) +
3374 sizeof(struct udphdr) - skb->data;
3375 }
3376
3377 /**
3378 * bnx2x_set_pbd_csum_e2 - update PBD with checksum and return header length
3379 *
3380 * @bp: driver handle
3381 * @skb: packet skb
3382 * @parsing_data: data to be updated
3383 * @xmit_type: xmit flags
3384 *
3385 * 57712/578xx related
3386 */
bnx2x_set_pbd_csum_e2(struct bnx2x * bp,struct sk_buff * skb,u32 * parsing_data,u32 xmit_type)3387 static u8 bnx2x_set_pbd_csum_e2(struct bnx2x *bp, struct sk_buff *skb,
3388 u32 *parsing_data, u32 xmit_type)
3389 {
3390 *parsing_data |=
3391 ((((u8 *)skb_transport_header(skb) - skb->data) >> 1) <<
3392 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W_SHIFT) &
3393 ETH_TX_PARSE_BD_E2_L4_HDR_START_OFFSET_W;
3394
3395 if (xmit_type & XMIT_CSUM_TCP) {
3396 *parsing_data |= ((tcp_hdrlen(skb) / 4) <<
3397 ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW_SHIFT) &
3398 ETH_TX_PARSE_BD_E2_TCP_HDR_LENGTH_DW;
3399
3400 return skb_transport_header(skb) + tcp_hdrlen(skb) - skb->data;
3401 }
3402 /* We support checksum offload for TCP and UDP only.
3403 * No need to pass the UDP header length - it's a constant.
3404 */
3405 return skb_transport_header(skb) + sizeof(struct udphdr) - skb->data;
3406 }
3407
3408 /* set FW indication according to inner or outer protocols if tunneled */
bnx2x_set_sbd_csum(struct bnx2x * bp,struct sk_buff * skb,struct eth_tx_start_bd * tx_start_bd,u32 xmit_type)3409 static void bnx2x_set_sbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3410 struct eth_tx_start_bd *tx_start_bd,
3411 u32 xmit_type)
3412 {
3413 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_L4_CSUM;
3414
3415 if (xmit_type & (XMIT_CSUM_ENC_V6 | XMIT_CSUM_V6))
3416 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IPV6;
3417
3418 if (!(xmit_type & XMIT_CSUM_TCP))
3419 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_IS_UDP;
3420 }
3421
3422 /**
3423 * bnx2x_set_pbd_csum - update PBD with checksum and return header length
3424 *
3425 * @bp: driver handle
3426 * @skb: packet skb
3427 * @pbd: parse BD to be updated
3428 * @xmit_type: xmit flags
3429 */
bnx2x_set_pbd_csum(struct bnx2x * bp,struct sk_buff * skb,struct eth_tx_parse_bd_e1x * pbd,u32 xmit_type)3430 static u8 bnx2x_set_pbd_csum(struct bnx2x *bp, struct sk_buff *skb,
3431 struct eth_tx_parse_bd_e1x *pbd,
3432 u32 xmit_type)
3433 {
3434 u8 hlen = (skb_network_header(skb) - skb->data) >> 1;
3435
3436 /* for now NS flag is not used in Linux */
3437 pbd->global_data =
3438 cpu_to_le16(hlen |
3439 ((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3440 ETH_TX_PARSE_BD_E1X_LLC_SNAP_EN_SHIFT));
3441
3442 pbd->ip_hlen_w = (skb_transport_header(skb) -
3443 skb_network_header(skb)) >> 1;
3444
3445 hlen += pbd->ip_hlen_w;
3446
3447 /* We support checksum offload for TCP and UDP only */
3448 if (xmit_type & XMIT_CSUM_TCP)
3449 hlen += tcp_hdrlen(skb) / 2;
3450 else
3451 hlen += sizeof(struct udphdr) / 2;
3452
3453 pbd->total_hlen_w = cpu_to_le16(hlen);
3454 hlen = hlen*2;
3455
3456 if (xmit_type & XMIT_CSUM_TCP) {
3457 pbd->tcp_pseudo_csum = bswab16(tcp_hdr(skb)->check);
3458
3459 } else {
3460 s8 fix = SKB_CS_OFF(skb); /* signed! */
3461
3462 DP(NETIF_MSG_TX_QUEUED,
3463 "hlen %d fix %d csum before fix %x\n",
3464 le16_to_cpu(pbd->total_hlen_w), fix, SKB_CS(skb));
3465
3466 /* HW bug: fixup the CSUM */
3467 pbd->tcp_pseudo_csum =
3468 bnx2x_csum_fix(skb_transport_header(skb),
3469 SKB_CS(skb), fix);
3470
3471 DP(NETIF_MSG_TX_QUEUED, "csum after fix %x\n",
3472 pbd->tcp_pseudo_csum);
3473 }
3474
3475 return hlen;
3476 }
3477
bnx2x_update_pbds_gso_enc(struct sk_buff * skb,struct eth_tx_parse_bd_e2 * pbd_e2,struct eth_tx_parse_2nd_bd * pbd2,u16 * global_data,u32 xmit_type)3478 static void bnx2x_update_pbds_gso_enc(struct sk_buff *skb,
3479 struct eth_tx_parse_bd_e2 *pbd_e2,
3480 struct eth_tx_parse_2nd_bd *pbd2,
3481 u16 *global_data,
3482 u32 xmit_type)
3483 {
3484 u16 hlen_w = 0;
3485 u8 outerip_off, outerip_len = 0;
3486
3487 /* from outer IP to transport */
3488 hlen_w = (skb_inner_transport_header(skb) -
3489 skb_network_header(skb)) >> 1;
3490
3491 /* transport len */
3492 hlen_w += inner_tcp_hdrlen(skb) >> 1;
3493
3494 pbd2->fw_ip_hdr_to_payload_w = hlen_w;
3495
3496 /* outer IP header info */
3497 if (xmit_type & XMIT_CSUM_V4) {
3498 struct iphdr *iph = ip_hdr(skb);
3499 pbd2->fw_ip_csum_wo_len_flags_frag =
3500 bswab16(csum_fold((~iph->check) -
3501 iph->tot_len - iph->frag_off));
3502 } else {
3503 pbd2->fw_ip_hdr_to_payload_w =
3504 hlen_w - ((sizeof(struct ipv6hdr)) >> 1);
3505 }
3506
3507 pbd2->tcp_send_seq = bswab32(inner_tcp_hdr(skb)->seq);
3508
3509 pbd2->tcp_flags = pbd_tcp_flags(inner_tcp_hdr(skb));
3510
3511 if (xmit_type & XMIT_GSO_V4) {
3512 pbd2->hw_ip_id = bswab16(inner_ip_hdr(skb)->id);
3513
3514 pbd_e2->data.tunnel_data.pseudo_csum =
3515 bswab16(~csum_tcpudp_magic(
3516 inner_ip_hdr(skb)->saddr,
3517 inner_ip_hdr(skb)->daddr,
3518 0, IPPROTO_TCP, 0));
3519
3520 outerip_len = ip_hdr(skb)->ihl << 1;
3521 } else {
3522 pbd_e2->data.tunnel_data.pseudo_csum =
3523 bswab16(~csum_ipv6_magic(
3524 &inner_ipv6_hdr(skb)->saddr,
3525 &inner_ipv6_hdr(skb)->daddr,
3526 0, IPPROTO_TCP, 0));
3527 }
3528
3529 outerip_off = (skb_network_header(skb) - skb->data) >> 1;
3530
3531 *global_data |=
3532 outerip_off |
3533 (!!(xmit_type & XMIT_CSUM_V6) <<
3534 ETH_TX_PARSE_2ND_BD_IP_HDR_TYPE_OUTER_SHIFT) |
3535 (outerip_len <<
3536 ETH_TX_PARSE_2ND_BD_IP_HDR_LEN_OUTER_W_SHIFT) |
3537 ((skb->protocol == cpu_to_be16(ETH_P_8021Q)) <<
3538 ETH_TX_PARSE_2ND_BD_LLC_SNAP_EN_SHIFT);
3539
3540 if (ip_hdr(skb)->protocol == IPPROTO_UDP) {
3541 SET_FLAG(*global_data, ETH_TX_PARSE_2ND_BD_TUNNEL_UDP_EXIST, 1);
3542 pbd2->tunnel_udp_hdr_start_w = skb_transport_offset(skb) >> 1;
3543 }
3544 }
3545
3546 /* called with netif_tx_lock
3547 * bnx2x_tx_int() runs without netif_tx_lock unless it needs to call
3548 * netif_wake_queue()
3549 */
bnx2x_start_xmit(struct sk_buff * skb,struct net_device * dev)3550 netdev_tx_t bnx2x_start_xmit(struct sk_buff *skb, struct net_device *dev)
3551 {
3552 struct bnx2x *bp = netdev_priv(dev);
3553
3554 struct netdev_queue *txq;
3555 struct bnx2x_fp_txdata *txdata;
3556 struct sw_tx_bd *tx_buf;
3557 struct eth_tx_start_bd *tx_start_bd, *first_bd;
3558 struct eth_tx_bd *tx_data_bd, *total_pkt_bd = NULL;
3559 struct eth_tx_parse_bd_e1x *pbd_e1x = NULL;
3560 struct eth_tx_parse_bd_e2 *pbd_e2 = NULL;
3561 struct eth_tx_parse_2nd_bd *pbd2 = NULL;
3562 u32 pbd_e2_parsing_data = 0;
3563 u16 pkt_prod, bd_prod;
3564 int nbd, txq_index;
3565 dma_addr_t mapping;
3566 u32 xmit_type = bnx2x_xmit_type(bp, skb);
3567 int i;
3568 u8 hlen = 0;
3569 __le16 pkt_size = 0;
3570 struct ethhdr *eth;
3571 u8 mac_type = UNICAST_ADDRESS;
3572
3573 #ifdef BNX2X_STOP_ON_ERROR
3574 if (unlikely(bp->panic))
3575 return NETDEV_TX_BUSY;
3576 #endif
3577
3578 txq_index = skb_get_queue_mapping(skb);
3579 txq = netdev_get_tx_queue(dev, txq_index);
3580
3581 BUG_ON(txq_index >= MAX_ETH_TXQ_IDX(bp) + (CNIC_LOADED(bp) ? 1 : 0));
3582
3583 txdata = &bp->bnx2x_txq[txq_index];
3584
3585 /* enable this debug print to view the transmission queue being used
3586 DP(NETIF_MSG_TX_QUEUED, "indices: txq %d, fp %d, txdata %d\n",
3587 txq_index, fp_index, txdata_index); */
3588
3589 /* enable this debug print to view the tranmission details
3590 DP(NETIF_MSG_TX_QUEUED,
3591 "transmitting packet cid %d fp index %d txdata_index %d tx_data ptr %p fp pointer %p\n",
3592 txdata->cid, fp_index, txdata_index, txdata, fp); */
3593
3594 if (unlikely(bnx2x_tx_avail(bp, txdata) <
3595 skb_shinfo(skb)->nr_frags +
3596 BDS_PER_TX_PKT +
3597 NEXT_CNT_PER_TX_PKT(MAX_BDS_PER_TX_PKT))) {
3598 /* Handle special storage cases separately */
3599 if (txdata->tx_ring_size == 0) {
3600 struct bnx2x_eth_q_stats *q_stats =
3601 bnx2x_fp_qstats(bp, txdata->parent_fp);
3602 q_stats->driver_filtered_tx_pkt++;
3603 dev_kfree_skb(skb);
3604 return NETDEV_TX_OK;
3605 }
3606 bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
3607 netif_tx_stop_queue(txq);
3608 BNX2X_ERR("BUG! Tx ring full when queue awake!\n");
3609
3610 return NETDEV_TX_BUSY;
3611 }
3612
3613 DP(NETIF_MSG_TX_QUEUED,
3614 "queue[%d]: SKB: summed %x protocol %x protocol(%x,%x) gso type %x xmit_type %x len %d\n",
3615 txq_index, skb->ip_summed, skb->protocol, ipv6_hdr(skb)->nexthdr,
3616 ip_hdr(skb)->protocol, skb_shinfo(skb)->gso_type, xmit_type,
3617 skb->len);
3618
3619 eth = (struct ethhdr *)skb->data;
3620
3621 /* set flag according to packet type (UNICAST_ADDRESS is default)*/
3622 if (unlikely(is_multicast_ether_addr(eth->h_dest))) {
3623 if (is_broadcast_ether_addr(eth->h_dest))
3624 mac_type = BROADCAST_ADDRESS;
3625 else
3626 mac_type = MULTICAST_ADDRESS;
3627 }
3628
3629 #if (MAX_SKB_FRAGS >= MAX_FETCH_BD - BDS_PER_TX_PKT)
3630 /* First, check if we need to linearize the skb (due to FW
3631 restrictions). No need to check fragmentation if page size > 8K
3632 (there will be no violation to FW restrictions) */
3633 if (bnx2x_pkt_req_lin(bp, skb, xmit_type)) {
3634 /* Statistics of linearization */
3635 bp->lin_cnt++;
3636 if (skb_linearize(skb) != 0) {
3637 DP(NETIF_MSG_TX_QUEUED,
3638 "SKB linearization failed - silently dropping this SKB\n");
3639 dev_kfree_skb_any(skb);
3640 return NETDEV_TX_OK;
3641 }
3642 }
3643 #endif
3644 /* Map skb linear data for DMA */
3645 mapping = dma_map_single(&bp->pdev->dev, skb->data,
3646 skb_headlen(skb), DMA_TO_DEVICE);
3647 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
3648 DP(NETIF_MSG_TX_QUEUED,
3649 "SKB mapping failed - silently dropping this SKB\n");
3650 dev_kfree_skb_any(skb);
3651 return NETDEV_TX_OK;
3652 }
3653 /*
3654 Please read carefully. First we use one BD which we mark as start,
3655 then we have a parsing info BD (used for TSO or xsum),
3656 and only then we have the rest of the TSO BDs.
3657 (don't forget to mark the last one as last,
3658 and to unmap only AFTER you write to the BD ...)
3659 And above all, all pdb sizes are in words - NOT DWORDS!
3660 */
3661
3662 /* get current pkt produced now - advance it just before sending packet
3663 * since mapping of pages may fail and cause packet to be dropped
3664 */
3665 pkt_prod = txdata->tx_pkt_prod;
3666 bd_prod = TX_BD(txdata->tx_bd_prod);
3667
3668 /* get a tx_buf and first BD
3669 * tx_start_bd may be changed during SPLIT,
3670 * but first_bd will always stay first
3671 */
3672 tx_buf = &txdata->tx_buf_ring[TX_BD(pkt_prod)];
3673 tx_start_bd = &txdata->tx_desc_ring[bd_prod].start_bd;
3674 first_bd = tx_start_bd;
3675
3676 tx_start_bd->bd_flags.as_bitfield = ETH_TX_BD_FLAGS_START_BD;
3677
3678 /* header nbd: indirectly zero other flags! */
3679 tx_start_bd->general_data = 1 << ETH_TX_START_BD_HDR_NBDS_SHIFT;
3680
3681 /* remember the first BD of the packet */
3682 tx_buf->first_bd = txdata->tx_bd_prod;
3683 tx_buf->skb = skb;
3684 tx_buf->flags = 0;
3685
3686 DP(NETIF_MSG_TX_QUEUED,
3687 "sending pkt %u @%p next_idx %u bd %u @%p\n",
3688 pkt_prod, tx_buf, txdata->tx_pkt_prod, bd_prod, tx_start_bd);
3689
3690 if (vlan_tx_tag_present(skb)) {
3691 tx_start_bd->vlan_or_ethertype =
3692 cpu_to_le16(vlan_tx_tag_get(skb));
3693 tx_start_bd->bd_flags.as_bitfield |=
3694 (X_ETH_OUTBAND_VLAN << ETH_TX_BD_FLAGS_VLAN_MODE_SHIFT);
3695 } else {
3696 /* when transmitting in a vf, start bd must hold the ethertype
3697 * for fw to enforce it
3698 */
3699 if (IS_VF(bp))
3700 tx_start_bd->vlan_or_ethertype =
3701 cpu_to_le16(ntohs(eth->h_proto));
3702 else
3703 /* used by FW for packet accounting */
3704 tx_start_bd->vlan_or_ethertype = cpu_to_le16(pkt_prod);
3705 }
3706
3707 nbd = 2; /* start_bd + pbd + frags (updated when pages are mapped) */
3708
3709 /* turn on parsing and get a BD */
3710 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3711
3712 if (xmit_type & XMIT_CSUM)
3713 bnx2x_set_sbd_csum(bp, skb, tx_start_bd, xmit_type);
3714
3715 if (!CHIP_IS_E1x(bp)) {
3716 pbd_e2 = &txdata->tx_desc_ring[bd_prod].parse_bd_e2;
3717 memset(pbd_e2, 0, sizeof(struct eth_tx_parse_bd_e2));
3718
3719 if (xmit_type & XMIT_CSUM_ENC) {
3720 u16 global_data = 0;
3721
3722 /* Set PBD in enc checksum offload case */
3723 hlen = bnx2x_set_pbd_csum_enc(bp, skb,
3724 &pbd_e2_parsing_data,
3725 xmit_type);
3726
3727 /* turn on 2nd parsing and get a BD */
3728 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3729
3730 pbd2 = &txdata->tx_desc_ring[bd_prod].parse_2nd_bd;
3731
3732 memset(pbd2, 0, sizeof(*pbd2));
3733
3734 pbd_e2->data.tunnel_data.ip_hdr_start_inner_w =
3735 (skb_inner_network_header(skb) -
3736 skb->data) >> 1;
3737
3738 if (xmit_type & XMIT_GSO_ENC)
3739 bnx2x_update_pbds_gso_enc(skb, pbd_e2, pbd2,
3740 &global_data,
3741 xmit_type);
3742
3743 pbd2->global_data = cpu_to_le16(global_data);
3744
3745 /* add addition parse BD indication to start BD */
3746 SET_FLAG(tx_start_bd->general_data,
3747 ETH_TX_START_BD_PARSE_NBDS, 1);
3748 /* set encapsulation flag in start BD */
3749 SET_FLAG(tx_start_bd->general_data,
3750 ETH_TX_START_BD_TUNNEL_EXIST, 1);
3751 nbd++;
3752 } else if (xmit_type & XMIT_CSUM) {
3753 /* Set PBD in checksum offload case w/o encapsulation */
3754 hlen = bnx2x_set_pbd_csum_e2(bp, skb,
3755 &pbd_e2_parsing_data,
3756 xmit_type);
3757 }
3758
3759 /* Add the macs to the parsing BD this is a vf */
3760 if (IS_VF(bp)) {
3761 /* override GRE parameters in BD */
3762 bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.src_hi,
3763 &pbd_e2->data.mac_addr.src_mid,
3764 &pbd_e2->data.mac_addr.src_lo,
3765 eth->h_source);
3766
3767 bnx2x_set_fw_mac_addr(&pbd_e2->data.mac_addr.dst_hi,
3768 &pbd_e2->data.mac_addr.dst_mid,
3769 &pbd_e2->data.mac_addr.dst_lo,
3770 eth->h_dest);
3771 }
3772
3773 SET_FLAG(pbd_e2_parsing_data,
3774 ETH_TX_PARSE_BD_E2_ETH_ADDR_TYPE, mac_type);
3775 } else {
3776 u16 global_data = 0;
3777 pbd_e1x = &txdata->tx_desc_ring[bd_prod].parse_bd_e1x;
3778 memset(pbd_e1x, 0, sizeof(struct eth_tx_parse_bd_e1x));
3779 /* Set PBD in checksum offload case */
3780 if (xmit_type & XMIT_CSUM)
3781 hlen = bnx2x_set_pbd_csum(bp, skb, pbd_e1x, xmit_type);
3782
3783 SET_FLAG(global_data,
3784 ETH_TX_PARSE_BD_E1X_ETH_ADDR_TYPE, mac_type);
3785 pbd_e1x->global_data |= cpu_to_le16(global_data);
3786 }
3787
3788 /* Setup the data pointer of the first BD of the packet */
3789 tx_start_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3790 tx_start_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3791 tx_start_bd->nbytes = cpu_to_le16(skb_headlen(skb));
3792 pkt_size = tx_start_bd->nbytes;
3793
3794 DP(NETIF_MSG_TX_QUEUED,
3795 "first bd @%p addr (%x:%x) nbytes %d flags %x vlan %x\n",
3796 tx_start_bd, tx_start_bd->addr_hi, tx_start_bd->addr_lo,
3797 le16_to_cpu(tx_start_bd->nbytes),
3798 tx_start_bd->bd_flags.as_bitfield,
3799 le16_to_cpu(tx_start_bd->vlan_or_ethertype));
3800
3801 if (xmit_type & XMIT_GSO) {
3802
3803 DP(NETIF_MSG_TX_QUEUED,
3804 "TSO packet len %d hlen %d total len %d tso size %d\n",
3805 skb->len, hlen, skb_headlen(skb),
3806 skb_shinfo(skb)->gso_size);
3807
3808 tx_start_bd->bd_flags.as_bitfield |= ETH_TX_BD_FLAGS_SW_LSO;
3809
3810 if (unlikely(skb_headlen(skb) > hlen)) {
3811 nbd++;
3812 bd_prod = bnx2x_tx_split(bp, txdata, tx_buf,
3813 &tx_start_bd, hlen,
3814 bd_prod);
3815 }
3816 if (!CHIP_IS_E1x(bp))
3817 bnx2x_set_pbd_gso_e2(skb, &pbd_e2_parsing_data,
3818 xmit_type);
3819 else
3820 bnx2x_set_pbd_gso(skb, pbd_e1x, first_bd, xmit_type);
3821 }
3822
3823 /* Set the PBD's parsing_data field if not zero
3824 * (for the chips newer than 57711).
3825 */
3826 if (pbd_e2_parsing_data)
3827 pbd_e2->parsing_data = cpu_to_le32(pbd_e2_parsing_data);
3828
3829 tx_data_bd = (struct eth_tx_bd *)tx_start_bd;
3830
3831 /* Handle fragmented skb */
3832 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
3833 skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
3834
3835 mapping = skb_frag_dma_map(&bp->pdev->dev, frag, 0,
3836 skb_frag_size(frag), DMA_TO_DEVICE);
3837 if (unlikely(dma_mapping_error(&bp->pdev->dev, mapping))) {
3838 unsigned int pkts_compl = 0, bytes_compl = 0;
3839
3840 DP(NETIF_MSG_TX_QUEUED,
3841 "Unable to map page - dropping packet...\n");
3842
3843 /* we need unmap all buffers already mapped
3844 * for this SKB;
3845 * first_bd->nbd need to be properly updated
3846 * before call to bnx2x_free_tx_pkt
3847 */
3848 first_bd->nbd = cpu_to_le16(nbd);
3849 bnx2x_free_tx_pkt(bp, txdata,
3850 TX_BD(txdata->tx_pkt_prod),
3851 &pkts_compl, &bytes_compl);
3852 return NETDEV_TX_OK;
3853 }
3854
3855 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3856 tx_data_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3857 if (total_pkt_bd == NULL)
3858 total_pkt_bd = &txdata->tx_desc_ring[bd_prod].reg_bd;
3859
3860 tx_data_bd->addr_hi = cpu_to_le32(U64_HI(mapping));
3861 tx_data_bd->addr_lo = cpu_to_le32(U64_LO(mapping));
3862 tx_data_bd->nbytes = cpu_to_le16(skb_frag_size(frag));
3863 le16_add_cpu(&pkt_size, skb_frag_size(frag));
3864 nbd++;
3865
3866 DP(NETIF_MSG_TX_QUEUED,
3867 "frag %d bd @%p addr (%x:%x) nbytes %d\n",
3868 i, tx_data_bd, tx_data_bd->addr_hi, tx_data_bd->addr_lo,
3869 le16_to_cpu(tx_data_bd->nbytes));
3870 }
3871
3872 DP(NETIF_MSG_TX_QUEUED, "last bd @%p\n", tx_data_bd);
3873
3874 /* update with actual num BDs */
3875 first_bd->nbd = cpu_to_le16(nbd);
3876
3877 bd_prod = TX_BD(NEXT_TX_IDX(bd_prod));
3878
3879 /* now send a tx doorbell, counting the next BD
3880 * if the packet contains or ends with it
3881 */
3882 if (TX_BD_POFF(bd_prod) < nbd)
3883 nbd++;
3884
3885 /* total_pkt_bytes should be set on the first data BD if
3886 * it's not an LSO packet and there is more than one
3887 * data BD. In this case pkt_size is limited by an MTU value.
3888 * However we prefer to set it for an LSO packet (while we don't
3889 * have to) in order to save some CPU cycles in a none-LSO
3890 * case, when we much more care about them.
3891 */
3892 if (total_pkt_bd != NULL)
3893 total_pkt_bd->total_pkt_bytes = pkt_size;
3894
3895 if (pbd_e1x)
3896 DP(NETIF_MSG_TX_QUEUED,
3897 "PBD (E1X) @%p ip_data %x ip_hlen %u ip_id %u lso_mss %u tcp_flags %x xsum %x seq %u hlen %u\n",
3898 pbd_e1x, pbd_e1x->global_data, pbd_e1x->ip_hlen_w,
3899 pbd_e1x->ip_id, pbd_e1x->lso_mss, pbd_e1x->tcp_flags,
3900 pbd_e1x->tcp_pseudo_csum, pbd_e1x->tcp_send_seq,
3901 le16_to_cpu(pbd_e1x->total_hlen_w));
3902 if (pbd_e2)
3903 DP(NETIF_MSG_TX_QUEUED,
3904 "PBD (E2) @%p dst %x %x %x src %x %x %x parsing_data %x\n",
3905 pbd_e2,
3906 pbd_e2->data.mac_addr.dst_hi,
3907 pbd_e2->data.mac_addr.dst_mid,
3908 pbd_e2->data.mac_addr.dst_lo,
3909 pbd_e2->data.mac_addr.src_hi,
3910 pbd_e2->data.mac_addr.src_mid,
3911 pbd_e2->data.mac_addr.src_lo,
3912 pbd_e2->parsing_data);
3913 DP(NETIF_MSG_TX_QUEUED, "doorbell: nbd %d bd %u\n", nbd, bd_prod);
3914
3915 netdev_tx_sent_queue(txq, skb->len);
3916
3917 skb_tx_timestamp(skb);
3918
3919 txdata->tx_pkt_prod++;
3920 /*
3921 * Make sure that the BD data is updated before updating the producer
3922 * since FW might read the BD right after the producer is updated.
3923 * This is only applicable for weak-ordered memory model archs such
3924 * as IA-64. The following barrier is also mandatory since FW will
3925 * assumes packets must have BDs.
3926 */
3927 wmb();
3928
3929 txdata->tx_db.data.prod += nbd;
3930 barrier();
3931
3932 DOORBELL(bp, txdata->cid, txdata->tx_db.raw);
3933
3934 mmiowb();
3935
3936 txdata->tx_bd_prod += nbd;
3937
3938 if (unlikely(bnx2x_tx_avail(bp, txdata) < MAX_DESC_PER_TX_PKT)) {
3939 netif_tx_stop_queue(txq);
3940
3941 /* paired memory barrier is in bnx2x_tx_int(), we have to keep
3942 * ordering of set_bit() in netif_tx_stop_queue() and read of
3943 * fp->bd_tx_cons */
3944 smp_mb();
3945
3946 bnx2x_fp_qstats(bp, txdata->parent_fp)->driver_xoff++;
3947 if (bnx2x_tx_avail(bp, txdata) >= MAX_DESC_PER_TX_PKT)
3948 netif_tx_wake_queue(txq);
3949 }
3950 txdata->tx_pkt++;
3951
3952 return NETDEV_TX_OK;
3953 }
3954
3955 /**
3956 * bnx2x_setup_tc - routine to configure net_device for multi tc
3957 *
3958 * @netdev: net device to configure
3959 * @tc: number of traffic classes to enable
3960 *
3961 * callback connected to the ndo_setup_tc function pointer
3962 */
bnx2x_setup_tc(struct net_device * dev,u8 num_tc)3963 int bnx2x_setup_tc(struct net_device *dev, u8 num_tc)
3964 {
3965 int cos, prio, count, offset;
3966 struct bnx2x *bp = netdev_priv(dev);
3967
3968 /* setup tc must be called under rtnl lock */
3969 ASSERT_RTNL();
3970
3971 /* no traffic classes requested. aborting */
3972 if (!num_tc) {
3973 netdev_reset_tc(dev);
3974 return 0;
3975 }
3976
3977 /* requested to support too many traffic classes */
3978 if (num_tc > bp->max_cos) {
3979 BNX2X_ERR("support for too many traffic classes requested: %d. max supported is %d\n",
3980 num_tc, bp->max_cos);
3981 return -EINVAL;
3982 }
3983
3984 /* declare amount of supported traffic classes */
3985 if (netdev_set_num_tc(dev, num_tc)) {
3986 BNX2X_ERR("failed to declare %d traffic classes\n", num_tc);
3987 return -EINVAL;
3988 }
3989
3990 /* configure priority to traffic class mapping */
3991 for (prio = 0; prio < BNX2X_MAX_PRIORITY; prio++) {
3992 netdev_set_prio_tc_map(dev, prio, bp->prio_to_cos[prio]);
3993 DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
3994 "mapping priority %d to tc %d\n",
3995 prio, bp->prio_to_cos[prio]);
3996 }
3997
3998
3999 /* Use this configuration to diffrentiate tc0 from other COSes
4000 This can be used for ets or pfc, and save the effort of setting
4001 up a multio class queue disc or negotiating DCBX with a switch
4002 netdev_set_prio_tc_map(dev, 0, 0);
4003 DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", 0, 0);
4004 for (prio = 1; prio < 16; prio++) {
4005 netdev_set_prio_tc_map(dev, prio, 1);
4006 DP(BNX2X_MSG_SP, "mapping priority %d to tc %d\n", prio, 1);
4007 } */
4008
4009 /* configure traffic class to transmission queue mapping */
4010 for (cos = 0; cos < bp->max_cos; cos++) {
4011 count = BNX2X_NUM_ETH_QUEUES(bp);
4012 offset = cos * BNX2X_NUM_NON_CNIC_QUEUES(bp);
4013 netdev_set_tc_queue(dev, cos, count, offset);
4014 DP(BNX2X_MSG_SP | NETIF_MSG_IFUP,
4015 "mapping tc %d to offset %d count %d\n",
4016 cos, offset, count);
4017 }
4018
4019 return 0;
4020 }
4021
4022 /* called with rtnl_lock */
bnx2x_change_mac_addr(struct net_device * dev,void * p)4023 int bnx2x_change_mac_addr(struct net_device *dev, void *p)
4024 {
4025 struct sockaddr *addr = p;
4026 struct bnx2x *bp = netdev_priv(dev);
4027 int rc = 0;
4028
4029 if (!bnx2x_is_valid_ether_addr(bp, addr->sa_data)) {
4030 BNX2X_ERR("Requested MAC address is not valid\n");
4031 return -EINVAL;
4032 }
4033
4034 if ((IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp)) &&
4035 !is_zero_ether_addr(addr->sa_data)) {
4036 BNX2X_ERR("Can't configure non-zero address on iSCSI or FCoE functions in MF-SD mode\n");
4037 return -EINVAL;
4038 }
4039
4040 if (netif_running(dev)) {
4041 rc = bnx2x_set_eth_mac(bp, false);
4042 if (rc)
4043 return rc;
4044 }
4045
4046 memcpy(dev->dev_addr, addr->sa_data, dev->addr_len);
4047
4048 if (netif_running(dev))
4049 rc = bnx2x_set_eth_mac(bp, true);
4050
4051 return rc;
4052 }
4053
bnx2x_free_fp_mem_at(struct bnx2x * bp,int fp_index)4054 static void bnx2x_free_fp_mem_at(struct bnx2x *bp, int fp_index)
4055 {
4056 union host_hc_status_block *sb = &bnx2x_fp(bp, fp_index, status_blk);
4057 struct bnx2x_fastpath *fp = &bp->fp[fp_index];
4058 u8 cos;
4059
4060 /* Common */
4061
4062 if (IS_FCOE_IDX(fp_index)) {
4063 memset(sb, 0, sizeof(union host_hc_status_block));
4064 fp->status_blk_mapping = 0;
4065 } else {
4066 /* status blocks */
4067 if (!CHIP_IS_E1x(bp))
4068 BNX2X_PCI_FREE(sb->e2_sb,
4069 bnx2x_fp(bp, fp_index,
4070 status_blk_mapping),
4071 sizeof(struct host_hc_status_block_e2));
4072 else
4073 BNX2X_PCI_FREE(sb->e1x_sb,
4074 bnx2x_fp(bp, fp_index,
4075 status_blk_mapping),
4076 sizeof(struct host_hc_status_block_e1x));
4077 }
4078
4079 /* Rx */
4080 if (!skip_rx_queue(bp, fp_index)) {
4081 bnx2x_free_rx_bds(fp);
4082
4083 /* fastpath rx rings: rx_buf rx_desc rx_comp */
4084 BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_buf_ring));
4085 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_desc_ring),
4086 bnx2x_fp(bp, fp_index, rx_desc_mapping),
4087 sizeof(struct eth_rx_bd) * NUM_RX_BD);
4088
4089 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_comp_ring),
4090 bnx2x_fp(bp, fp_index, rx_comp_mapping),
4091 sizeof(struct eth_fast_path_rx_cqe) *
4092 NUM_RCQ_BD);
4093
4094 /* SGE ring */
4095 BNX2X_FREE(bnx2x_fp(bp, fp_index, rx_page_ring));
4096 BNX2X_PCI_FREE(bnx2x_fp(bp, fp_index, rx_sge_ring),
4097 bnx2x_fp(bp, fp_index, rx_sge_mapping),
4098 BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4099 }
4100
4101 /* Tx */
4102 if (!skip_tx_queue(bp, fp_index)) {
4103 /* fastpath tx rings: tx_buf tx_desc */
4104 for_each_cos_in_tx_queue(fp, cos) {
4105 struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4106
4107 DP(NETIF_MSG_IFDOWN,
4108 "freeing tx memory of fp %d cos %d cid %d\n",
4109 fp_index, cos, txdata->cid);
4110
4111 BNX2X_FREE(txdata->tx_buf_ring);
4112 BNX2X_PCI_FREE(txdata->tx_desc_ring,
4113 txdata->tx_desc_mapping,
4114 sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4115 }
4116 }
4117 /* end of fastpath */
4118 }
4119
bnx2x_free_fp_mem_cnic(struct bnx2x * bp)4120 void bnx2x_free_fp_mem_cnic(struct bnx2x *bp)
4121 {
4122 int i;
4123 for_each_cnic_queue(bp, i)
4124 bnx2x_free_fp_mem_at(bp, i);
4125 }
4126
bnx2x_free_fp_mem(struct bnx2x * bp)4127 void bnx2x_free_fp_mem(struct bnx2x *bp)
4128 {
4129 int i;
4130 for_each_eth_queue(bp, i)
4131 bnx2x_free_fp_mem_at(bp, i);
4132 }
4133
set_sb_shortcuts(struct bnx2x * bp,int index)4134 static void set_sb_shortcuts(struct bnx2x *bp, int index)
4135 {
4136 union host_hc_status_block status_blk = bnx2x_fp(bp, index, status_blk);
4137 if (!CHIP_IS_E1x(bp)) {
4138 bnx2x_fp(bp, index, sb_index_values) =
4139 (__le16 *)status_blk.e2_sb->sb.index_values;
4140 bnx2x_fp(bp, index, sb_running_index) =
4141 (__le16 *)status_blk.e2_sb->sb.running_index;
4142 } else {
4143 bnx2x_fp(bp, index, sb_index_values) =
4144 (__le16 *)status_blk.e1x_sb->sb.index_values;
4145 bnx2x_fp(bp, index, sb_running_index) =
4146 (__le16 *)status_blk.e1x_sb->sb.running_index;
4147 }
4148 }
4149
4150 /* Returns the number of actually allocated BDs */
bnx2x_alloc_rx_bds(struct bnx2x_fastpath * fp,int rx_ring_size)4151 static int bnx2x_alloc_rx_bds(struct bnx2x_fastpath *fp,
4152 int rx_ring_size)
4153 {
4154 struct bnx2x *bp = fp->bp;
4155 u16 ring_prod, cqe_ring_prod;
4156 int i, failure_cnt = 0;
4157
4158 fp->rx_comp_cons = 0;
4159 cqe_ring_prod = ring_prod = 0;
4160
4161 /* This routine is called only during fo init so
4162 * fp->eth_q_stats.rx_skb_alloc_failed = 0
4163 */
4164 for (i = 0; i < rx_ring_size; i++) {
4165 if (bnx2x_alloc_rx_data(bp, fp, ring_prod) < 0) {
4166 failure_cnt++;
4167 continue;
4168 }
4169 ring_prod = NEXT_RX_IDX(ring_prod);
4170 cqe_ring_prod = NEXT_RCQ_IDX(cqe_ring_prod);
4171 WARN_ON(ring_prod <= (i - failure_cnt));
4172 }
4173
4174 if (failure_cnt)
4175 BNX2X_ERR("was only able to allocate %d rx skbs on queue[%d]\n",
4176 i - failure_cnt, fp->index);
4177
4178 fp->rx_bd_prod = ring_prod;
4179 /* Limit the CQE producer by the CQE ring size */
4180 fp->rx_comp_prod = min_t(u16, NUM_RCQ_RINGS*RCQ_DESC_CNT,
4181 cqe_ring_prod);
4182 fp->rx_pkt = fp->rx_calls = 0;
4183
4184 bnx2x_fp_stats(bp, fp)->eth_q_stats.rx_skb_alloc_failed += failure_cnt;
4185
4186 return i - failure_cnt;
4187 }
4188
bnx2x_set_next_page_rx_cq(struct bnx2x_fastpath * fp)4189 static void bnx2x_set_next_page_rx_cq(struct bnx2x_fastpath *fp)
4190 {
4191 int i;
4192
4193 for (i = 1; i <= NUM_RCQ_RINGS; i++) {
4194 struct eth_rx_cqe_next_page *nextpg;
4195
4196 nextpg = (struct eth_rx_cqe_next_page *)
4197 &fp->rx_comp_ring[RCQ_DESC_CNT * i - 1];
4198 nextpg->addr_hi =
4199 cpu_to_le32(U64_HI(fp->rx_comp_mapping +
4200 BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4201 nextpg->addr_lo =
4202 cpu_to_le32(U64_LO(fp->rx_comp_mapping +
4203 BCM_PAGE_SIZE*(i % NUM_RCQ_RINGS)));
4204 }
4205 }
4206
bnx2x_alloc_fp_mem_at(struct bnx2x * bp,int index)4207 static int bnx2x_alloc_fp_mem_at(struct bnx2x *bp, int index)
4208 {
4209 union host_hc_status_block *sb;
4210 struct bnx2x_fastpath *fp = &bp->fp[index];
4211 int ring_size = 0;
4212 u8 cos;
4213 int rx_ring_size = 0;
4214
4215 if (!bp->rx_ring_size &&
4216 (IS_MF_STORAGE_SD(bp) || IS_MF_FCOE_AFEX(bp))) {
4217 rx_ring_size = MIN_RX_SIZE_NONTPA;
4218 bp->rx_ring_size = rx_ring_size;
4219 } else if (!bp->rx_ring_size) {
4220 rx_ring_size = MAX_RX_AVAIL/BNX2X_NUM_RX_QUEUES(bp);
4221
4222 if (CHIP_IS_E3(bp)) {
4223 u32 cfg = SHMEM_RD(bp,
4224 dev_info.port_hw_config[BP_PORT(bp)].
4225 default_cfg);
4226
4227 /* Decrease ring size for 1G functions */
4228 if ((cfg & PORT_HW_CFG_NET_SERDES_IF_MASK) ==
4229 PORT_HW_CFG_NET_SERDES_IF_SGMII)
4230 rx_ring_size /= 10;
4231 }
4232
4233 /* allocate at least number of buffers required by FW */
4234 rx_ring_size = max_t(int, bp->disable_tpa ? MIN_RX_SIZE_NONTPA :
4235 MIN_RX_SIZE_TPA, rx_ring_size);
4236
4237 bp->rx_ring_size = rx_ring_size;
4238 } else /* if rx_ring_size specified - use it */
4239 rx_ring_size = bp->rx_ring_size;
4240
4241 DP(BNX2X_MSG_SP, "calculated rx_ring_size %d\n", rx_ring_size);
4242
4243 /* Common */
4244 sb = &bnx2x_fp(bp, index, status_blk);
4245
4246 if (!IS_FCOE_IDX(index)) {
4247 /* status blocks */
4248 if (!CHIP_IS_E1x(bp))
4249 BNX2X_PCI_ALLOC(sb->e2_sb,
4250 &bnx2x_fp(bp, index, status_blk_mapping),
4251 sizeof(struct host_hc_status_block_e2));
4252 else
4253 BNX2X_PCI_ALLOC(sb->e1x_sb,
4254 &bnx2x_fp(bp, index, status_blk_mapping),
4255 sizeof(struct host_hc_status_block_e1x));
4256 }
4257
4258 /* FCoE Queue uses Default SB and doesn't ACK the SB, thus no need to
4259 * set shortcuts for it.
4260 */
4261 if (!IS_FCOE_IDX(index))
4262 set_sb_shortcuts(bp, index);
4263
4264 /* Tx */
4265 if (!skip_tx_queue(bp, index)) {
4266 /* fastpath tx rings: tx_buf tx_desc */
4267 for_each_cos_in_tx_queue(fp, cos) {
4268 struct bnx2x_fp_txdata *txdata = fp->txdata_ptr[cos];
4269
4270 DP(NETIF_MSG_IFUP,
4271 "allocating tx memory of fp %d cos %d\n",
4272 index, cos);
4273
4274 BNX2X_ALLOC(txdata->tx_buf_ring,
4275 sizeof(struct sw_tx_bd) * NUM_TX_BD);
4276 BNX2X_PCI_ALLOC(txdata->tx_desc_ring,
4277 &txdata->tx_desc_mapping,
4278 sizeof(union eth_tx_bd_types) * NUM_TX_BD);
4279 }
4280 }
4281
4282 /* Rx */
4283 if (!skip_rx_queue(bp, index)) {
4284 /* fastpath rx rings: rx_buf rx_desc rx_comp */
4285 BNX2X_ALLOC(bnx2x_fp(bp, index, rx_buf_ring),
4286 sizeof(struct sw_rx_bd) * NUM_RX_BD);
4287 BNX2X_PCI_ALLOC(bnx2x_fp(bp, index, rx_desc_ring),
4288 &bnx2x_fp(bp, index, rx_desc_mapping),
4289 sizeof(struct eth_rx_bd) * NUM_RX_BD);
4290
4291 BNX2X_PCI_ALLOC(bnx2x_fp(bp, index, rx_comp_ring),
4292 &bnx2x_fp(bp, index, rx_comp_mapping),
4293 sizeof(struct eth_fast_path_rx_cqe) *
4294 NUM_RCQ_BD);
4295
4296 /* SGE ring */
4297 BNX2X_ALLOC(bnx2x_fp(bp, index, rx_page_ring),
4298 sizeof(struct sw_rx_page) * NUM_RX_SGE);
4299 BNX2X_PCI_ALLOC(bnx2x_fp(bp, index, rx_sge_ring),
4300 &bnx2x_fp(bp, index, rx_sge_mapping),
4301 BCM_PAGE_SIZE * NUM_RX_SGE_PAGES);
4302 /* RX BD ring */
4303 bnx2x_set_next_page_rx_bd(fp);
4304
4305 /* CQ ring */
4306 bnx2x_set_next_page_rx_cq(fp);
4307
4308 /* BDs */
4309 ring_size = bnx2x_alloc_rx_bds(fp, rx_ring_size);
4310 if (ring_size < rx_ring_size)
4311 goto alloc_mem_err;
4312 }
4313
4314 return 0;
4315
4316 /* handles low memory cases */
4317 alloc_mem_err:
4318 BNX2X_ERR("Unable to allocate full memory for queue %d (size %d)\n",
4319 index, ring_size);
4320 /* FW will drop all packets if queue is not big enough,
4321 * In these cases we disable the queue
4322 * Min size is different for OOO, TPA and non-TPA queues
4323 */
4324 if (ring_size < (fp->disable_tpa ?
4325 MIN_RX_SIZE_NONTPA : MIN_RX_SIZE_TPA)) {
4326 /* release memory allocated for this queue */
4327 bnx2x_free_fp_mem_at(bp, index);
4328 return -ENOMEM;
4329 }
4330 return 0;
4331 }
4332
bnx2x_alloc_fp_mem_cnic(struct bnx2x * bp)4333 int bnx2x_alloc_fp_mem_cnic(struct bnx2x *bp)
4334 {
4335 if (!NO_FCOE(bp))
4336 /* FCoE */
4337 if (bnx2x_alloc_fp_mem_at(bp, FCOE_IDX(bp)))
4338 /* we will fail load process instead of mark
4339 * NO_FCOE_FLAG
4340 */
4341 return -ENOMEM;
4342
4343 return 0;
4344 }
4345
bnx2x_alloc_fp_mem(struct bnx2x * bp)4346 int bnx2x_alloc_fp_mem(struct bnx2x *bp)
4347 {
4348 int i;
4349
4350 /* 1. Allocate FP for leading - fatal if error
4351 * 2. Allocate RSS - fix number of queues if error
4352 */
4353
4354 /* leading */
4355 if (bnx2x_alloc_fp_mem_at(bp, 0))
4356 return -ENOMEM;
4357
4358 /* RSS */
4359 for_each_nondefault_eth_queue(bp, i)
4360 if (bnx2x_alloc_fp_mem_at(bp, i))
4361 break;
4362
4363 /* handle memory failures */
4364 if (i != BNX2X_NUM_ETH_QUEUES(bp)) {
4365 int delta = BNX2X_NUM_ETH_QUEUES(bp) - i;
4366
4367 WARN_ON(delta < 0);
4368 bnx2x_shrink_eth_fp(bp, delta);
4369 if (CNIC_SUPPORT(bp))
4370 /* move non eth FPs next to last eth FP
4371 * must be done in that order
4372 * FCOE_IDX < FWD_IDX < OOO_IDX
4373 */
4374
4375 /* move FCoE fp even NO_FCOE_FLAG is on */
4376 bnx2x_move_fp(bp, FCOE_IDX(bp), FCOE_IDX(bp) - delta);
4377 bp->num_ethernet_queues -= delta;
4378 bp->num_queues = bp->num_ethernet_queues +
4379 bp->num_cnic_queues;
4380 BNX2X_ERR("Adjusted num of queues from %d to %d\n",
4381 bp->num_queues + delta, bp->num_queues);
4382 }
4383
4384 return 0;
4385 }
4386
bnx2x_free_mem_bp(struct bnx2x * bp)4387 void bnx2x_free_mem_bp(struct bnx2x *bp)
4388 {
4389 int i;
4390
4391 for (i = 0; i < bp->fp_array_size; i++)
4392 kfree(bp->fp[i].tpa_info);
4393 kfree(bp->fp);
4394 kfree(bp->sp_objs);
4395 kfree(bp->fp_stats);
4396 kfree(bp->bnx2x_txq);
4397 kfree(bp->msix_table);
4398 kfree(bp->ilt);
4399 }
4400
bnx2x_alloc_mem_bp(struct bnx2x * bp)4401 int bnx2x_alloc_mem_bp(struct bnx2x *bp)
4402 {
4403 struct bnx2x_fastpath *fp;
4404 struct msix_entry *tbl;
4405 struct bnx2x_ilt *ilt;
4406 int msix_table_size = 0;
4407 int fp_array_size, txq_array_size;
4408 int i;
4409
4410 /*
4411 * The biggest MSI-X table we might need is as a maximum number of fast
4412 * path IGU SBs plus default SB (for PF only).
4413 */
4414 msix_table_size = bp->igu_sb_cnt;
4415 if (IS_PF(bp))
4416 msix_table_size++;
4417 BNX2X_DEV_INFO("msix_table_size %d\n", msix_table_size);
4418
4419 /* fp array: RSS plus CNIC related L2 queues */
4420 fp_array_size = BNX2X_MAX_RSS_COUNT(bp) + CNIC_SUPPORT(bp);
4421 bp->fp_array_size = fp_array_size;
4422 BNX2X_DEV_INFO("fp_array_size %d\n", bp->fp_array_size);
4423
4424 fp = kcalloc(bp->fp_array_size, sizeof(*fp), GFP_KERNEL);
4425 if (!fp)
4426 goto alloc_err;
4427 for (i = 0; i < bp->fp_array_size; i++) {
4428 fp[i].tpa_info =
4429 kcalloc(ETH_MAX_AGGREGATION_QUEUES_E1H_E2,
4430 sizeof(struct bnx2x_agg_info), GFP_KERNEL);
4431 if (!(fp[i].tpa_info))
4432 goto alloc_err;
4433 }
4434
4435 bp->fp = fp;
4436
4437 /* allocate sp objs */
4438 bp->sp_objs = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_sp_objs),
4439 GFP_KERNEL);
4440 if (!bp->sp_objs)
4441 goto alloc_err;
4442
4443 /* allocate fp_stats */
4444 bp->fp_stats = kcalloc(bp->fp_array_size, sizeof(struct bnx2x_fp_stats),
4445 GFP_KERNEL);
4446 if (!bp->fp_stats)
4447 goto alloc_err;
4448
4449 /* Allocate memory for the transmission queues array */
4450 txq_array_size =
4451 BNX2X_MAX_RSS_COUNT(bp) * BNX2X_MULTI_TX_COS + CNIC_SUPPORT(bp);
4452 BNX2X_DEV_INFO("txq_array_size %d", txq_array_size);
4453
4454 bp->bnx2x_txq = kcalloc(txq_array_size, sizeof(struct bnx2x_fp_txdata),
4455 GFP_KERNEL);
4456 if (!bp->bnx2x_txq)
4457 goto alloc_err;
4458
4459 /* msix table */
4460 tbl = kcalloc(msix_table_size, sizeof(*tbl), GFP_KERNEL);
4461 if (!tbl)
4462 goto alloc_err;
4463 bp->msix_table = tbl;
4464
4465 /* ilt */
4466 ilt = kzalloc(sizeof(*ilt), GFP_KERNEL);
4467 if (!ilt)
4468 goto alloc_err;
4469 bp->ilt = ilt;
4470
4471 return 0;
4472 alloc_err:
4473 bnx2x_free_mem_bp(bp);
4474 return -ENOMEM;
4475
4476 }
4477
bnx2x_reload_if_running(struct net_device * dev)4478 int bnx2x_reload_if_running(struct net_device *dev)
4479 {
4480 struct bnx2x *bp = netdev_priv(dev);
4481
4482 if (unlikely(!netif_running(dev)))
4483 return 0;
4484
4485 bnx2x_nic_unload(bp, UNLOAD_NORMAL, true);
4486 return bnx2x_nic_load(bp, LOAD_NORMAL);
4487 }
4488
bnx2x_get_cur_phy_idx(struct bnx2x * bp)4489 int bnx2x_get_cur_phy_idx(struct bnx2x *bp)
4490 {
4491 u32 sel_phy_idx = 0;
4492 if (bp->link_params.num_phys <= 1)
4493 return INT_PHY;
4494
4495 if (bp->link_vars.link_up) {
4496 sel_phy_idx = EXT_PHY1;
4497 /* In case link is SERDES, check if the EXT_PHY2 is the one */
4498 if ((bp->link_vars.link_status & LINK_STATUS_SERDES_LINK) &&
4499 (bp->link_params.phy[EXT_PHY2].supported & SUPPORTED_FIBRE))
4500 sel_phy_idx = EXT_PHY2;
4501 } else {
4502
4503 switch (bnx2x_phy_selection(&bp->link_params)) {
4504 case PORT_HW_CFG_PHY_SELECTION_HARDWARE_DEFAULT:
4505 case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY:
4506 case PORT_HW_CFG_PHY_SELECTION_FIRST_PHY_PRIORITY:
4507 sel_phy_idx = EXT_PHY1;
4508 break;
4509 case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY:
4510 case PORT_HW_CFG_PHY_SELECTION_SECOND_PHY_PRIORITY:
4511 sel_phy_idx = EXT_PHY2;
4512 break;
4513 }
4514 }
4515
4516 return sel_phy_idx;
4517
4518 }
bnx2x_get_link_cfg_idx(struct bnx2x * bp)4519 int bnx2x_get_link_cfg_idx(struct bnx2x *bp)
4520 {
4521 u32 sel_phy_idx = bnx2x_get_cur_phy_idx(bp);
4522 /*
4523 * The selected activated PHY is always after swapping (in case PHY
4524 * swapping is enabled). So when swapping is enabled, we need to reverse
4525 * the configuration
4526 */
4527
4528 if (bp->link_params.multi_phy_config &
4529 PORT_HW_CFG_PHY_SWAPPED_ENABLED) {
4530 if (sel_phy_idx == EXT_PHY1)
4531 sel_phy_idx = EXT_PHY2;
4532 else if (sel_phy_idx == EXT_PHY2)
4533 sel_phy_idx = EXT_PHY1;
4534 }
4535 return LINK_CONFIG_IDX(sel_phy_idx);
4536 }
4537
4538 #ifdef NETDEV_FCOE_WWNN
bnx2x_fcoe_get_wwn(struct net_device * dev,u64 * wwn,int type)4539 int bnx2x_fcoe_get_wwn(struct net_device *dev, u64 *wwn, int type)
4540 {
4541 struct bnx2x *bp = netdev_priv(dev);
4542 struct cnic_eth_dev *cp = &bp->cnic_eth_dev;
4543
4544 switch (type) {
4545 case NETDEV_FCOE_WWNN:
4546 *wwn = HILO_U64(cp->fcoe_wwn_node_name_hi,
4547 cp->fcoe_wwn_node_name_lo);
4548 break;
4549 case NETDEV_FCOE_WWPN:
4550 *wwn = HILO_U64(cp->fcoe_wwn_port_name_hi,
4551 cp->fcoe_wwn_port_name_lo);
4552 break;
4553 default:
4554 BNX2X_ERR("Wrong WWN type requested - %d\n", type);
4555 return -EINVAL;
4556 }
4557
4558 return 0;
4559 }
4560 #endif
4561
4562 /* called with rtnl_lock */
bnx2x_change_mtu(struct net_device * dev,int new_mtu)4563 int bnx2x_change_mtu(struct net_device *dev, int new_mtu)
4564 {
4565 struct bnx2x *bp = netdev_priv(dev);
4566
4567 if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4568 BNX2X_ERR("Can't perform change MTU during parity recovery\n");
4569 return -EAGAIN;
4570 }
4571
4572 if ((new_mtu > ETH_MAX_JUMBO_PACKET_SIZE) ||
4573 ((new_mtu + ETH_HLEN) < ETH_MIN_PACKET_SIZE)) {
4574 BNX2X_ERR("Can't support requested MTU size\n");
4575 return -EINVAL;
4576 }
4577
4578 /* This does not race with packet allocation
4579 * because the actual alloc size is
4580 * only updated as part of load
4581 */
4582 dev->mtu = new_mtu;
4583
4584 return bnx2x_reload_if_running(dev);
4585 }
4586
bnx2x_fix_features(struct net_device * dev,netdev_features_t features)4587 netdev_features_t bnx2x_fix_features(struct net_device *dev,
4588 netdev_features_t features)
4589 {
4590 struct bnx2x *bp = netdev_priv(dev);
4591
4592 /* TPA requires Rx CSUM offloading */
4593 if (!(features & NETIF_F_RXCSUM) || bp->disable_tpa) {
4594 features &= ~NETIF_F_LRO;
4595 features &= ~NETIF_F_GRO;
4596 }
4597
4598 return features;
4599 }
4600
bnx2x_set_features(struct net_device * dev,netdev_features_t features)4601 int bnx2x_set_features(struct net_device *dev, netdev_features_t features)
4602 {
4603 struct bnx2x *bp = netdev_priv(dev);
4604 u32 flags = bp->flags;
4605 bool bnx2x_reload = false;
4606
4607 if (features & NETIF_F_LRO)
4608 flags |= TPA_ENABLE_FLAG;
4609 else
4610 flags &= ~TPA_ENABLE_FLAG;
4611
4612 if (features & NETIF_F_GRO)
4613 flags |= GRO_ENABLE_FLAG;
4614 else
4615 flags &= ~GRO_ENABLE_FLAG;
4616
4617 if (features & NETIF_F_LOOPBACK) {
4618 if (bp->link_params.loopback_mode != LOOPBACK_BMAC) {
4619 bp->link_params.loopback_mode = LOOPBACK_BMAC;
4620 bnx2x_reload = true;
4621 }
4622 } else {
4623 if (bp->link_params.loopback_mode != LOOPBACK_NONE) {
4624 bp->link_params.loopback_mode = LOOPBACK_NONE;
4625 bnx2x_reload = true;
4626 }
4627 }
4628
4629 if (flags ^ bp->flags) {
4630 bp->flags = flags;
4631 bnx2x_reload = true;
4632 }
4633
4634 if (bnx2x_reload) {
4635 if (bp->recovery_state == BNX2X_RECOVERY_DONE)
4636 return bnx2x_reload_if_running(dev);
4637 /* else: bnx2x_nic_load() will be called at end of recovery */
4638 }
4639
4640 return 0;
4641 }
4642
bnx2x_tx_timeout(struct net_device * dev)4643 void bnx2x_tx_timeout(struct net_device *dev)
4644 {
4645 struct bnx2x *bp = netdev_priv(dev);
4646
4647 #ifdef BNX2X_STOP_ON_ERROR
4648 if (!bp->panic)
4649 bnx2x_panic();
4650 #endif
4651
4652 smp_mb__before_clear_bit();
4653 set_bit(BNX2X_SP_RTNL_TX_TIMEOUT, &bp->sp_rtnl_state);
4654 smp_mb__after_clear_bit();
4655
4656 /* This allows the netif to be shutdown gracefully before resetting */
4657 schedule_delayed_work(&bp->sp_rtnl_task, 0);
4658 }
4659
bnx2x_suspend(struct pci_dev * pdev,pm_message_t state)4660 int bnx2x_suspend(struct pci_dev *pdev, pm_message_t state)
4661 {
4662 struct net_device *dev = pci_get_drvdata(pdev);
4663 struct bnx2x *bp;
4664
4665 if (!dev) {
4666 dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4667 return -ENODEV;
4668 }
4669 bp = netdev_priv(dev);
4670
4671 rtnl_lock();
4672
4673 pci_save_state(pdev);
4674
4675 if (!netif_running(dev)) {
4676 rtnl_unlock();
4677 return 0;
4678 }
4679
4680 netif_device_detach(dev);
4681
4682 bnx2x_nic_unload(bp, UNLOAD_CLOSE, false);
4683
4684 bnx2x_set_power_state(bp, pci_choose_state(pdev, state));
4685
4686 rtnl_unlock();
4687
4688 return 0;
4689 }
4690
bnx2x_resume(struct pci_dev * pdev)4691 int bnx2x_resume(struct pci_dev *pdev)
4692 {
4693 struct net_device *dev = pci_get_drvdata(pdev);
4694 struct bnx2x *bp;
4695 int rc;
4696
4697 if (!dev) {
4698 dev_err(&pdev->dev, "BAD net device from bnx2x_init_one\n");
4699 return -ENODEV;
4700 }
4701 bp = netdev_priv(dev);
4702
4703 if (bp->recovery_state != BNX2X_RECOVERY_DONE) {
4704 BNX2X_ERR("Handling parity error recovery. Try again later\n");
4705 return -EAGAIN;
4706 }
4707
4708 rtnl_lock();
4709
4710 pci_restore_state(pdev);
4711
4712 if (!netif_running(dev)) {
4713 rtnl_unlock();
4714 return 0;
4715 }
4716
4717 bnx2x_set_power_state(bp, PCI_D0);
4718 netif_device_attach(dev);
4719
4720 rc = bnx2x_nic_load(bp, LOAD_OPEN);
4721
4722 rtnl_unlock();
4723
4724 return rc;
4725 }
4726
4727
bnx2x_set_ctx_validation(struct bnx2x * bp,struct eth_context * cxt,u32 cid)4728 void bnx2x_set_ctx_validation(struct bnx2x *bp, struct eth_context *cxt,
4729 u32 cid)
4730 {
4731 /* ustorm cxt validation */
4732 cxt->ustorm_ag_context.cdu_usage =
4733 CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4734 CDU_REGION_NUMBER_UCM_AG, ETH_CONNECTION_TYPE);
4735 /* xcontext validation */
4736 cxt->xstorm_ag_context.cdu_reserved =
4737 CDU_RSRVD_VALUE_TYPE_A(HW_CID(bp, cid),
4738 CDU_REGION_NUMBER_XCM_AG, ETH_CONNECTION_TYPE);
4739 }
4740
storm_memset_hc_timeout(struct bnx2x * bp,u8 port,u8 fw_sb_id,u8 sb_index,u8 ticks)4741 static void storm_memset_hc_timeout(struct bnx2x *bp, u8 port,
4742 u8 fw_sb_id, u8 sb_index,
4743 u8 ticks)
4744 {
4745
4746 u32 addr = BAR_CSTRORM_INTMEM +
4747 CSTORM_STATUS_BLOCK_DATA_TIMEOUT_OFFSET(fw_sb_id, sb_index);
4748 REG_WR8(bp, addr, ticks);
4749 DP(NETIF_MSG_IFUP,
4750 "port %x fw_sb_id %d sb_index %d ticks %d\n",
4751 port, fw_sb_id, sb_index, ticks);
4752 }
4753
storm_memset_hc_disable(struct bnx2x * bp,u8 port,u16 fw_sb_id,u8 sb_index,u8 disable)4754 static void storm_memset_hc_disable(struct bnx2x *bp, u8 port,
4755 u16 fw_sb_id, u8 sb_index,
4756 u8 disable)
4757 {
4758 u32 enable_flag = disable ? 0 : (1 << HC_INDEX_DATA_HC_ENABLED_SHIFT);
4759 u32 addr = BAR_CSTRORM_INTMEM +
4760 CSTORM_STATUS_BLOCK_DATA_FLAGS_OFFSET(fw_sb_id, sb_index);
4761 u8 flags = REG_RD8(bp, addr);
4762 /* clear and set */
4763 flags &= ~HC_INDEX_DATA_HC_ENABLED;
4764 flags |= enable_flag;
4765 REG_WR8(bp, addr, flags);
4766 DP(NETIF_MSG_IFUP,
4767 "port %x fw_sb_id %d sb_index %d disable %d\n",
4768 port, fw_sb_id, sb_index, disable);
4769 }
4770
bnx2x_update_coalesce_sb_index(struct bnx2x * bp,u8 fw_sb_id,u8 sb_index,u8 disable,u16 usec)4771 void bnx2x_update_coalesce_sb_index(struct bnx2x *bp, u8 fw_sb_id,
4772 u8 sb_index, u8 disable, u16 usec)
4773 {
4774 int port = BP_PORT(bp);
4775 u8 ticks = usec / BNX2X_BTR;
4776
4777 storm_memset_hc_timeout(bp, port, fw_sb_id, sb_index, ticks);
4778
4779 disable = disable ? 1 : (usec ? 0 : 1);
4780 storm_memset_hc_disable(bp, port, fw_sb_id, sb_index, disable);
4781 }
4782