be2net: receive asynchronous link status notifications from BE
[safe/jmp/linux-2.6] / drivers / net / benet / be_main.c
1 /*
2  * Copyright (C) 2005 - 2009 ServerEngines
3  * All rights reserved.
4  *
5  * This program is free software; you can redistribute it and/or
6  * modify it under the terms of the GNU General Public License version 2
7  * as published by the Free Software Foundation.  The full GNU General
8  * Public License is included in this distribution in the file called COPYING.
9  *
10  * Contact Information:
11  * linux-drivers@serverengines.com
12  *
13  * ServerEngines
14  * 209 N. Fair Oaks Ave
15  * Sunnyvale, CA 94085
16  */
17
18 #include "be.h"
19 #include <asm/div64.h>
20
21 MODULE_VERSION(DRV_VER);
22 MODULE_DEVICE_TABLE(pci, be_dev_ids);
23 MODULE_DESCRIPTION(DRV_DESC " " DRV_VER);
24 MODULE_AUTHOR("ServerEngines Corporation");
25 MODULE_LICENSE("GPL");
26
27 static unsigned int rx_frag_size = 2048;
28 module_param(rx_frag_size, uint, S_IRUGO);
29 MODULE_PARM_DESC(rx_frag_size, "Size of a fragment that holds rcvd data.");
30
31 static DEFINE_PCI_DEVICE_TABLE(be_dev_ids) = {
32         { PCI_DEVICE(BE_VENDOR_ID, BE_DEVICE_ID1) },
33         { PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID1) },
34         { PCI_DEVICE(BE_VENDOR_ID, OC_DEVICE_ID2) },
35         { 0 }
36 };
37 MODULE_DEVICE_TABLE(pci, be_dev_ids);
38
39 static void be_queue_free(struct be_adapter *adapter, struct be_queue_info *q)
40 {
41         struct be_dma_mem *mem = &q->dma_mem;
42         if (mem->va)
43                 pci_free_consistent(adapter->pdev, mem->size,
44                         mem->va, mem->dma);
45 }
46
47 static int be_queue_alloc(struct be_adapter *adapter, struct be_queue_info *q,
48                 u16 len, u16 entry_size)
49 {
50         struct be_dma_mem *mem = &q->dma_mem;
51
52         memset(q, 0, sizeof(*q));
53         q->len = len;
54         q->entry_size = entry_size;
55         mem->size = len * entry_size;
56         mem->va = pci_alloc_consistent(adapter->pdev, mem->size, &mem->dma);
57         if (!mem->va)
58                 return -1;
59         memset(mem->va, 0, mem->size);
60         return 0;
61 }
62
63 static void be_intr_set(struct be_ctrl_info *ctrl, bool enable)
64 {
65         u8 __iomem *addr = ctrl->pcicfg + PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET;
66         u32 reg = ioread32(addr);
67         u32 enabled = reg & MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
68         if (!enabled && enable) {
69                 reg |= MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
70         } else if (enabled && !enable) {
71                 reg &= ~MEMBAR_CTRL_INT_CTRL_HOSTINTR_MASK;
72         } else {
73                 printk(KERN_WARNING DRV_NAME
74                         ": bad value in membar_int_ctrl reg=0x%x\n", reg);
75                 return;
76         }
77         iowrite32(reg, addr);
78 }
79
80 static void be_rxq_notify(struct be_ctrl_info *ctrl, u16 qid, u16 posted)
81 {
82         u32 val = 0;
83         val |= qid & DB_RQ_RING_ID_MASK;
84         val |= posted << DB_RQ_NUM_POSTED_SHIFT;
85         iowrite32(val, ctrl->db + DB_RQ_OFFSET);
86 }
87
88 static void be_txq_notify(struct be_ctrl_info *ctrl, u16 qid, u16 posted)
89 {
90         u32 val = 0;
91         val |= qid & DB_TXULP_RING_ID_MASK;
92         val |= (posted & DB_TXULP_NUM_POSTED_MASK) << DB_TXULP_NUM_POSTED_SHIFT;
93         iowrite32(val, ctrl->db + DB_TXULP1_OFFSET);
94 }
95
96 static void be_eq_notify(struct be_ctrl_info *ctrl, u16 qid,
97                 bool arm, bool clear_int, u16 num_popped)
98 {
99         u32 val = 0;
100         val |= qid & DB_EQ_RING_ID_MASK;
101         if (arm)
102                 val |= 1 << DB_EQ_REARM_SHIFT;
103         if (clear_int)
104                 val |= 1 << DB_EQ_CLR_SHIFT;
105         val |= 1 << DB_EQ_EVNT_SHIFT;
106         val |= num_popped << DB_EQ_NUM_POPPED_SHIFT;
107         iowrite32(val, ctrl->db + DB_EQ_OFFSET);
108 }
109
110 void be_cq_notify(struct be_ctrl_info *ctrl, u16 qid,
111                 bool arm, u16 num_popped)
112 {
113         u32 val = 0;
114         val |= qid & DB_CQ_RING_ID_MASK;
115         if (arm)
116                 val |= 1 << DB_CQ_REARM_SHIFT;
117         val |= num_popped << DB_CQ_NUM_POPPED_SHIFT;
118         iowrite32(val, ctrl->db + DB_CQ_OFFSET);
119 }
120
121
122 static int be_mac_addr_set(struct net_device *netdev, void *p)
123 {
124         struct be_adapter *adapter = netdev_priv(netdev);
125         struct sockaddr *addr = p;
126         int status = 0;
127
128         if (netif_running(netdev)) {
129                 status = be_cmd_pmac_del(&adapter->ctrl, adapter->if_handle,
130                                 adapter->pmac_id);
131                 if (status)
132                         return status;
133
134                 status = be_cmd_pmac_add(&adapter->ctrl, (u8 *)addr->sa_data,
135                                 adapter->if_handle, &adapter->pmac_id);
136         }
137
138         if (!status)
139                 memcpy(netdev->dev_addr, addr->sa_data, netdev->addr_len);
140
141         return status;
142 }
143
144 static void netdev_stats_update(struct be_adapter *adapter)
145 {
146         struct be_hw_stats *hw_stats = hw_stats_from_cmd(adapter->stats.cmd.va);
147         struct be_rxf_stats *rxf_stats = &hw_stats->rxf;
148         struct be_port_rxf_stats *port_stats =
149                         &rxf_stats->port[adapter->port_num];
150         struct net_device_stats *dev_stats = &adapter->stats.net_stats;
151         struct be_erx_stats *erx_stats = &hw_stats->erx;
152
153         dev_stats->rx_packets = port_stats->rx_total_frames;
154         dev_stats->tx_packets = port_stats->tx_unicastframes +
155                 port_stats->tx_multicastframes + port_stats->tx_broadcastframes;
156         dev_stats->rx_bytes = (u64) port_stats->rx_bytes_msd << 32 |
157                                 (u64) port_stats->rx_bytes_lsd;
158         dev_stats->tx_bytes = (u64) port_stats->tx_bytes_msd << 32 |
159                                 (u64) port_stats->tx_bytes_lsd;
160
161         /* bad pkts received */
162         dev_stats->rx_errors = port_stats->rx_crc_errors +
163                 port_stats->rx_alignment_symbol_errors +
164                 port_stats->rx_in_range_errors +
165                 port_stats->rx_out_range_errors +
166                 port_stats->rx_frame_too_long +
167                 port_stats->rx_dropped_too_small +
168                 port_stats->rx_dropped_too_short +
169                 port_stats->rx_dropped_header_too_small +
170                 port_stats->rx_dropped_tcp_length +
171                 port_stats->rx_dropped_runt +
172                 port_stats->rx_tcp_checksum_errs +
173                 port_stats->rx_ip_checksum_errs +
174                 port_stats->rx_udp_checksum_errs;
175
176         /*  no space in linux buffers: best possible approximation */
177         dev_stats->rx_dropped = erx_stats->rx_drops_no_fragments[0];
178
179         /* detailed rx errors */
180         dev_stats->rx_length_errors = port_stats->rx_in_range_errors +
181                 port_stats->rx_out_range_errors +
182                 port_stats->rx_frame_too_long;
183
184         /* receive ring buffer overflow */
185         dev_stats->rx_over_errors = 0;
186
187         dev_stats->rx_crc_errors = port_stats->rx_crc_errors;
188
189         /* frame alignment errors */
190         dev_stats->rx_frame_errors = port_stats->rx_alignment_symbol_errors;
191
192         /* receiver fifo overrun */
193         /* drops_no_pbuf is no per i/f, it's per BE card */
194         dev_stats->rx_fifo_errors = port_stats->rx_fifo_overflow +
195                                         port_stats->rx_input_fifo_overflow +
196                                         rxf_stats->rx_drops_no_pbuf;
197         /* receiver missed packetd */
198         dev_stats->rx_missed_errors = 0;
199
200         /*  packet transmit problems */
201         dev_stats->tx_errors = 0;
202
203         /* no space available in linux */
204         dev_stats->tx_dropped = 0;
205
206         dev_stats->multicast = port_stats->tx_multicastframes;
207         dev_stats->collisions = 0;
208
209         /* detailed tx_errors */
210         dev_stats->tx_aborted_errors = 0;
211         dev_stats->tx_carrier_errors = 0;
212         dev_stats->tx_fifo_errors = 0;
213         dev_stats->tx_heartbeat_errors = 0;
214         dev_stats->tx_window_errors = 0;
215 }
216
217 void be_link_status_update(void *ctxt, bool link_up)
218 {
219         struct be_adapter *adapter = ctxt;
220         struct net_device *netdev = adapter->netdev;
221
222         /* If link came up or went down */
223         if (adapter->link_up != link_up) {
224                 if (link_up) {
225                         netif_start_queue(netdev);
226                         netif_carrier_on(netdev);
227                         printk(KERN_INFO "%s: Link up\n", netdev->name);
228                 } else {
229                         netif_stop_queue(netdev);
230                         netif_carrier_off(netdev);
231                         printk(KERN_INFO "%s: Link down\n", netdev->name);
232                 }
233                 adapter->link_up = link_up;
234         }
235 }
236
237 /* Update the EQ delay n BE based on the RX frags consumed / sec */
238 static void be_rx_eqd_update(struct be_adapter *adapter)
239 {
240         struct be_ctrl_info *ctrl = &adapter->ctrl;
241         struct be_eq_obj *rx_eq = &adapter->rx_eq;
242         struct be_drvr_stats *stats = &adapter->stats.drvr_stats;
243         ulong now = jiffies;
244         u32 eqd;
245
246         if (!rx_eq->enable_aic)
247                 return;
248
249         /* Wrapped around */
250         if (time_before(now, stats->rx_fps_jiffies)) {
251                 stats->rx_fps_jiffies = now;
252                 return;
253         }
254
255         /* Update once a second */
256         if ((now - stats->rx_fps_jiffies) < HZ)
257                 return;
258
259         stats->be_rx_fps = (stats->be_rx_frags - stats->be_prev_rx_frags) /
260                         ((now - stats->rx_fps_jiffies) / HZ);
261
262         stats->rx_fps_jiffies = now;
263         stats->be_prev_rx_frags = stats->be_rx_frags;
264         eqd = stats->be_rx_fps / 110000;
265         eqd = eqd << 3;
266         if (eqd > rx_eq->max_eqd)
267                 eqd = rx_eq->max_eqd;
268         if (eqd < rx_eq->min_eqd)
269                 eqd = rx_eq->min_eqd;
270         if (eqd < 10)
271                 eqd = 0;
272         if (eqd != rx_eq->cur_eqd)
273                 be_cmd_modify_eqd(ctrl, rx_eq->q.id, eqd);
274
275         rx_eq->cur_eqd = eqd;
276 }
277
278 static struct net_device_stats *be_get_stats(struct net_device *dev)
279 {
280         struct be_adapter *adapter = netdev_priv(dev);
281
282         return &adapter->stats.net_stats;
283 }
284
285 static u32 be_calc_rate(u64 bytes, unsigned long ticks)
286 {
287         u64 rate = bytes;
288
289         do_div(rate, ticks / HZ);
290         rate <<= 3;                     /* bytes/sec -> bits/sec */
291         do_div(rate, 1000000ul);        /* MB/Sec */
292
293         return rate;
294 }
295
296 static void be_tx_rate_update(struct be_adapter *adapter)
297 {
298         struct be_drvr_stats *stats = drvr_stats(adapter);
299         ulong now = jiffies;
300
301         /* Wrapped around? */
302         if (time_before(now, stats->be_tx_jiffies)) {
303                 stats->be_tx_jiffies = now;
304                 return;
305         }
306
307         /* Update tx rate once in two seconds */
308         if ((now - stats->be_tx_jiffies) > 2 * HZ) {
309                 stats->be_tx_rate = be_calc_rate(stats->be_tx_bytes
310                                                   - stats->be_tx_bytes_prev,
311                                                  now - stats->be_tx_jiffies);
312                 stats->be_tx_jiffies = now;
313                 stats->be_tx_bytes_prev = stats->be_tx_bytes;
314         }
315 }
316
317 static void be_tx_stats_update(struct be_adapter *adapter,
318                         u32 wrb_cnt, u32 copied, bool stopped)
319 {
320         struct be_drvr_stats *stats = drvr_stats(adapter);
321         stats->be_tx_reqs++;
322         stats->be_tx_wrbs += wrb_cnt;
323         stats->be_tx_bytes += copied;
324         if (stopped)
325                 stats->be_tx_stops++;
326 }
327
328 /* Determine number of WRB entries needed to xmit data in an skb */
329 static u32 wrb_cnt_for_skb(struct sk_buff *skb, bool *dummy)
330 {
331         int cnt = (skb->len > skb->data_len);
332
333         cnt += skb_shinfo(skb)->nr_frags;
334
335         /* to account for hdr wrb */
336         cnt++;
337         if (cnt & 1) {
338                 /* add a dummy to make it an even num */
339                 cnt++;
340                 *dummy = true;
341         } else
342                 *dummy = false;
343         BUG_ON(cnt > BE_MAX_TX_FRAG_COUNT);
344         return cnt;
345 }
346
347 static inline void wrb_fill(struct be_eth_wrb *wrb, u64 addr, int len)
348 {
349         wrb->frag_pa_hi = upper_32_bits(addr);
350         wrb->frag_pa_lo = addr & 0xFFFFFFFF;
351         wrb->frag_len = len & ETH_WRB_FRAG_LEN_MASK;
352 }
353
354 static void wrb_fill_hdr(struct be_eth_hdr_wrb *hdr, struct sk_buff *skb,
355                 bool vlan, u32 wrb_cnt, u32 len)
356 {
357         memset(hdr, 0, sizeof(*hdr));
358
359         AMAP_SET_BITS(struct amap_eth_hdr_wrb, crc, hdr, 1);
360
361         if (skb_shinfo(skb)->gso_segs > 1 && skb_shinfo(skb)->gso_size) {
362                 AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso, hdr, 1);
363                 AMAP_SET_BITS(struct amap_eth_hdr_wrb, lso_mss,
364                         hdr, skb_shinfo(skb)->gso_size);
365         } else if (skb->ip_summed == CHECKSUM_PARTIAL) {
366                 if (is_tcp_pkt(skb))
367                         AMAP_SET_BITS(struct amap_eth_hdr_wrb, tcpcs, hdr, 1);
368                 else if (is_udp_pkt(skb))
369                         AMAP_SET_BITS(struct amap_eth_hdr_wrb, udpcs, hdr, 1);
370         }
371
372         if (vlan && vlan_tx_tag_present(skb)) {
373                 AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan, hdr, 1);
374                 AMAP_SET_BITS(struct amap_eth_hdr_wrb, vlan_tag,
375                         hdr, vlan_tx_tag_get(skb));
376         }
377
378         AMAP_SET_BITS(struct amap_eth_hdr_wrb, event, hdr, 1);
379         AMAP_SET_BITS(struct amap_eth_hdr_wrb, complete, hdr, 1);
380         AMAP_SET_BITS(struct amap_eth_hdr_wrb, num_wrb, hdr, wrb_cnt);
381         AMAP_SET_BITS(struct amap_eth_hdr_wrb, len, hdr, len);
382 }
383
384
385 static int make_tx_wrbs(struct be_adapter *adapter,
386                 struct sk_buff *skb, u32 wrb_cnt, bool dummy_wrb)
387 {
388         u64 busaddr;
389         u32 i, copied = 0;
390         struct pci_dev *pdev = adapter->pdev;
391         struct sk_buff *first_skb = skb;
392         struct be_queue_info *txq = &adapter->tx_obj.q;
393         struct be_eth_wrb *wrb;
394         struct be_eth_hdr_wrb *hdr;
395
396         atomic_add(wrb_cnt, &txq->used);
397         hdr = queue_head_node(txq);
398         queue_head_inc(txq);
399
400         if (skb->len > skb->data_len) {
401                 int len = skb->len - skb->data_len;
402                 busaddr = pci_map_single(pdev, skb->data, len,
403                                          PCI_DMA_TODEVICE);
404                 wrb = queue_head_node(txq);
405                 wrb_fill(wrb, busaddr, len);
406                 be_dws_cpu_to_le(wrb, sizeof(*wrb));
407                 queue_head_inc(txq);
408                 copied += len;
409         }
410
411         for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
412                 struct skb_frag_struct *frag =
413                         &skb_shinfo(skb)->frags[i];
414                 busaddr = pci_map_page(pdev, frag->page,
415                                        frag->page_offset,
416                                        frag->size, PCI_DMA_TODEVICE);
417                 wrb = queue_head_node(txq);
418                 wrb_fill(wrb, busaddr, frag->size);
419                 be_dws_cpu_to_le(wrb, sizeof(*wrb));
420                 queue_head_inc(txq);
421                 copied += frag->size;
422         }
423
424         if (dummy_wrb) {
425                 wrb = queue_head_node(txq);
426                 wrb_fill(wrb, 0, 0);
427                 be_dws_cpu_to_le(wrb, sizeof(*wrb));
428                 queue_head_inc(txq);
429         }
430
431         wrb_fill_hdr(hdr, first_skb, adapter->vlan_grp ? true : false,
432                 wrb_cnt, copied);
433         be_dws_cpu_to_le(hdr, sizeof(*hdr));
434
435         return copied;
436 }
437
438 static int be_xmit(struct sk_buff *skb, struct net_device *netdev)
439 {
440         struct be_adapter *adapter = netdev_priv(netdev);
441         struct be_tx_obj *tx_obj = &adapter->tx_obj;
442         struct be_queue_info *txq = &tx_obj->q;
443         u32 wrb_cnt = 0, copied = 0;
444         u32 start = txq->head;
445         bool dummy_wrb, stopped = false;
446
447         wrb_cnt = wrb_cnt_for_skb(skb, &dummy_wrb);
448
449         copied = make_tx_wrbs(adapter, skb, wrb_cnt, dummy_wrb);
450
451         /* record the sent skb in the sent_skb table */
452         BUG_ON(tx_obj->sent_skb_list[start]);
453         tx_obj->sent_skb_list[start] = skb;
454
455         /* Ensure that txq has space for the next skb; Else stop the queue
456          * *BEFORE* ringing the tx doorbell, so that we serialze the
457          * tx compls of the current transmit which'll wake up the queue
458          */
459         if ((BE_MAX_TX_FRAG_COUNT + atomic_read(&txq->used)) >= txq->len) {
460                 netif_stop_queue(netdev);
461                 stopped = true;
462         }
463
464         be_txq_notify(&adapter->ctrl, txq->id, wrb_cnt);
465
466         be_tx_stats_update(adapter, wrb_cnt, copied, stopped);
467         return NETDEV_TX_OK;
468 }
469
470 static int be_change_mtu(struct net_device *netdev, int new_mtu)
471 {
472         struct be_adapter *adapter = netdev_priv(netdev);
473         if (new_mtu < BE_MIN_MTU ||
474                         new_mtu > BE_MAX_JUMBO_FRAME_SIZE) {
475                 dev_info(&adapter->pdev->dev,
476                         "MTU must be between %d and %d bytes\n",
477                         BE_MIN_MTU, BE_MAX_JUMBO_FRAME_SIZE);
478                 return -EINVAL;
479         }
480         dev_info(&adapter->pdev->dev, "MTU changed from %d to %d bytes\n",
481                         netdev->mtu, new_mtu);
482         netdev->mtu = new_mtu;
483         return 0;
484 }
485
486 /*
487  * if there are BE_NUM_VLANS_SUPPORTED or lesser number of VLANS configured,
488  * program them in BE.  If more than BE_NUM_VLANS_SUPPORTED are configured,
489  * set the BE in promiscuous VLAN mode.
490  */
491 static void be_vid_config(struct net_device *netdev)
492 {
493         struct be_adapter *adapter = netdev_priv(netdev);
494         u16 vtag[BE_NUM_VLANS_SUPPORTED];
495         u16 ntags = 0, i;
496
497         if (adapter->num_vlans <= BE_NUM_VLANS_SUPPORTED)  {
498                 /* Construct VLAN Table to give to HW */
499                 for (i = 0; i < VLAN_GROUP_ARRAY_LEN; i++) {
500                         if (adapter->vlan_tag[i]) {
501                                 vtag[ntags] = cpu_to_le16(i);
502                                 ntags++;
503                         }
504                 }
505                 be_cmd_vlan_config(&adapter->ctrl, adapter->if_handle,
506                         vtag, ntags, 1, 0);
507         } else {
508                 be_cmd_vlan_config(&adapter->ctrl, adapter->if_handle,
509                         NULL, 0, 1, 1);
510         }
511 }
512
513 static void be_vlan_register(struct net_device *netdev, struct vlan_group *grp)
514 {
515         struct be_adapter *adapter = netdev_priv(netdev);
516         struct be_eq_obj *rx_eq = &adapter->rx_eq;
517         struct be_eq_obj *tx_eq = &adapter->tx_eq;
518         struct be_ctrl_info *ctrl = &adapter->ctrl;
519
520         be_eq_notify(ctrl, rx_eq->q.id, false, false, 0);
521         be_eq_notify(ctrl, tx_eq->q.id, false, false, 0);
522         adapter->vlan_grp = grp;
523         be_eq_notify(ctrl, rx_eq->q.id, true, false, 0);
524         be_eq_notify(ctrl, tx_eq->q.id, true, false, 0);
525 }
526
527 static void be_vlan_add_vid(struct net_device *netdev, u16 vid)
528 {
529         struct be_adapter *adapter = netdev_priv(netdev);
530
531         adapter->num_vlans++;
532         adapter->vlan_tag[vid] = 1;
533
534         be_vid_config(netdev);
535 }
536
537 static void be_vlan_rem_vid(struct net_device *netdev, u16 vid)
538 {
539         struct be_adapter *adapter = netdev_priv(netdev);
540
541         adapter->num_vlans--;
542         adapter->vlan_tag[vid] = 0;
543
544         vlan_group_set_device(adapter->vlan_grp, vid, NULL);
545         be_vid_config(netdev);
546 }
547
548 static void be_set_multicast_list(struct net_device *netdev)
549 {
550         struct be_adapter *adapter = netdev_priv(netdev);
551         struct be_ctrl_info *ctrl = &adapter->ctrl;
552
553         if (netdev->flags & IFF_PROMISC) {
554                 be_cmd_promiscuous_config(ctrl, adapter->port_num, 1);
555                 adapter->promiscuous = true;
556                 goto done;
557         }
558
559         /* BE was previously in promiscous mode; disable it */
560         if (adapter->promiscuous) {
561                 adapter->promiscuous = false;
562                 be_cmd_promiscuous_config(ctrl, adapter->port_num, 0);
563         }
564
565         if (netdev->flags & IFF_ALLMULTI) {
566                 be_cmd_multicast_set(ctrl, adapter->if_handle, NULL, 0);
567                 goto done;
568         }
569
570         be_cmd_multicast_set(ctrl, adapter->if_handle, netdev->mc_list,
571                 netdev->mc_count);
572 done:
573         return;
574 }
575
576 static void be_rx_rate_update(struct be_adapter *adapter)
577 {
578         struct be_drvr_stats *stats = drvr_stats(adapter);
579         ulong now = jiffies;
580
581         /* Wrapped around */
582         if (time_before(now, stats->be_rx_jiffies)) {
583                 stats->be_rx_jiffies = now;
584                 return;
585         }
586
587         /* Update the rate once in two seconds */
588         if ((now - stats->be_rx_jiffies) < 2 * HZ)
589                 return;
590
591         stats->be_rx_rate = be_calc_rate(stats->be_rx_bytes
592                                           - stats->be_rx_bytes_prev,
593                                          now - stats->be_rx_jiffies);
594         stats->be_rx_jiffies = now;
595         stats->be_rx_bytes_prev = stats->be_rx_bytes;
596 }
597
598 static void be_rx_stats_update(struct be_adapter *adapter,
599                 u32 pktsize, u16 numfrags)
600 {
601         struct be_drvr_stats *stats = drvr_stats(adapter);
602
603         stats->be_rx_compl++;
604         stats->be_rx_frags += numfrags;
605         stats->be_rx_bytes += pktsize;
606 }
607
608 static inline bool do_pkt_csum(struct be_eth_rx_compl *rxcp, bool cso)
609 {
610         u8 l4_cksm, ip_version, ipcksm, tcpf = 0, udpf = 0, ipv6_chk;
611
612         l4_cksm = AMAP_GET_BITS(struct amap_eth_rx_compl, l4_cksm, rxcp);
613         ipcksm = AMAP_GET_BITS(struct amap_eth_rx_compl, ipcksm, rxcp);
614         ip_version = AMAP_GET_BITS(struct amap_eth_rx_compl, ip_version, rxcp);
615         if (ip_version) {
616                 tcpf = AMAP_GET_BITS(struct amap_eth_rx_compl, tcpf, rxcp);
617                 udpf = AMAP_GET_BITS(struct amap_eth_rx_compl, udpf, rxcp);
618         }
619         ipv6_chk = (ip_version && (tcpf || udpf));
620
621         return ((l4_cksm && ipv6_chk && ipcksm) && cso) ? false : true;
622 }
623
624 static struct be_rx_page_info *
625 get_rx_page_info(struct be_adapter *adapter, u16 frag_idx)
626 {
627         struct be_rx_page_info *rx_page_info;
628         struct be_queue_info *rxq = &adapter->rx_obj.q;
629
630         rx_page_info = &adapter->rx_obj.page_info_tbl[frag_idx];
631         BUG_ON(!rx_page_info->page);
632
633         if (rx_page_info->last_page_user)
634                 pci_unmap_page(adapter->pdev, pci_unmap_addr(rx_page_info, bus),
635                         adapter->big_page_size, PCI_DMA_FROMDEVICE);
636
637         atomic_dec(&rxq->used);
638         return rx_page_info;
639 }
640
641 /* Throwaway the data in the Rx completion */
642 static void be_rx_compl_discard(struct be_adapter *adapter,
643                         struct be_eth_rx_compl *rxcp)
644 {
645         struct be_queue_info *rxq = &adapter->rx_obj.q;
646         struct be_rx_page_info *page_info;
647         u16 rxq_idx, i, num_rcvd;
648
649         rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
650         num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
651
652         for (i = 0; i < num_rcvd; i++) {
653                 page_info = get_rx_page_info(adapter, rxq_idx);
654                 put_page(page_info->page);
655                 memset(page_info, 0, sizeof(*page_info));
656                 index_inc(&rxq_idx, rxq->len);
657         }
658 }
659
660 /*
661  * skb_fill_rx_data forms a complete skb for an ether frame
662  * indicated by rxcp.
663  */
664 static void skb_fill_rx_data(struct be_adapter *adapter,
665                         struct sk_buff *skb, struct be_eth_rx_compl *rxcp)
666 {
667         struct be_queue_info *rxq = &adapter->rx_obj.q;
668         struct be_rx_page_info *page_info;
669         u16 rxq_idx, i, num_rcvd;
670         u32 pktsize, hdr_len, curr_frag_len;
671         u8 *start;
672
673         rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
674         pktsize = AMAP_GET_BITS(struct amap_eth_rx_compl, pktsize, rxcp);
675         num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
676
677         page_info = get_rx_page_info(adapter, rxq_idx);
678
679         start = page_address(page_info->page) + page_info->page_offset;
680         prefetch(start);
681
682         /* Copy data in the first descriptor of this completion */
683         curr_frag_len = min(pktsize, rx_frag_size);
684
685         /* Copy the header portion into skb_data */
686         hdr_len = min((u32)BE_HDR_LEN, curr_frag_len);
687         memcpy(skb->data, start, hdr_len);
688         skb->len = curr_frag_len;
689         if (curr_frag_len <= BE_HDR_LEN) { /* tiny packet */
690                 /* Complete packet has now been moved to data */
691                 put_page(page_info->page);
692                 skb->data_len = 0;
693                 skb->tail += curr_frag_len;
694         } else {
695                 skb_shinfo(skb)->nr_frags = 1;
696                 skb_shinfo(skb)->frags[0].page = page_info->page;
697                 skb_shinfo(skb)->frags[0].page_offset =
698                                         page_info->page_offset + hdr_len;
699                 skb_shinfo(skb)->frags[0].size = curr_frag_len - hdr_len;
700                 skb->data_len = curr_frag_len - hdr_len;
701                 skb->tail += hdr_len;
702         }
703         memset(page_info, 0, sizeof(*page_info));
704
705         if (pktsize <= rx_frag_size) {
706                 BUG_ON(num_rcvd != 1);
707                 goto done;
708         }
709
710         /* More frags present for this completion */
711         pktsize -= curr_frag_len; /* account for above copied frag */
712         for (i = 1; i < num_rcvd; i++) {
713                 index_inc(&rxq_idx, rxq->len);
714                 page_info = get_rx_page_info(adapter, rxq_idx);
715
716                 curr_frag_len = min(pktsize, rx_frag_size);
717
718                 skb_shinfo(skb)->frags[i].page = page_info->page;
719                 skb_shinfo(skb)->frags[i].page_offset = page_info->page_offset;
720                 skb_shinfo(skb)->frags[i].size = curr_frag_len;
721                 skb->len += curr_frag_len;
722                 skb->data_len += curr_frag_len;
723                 skb_shinfo(skb)->nr_frags++;
724                 pktsize -= curr_frag_len;
725
726                 memset(page_info, 0, sizeof(*page_info));
727         }
728
729 done:
730         be_rx_stats_update(adapter, pktsize, num_rcvd);
731         return;
732 }
733
734 /* Process the RX completion indicated by rxcp when LRO is disabled */
735 static void be_rx_compl_process(struct be_adapter *adapter,
736                         struct be_eth_rx_compl *rxcp)
737 {
738         struct sk_buff *skb;
739         u32 vtp, vid;
740
741         vtp = AMAP_GET_BITS(struct amap_eth_rx_compl, vtp, rxcp);
742
743         skb = netdev_alloc_skb(adapter->netdev, BE_HDR_LEN + NET_IP_ALIGN);
744         if (!skb) {
745                 if (net_ratelimit())
746                         dev_warn(&adapter->pdev->dev, "skb alloc failed\n");
747                 be_rx_compl_discard(adapter, rxcp);
748                 return;
749         }
750
751         skb_reserve(skb, NET_IP_ALIGN);
752
753         skb_fill_rx_data(adapter, skb, rxcp);
754
755         if (do_pkt_csum(rxcp, adapter->rx_csum))
756                 skb->ip_summed = CHECKSUM_NONE;
757         else
758                 skb->ip_summed = CHECKSUM_UNNECESSARY;
759
760         skb->truesize = skb->len + sizeof(struct sk_buff);
761         skb->protocol = eth_type_trans(skb, adapter->netdev);
762         skb->dev = adapter->netdev;
763
764         if (vtp) {
765                 if (!adapter->vlan_grp || adapter->num_vlans == 0) {
766                         kfree_skb(skb);
767                         return;
768                 }
769                 vid = AMAP_GET_BITS(struct amap_eth_rx_compl, vlan_tag, rxcp);
770                 vid = be16_to_cpu(vid);
771                 vlan_hwaccel_receive_skb(skb, adapter->vlan_grp, vid);
772         } else {
773                 netif_receive_skb(skb);
774         }
775
776         adapter->netdev->last_rx = jiffies;
777
778         return;
779 }
780
781 /* Process the RX completion indicated by rxcp when LRO is enabled */
782 static void be_rx_compl_process_lro(struct be_adapter *adapter,
783                         struct be_eth_rx_compl *rxcp)
784 {
785         struct be_rx_page_info *page_info;
786         struct skb_frag_struct rx_frags[BE_MAX_FRAGS_PER_FRAME];
787         struct be_queue_info *rxq = &adapter->rx_obj.q;
788         u32 num_rcvd, pkt_size, remaining, vlanf, curr_frag_len;
789         u16 i, rxq_idx = 0, vid;
790
791         num_rcvd = AMAP_GET_BITS(struct amap_eth_rx_compl, numfrags, rxcp);
792         pkt_size = AMAP_GET_BITS(struct amap_eth_rx_compl, pktsize, rxcp);
793         vlanf = AMAP_GET_BITS(struct amap_eth_rx_compl, vtp, rxcp);
794         rxq_idx = AMAP_GET_BITS(struct amap_eth_rx_compl, fragndx, rxcp);
795
796         remaining = pkt_size;
797         for (i = 0; i < num_rcvd; i++) {
798                 page_info = get_rx_page_info(adapter, rxq_idx);
799
800                 curr_frag_len = min(remaining, rx_frag_size);
801
802                 rx_frags[i].page = page_info->page;
803                 rx_frags[i].page_offset = page_info->page_offset;
804                 rx_frags[i].size = curr_frag_len;
805                 remaining -= curr_frag_len;
806
807                 index_inc(&rxq_idx, rxq->len);
808
809                 memset(page_info, 0, sizeof(*page_info));
810         }
811
812         if (likely(!vlanf)) {
813                 lro_receive_frags(&adapter->rx_obj.lro_mgr, rx_frags, pkt_size,
814                                 pkt_size, NULL, 0);
815         } else {
816                 vid = AMAP_GET_BITS(struct amap_eth_rx_compl, vlan_tag, rxcp);
817                 vid = be16_to_cpu(vid);
818
819                 if (!adapter->vlan_grp || adapter->num_vlans == 0)
820                         return;
821
822                 lro_vlan_hwaccel_receive_frags(&adapter->rx_obj.lro_mgr,
823                         rx_frags, pkt_size, pkt_size, adapter->vlan_grp,
824                         vid, NULL, 0);
825         }
826
827         be_rx_stats_update(adapter, pkt_size, num_rcvd);
828         return;
829 }
830
831 static struct be_eth_rx_compl *be_rx_compl_get(struct be_adapter *adapter)
832 {
833         struct be_eth_rx_compl *rxcp = queue_tail_node(&adapter->rx_obj.cq);
834
835         if (rxcp->dw[offsetof(struct amap_eth_rx_compl, valid) / 32] == 0)
836                 return NULL;
837
838         be_dws_le_to_cpu(rxcp, sizeof(*rxcp));
839
840         queue_tail_inc(&adapter->rx_obj.cq);
841         return rxcp;
842 }
843
844 /* To reset the valid bit, we need to reset the whole word as
845  * when walking the queue the valid entries are little-endian
846  * and invalid entries are host endian
847  */
848 static inline void be_rx_compl_reset(struct be_eth_rx_compl *rxcp)
849 {
850         rxcp->dw[offsetof(struct amap_eth_rx_compl, valid) / 32] = 0;
851 }
852
853 static inline struct page *be_alloc_pages(u32 size)
854 {
855         gfp_t alloc_flags = GFP_ATOMIC;
856         u32 order = get_order(size);
857         if (order > 0)
858                 alloc_flags |= __GFP_COMP;
859         return  alloc_pages(alloc_flags, order);
860 }
861
862 /*
863  * Allocate a page, split it to fragments of size rx_frag_size and post as
864  * receive buffers to BE
865  */
866 static void be_post_rx_frags(struct be_adapter *adapter)
867 {
868         struct be_rx_page_info *page_info_tbl = adapter->rx_obj.page_info_tbl;
869         struct be_rx_page_info *page_info = NULL;
870         struct be_queue_info *rxq = &adapter->rx_obj.q;
871         struct page *pagep = NULL;
872         struct be_eth_rx_d *rxd;
873         u64 page_dmaaddr = 0, frag_dmaaddr;
874         u32 posted, page_offset = 0;
875
876         page_info = &page_info_tbl[rxq->head];
877         for (posted = 0; posted < MAX_RX_POST && !page_info->page; posted++) {
878                 if (!pagep) {
879                         pagep = be_alloc_pages(adapter->big_page_size);
880                         if (unlikely(!pagep)) {
881                                 drvr_stats(adapter)->be_ethrx_post_fail++;
882                                 break;
883                         }
884                         page_dmaaddr = pci_map_page(adapter->pdev, pagep, 0,
885                                                 adapter->big_page_size,
886                                                 PCI_DMA_FROMDEVICE);
887                         page_info->page_offset = 0;
888                 } else {
889                         get_page(pagep);
890                         page_info->page_offset = page_offset + rx_frag_size;
891                 }
892                 page_offset = page_info->page_offset;
893                 page_info->page = pagep;
894                 pci_unmap_addr_set(page_info, bus, page_dmaaddr);
895                 frag_dmaaddr = page_dmaaddr + page_info->page_offset;
896
897                 rxd = queue_head_node(rxq);
898                 rxd->fragpa_lo = cpu_to_le32(frag_dmaaddr & 0xFFFFFFFF);
899                 rxd->fragpa_hi = cpu_to_le32(upper_32_bits(frag_dmaaddr));
900                 queue_head_inc(rxq);
901
902                 /* Any space left in the current big page for another frag? */
903                 if ((page_offset + rx_frag_size + rx_frag_size) >
904                                         adapter->big_page_size) {
905                         pagep = NULL;
906                         page_info->last_page_user = true;
907                 }
908                 page_info = &page_info_tbl[rxq->head];
909         }
910         if (pagep)
911                 page_info->last_page_user = true;
912
913         if (posted) {
914                 atomic_add(posted, &rxq->used);
915                 be_rxq_notify(&adapter->ctrl, rxq->id, posted);
916         } else if (atomic_read(&rxq->used) == 0) {
917                 /* Let be_worker replenish when memory is available */
918                 adapter->rx_post_starved = true;
919         }
920
921         return;
922 }
923
924 static struct be_eth_tx_compl *be_tx_compl_get(struct be_queue_info *tx_cq)
925 {
926         struct be_eth_tx_compl *txcp = queue_tail_node(tx_cq);
927
928         if (txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] == 0)
929                 return NULL;
930
931         be_dws_le_to_cpu(txcp, sizeof(*txcp));
932
933         txcp->dw[offsetof(struct amap_eth_tx_compl, valid) / 32] = 0;
934
935         queue_tail_inc(tx_cq);
936         return txcp;
937 }
938
939 static void be_tx_compl_process(struct be_adapter *adapter, u16 last_index)
940 {
941         struct be_queue_info *txq = &adapter->tx_obj.q;
942         struct be_eth_wrb *wrb;
943         struct sk_buff **sent_skbs = adapter->tx_obj.sent_skb_list;
944         struct sk_buff *sent_skb;
945         u64 busaddr;
946         u16 cur_index, num_wrbs = 0;
947
948         cur_index = txq->tail;
949         sent_skb = sent_skbs[cur_index];
950         BUG_ON(!sent_skb);
951         sent_skbs[cur_index] = NULL;
952
953         do {
954                 cur_index = txq->tail;
955                 wrb = queue_tail_node(txq);
956                 be_dws_le_to_cpu(wrb, sizeof(*wrb));
957                 busaddr = ((u64)wrb->frag_pa_hi << 32) | (u64)wrb->frag_pa_lo;
958                 if (busaddr != 0) {
959                         pci_unmap_single(adapter->pdev, busaddr,
960                                 wrb->frag_len, PCI_DMA_TODEVICE);
961                 }
962                 num_wrbs++;
963                 queue_tail_inc(txq);
964         } while (cur_index != last_index);
965
966         atomic_sub(num_wrbs, &txq->used);
967
968         kfree_skb(sent_skb);
969 }
970
971 static void be_rx_q_clean(struct be_adapter *adapter)
972 {
973         struct be_rx_page_info *page_info;
974         struct be_queue_info *rxq = &adapter->rx_obj.q;
975         struct be_queue_info *rx_cq = &adapter->rx_obj.cq;
976         struct be_eth_rx_compl *rxcp;
977         u16 tail;
978
979         /* First cleanup pending rx completions */
980         while ((rxcp = be_rx_compl_get(adapter)) != NULL) {
981                 be_rx_compl_discard(adapter, rxcp);
982                 be_rx_compl_reset(rxcp);
983                 be_cq_notify(&adapter->ctrl, rx_cq->id, true, 1);
984         }
985
986         /* Then free posted rx buffer that were not used */
987         tail = (rxq->head + rxq->len - atomic_read(&rxq->used)) % rxq->len;
988         for (; tail != rxq->head; index_inc(&tail, rxq->len)) {
989                 page_info = get_rx_page_info(adapter, tail);
990                 put_page(page_info->page);
991                 memset(page_info, 0, sizeof(*page_info));
992         }
993         BUG_ON(atomic_read(&rxq->used));
994 }
995
996 static void be_tx_q_clean(struct be_adapter *adapter)
997 {
998         struct sk_buff **sent_skbs = adapter->tx_obj.sent_skb_list;
999         struct sk_buff *sent_skb;
1000         struct be_queue_info *txq = &adapter->tx_obj.q;
1001         u16 last_index;
1002         bool dummy_wrb;
1003
1004         while (atomic_read(&txq->used)) {
1005                 sent_skb = sent_skbs[txq->tail];
1006                 last_index = txq->tail;
1007                 index_adv(&last_index,
1008                         wrb_cnt_for_skb(sent_skb, &dummy_wrb) - 1, txq->len);
1009                 be_tx_compl_process(adapter, last_index);
1010         }
1011 }
1012
1013 static void be_mcc_queues_destroy(struct be_adapter *adapter)
1014 {
1015         struct be_queue_info *q;
1016         struct be_ctrl_info *ctrl = &adapter->ctrl;
1017
1018         q = &ctrl->mcc_obj.q;
1019         if (q->created)
1020                 be_cmd_q_destroy(ctrl, q, QTYPE_MCCQ);
1021         be_queue_free(adapter, q);
1022
1023         q = &ctrl->mcc_obj.cq;
1024         if (q->created)
1025                 be_cmd_q_destroy(ctrl, q, QTYPE_CQ);
1026         be_queue_free(adapter, q);
1027 }
1028
1029 /* Must be called only after TX qs are created as MCC shares TX EQ */
1030 static int be_mcc_queues_create(struct be_adapter *adapter)
1031 {
1032         struct be_queue_info *q, *cq;
1033         struct be_ctrl_info *ctrl = &adapter->ctrl;
1034
1035         /* Alloc MCC compl queue */
1036         cq = &ctrl->mcc_obj.cq;
1037         if (be_queue_alloc(adapter, cq, MCC_CQ_LEN,
1038                         sizeof(struct be_mcc_cq_entry)))
1039                 goto err;
1040
1041         /* Ask BE to create MCC compl queue; share TX's eq */
1042         if (be_cmd_cq_create(ctrl, cq, &adapter->tx_eq.q, false, true, 0))
1043                 goto mcc_cq_free;
1044
1045         /* Alloc MCC queue */
1046         q = &ctrl->mcc_obj.q;
1047         if (be_queue_alloc(adapter, q, MCC_Q_LEN, sizeof(struct be_mcc_wrb)))
1048                 goto mcc_cq_destroy;
1049
1050         /* Ask BE to create MCC queue */
1051         if (be_cmd_mccq_create(ctrl, q, cq))
1052                 goto mcc_q_free;
1053
1054         return 0;
1055
1056 mcc_q_free:
1057         be_queue_free(adapter, q);
1058 mcc_cq_destroy:
1059         be_cmd_q_destroy(ctrl, cq, QTYPE_CQ);
1060 mcc_cq_free:
1061         be_queue_free(adapter, cq);
1062 err:
1063         return -1;
1064 }
1065
1066 static void be_tx_queues_destroy(struct be_adapter *adapter)
1067 {
1068         struct be_queue_info *q;
1069
1070         q = &adapter->tx_obj.q;
1071         if (q->created) {
1072                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_TXQ);
1073
1074                 /* No more tx completions can be rcvd now; clean up if there
1075                  * are any pending completions or pending tx requests */
1076                 be_tx_q_clean(adapter);
1077         }
1078         be_queue_free(adapter, q);
1079
1080         q = &adapter->tx_obj.cq;
1081         if (q->created)
1082                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_CQ);
1083         be_queue_free(adapter, q);
1084
1085         q = &adapter->tx_eq.q;
1086         if (q->created)
1087                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_EQ);
1088         be_queue_free(adapter, q);
1089 }
1090
1091 static int be_tx_queues_create(struct be_adapter *adapter)
1092 {
1093         struct be_queue_info *eq, *q, *cq;
1094
1095         adapter->tx_eq.max_eqd = 0;
1096         adapter->tx_eq.min_eqd = 0;
1097         adapter->tx_eq.cur_eqd = 96;
1098         adapter->tx_eq.enable_aic = false;
1099         /* Alloc Tx Event queue */
1100         eq = &adapter->tx_eq.q;
1101         if (be_queue_alloc(adapter, eq, EVNT_Q_LEN, sizeof(struct be_eq_entry)))
1102                 return -1;
1103
1104         /* Ask BE to create Tx Event queue */
1105         if (be_cmd_eq_create(&adapter->ctrl, eq, adapter->tx_eq.cur_eqd))
1106                 goto tx_eq_free;
1107         /* Alloc TX eth compl queue */
1108         cq = &adapter->tx_obj.cq;
1109         if (be_queue_alloc(adapter, cq, TX_CQ_LEN,
1110                         sizeof(struct be_eth_tx_compl)))
1111                 goto tx_eq_destroy;
1112
1113         /* Ask BE to create Tx eth compl queue */
1114         if (be_cmd_cq_create(&adapter->ctrl, cq, eq, false, false, 3))
1115                 goto tx_cq_free;
1116
1117         /* Alloc TX eth queue */
1118         q = &adapter->tx_obj.q;
1119         if (be_queue_alloc(adapter, q, TX_Q_LEN, sizeof(struct be_eth_wrb)))
1120                 goto tx_cq_destroy;
1121
1122         /* Ask BE to create Tx eth queue */
1123         if (be_cmd_txq_create(&adapter->ctrl, q, cq))
1124                 goto tx_q_free;
1125         return 0;
1126
1127 tx_q_free:
1128         be_queue_free(adapter, q);
1129 tx_cq_destroy:
1130         be_cmd_q_destroy(&adapter->ctrl, cq, QTYPE_CQ);
1131 tx_cq_free:
1132         be_queue_free(adapter, cq);
1133 tx_eq_destroy:
1134         be_cmd_q_destroy(&adapter->ctrl, eq, QTYPE_EQ);
1135 tx_eq_free:
1136         be_queue_free(adapter, eq);
1137         return -1;
1138 }
1139
1140 static void be_rx_queues_destroy(struct be_adapter *adapter)
1141 {
1142         struct be_queue_info *q;
1143
1144         q = &adapter->rx_obj.q;
1145         if (q->created) {
1146                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_RXQ);
1147                 be_rx_q_clean(adapter);
1148         }
1149         be_queue_free(adapter, q);
1150
1151         q = &adapter->rx_obj.cq;
1152         if (q->created)
1153                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_CQ);
1154         be_queue_free(adapter, q);
1155
1156         q = &adapter->rx_eq.q;
1157         if (q->created)
1158                 be_cmd_q_destroy(&adapter->ctrl, q, QTYPE_EQ);
1159         be_queue_free(adapter, q);
1160 }
1161
1162 static int be_rx_queues_create(struct be_adapter *adapter)
1163 {
1164         struct be_queue_info *eq, *q, *cq;
1165         int rc;
1166
1167         adapter->max_rx_coal = BE_MAX_FRAGS_PER_FRAME;
1168         adapter->big_page_size = (1 << get_order(rx_frag_size)) * PAGE_SIZE;
1169         adapter->rx_eq.max_eqd = BE_MAX_EQD;
1170         adapter->rx_eq.min_eqd = 0;
1171         adapter->rx_eq.cur_eqd = 0;
1172         adapter->rx_eq.enable_aic = true;
1173
1174         /* Alloc Rx Event queue */
1175         eq = &adapter->rx_eq.q;
1176         rc = be_queue_alloc(adapter, eq, EVNT_Q_LEN,
1177                                 sizeof(struct be_eq_entry));
1178         if (rc)
1179                 return rc;
1180
1181         /* Ask BE to create Rx Event queue */
1182         rc = be_cmd_eq_create(&adapter->ctrl, eq, adapter->rx_eq.cur_eqd);
1183         if (rc)
1184                 goto rx_eq_free;
1185
1186         /* Alloc RX eth compl queue */
1187         cq = &adapter->rx_obj.cq;
1188         rc = be_queue_alloc(adapter, cq, RX_CQ_LEN,
1189                         sizeof(struct be_eth_rx_compl));
1190         if (rc)
1191                 goto rx_eq_destroy;
1192
1193         /* Ask BE to create Rx eth compl queue */
1194         rc = be_cmd_cq_create(&adapter->ctrl, cq, eq, false, false, 3);
1195         if (rc)
1196                 goto rx_cq_free;
1197
1198         /* Alloc RX eth queue */
1199         q = &adapter->rx_obj.q;
1200         rc = be_queue_alloc(adapter, q, RX_Q_LEN, sizeof(struct be_eth_rx_d));
1201         if (rc)
1202                 goto rx_cq_destroy;
1203
1204         /* Ask BE to create Rx eth queue */
1205         rc = be_cmd_rxq_create(&adapter->ctrl, q, cq->id, rx_frag_size,
1206                 BE_MAX_JUMBO_FRAME_SIZE, adapter->if_handle, false);
1207         if (rc)
1208                 goto rx_q_free;
1209
1210         return 0;
1211 rx_q_free:
1212         be_queue_free(adapter, q);
1213 rx_cq_destroy:
1214         be_cmd_q_destroy(&adapter->ctrl, cq, QTYPE_CQ);
1215 rx_cq_free:
1216         be_queue_free(adapter, cq);
1217 rx_eq_destroy:
1218         be_cmd_q_destroy(&adapter->ctrl, eq, QTYPE_EQ);
1219 rx_eq_free:
1220         be_queue_free(adapter, eq);
1221         return rc;
1222 }
1223 static bool event_get(struct be_eq_obj *eq_obj, u16 *rid)
1224 {
1225         struct be_eq_entry *entry = queue_tail_node(&eq_obj->q);
1226         u32 evt = entry->evt;
1227
1228         if (!evt)
1229                 return false;
1230
1231         evt = le32_to_cpu(evt);
1232         *rid = (evt >> EQ_ENTRY_RES_ID_SHIFT) & EQ_ENTRY_RES_ID_MASK;
1233         entry->evt = 0;
1234         queue_tail_inc(&eq_obj->q);
1235         return true;
1236 }
1237
1238 static int event_handle(struct be_ctrl_info *ctrl,
1239                         struct be_eq_obj *eq_obj)
1240 {
1241         u16 rid = 0, num = 0;
1242
1243         while (event_get(eq_obj, &rid))
1244                 num++;
1245
1246         /* We can see an interrupt and no event */
1247         be_eq_notify(ctrl, eq_obj->q.id, true, true, num);
1248         if (num)
1249                 napi_schedule(&eq_obj->napi);
1250
1251         return num;
1252 }
1253
1254 static irqreturn_t be_intx(int irq, void *dev)
1255 {
1256         struct be_adapter *adapter = dev;
1257         struct be_ctrl_info *ctrl = &adapter->ctrl;
1258         int rx, tx;
1259
1260         tx = event_handle(ctrl, &adapter->tx_eq);
1261         rx = event_handle(ctrl, &adapter->rx_eq);
1262
1263         if (rx || tx)
1264                 return IRQ_HANDLED;
1265         else
1266                 return IRQ_NONE;
1267 }
1268
1269 static irqreturn_t be_msix_rx(int irq, void *dev)
1270 {
1271         struct be_adapter *adapter = dev;
1272
1273         event_handle(&adapter->ctrl, &adapter->rx_eq);
1274
1275         return IRQ_HANDLED;
1276 }
1277
1278 static irqreturn_t be_msix_tx_mcc(int irq, void *dev)
1279 {
1280         struct be_adapter *adapter = dev;
1281
1282         event_handle(&adapter->ctrl, &adapter->tx_eq);
1283
1284         return IRQ_HANDLED;
1285 }
1286
1287 static inline bool do_lro(struct be_adapter *adapter,
1288                         struct be_eth_rx_compl *rxcp)
1289 {
1290         int err = AMAP_GET_BITS(struct amap_eth_rx_compl, err, rxcp);
1291         int tcp_frame = AMAP_GET_BITS(struct amap_eth_rx_compl, tcpf, rxcp);
1292
1293         if (err)
1294                 drvr_stats(adapter)->be_rxcp_err++;
1295
1296         return (!tcp_frame || err || (adapter->max_rx_coal <= 1)) ?
1297                 false : true;
1298 }
1299
1300 int be_poll_rx(struct napi_struct *napi, int budget)
1301 {
1302         struct be_eq_obj *rx_eq = container_of(napi, struct be_eq_obj, napi);
1303         struct be_adapter *adapter =
1304                 container_of(rx_eq, struct be_adapter, rx_eq);
1305         struct be_queue_info *rx_cq = &adapter->rx_obj.cq;
1306         struct be_eth_rx_compl *rxcp;
1307         u32 work_done;
1308
1309         for (work_done = 0; work_done < budget; work_done++) {
1310                 rxcp = be_rx_compl_get(adapter);
1311                 if (!rxcp)
1312                         break;
1313
1314                 if (do_lro(adapter, rxcp))
1315                         be_rx_compl_process_lro(adapter, rxcp);
1316                 else
1317                         be_rx_compl_process(adapter, rxcp);
1318
1319                 be_rx_compl_reset(rxcp);
1320         }
1321
1322         lro_flush_all(&adapter->rx_obj.lro_mgr);
1323
1324         /* Refill the queue */
1325         if (atomic_read(&adapter->rx_obj.q.used) < RX_FRAGS_REFILL_WM)
1326                 be_post_rx_frags(adapter);
1327
1328         /* All consumed */
1329         if (work_done < budget) {
1330                 napi_complete(napi);
1331                 be_cq_notify(&adapter->ctrl, rx_cq->id, true, work_done);
1332         } else {
1333                 /* More to be consumed; continue with interrupts disabled */
1334                 be_cq_notify(&adapter->ctrl, rx_cq->id, false, work_done);
1335         }
1336         return work_done;
1337 }
1338
1339 void be_process_tx(struct be_adapter *adapter)
1340 {
1341         struct be_queue_info *txq = &adapter->tx_obj.q;
1342         struct be_queue_info *tx_cq = &adapter->tx_obj.cq;
1343         struct be_eth_tx_compl *txcp;
1344         u32 num_cmpl = 0;
1345         u16 end_idx;
1346
1347         while ((txcp = be_tx_compl_get(tx_cq))) {
1348                 end_idx = AMAP_GET_BITS(struct amap_eth_tx_compl,
1349                                         wrb_index, txcp);
1350                 be_tx_compl_process(adapter, end_idx);
1351                 num_cmpl++;
1352         }
1353
1354         if (num_cmpl) {
1355                 be_cq_notify(&adapter->ctrl, tx_cq->id, true, num_cmpl);
1356
1357                 /* As Tx wrbs have been freed up, wake up netdev queue if
1358                  * it was stopped due to lack of tx wrbs.
1359                  */
1360                 if (netif_queue_stopped(adapter->netdev) &&
1361                         atomic_read(&txq->used) < txq->len / 2) {
1362                         netif_wake_queue(adapter->netdev);
1363                 }
1364
1365                 drvr_stats(adapter)->be_tx_events++;
1366                 drvr_stats(adapter)->be_tx_compl += num_cmpl;
1367         }
1368 }
1369
1370 /* As TX and MCC share the same EQ check for both TX and MCC completions.
1371  * For TX/MCC we don't honour budget; consume everything
1372  */
1373 static int be_poll_tx_mcc(struct napi_struct *napi, int budget)
1374 {
1375         struct be_eq_obj *tx_eq = container_of(napi, struct be_eq_obj, napi);
1376         struct be_adapter *adapter =
1377                 container_of(tx_eq, struct be_adapter, tx_eq);
1378
1379         napi_complete(napi);
1380
1381         be_process_tx(adapter);
1382
1383         be_process_mcc(&adapter->ctrl);
1384
1385         return 1;
1386 }
1387
1388 static void be_worker(struct work_struct *work)
1389 {
1390         struct be_adapter *adapter =
1391                 container_of(work, struct be_adapter, work.work);
1392         int status;
1393
1394         /* Get Stats */
1395         status = be_cmd_get_stats(&adapter->ctrl, &adapter->stats.cmd);
1396         if (!status)
1397                 netdev_stats_update(adapter);
1398
1399         /* Set EQ delay */
1400         be_rx_eqd_update(adapter);
1401
1402         be_tx_rate_update(adapter);
1403         be_rx_rate_update(adapter);
1404
1405         if (adapter->rx_post_starved) {
1406                 adapter->rx_post_starved = false;
1407                 be_post_rx_frags(adapter);
1408         }
1409
1410         schedule_delayed_work(&adapter->work, msecs_to_jiffies(1000));
1411 }
1412
1413 static void be_msix_enable(struct be_adapter *adapter)
1414 {
1415         int i, status;
1416
1417         for (i = 0; i < BE_NUM_MSIX_VECTORS; i++)
1418                 adapter->msix_entries[i].entry = i;
1419
1420         status = pci_enable_msix(adapter->pdev, adapter->msix_entries,
1421                 BE_NUM_MSIX_VECTORS);
1422         if (status == 0)
1423                 adapter->msix_enabled = true;
1424         return;
1425 }
1426
1427 static inline int be_msix_vec_get(struct be_adapter *adapter, u32 eq_id)
1428 {
1429         return adapter->msix_entries[eq_id -
1430                         8 * adapter->ctrl.pci_func].vector;
1431 }
1432
1433 static int be_msix_register(struct be_adapter *adapter)
1434 {
1435         struct net_device *netdev = adapter->netdev;
1436         struct be_eq_obj *tx_eq = &adapter->tx_eq;
1437         struct be_eq_obj *rx_eq = &adapter->rx_eq;
1438         int status, vec;
1439
1440         sprintf(tx_eq->desc, "%s-tx", netdev->name);
1441         vec = be_msix_vec_get(adapter, tx_eq->q.id);
1442         status = request_irq(vec, be_msix_tx_mcc, 0, tx_eq->desc, adapter);
1443         if (status)
1444                 goto err;
1445
1446         sprintf(rx_eq->desc, "%s-rx", netdev->name);
1447         vec = be_msix_vec_get(adapter, rx_eq->q.id);
1448         status = request_irq(vec, be_msix_rx, 0, rx_eq->desc, adapter);
1449         if (status) { /* Free TX IRQ */
1450                 vec = be_msix_vec_get(adapter, tx_eq->q.id);
1451                 free_irq(vec, adapter);
1452                 goto err;
1453         }
1454         return 0;
1455 err:
1456         dev_warn(&adapter->pdev->dev,
1457                 "MSIX Request IRQ failed - err %d\n", status);
1458         pci_disable_msix(adapter->pdev);
1459         adapter->msix_enabled = false;
1460         return status;
1461 }
1462
1463 static int be_irq_register(struct be_adapter *adapter)
1464 {
1465         struct net_device *netdev = adapter->netdev;
1466         int status;
1467
1468         if (adapter->msix_enabled) {
1469                 status = be_msix_register(adapter);
1470                 if (status == 0)
1471                         goto done;
1472         }
1473
1474         /* INTx */
1475         netdev->irq = adapter->pdev->irq;
1476         status = request_irq(netdev->irq, be_intx, IRQF_SHARED, netdev->name,
1477                         adapter);
1478         if (status) {
1479                 dev_err(&adapter->pdev->dev,
1480                         "INTx request IRQ failed - err %d\n", status);
1481                 return status;
1482         }
1483 done:
1484         adapter->isr_registered = true;
1485         return 0;
1486 }
1487
1488 static void be_irq_unregister(struct be_adapter *adapter)
1489 {
1490         struct net_device *netdev = adapter->netdev;
1491         int vec;
1492
1493         if (!adapter->isr_registered)
1494                 return;
1495
1496         /* INTx */
1497         if (!adapter->msix_enabled) {
1498                 free_irq(netdev->irq, adapter);
1499                 goto done;
1500         }
1501
1502         /* MSIx */
1503         vec = be_msix_vec_get(adapter, adapter->tx_eq.q.id);
1504         free_irq(vec, adapter);
1505         vec = be_msix_vec_get(adapter, adapter->rx_eq.q.id);
1506         free_irq(vec, adapter);
1507 done:
1508         adapter->isr_registered = false;
1509         return;
1510 }
1511
1512 static int be_open(struct net_device *netdev)
1513 {
1514         struct be_adapter *adapter = netdev_priv(netdev);
1515         struct be_ctrl_info *ctrl = &adapter->ctrl;
1516         struct be_eq_obj *rx_eq = &adapter->rx_eq;
1517         struct be_eq_obj *tx_eq = &adapter->tx_eq;
1518         bool link_up;
1519         int status;
1520
1521         /* First time posting */
1522         be_post_rx_frags(adapter);
1523
1524         napi_enable(&rx_eq->napi);
1525         napi_enable(&tx_eq->napi);
1526
1527         be_irq_register(adapter);
1528
1529         be_intr_set(ctrl, true);
1530
1531         /* The evt queues are created in unarmed state; arm them */
1532         be_eq_notify(ctrl, rx_eq->q.id, true, false, 0);
1533         be_eq_notify(ctrl, tx_eq->q.id, true, false, 0);
1534
1535         /* Rx compl queue may be in unarmed state; rearm it */
1536         be_cq_notify(ctrl, adapter->rx_obj.cq.id, true, 0);
1537
1538         status = be_cmd_link_status_query(ctrl, &link_up);
1539         if (status)
1540                 return status;
1541         be_link_status_update(adapter, link_up);
1542
1543         schedule_delayed_work(&adapter->work, msecs_to_jiffies(100));
1544         return 0;
1545 }
1546
1547 static int be_setup(struct be_adapter *adapter)
1548 {
1549         struct be_ctrl_info *ctrl = &adapter->ctrl;
1550         struct net_device *netdev = adapter->netdev;
1551         u32 if_flags;
1552         int status;
1553
1554         if_flags = BE_IF_FLAGS_BROADCAST | BE_IF_FLAGS_PROMISCUOUS |
1555                 BE_IF_FLAGS_MCAST_PROMISCUOUS | BE_IF_FLAGS_UNTAGGED |
1556                 BE_IF_FLAGS_PASS_L3L4_ERRORS;
1557         status = be_cmd_if_create(ctrl, if_flags, netdev->dev_addr,
1558                         false/* pmac_invalid */, &adapter->if_handle,
1559                         &adapter->pmac_id);
1560         if (status != 0)
1561                 goto do_none;
1562
1563         be_vid_config(netdev);
1564
1565         status = be_cmd_set_flow_control(ctrl, true, true);
1566         if (status != 0)
1567                 goto if_destroy;
1568
1569         status = be_tx_queues_create(adapter);
1570         if (status != 0)
1571                 goto if_destroy;
1572
1573         status = be_rx_queues_create(adapter);
1574         if (status != 0)
1575                 goto tx_qs_destroy;
1576
1577         status = be_mcc_queues_create(adapter);
1578         if (status != 0)
1579                 goto rx_qs_destroy;
1580
1581         return 0;
1582
1583 rx_qs_destroy:
1584         be_rx_queues_destroy(adapter);
1585 tx_qs_destroy:
1586         be_tx_queues_destroy(adapter);
1587 if_destroy:
1588         be_cmd_if_destroy(ctrl, adapter->if_handle);
1589 do_none:
1590         return status;
1591 }
1592
1593 static int be_clear(struct be_adapter *adapter)
1594 {
1595         struct be_ctrl_info *ctrl = &adapter->ctrl;
1596
1597         be_rx_queues_destroy(adapter);
1598         be_tx_queues_destroy(adapter);
1599
1600         be_cmd_if_destroy(ctrl, adapter->if_handle);
1601
1602         be_mcc_queues_destroy(adapter);
1603         return 0;
1604 }
1605
1606 static int be_close(struct net_device *netdev)
1607 {
1608         struct be_adapter *adapter = netdev_priv(netdev);
1609         struct be_ctrl_info *ctrl = &adapter->ctrl;
1610         struct be_eq_obj *rx_eq = &adapter->rx_eq;
1611         struct be_eq_obj *tx_eq = &adapter->tx_eq;
1612         int vec;
1613
1614         cancel_delayed_work_sync(&adapter->work);
1615
1616         netif_stop_queue(netdev);
1617         netif_carrier_off(netdev);
1618         adapter->link_up = false;
1619
1620         be_intr_set(ctrl, false);
1621
1622         if (adapter->msix_enabled) {
1623                 vec = be_msix_vec_get(adapter, tx_eq->q.id);
1624                 synchronize_irq(vec);
1625                 vec = be_msix_vec_get(adapter, rx_eq->q.id);
1626                 synchronize_irq(vec);
1627         } else {
1628                 synchronize_irq(netdev->irq);
1629         }
1630         be_irq_unregister(adapter);
1631
1632         napi_disable(&rx_eq->napi);
1633         napi_disable(&tx_eq->napi);
1634
1635         return 0;
1636 }
1637
1638 static int be_get_frag_header(struct skb_frag_struct *frag, void **mac_hdr,
1639                                 void **ip_hdr, void **tcpudp_hdr,
1640                                 u64 *hdr_flags, void *priv)
1641 {
1642         struct ethhdr *eh;
1643         struct vlan_ethhdr *veh;
1644         struct iphdr *iph;
1645         u8 *va = page_address(frag->page) + frag->page_offset;
1646         unsigned long ll_hlen;
1647
1648         prefetch(va);
1649         eh = (struct ethhdr *)va;
1650         *mac_hdr = eh;
1651         ll_hlen = ETH_HLEN;
1652         if (eh->h_proto != htons(ETH_P_IP)) {
1653                 if (eh->h_proto == htons(ETH_P_8021Q)) {
1654                         veh = (struct vlan_ethhdr *)va;
1655                         if (veh->h_vlan_encapsulated_proto != htons(ETH_P_IP))
1656                                 return -1;
1657
1658                         ll_hlen += VLAN_HLEN;
1659                 } else {
1660                         return -1;
1661                 }
1662         }
1663         *hdr_flags = LRO_IPV4;
1664         iph = (struct iphdr *)(va + ll_hlen);
1665         *ip_hdr = iph;
1666         if (iph->protocol != IPPROTO_TCP)
1667                 return -1;
1668         *hdr_flags |= LRO_TCP;
1669         *tcpudp_hdr = (u8 *) (*ip_hdr) + (iph->ihl << 2);
1670
1671         return 0;
1672 }
1673
1674 static void be_lro_init(struct be_adapter *adapter, struct net_device *netdev)
1675 {
1676         struct net_lro_mgr *lro_mgr;
1677
1678         lro_mgr = &adapter->rx_obj.lro_mgr;
1679         lro_mgr->dev = netdev;
1680         lro_mgr->features = LRO_F_NAPI;
1681         lro_mgr->ip_summed = CHECKSUM_UNNECESSARY;
1682         lro_mgr->ip_summed_aggr = CHECKSUM_UNNECESSARY;
1683         lro_mgr->max_desc = BE_MAX_LRO_DESCRIPTORS;
1684         lro_mgr->lro_arr = adapter->rx_obj.lro_desc;
1685         lro_mgr->get_frag_header = be_get_frag_header;
1686         lro_mgr->max_aggr = BE_MAX_FRAGS_PER_FRAME;
1687 }
1688
1689 static struct net_device_ops be_netdev_ops = {
1690         .ndo_open               = be_open,
1691         .ndo_stop               = be_close,
1692         .ndo_start_xmit         = be_xmit,
1693         .ndo_get_stats          = be_get_stats,
1694         .ndo_set_rx_mode        = be_set_multicast_list,
1695         .ndo_set_mac_address    = be_mac_addr_set,
1696         .ndo_change_mtu         = be_change_mtu,
1697         .ndo_validate_addr      = eth_validate_addr,
1698         .ndo_vlan_rx_register   = be_vlan_register,
1699         .ndo_vlan_rx_add_vid    = be_vlan_add_vid,
1700         .ndo_vlan_rx_kill_vid   = be_vlan_rem_vid,
1701 };
1702
1703 static void be_netdev_init(struct net_device *netdev)
1704 {
1705         struct be_adapter *adapter = netdev_priv(netdev);
1706
1707         netdev->features |= NETIF_F_SG | NETIF_F_HW_VLAN_RX | NETIF_F_TSO |
1708                 NETIF_F_HW_VLAN_TX | NETIF_F_HW_VLAN_FILTER | NETIF_F_IP_CSUM |
1709                 NETIF_F_IPV6_CSUM;
1710
1711         netdev->flags |= IFF_MULTICAST;
1712
1713         adapter->rx_csum = true;
1714
1715         BE_SET_NETDEV_OPS(netdev, &be_netdev_ops);
1716
1717         SET_ETHTOOL_OPS(netdev, &be_ethtool_ops);
1718
1719         be_lro_init(adapter, netdev);
1720
1721         netif_napi_add(netdev, &adapter->rx_eq.napi, be_poll_rx,
1722                 BE_NAPI_WEIGHT);
1723         netif_napi_add(netdev, &adapter->tx_eq.napi, be_poll_tx_mcc,
1724                 BE_NAPI_WEIGHT);
1725
1726         netif_carrier_off(netdev);
1727         netif_stop_queue(netdev);
1728 }
1729
1730 static void be_unmap_pci_bars(struct be_adapter *adapter)
1731 {
1732         struct be_ctrl_info *ctrl = &adapter->ctrl;
1733         if (ctrl->csr)
1734                 iounmap(ctrl->csr);
1735         if (ctrl->db)
1736                 iounmap(ctrl->db);
1737         if (ctrl->pcicfg)
1738                 iounmap(ctrl->pcicfg);
1739 }
1740
1741 static int be_map_pci_bars(struct be_adapter *adapter)
1742 {
1743         u8 __iomem *addr;
1744
1745         addr = ioremap_nocache(pci_resource_start(adapter->pdev, 2),
1746                         pci_resource_len(adapter->pdev, 2));
1747         if (addr == NULL)
1748                 return -ENOMEM;
1749         adapter->ctrl.csr = addr;
1750
1751         addr = ioremap_nocache(pci_resource_start(adapter->pdev, 4),
1752                         128 * 1024);
1753         if (addr == NULL)
1754                 goto pci_map_err;
1755         adapter->ctrl.db = addr;
1756
1757         addr = ioremap_nocache(pci_resource_start(adapter->pdev, 1),
1758                         pci_resource_len(adapter->pdev, 1));
1759         if (addr == NULL)
1760                 goto pci_map_err;
1761         adapter->ctrl.pcicfg = addr;
1762
1763         return 0;
1764 pci_map_err:
1765         be_unmap_pci_bars(adapter);
1766         return -ENOMEM;
1767 }
1768
1769
1770 static void be_ctrl_cleanup(struct be_adapter *adapter)
1771 {
1772         struct be_dma_mem *mem = &adapter->ctrl.mbox_mem_alloced;
1773
1774         be_unmap_pci_bars(adapter);
1775
1776         if (mem->va)
1777                 pci_free_consistent(adapter->pdev, mem->size,
1778                         mem->va, mem->dma);
1779 }
1780
1781 /* Initialize the mbox required to send cmds to BE */
1782 static int be_ctrl_init(struct be_adapter *adapter)
1783 {
1784         struct be_ctrl_info *ctrl = &adapter->ctrl;
1785         struct be_dma_mem *mbox_mem_alloc = &ctrl->mbox_mem_alloced;
1786         struct be_dma_mem *mbox_mem_align = &ctrl->mbox_mem;
1787         int status;
1788         u32 val;
1789
1790         status = be_map_pci_bars(adapter);
1791         if (status)
1792                 return status;
1793
1794         mbox_mem_alloc->size = sizeof(struct be_mcc_mailbox) + 16;
1795         mbox_mem_alloc->va = pci_alloc_consistent(adapter->pdev,
1796                                 mbox_mem_alloc->size, &mbox_mem_alloc->dma);
1797         if (!mbox_mem_alloc->va) {
1798                 be_unmap_pci_bars(adapter);
1799                 return -1;
1800         }
1801         mbox_mem_align->size = sizeof(struct be_mcc_mailbox);
1802         mbox_mem_align->va = PTR_ALIGN(mbox_mem_alloc->va, 16);
1803         mbox_mem_align->dma = PTR_ALIGN(mbox_mem_alloc->dma, 16);
1804         memset(mbox_mem_align->va, 0, sizeof(struct be_mcc_mailbox));
1805         spin_lock_init(&ctrl->mbox_lock);
1806         spin_lock_init(&ctrl->mcc_lock);
1807         spin_lock_init(&ctrl->mcc_cq_lock);
1808
1809         ctrl->async_cb = be_link_status_update;
1810         ctrl->adapter_ctxt = adapter;
1811
1812         val = ioread32(ctrl->pcicfg + PCICFG_MEMBAR_CTRL_INT_CTRL_OFFSET);
1813         ctrl->pci_func = (val >> MEMBAR_CTRL_INT_CTRL_PFUNC_SHIFT) &
1814                                         MEMBAR_CTRL_INT_CTRL_PFUNC_MASK;
1815         return 0;
1816 }
1817
1818 static void be_stats_cleanup(struct be_adapter *adapter)
1819 {
1820         struct be_stats_obj *stats = &adapter->stats;
1821         struct be_dma_mem *cmd = &stats->cmd;
1822
1823         if (cmd->va)
1824                 pci_free_consistent(adapter->pdev, cmd->size,
1825                         cmd->va, cmd->dma);
1826 }
1827
1828 static int be_stats_init(struct be_adapter *adapter)
1829 {
1830         struct be_stats_obj *stats = &adapter->stats;
1831         struct be_dma_mem *cmd = &stats->cmd;
1832
1833         cmd->size = sizeof(struct be_cmd_req_get_stats);
1834         cmd->va = pci_alloc_consistent(adapter->pdev, cmd->size, &cmd->dma);
1835         if (cmd->va == NULL)
1836                 return -1;
1837         return 0;
1838 }
1839
1840 static void __devexit be_remove(struct pci_dev *pdev)
1841 {
1842         struct be_adapter *adapter = pci_get_drvdata(pdev);
1843         if (!adapter)
1844                 return;
1845
1846         unregister_netdev(adapter->netdev);
1847
1848         be_clear(adapter);
1849
1850         be_stats_cleanup(adapter);
1851
1852         be_ctrl_cleanup(adapter);
1853
1854         if (adapter->msix_enabled) {
1855                 pci_disable_msix(adapter->pdev);
1856                 adapter->msix_enabled = false;
1857         }
1858
1859         pci_set_drvdata(pdev, NULL);
1860         pci_release_regions(pdev);
1861         pci_disable_device(pdev);
1862
1863         free_netdev(adapter->netdev);
1864 }
1865
1866 static int be_hw_up(struct be_adapter *adapter)
1867 {
1868         struct be_ctrl_info *ctrl = &adapter->ctrl;
1869         int status;
1870
1871         status = be_cmd_POST(ctrl);
1872         if (status)
1873                 return status;
1874
1875         status = be_cmd_get_fw_ver(ctrl, adapter->fw_ver);
1876         if (status)
1877                 return status;
1878
1879         status = be_cmd_query_fw_cfg(ctrl, &adapter->port_num);
1880         return status;
1881 }
1882
1883 static int __devinit be_probe(struct pci_dev *pdev,
1884                         const struct pci_device_id *pdev_id)
1885 {
1886         int status = 0;
1887         struct be_adapter *adapter;
1888         struct net_device *netdev;
1889         struct be_ctrl_info *ctrl;
1890         u8 mac[ETH_ALEN];
1891
1892         status = pci_enable_device(pdev);
1893         if (status)
1894                 goto do_none;
1895
1896         status = pci_request_regions(pdev, DRV_NAME);
1897         if (status)
1898                 goto disable_dev;
1899         pci_set_master(pdev);
1900
1901         netdev = alloc_etherdev(sizeof(struct be_adapter));
1902         if (netdev == NULL) {
1903                 status = -ENOMEM;
1904                 goto rel_reg;
1905         }
1906         adapter = netdev_priv(netdev);
1907         adapter->pdev = pdev;
1908         pci_set_drvdata(pdev, adapter);
1909         adapter->netdev = netdev;
1910
1911         be_msix_enable(adapter);
1912
1913         status = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1914         if (!status) {
1915                 netdev->features |= NETIF_F_HIGHDMA;
1916         } else {
1917                 status = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1918                 if (status) {
1919                         dev_err(&pdev->dev, "Could not set PCI DMA Mask\n");
1920                         goto free_netdev;
1921                 }
1922         }
1923
1924         ctrl = &adapter->ctrl;
1925         status = be_ctrl_init(adapter);
1926         if (status)
1927                 goto free_netdev;
1928
1929         status = be_stats_init(adapter);
1930         if (status)
1931                 goto ctrl_clean;
1932
1933         status = be_hw_up(adapter);
1934         if (status)
1935                 goto stats_clean;
1936
1937         status = be_cmd_mac_addr_query(ctrl, mac, MAC_ADDRESS_TYPE_NETWORK,
1938                         true /* permanent */, 0);
1939         if (status)
1940                 goto stats_clean;
1941         memcpy(netdev->dev_addr, mac, ETH_ALEN);
1942
1943         INIT_DELAYED_WORK(&adapter->work, be_worker);
1944         be_netdev_init(netdev);
1945         SET_NETDEV_DEV(netdev, &adapter->pdev->dev);
1946
1947         status = be_setup(adapter);
1948         if (status)
1949                 goto stats_clean;
1950         status = register_netdev(netdev);
1951         if (status != 0)
1952                 goto unsetup;
1953
1954         dev_info(&pdev->dev, "%s port %d\n", nic_name(pdev), adapter->port_num);
1955         return 0;
1956
1957 unsetup:
1958         be_clear(adapter);
1959 stats_clean:
1960         be_stats_cleanup(adapter);
1961 ctrl_clean:
1962         be_ctrl_cleanup(adapter);
1963 free_netdev:
1964         free_netdev(adapter->netdev);
1965 rel_reg:
1966         pci_release_regions(pdev);
1967 disable_dev:
1968         pci_disable_device(pdev);
1969 do_none:
1970         dev_err(&pdev->dev, "%s initialization failed\n", nic_name(pdev));
1971         return status;
1972 }
1973
1974 static int be_suspend(struct pci_dev *pdev, pm_message_t state)
1975 {
1976         struct be_adapter *adapter = pci_get_drvdata(pdev);
1977         struct net_device *netdev =  adapter->netdev;
1978
1979         netif_device_detach(netdev);
1980         if (netif_running(netdev)) {
1981                 rtnl_lock();
1982                 be_close(netdev);
1983                 be_clear(adapter);
1984                 rtnl_unlock();
1985         }
1986
1987         pci_save_state(pdev);
1988         pci_disable_device(pdev);
1989         pci_set_power_state(pdev, pci_choose_state(pdev, state));
1990         return 0;
1991 }
1992
1993 static int be_resume(struct pci_dev *pdev)
1994 {
1995         int status = 0;
1996         struct be_adapter *adapter = pci_get_drvdata(pdev);
1997         struct net_device *netdev =  adapter->netdev;
1998
1999         netif_device_detach(netdev);
2000
2001         status = pci_enable_device(pdev);
2002         if (status)
2003                 return status;
2004
2005         pci_set_power_state(pdev, 0);
2006         pci_restore_state(pdev);
2007
2008         if (netif_running(netdev)) {
2009                 rtnl_lock();
2010                 be_setup(adapter);
2011                 be_open(netdev);
2012                 rtnl_unlock();
2013         }
2014         netif_device_attach(netdev);
2015         return 0;
2016 }
2017
2018 static struct pci_driver be_driver = {
2019         .name = DRV_NAME,
2020         .id_table = be_dev_ids,
2021         .probe = be_probe,
2022         .remove = be_remove,
2023         .suspend = be_suspend,
2024         .resume = be_resume
2025 };
2026
2027 static int __init be_init_module(void)
2028 {
2029         if (rx_frag_size != 8192 && rx_frag_size != 4096
2030                 && rx_frag_size != 2048) {
2031                 printk(KERN_WARNING DRV_NAME
2032                         " : Module param rx_frag_size must be 2048/4096/8192."
2033                         " Using 2048\n");
2034                 rx_frag_size = 2048;
2035         }
2036         /* Ensure rx_frag_size is aligned to chache line */
2037         if (SKB_DATA_ALIGN(rx_frag_size) != rx_frag_size) {
2038                 printk(KERN_WARNING DRV_NAME
2039                         " : Bad module param rx_frag_size. Using 2048\n");
2040                 rx_frag_size = 2048;
2041         }
2042
2043         return pci_register_driver(&be_driver);
2044 }
2045 module_init(be_init_module);
2046
2047 static void __exit be_exit_module(void)
2048 {
2049         pci_unregister_driver(&be_driver);
2050 }
2051 module_exit(be_exit_module);