blob: ce1ab8d59eb009502182c39ef058471a2da77658 [file] [log] [blame]
b.liue9582032025-04-17 19:18:16 +08001// SPDX-License-Identifier: GPL-2.0-or-later
2/**************************************************************************/
3/* */
4/* IBM System i and System p Virtual NIC Device Driver */
5/* Copyright (C) 2014 IBM Corp. */
6/* Santiago Leon (santi_leon@yahoo.com) */
7/* Thomas Falcon (tlfalcon@linux.vnet.ibm.com) */
8/* John Allen (jallen@linux.vnet.ibm.com) */
9/* */
10/* */
11/* This module contains the implementation of a virtual ethernet device */
12/* for use with IBM i/p Series LPAR Linux. It utilizes the logical LAN */
13/* option of the RS/6000 Platform Architecture to interface with virtual */
14/* ethernet NICs that are presented to the partition by the hypervisor. */
15/* */
16/* Messages are passed between the VNIC driver and the VNIC server using */
17/* Command/Response Queues (CRQs) and sub CRQs (sCRQs). CRQs are used to */
18/* issue and receive commands that initiate communication with the server */
19/* on driver initialization. Sub CRQs (sCRQs) are similar to CRQs, but */
20/* are used by the driver to notify the server that a packet is */
21/* ready for transmission or that a buffer has been added to receive a */
22/* packet. Subsequently, sCRQs are used by the server to notify the */
23/* driver that a packet transmission has been completed or that a packet */
24/* has been received and placed in a waiting buffer. */
25/* */
26/* In lieu of a more conventional "on-the-fly" DMA mapping strategy in */
27/* which skbs are DMA mapped and immediately unmapped when the transmit */
28/* or receive has been completed, the VNIC driver is required to use */
29/* "long term mapping". This entails that large, continuous DMA mapped */
30/* buffers are allocated on driver initialization and these buffers are */
31/* then continuously reused to pass skbs to and from the VNIC server. */
32/* */
33/**************************************************************************/
34
35#include <linux/module.h>
36#include <linux/moduleparam.h>
37#include <linux/types.h>
38#include <linux/errno.h>
39#include <linux/completion.h>
40#include <linux/ioport.h>
41#include <linux/dma-mapping.h>
42#include <linux/kernel.h>
43#include <linux/netdevice.h>
44#include <linux/etherdevice.h>
45#include <linux/skbuff.h>
46#include <linux/init.h>
47#include <linux/delay.h>
48#include <linux/mm.h>
49#include <linux/ethtool.h>
50#include <linux/proc_fs.h>
51#include <linux/if_arp.h>
52#include <linux/in.h>
53#include <linux/ip.h>
54#include <linux/ipv6.h>
55#include <linux/irq.h>
56#include <linux/kthread.h>
57#include <linux/seq_file.h>
58#include <linux/interrupt.h>
59#include <net/net_namespace.h>
60#include <asm/hvcall.h>
61#include <linux/atomic.h>
62#include <asm/vio.h>
63#include <asm/iommu.h>
64#include <linux/uaccess.h>
65#include <asm/firmware.h>
66#include <linux/workqueue.h>
67#include <linux/if_vlan.h>
68#include <linux/utsname.h>
69
70#include "ibmvnic.h"
71
72static const char ibmvnic_driver_name[] = "ibmvnic";
73static const char ibmvnic_driver_string[] = "IBM System i/p Virtual NIC Driver";
74
75MODULE_AUTHOR("Santiago Leon");
76MODULE_DESCRIPTION("IBM System i/p Virtual NIC Driver");
77MODULE_LICENSE("GPL");
78MODULE_VERSION(IBMVNIC_DRIVER_VERSION);
79
80static int ibmvnic_version = IBMVNIC_INITIAL_VERSION;
81static int ibmvnic_remove(struct vio_dev *);
82static void release_sub_crqs(struct ibmvnic_adapter *, bool);
83static int ibmvnic_reset_crq(struct ibmvnic_adapter *);
84static int ibmvnic_send_crq_init(struct ibmvnic_adapter *);
85static int ibmvnic_reenable_crq_queue(struct ibmvnic_adapter *);
86static int ibmvnic_send_crq(struct ibmvnic_adapter *, union ibmvnic_crq *);
87static int send_subcrq(struct ibmvnic_adapter *adapter, u64 remote_handle,
88 union sub_crq *sub_crq);
89static int send_subcrq_indirect(struct ibmvnic_adapter *, u64, u64, u64);
90static irqreturn_t ibmvnic_interrupt_rx(int irq, void *instance);
91static int enable_scrq_irq(struct ibmvnic_adapter *,
92 struct ibmvnic_sub_crq_queue *);
93static int disable_scrq_irq(struct ibmvnic_adapter *,
94 struct ibmvnic_sub_crq_queue *);
95static int pending_scrq(struct ibmvnic_adapter *,
96 struct ibmvnic_sub_crq_queue *);
97static union sub_crq *ibmvnic_next_scrq(struct ibmvnic_adapter *,
98 struct ibmvnic_sub_crq_queue *);
99static int ibmvnic_poll(struct napi_struct *napi, int data);
100static void send_map_query(struct ibmvnic_adapter *adapter);
101static int send_request_map(struct ibmvnic_adapter *, dma_addr_t, __be32, u8);
102static int send_request_unmap(struct ibmvnic_adapter *, u8);
103static int send_login(struct ibmvnic_adapter *adapter);
104static void send_cap_queries(struct ibmvnic_adapter *adapter);
105static int init_sub_crqs(struct ibmvnic_adapter *);
106static int init_sub_crq_irqs(struct ibmvnic_adapter *adapter);
107static int ibmvnic_init(struct ibmvnic_adapter *);
108static int ibmvnic_reset_init(struct ibmvnic_adapter *);
109static void release_crq_queue(struct ibmvnic_adapter *);
110static int __ibmvnic_set_mac(struct net_device *, u8 *);
111static int init_crq_queue(struct ibmvnic_adapter *adapter);
112static int send_query_phys_parms(struct ibmvnic_adapter *adapter);
113
114struct ibmvnic_stat {
115 char name[ETH_GSTRING_LEN];
116 int offset;
117};
118
119#define IBMVNIC_STAT_OFF(stat) (offsetof(struct ibmvnic_adapter, stats) + \
120 offsetof(struct ibmvnic_statistics, stat))
121#define IBMVNIC_GET_STAT(a, off) (*((u64 *)(((unsigned long)(a)) + off)))
122
123static const struct ibmvnic_stat ibmvnic_stats[] = {
124 {"rx_packets", IBMVNIC_STAT_OFF(rx_packets)},
125 {"rx_bytes", IBMVNIC_STAT_OFF(rx_bytes)},
126 {"tx_packets", IBMVNIC_STAT_OFF(tx_packets)},
127 {"tx_bytes", IBMVNIC_STAT_OFF(tx_bytes)},
128 {"ucast_tx_packets", IBMVNIC_STAT_OFF(ucast_tx_packets)},
129 {"ucast_rx_packets", IBMVNIC_STAT_OFF(ucast_rx_packets)},
130 {"mcast_tx_packets", IBMVNIC_STAT_OFF(mcast_tx_packets)},
131 {"mcast_rx_packets", IBMVNIC_STAT_OFF(mcast_rx_packets)},
132 {"bcast_tx_packets", IBMVNIC_STAT_OFF(bcast_tx_packets)},
133 {"bcast_rx_packets", IBMVNIC_STAT_OFF(bcast_rx_packets)},
134 {"align_errors", IBMVNIC_STAT_OFF(align_errors)},
135 {"fcs_errors", IBMVNIC_STAT_OFF(fcs_errors)},
136 {"single_collision_frames", IBMVNIC_STAT_OFF(single_collision_frames)},
137 {"multi_collision_frames", IBMVNIC_STAT_OFF(multi_collision_frames)},
138 {"sqe_test_errors", IBMVNIC_STAT_OFF(sqe_test_errors)},
139 {"deferred_tx", IBMVNIC_STAT_OFF(deferred_tx)},
140 {"late_collisions", IBMVNIC_STAT_OFF(late_collisions)},
141 {"excess_collisions", IBMVNIC_STAT_OFF(excess_collisions)},
142 {"internal_mac_tx_errors", IBMVNIC_STAT_OFF(internal_mac_tx_errors)},
143 {"carrier_sense", IBMVNIC_STAT_OFF(carrier_sense)},
144 {"too_long_frames", IBMVNIC_STAT_OFF(too_long_frames)},
145 {"internal_mac_rx_errors", IBMVNIC_STAT_OFF(internal_mac_rx_errors)},
146};
147
148static long h_reg_sub_crq(unsigned long unit_address, unsigned long token,
149 unsigned long length, unsigned long *number,
150 unsigned long *irq)
151{
152 unsigned long retbuf[PLPAR_HCALL_BUFSIZE];
153 long rc;
154
155 rc = plpar_hcall(H_REG_SUB_CRQ, retbuf, unit_address, token, length);
156 *number = retbuf[0];
157 *irq = retbuf[1];
158
159 return rc;
160}
161
162static int alloc_long_term_buff(struct ibmvnic_adapter *adapter,
163 struct ibmvnic_long_term_buff *ltb, int size)
164{
165 struct device *dev = &adapter->vdev->dev;
166 int rc;
167
168 ltb->size = size;
169 ltb->buff = dma_alloc_coherent(dev, ltb->size, &ltb->addr,
170 GFP_KERNEL);
171
172 if (!ltb->buff) {
173 dev_err(dev, "Couldn't alloc long term buffer\n");
174 return -ENOMEM;
175 }
176 ltb->map_id = adapter->map_id;
177 adapter->map_id++;
178
179 reinit_completion(&adapter->fw_done);
180 rc = send_request_map(adapter, ltb->addr,
181 ltb->size, ltb->map_id);
182 if (rc) {
183 dma_free_coherent(dev, ltb->size, ltb->buff, ltb->addr);
184 return rc;
185 }
186 wait_for_completion(&adapter->fw_done);
187
188 if (adapter->fw_done_rc) {
189 dev_err(dev, "Couldn't map long term buffer,rc = %d\n",
190 adapter->fw_done_rc);
191 dma_free_coherent(dev, ltb->size, ltb->buff, ltb->addr);
192 return -1;
193 }
194 return 0;
195}
196
197static void free_long_term_buff(struct ibmvnic_adapter *adapter,
198 struct ibmvnic_long_term_buff *ltb)
199{
200 struct device *dev = &adapter->vdev->dev;
201
202 if (!ltb->buff)
203 return;
204
205 /* VIOS automatically unmaps the long term buffer at remote
206 * end for the following resets:
207 * FAILOVER, MOBILITY, TIMEOUT.
208 */
209 if (adapter->reset_reason != VNIC_RESET_FAILOVER &&
210 adapter->reset_reason != VNIC_RESET_MOBILITY &&
211 adapter->reset_reason != VNIC_RESET_TIMEOUT)
212 send_request_unmap(adapter, ltb->map_id);
213 dma_free_coherent(dev, ltb->size, ltb->buff, ltb->addr);
214}
215
216static int reset_long_term_buff(struct ibmvnic_adapter *adapter,
217 struct ibmvnic_long_term_buff *ltb)
218{
219 int rc;
220
221 memset(ltb->buff, 0, ltb->size);
222
223 reinit_completion(&adapter->fw_done);
224 rc = send_request_map(adapter, ltb->addr, ltb->size, ltb->map_id);
225 if (rc)
226 return rc;
227 wait_for_completion(&adapter->fw_done);
228
229 if (adapter->fw_done_rc) {
230 dev_info(&adapter->vdev->dev,
231 "Reset failed, attempting to free and reallocate buffer\n");
232 free_long_term_buff(adapter, ltb);
233 return alloc_long_term_buff(adapter, ltb, ltb->size);
234 }
235 return 0;
236}
237
238static void deactivate_rx_pools(struct ibmvnic_adapter *adapter)
239{
240 int i;
241
242 for (i = 0; i < be32_to_cpu(adapter->login_rsp_buf->num_rxadd_subcrqs);
243 i++)
244 adapter->rx_pool[i].active = 0;
245}
246
247static void replenish_rx_pool(struct ibmvnic_adapter *adapter,
248 struct ibmvnic_rx_pool *pool)
249{
250 int count = pool->size - atomic_read(&pool->available);
251 struct device *dev = &adapter->vdev->dev;
252 int buffers_added = 0;
253 unsigned long lpar_rc;
254 union sub_crq sub_crq;
255 struct sk_buff *skb;
256 unsigned int offset;
257 dma_addr_t dma_addr;
258 unsigned char *dst;
259 u64 *handle_array;
260 int shift = 0;
261 int index;
262 int i;
263
264 if (!pool->active)
265 return;
266
267 handle_array = (u64 *)((u8 *)(adapter->login_rsp_buf) +
268 be32_to_cpu(adapter->login_rsp_buf->
269 off_rxadd_subcrqs));
270
271 for (i = 0; i < count; ++i) {
272 skb = alloc_skb(pool->buff_size, GFP_ATOMIC);
273 if (!skb) {
274 dev_err(dev, "Couldn't replenish rx buff\n");
275 adapter->replenish_no_mem++;
276 break;
277 }
278
279 index = pool->free_map[pool->next_free];
280
281 if (pool->rx_buff[index].skb)
282 dev_err(dev, "Inconsistent free_map!\n");
283
284 /* Copy the skb to the long term mapped DMA buffer */
285 offset = index * pool->buff_size;
286 dst = pool->long_term_buff.buff + offset;
287 memset(dst, 0, pool->buff_size);
288 dma_addr = pool->long_term_buff.addr + offset;
289 pool->rx_buff[index].data = dst;
290
291 pool->free_map[pool->next_free] = IBMVNIC_INVALID_MAP;
292 pool->rx_buff[index].dma = dma_addr;
293 pool->rx_buff[index].skb = skb;
294 pool->rx_buff[index].pool_index = pool->index;
295 pool->rx_buff[index].size = pool->buff_size;
296
297 memset(&sub_crq, 0, sizeof(sub_crq));
298 sub_crq.rx_add.first = IBMVNIC_CRQ_CMD;
299 sub_crq.rx_add.correlator =
300 cpu_to_be64((u64)&pool->rx_buff[index]);
301 sub_crq.rx_add.ioba = cpu_to_be32(dma_addr);
302 sub_crq.rx_add.map_id = pool->long_term_buff.map_id;
303
304 /* The length field of the sCRQ is defined to be 24 bits so the
305 * buffer size needs to be left shifted by a byte before it is
306 * converted to big endian to prevent the last byte from being
307 * truncated.
308 */
309#ifdef __LITTLE_ENDIAN__
310 shift = 8;
311#endif
312 sub_crq.rx_add.len = cpu_to_be32(pool->buff_size << shift);
313
314 lpar_rc = send_subcrq(adapter, handle_array[pool->index],
315 &sub_crq);
316 if (lpar_rc != H_SUCCESS)
317 goto failure;
318
319 buffers_added++;
320 adapter->replenish_add_buff_success++;
321 pool->next_free = (pool->next_free + 1) % pool->size;
322 }
323 atomic_add(buffers_added, &pool->available);
324 return;
325
326failure:
327 if (lpar_rc != H_PARAMETER && lpar_rc != H_CLOSED)
328 dev_err_ratelimited(dev, "rx: replenish packet buffer failed\n");
329 pool->free_map[pool->next_free] = index;
330 pool->rx_buff[index].skb = NULL;
331
332 dev_kfree_skb_any(skb);
333 adapter->replenish_add_buff_failure++;
334 atomic_add(buffers_added, &pool->available);
335
336 if (lpar_rc == H_CLOSED || adapter->failover_pending) {
337 /* Disable buffer pool replenishment and report carrier off if
338 * queue is closed or pending failover.
339 * Firmware guarantees that a signal will be sent to the
340 * driver, triggering a reset.
341 */
342 deactivate_rx_pools(adapter);
343 netif_carrier_off(adapter->netdev);
344 }
345}
346
347static void replenish_pools(struct ibmvnic_adapter *adapter)
348{
349 int i;
350
351 adapter->replenish_task_cycles++;
352 for (i = 0; i < be32_to_cpu(adapter->login_rsp_buf->num_rxadd_subcrqs);
353 i++) {
354 if (adapter->rx_pool[i].active)
355 replenish_rx_pool(adapter, &adapter->rx_pool[i]);
356 }
357}
358
359static void release_stats_buffers(struct ibmvnic_adapter *adapter)
360{
361 kfree(adapter->tx_stats_buffers);
362 kfree(adapter->rx_stats_buffers);
363 adapter->tx_stats_buffers = NULL;
364 adapter->rx_stats_buffers = NULL;
365}
366
367static int init_stats_buffers(struct ibmvnic_adapter *adapter)
368{
369 adapter->tx_stats_buffers =
370 kcalloc(IBMVNIC_MAX_QUEUES,
371 sizeof(struct ibmvnic_tx_queue_stats),
372 GFP_KERNEL);
373 if (!adapter->tx_stats_buffers)
374 return -ENOMEM;
375
376 adapter->rx_stats_buffers =
377 kcalloc(IBMVNIC_MAX_QUEUES,
378 sizeof(struct ibmvnic_rx_queue_stats),
379 GFP_KERNEL);
380 if (!adapter->rx_stats_buffers)
381 return -ENOMEM;
382
383 return 0;
384}
385
386static void release_stats_token(struct ibmvnic_adapter *adapter)
387{
388 struct device *dev = &adapter->vdev->dev;
389
390 if (!adapter->stats_token)
391 return;
392
393 dma_unmap_single(dev, adapter->stats_token,
394 sizeof(struct ibmvnic_statistics),
395 DMA_FROM_DEVICE);
396 adapter->stats_token = 0;
397}
398
399static int init_stats_token(struct ibmvnic_adapter *adapter)
400{
401 struct device *dev = &adapter->vdev->dev;
402 dma_addr_t stok;
403
404 stok = dma_map_single(dev, &adapter->stats,
405 sizeof(struct ibmvnic_statistics),
406 DMA_FROM_DEVICE);
407 if (dma_mapping_error(dev, stok)) {
408 dev_err(dev, "Couldn't map stats buffer\n");
409 return -1;
410 }
411
412 adapter->stats_token = stok;
413 netdev_dbg(adapter->netdev, "Stats token initialized (%llx)\n", stok);
414 return 0;
415}
416
417static int reset_rx_pools(struct ibmvnic_adapter *adapter)
418{
419 struct ibmvnic_rx_pool *rx_pool;
420 int rx_scrqs;
421 int i, j, rc;
422 u64 *size_array;
423
424 if (!adapter->rx_pool)
425 return -1;
426
427 size_array = (u64 *)((u8 *)(adapter->login_rsp_buf) +
428 be32_to_cpu(adapter->login_rsp_buf->off_rxadd_buff_size));
429
430 rx_scrqs = be32_to_cpu(adapter->login_rsp_buf->num_rxadd_subcrqs);
431 for (i = 0; i < rx_scrqs; i++) {
432 rx_pool = &adapter->rx_pool[i];
433
434 netdev_dbg(adapter->netdev, "Re-setting rx_pool[%d]\n", i);
435
436 if (rx_pool->buff_size != be64_to_cpu(size_array[i])) {
437 free_long_term_buff(adapter, &rx_pool->long_term_buff);
438 rx_pool->buff_size = be64_to_cpu(size_array[i]);
439 rc = alloc_long_term_buff(adapter,
440 &rx_pool->long_term_buff,
441 rx_pool->size *
442 rx_pool->buff_size);
443 } else {
444 rc = reset_long_term_buff(adapter,
445 &rx_pool->long_term_buff);
446 }
447
448 if (rc)
449 return rc;
450
451 for (j = 0; j < rx_pool->size; j++)
452 rx_pool->free_map[j] = j;
453
454 memset(rx_pool->rx_buff, 0,
455 rx_pool->size * sizeof(struct ibmvnic_rx_buff));
456
457 atomic_set(&rx_pool->available, 0);
458 rx_pool->next_alloc = 0;
459 rx_pool->next_free = 0;
460 rx_pool->active = 1;
461 }
462
463 return 0;
464}
465
466static void release_rx_pools(struct ibmvnic_adapter *adapter)
467{
468 struct ibmvnic_rx_pool *rx_pool;
469 int i, j;
470
471 if (!adapter->rx_pool)
472 return;
473
474 for (i = 0; i < adapter->num_active_rx_pools; i++) {
475 rx_pool = &adapter->rx_pool[i];
476
477 netdev_dbg(adapter->netdev, "Releasing rx_pool[%d]\n", i);
478
479 kfree(rx_pool->free_map);
480 free_long_term_buff(adapter, &rx_pool->long_term_buff);
481
482 if (!rx_pool->rx_buff)
483 continue;
484
485 for (j = 0; j < rx_pool->size; j++) {
486 if (rx_pool->rx_buff[j].skb) {
487 dev_kfree_skb_any(rx_pool->rx_buff[j].skb);
488 rx_pool->rx_buff[j].skb = NULL;
489 }
490 }
491
492 kfree(rx_pool->rx_buff);
493 }
494
495 kfree(adapter->rx_pool);
496 adapter->rx_pool = NULL;
497 adapter->num_active_rx_pools = 0;
498}
499
500static int init_rx_pools(struct net_device *netdev)
501{
502 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
503 struct device *dev = &adapter->vdev->dev;
504 struct ibmvnic_rx_pool *rx_pool;
505 int rxadd_subcrqs;
506 u64 *size_array;
507 int i, j;
508
509 rxadd_subcrqs =
510 be32_to_cpu(adapter->login_rsp_buf->num_rxadd_subcrqs);
511 size_array = (u64 *)((u8 *)(adapter->login_rsp_buf) +
512 be32_to_cpu(adapter->login_rsp_buf->off_rxadd_buff_size));
513
514 adapter->rx_pool = kcalloc(rxadd_subcrqs,
515 sizeof(struct ibmvnic_rx_pool),
516 GFP_KERNEL);
517 if (!adapter->rx_pool) {
518 dev_err(dev, "Failed to allocate rx pools\n");
519 return -1;
520 }
521
522 adapter->num_active_rx_pools = rxadd_subcrqs;
523
524 for (i = 0; i < rxadd_subcrqs; i++) {
525 rx_pool = &adapter->rx_pool[i];
526
527 netdev_dbg(adapter->netdev,
528 "Initializing rx_pool[%d], %lld buffs, %lld bytes each\n",
529 i, adapter->req_rx_add_entries_per_subcrq,
530 be64_to_cpu(size_array[i]));
531
532 rx_pool->size = adapter->req_rx_add_entries_per_subcrq;
533 rx_pool->index = i;
534 rx_pool->buff_size = be64_to_cpu(size_array[i]);
535 rx_pool->active = 1;
536
537 rx_pool->free_map = kcalloc(rx_pool->size, sizeof(int),
538 GFP_KERNEL);
539 if (!rx_pool->free_map) {
540 release_rx_pools(adapter);
541 return -1;
542 }
543
544 rx_pool->rx_buff = kcalloc(rx_pool->size,
545 sizeof(struct ibmvnic_rx_buff),
546 GFP_KERNEL);
547 if (!rx_pool->rx_buff) {
548 dev_err(dev, "Couldn't alloc rx buffers\n");
549 release_rx_pools(adapter);
550 return -1;
551 }
552
553 if (alloc_long_term_buff(adapter, &rx_pool->long_term_buff,
554 rx_pool->size * rx_pool->buff_size)) {
555 release_rx_pools(adapter);
556 return -1;
557 }
558
559 for (j = 0; j < rx_pool->size; ++j)
560 rx_pool->free_map[j] = j;
561
562 atomic_set(&rx_pool->available, 0);
563 rx_pool->next_alloc = 0;
564 rx_pool->next_free = 0;
565 }
566
567 return 0;
568}
569
570static int reset_one_tx_pool(struct ibmvnic_adapter *adapter,
571 struct ibmvnic_tx_pool *tx_pool)
572{
573 int rc, i;
574
575 rc = reset_long_term_buff(adapter, &tx_pool->long_term_buff);
576 if (rc)
577 return rc;
578
579 memset(tx_pool->tx_buff, 0,
580 tx_pool->num_buffers *
581 sizeof(struct ibmvnic_tx_buff));
582
583 for (i = 0; i < tx_pool->num_buffers; i++)
584 tx_pool->free_map[i] = i;
585
586 tx_pool->consumer_index = 0;
587 tx_pool->producer_index = 0;
588
589 return 0;
590}
591
592static int reset_tx_pools(struct ibmvnic_adapter *adapter)
593{
594 int tx_scrqs;
595 int i, rc;
596
597 if (!adapter->tx_pool)
598 return -1;
599
600 tx_scrqs = be32_to_cpu(adapter->login_rsp_buf->num_txsubm_subcrqs);
601 for (i = 0; i < tx_scrqs; i++) {
602 rc = reset_one_tx_pool(adapter, &adapter->tso_pool[i]);
603 if (rc)
604 return rc;
605 rc = reset_one_tx_pool(adapter, &adapter->tx_pool[i]);
606 if (rc)
607 return rc;
608 }
609
610 return 0;
611}
612
613static void release_vpd_data(struct ibmvnic_adapter *adapter)
614{
615 if (!adapter->vpd)
616 return;
617
618 kfree(adapter->vpd->buff);
619 kfree(adapter->vpd);
620
621 adapter->vpd = NULL;
622}
623
624static void release_one_tx_pool(struct ibmvnic_adapter *adapter,
625 struct ibmvnic_tx_pool *tx_pool)
626{
627 kfree(tx_pool->tx_buff);
628 kfree(tx_pool->free_map);
629 free_long_term_buff(adapter, &tx_pool->long_term_buff);
630}
631
632static void release_tx_pools(struct ibmvnic_adapter *adapter)
633{
634 int i;
635
636 if (!adapter->tx_pool)
637 return;
638
639 for (i = 0; i < adapter->num_active_tx_pools; i++) {
640 release_one_tx_pool(adapter, &adapter->tx_pool[i]);
641 release_one_tx_pool(adapter, &adapter->tso_pool[i]);
642 }
643
644 kfree(adapter->tx_pool);
645 adapter->tx_pool = NULL;
646 kfree(adapter->tso_pool);
647 adapter->tso_pool = NULL;
648 adapter->num_active_tx_pools = 0;
649}
650
651static int init_one_tx_pool(struct net_device *netdev,
652 struct ibmvnic_tx_pool *tx_pool,
653 int num_entries, int buf_size)
654{
655 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
656 int i;
657
658 tx_pool->tx_buff = kcalloc(num_entries,
659 sizeof(struct ibmvnic_tx_buff),
660 GFP_KERNEL);
661 if (!tx_pool->tx_buff)
662 return -1;
663
664 if (alloc_long_term_buff(adapter, &tx_pool->long_term_buff,
665 num_entries * buf_size))
666 return -1;
667
668 tx_pool->free_map = kcalloc(num_entries, sizeof(int), GFP_KERNEL);
669 if (!tx_pool->free_map)
670 return -1;
671
672 for (i = 0; i < num_entries; i++)
673 tx_pool->free_map[i] = i;
674
675 tx_pool->consumer_index = 0;
676 tx_pool->producer_index = 0;
677 tx_pool->num_buffers = num_entries;
678 tx_pool->buf_size = buf_size;
679
680 return 0;
681}
682
683static int init_tx_pools(struct net_device *netdev)
684{
685 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
686 int tx_subcrqs;
687 int i, rc;
688
689 tx_subcrqs = be32_to_cpu(adapter->login_rsp_buf->num_txsubm_subcrqs);
690 adapter->tx_pool = kcalloc(tx_subcrqs,
691 sizeof(struct ibmvnic_tx_pool), GFP_KERNEL);
692 if (!adapter->tx_pool)
693 return -1;
694
695 adapter->tso_pool = kcalloc(tx_subcrqs,
696 sizeof(struct ibmvnic_tx_pool), GFP_KERNEL);
697 if (!adapter->tso_pool) {
698 kfree(adapter->tx_pool);
699 adapter->tx_pool = NULL;
700 return -1;
701 }
702
703 adapter->num_active_tx_pools = tx_subcrqs;
704
705 for (i = 0; i < tx_subcrqs; i++) {
706 rc = init_one_tx_pool(netdev, &adapter->tx_pool[i],
707 adapter->req_tx_entries_per_subcrq,
708 adapter->req_mtu + VLAN_HLEN);
709 if (rc) {
710 release_tx_pools(adapter);
711 return rc;
712 }
713
714 rc = init_one_tx_pool(netdev, &adapter->tso_pool[i],
715 IBMVNIC_TSO_BUFS,
716 IBMVNIC_TSO_BUF_SZ);
717 if (rc) {
718 release_tx_pools(adapter);
719 return rc;
720 }
721 }
722
723 return 0;
724}
725
726static void ibmvnic_napi_enable(struct ibmvnic_adapter *adapter)
727{
728 int i;
729
730 if (adapter->napi_enabled)
731 return;
732
733 for (i = 0; i < adapter->req_rx_queues; i++)
734 napi_enable(&adapter->napi[i]);
735
736 adapter->napi_enabled = true;
737}
738
739static void ibmvnic_napi_disable(struct ibmvnic_adapter *adapter)
740{
741 int i;
742
743 if (!adapter->napi_enabled)
744 return;
745
746 for (i = 0; i < adapter->req_rx_queues; i++) {
747 netdev_dbg(adapter->netdev, "Disabling napi[%d]\n", i);
748 napi_disable(&adapter->napi[i]);
749 }
750
751 adapter->napi_enabled = false;
752}
753
754static int init_napi(struct ibmvnic_adapter *adapter)
755{
756 int i;
757
758 adapter->napi = kcalloc(adapter->req_rx_queues,
759 sizeof(struct napi_struct), GFP_KERNEL);
760 if (!adapter->napi)
761 return -ENOMEM;
762
763 for (i = 0; i < adapter->req_rx_queues; i++) {
764 netdev_dbg(adapter->netdev, "Adding napi[%d]\n", i);
765 netif_napi_add(adapter->netdev, &adapter->napi[i],
766 ibmvnic_poll, NAPI_POLL_WEIGHT);
767 }
768
769 adapter->num_active_rx_napi = adapter->req_rx_queues;
770 return 0;
771}
772
773static void release_napi(struct ibmvnic_adapter *adapter)
774{
775 int i;
776
777 if (!adapter->napi)
778 return;
779
780 for (i = 0; i < adapter->num_active_rx_napi; i++) {
781 netdev_dbg(adapter->netdev, "Releasing napi[%d]\n", i);
782 netif_napi_del(&adapter->napi[i]);
783 }
784
785 kfree(adapter->napi);
786 adapter->napi = NULL;
787 adapter->num_active_rx_napi = 0;
788 adapter->napi_enabled = false;
789}
790
791static int ibmvnic_login(struct net_device *netdev)
792{
793 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
794 unsigned long timeout = msecs_to_jiffies(30000);
795 int retry_count = 0;
796 int retries = 10;
797 bool retry;
798 int rc;
799
800 do {
801 retry = false;
802 if (retry_count > retries) {
803 netdev_warn(netdev, "Login attempts exceeded\n");
804 return -1;
805 }
806
807 adapter->init_done_rc = 0;
808 reinit_completion(&adapter->init_done);
809 rc = send_login(adapter);
810 if (rc) {
811 netdev_warn(netdev, "Unable to login\n");
812 return rc;
813 }
814
815 if (!wait_for_completion_timeout(&adapter->init_done,
816 timeout)) {
817 netdev_warn(netdev, "Login timed out, retrying...\n");
818 retry = true;
819 adapter->init_done_rc = 0;
820 retry_count++;
821 continue;
822 }
823
824 if (adapter->init_done_rc == ABORTED) {
825 netdev_warn(netdev, "Login aborted, retrying...\n");
826 retry = true;
827 adapter->init_done_rc = 0;
828 retry_count++;
829 /* FW or device may be busy, so
830 * wait a bit before retrying login
831 */
832 msleep(500);
833 } else if (adapter->init_done_rc == PARTIALSUCCESS) {
834 retry_count++;
835 release_sub_crqs(adapter, 1);
836
837 retry = true;
838 netdev_dbg(netdev,
839 "Received partial success, retrying...\n");
840 adapter->init_done_rc = 0;
841 reinit_completion(&adapter->init_done);
842 send_cap_queries(adapter);
843 if (!wait_for_completion_timeout(&adapter->init_done,
844 timeout)) {
845 netdev_warn(netdev,
846 "Capabilities query timed out\n");
847 return -1;
848 }
849
850 rc = init_sub_crqs(adapter);
851 if (rc) {
852 netdev_warn(netdev,
853 "SCRQ initialization failed\n");
854 return -1;
855 }
856
857 rc = init_sub_crq_irqs(adapter);
858 if (rc) {
859 netdev_warn(netdev,
860 "SCRQ irq initialization failed\n");
861 return -1;
862 }
863 } else if (adapter->init_done_rc) {
864 netdev_warn(netdev, "Adapter login failed\n");
865 return -1;
866 }
867 } while (retry);
868
869 __ibmvnic_set_mac(netdev, adapter->mac_addr);
870
871 return 0;
872}
873
874static void release_login_buffer(struct ibmvnic_adapter *adapter)
875{
876 if (!adapter->login_buf)
877 return;
878
879 dma_unmap_single(&adapter->vdev->dev, adapter->login_buf_token,
880 adapter->login_buf_sz, DMA_TO_DEVICE);
881 kfree(adapter->login_buf);
882 adapter->login_buf = NULL;
883}
884
885static void release_login_rsp_buffer(struct ibmvnic_adapter *adapter)
886{
887 if (!adapter->login_rsp_buf)
888 return;
889
890 dma_unmap_single(&adapter->vdev->dev, adapter->login_rsp_buf_token,
891 adapter->login_rsp_buf_sz, DMA_FROM_DEVICE);
892 kfree(adapter->login_rsp_buf);
893 adapter->login_rsp_buf = NULL;
894}
895
896static void release_resources(struct ibmvnic_adapter *adapter)
897{
898 release_vpd_data(adapter);
899
900 release_tx_pools(adapter);
901 release_rx_pools(adapter);
902
903 release_napi(adapter);
904 release_login_rsp_buffer(adapter);
905}
906
907static int set_link_state(struct ibmvnic_adapter *adapter, u8 link_state)
908{
909 struct net_device *netdev = adapter->netdev;
910 unsigned long timeout = msecs_to_jiffies(30000);
911 union ibmvnic_crq crq;
912 bool resend;
913 int rc;
914
915 netdev_dbg(netdev, "setting link state %d\n", link_state);
916
917 memset(&crq, 0, sizeof(crq));
918 crq.logical_link_state.first = IBMVNIC_CRQ_CMD;
919 crq.logical_link_state.cmd = LOGICAL_LINK_STATE;
920 crq.logical_link_state.link_state = link_state;
921
922 do {
923 resend = false;
924
925 reinit_completion(&adapter->init_done);
926 rc = ibmvnic_send_crq(adapter, &crq);
927 if (rc) {
928 netdev_err(netdev, "Failed to set link state\n");
929 return rc;
930 }
931
932 if (!wait_for_completion_timeout(&adapter->init_done,
933 timeout)) {
934 netdev_err(netdev, "timeout setting link state\n");
935 return -1;
936 }
937
938 if (adapter->init_done_rc == 1) {
939 /* Partuial success, delay and re-send */
940 mdelay(1000);
941 resend = true;
942 } else if (adapter->init_done_rc) {
943 netdev_warn(netdev, "Unable to set link state, rc=%d\n",
944 adapter->init_done_rc);
945 return adapter->init_done_rc;
946 }
947 } while (resend);
948
949 return 0;
950}
951
952static int set_real_num_queues(struct net_device *netdev)
953{
954 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
955 int rc;
956
957 netdev_dbg(netdev, "Setting real tx/rx queues (%llx/%llx)\n",
958 adapter->req_tx_queues, adapter->req_rx_queues);
959
960 rc = netif_set_real_num_tx_queues(netdev, adapter->req_tx_queues);
961 if (rc) {
962 netdev_err(netdev, "failed to set the number of tx queues\n");
963 return rc;
964 }
965
966 rc = netif_set_real_num_rx_queues(netdev, adapter->req_rx_queues);
967 if (rc)
968 netdev_err(netdev, "failed to set the number of rx queues\n");
969
970 return rc;
971}
972
973static int ibmvnic_get_vpd(struct ibmvnic_adapter *adapter)
974{
975 struct device *dev = &adapter->vdev->dev;
976 union ibmvnic_crq crq;
977 int len = 0;
978 int rc;
979
980 if (adapter->vpd->buff)
981 len = adapter->vpd->len;
982
983 reinit_completion(&adapter->fw_done);
984 crq.get_vpd_size.first = IBMVNIC_CRQ_CMD;
985 crq.get_vpd_size.cmd = GET_VPD_SIZE;
986 rc = ibmvnic_send_crq(adapter, &crq);
987 if (rc)
988 return rc;
989 wait_for_completion(&adapter->fw_done);
990
991 if (!adapter->vpd->len)
992 return -ENODATA;
993
994 if (!adapter->vpd->buff)
995 adapter->vpd->buff = kzalloc(adapter->vpd->len, GFP_KERNEL);
996 else if (adapter->vpd->len != len)
997 adapter->vpd->buff =
998 krealloc(adapter->vpd->buff,
999 adapter->vpd->len, GFP_KERNEL);
1000
1001 if (!adapter->vpd->buff) {
1002 dev_err(dev, "Could allocate VPD buffer\n");
1003 return -ENOMEM;
1004 }
1005
1006 adapter->vpd->dma_addr =
1007 dma_map_single(dev, adapter->vpd->buff, adapter->vpd->len,
1008 DMA_FROM_DEVICE);
1009 if (dma_mapping_error(dev, adapter->vpd->dma_addr)) {
1010 dev_err(dev, "Could not map VPD buffer\n");
1011 kfree(adapter->vpd->buff);
1012 adapter->vpd->buff = NULL;
1013 return -ENOMEM;
1014 }
1015
1016 reinit_completion(&adapter->fw_done);
1017 crq.get_vpd.first = IBMVNIC_CRQ_CMD;
1018 crq.get_vpd.cmd = GET_VPD;
1019 crq.get_vpd.ioba = cpu_to_be32(adapter->vpd->dma_addr);
1020 crq.get_vpd.len = cpu_to_be32((u32)adapter->vpd->len);
1021 rc = ibmvnic_send_crq(adapter, &crq);
1022 if (rc) {
1023 kfree(adapter->vpd->buff);
1024 adapter->vpd->buff = NULL;
1025 return rc;
1026 }
1027 wait_for_completion(&adapter->fw_done);
1028
1029 return 0;
1030}
1031
1032static int init_resources(struct ibmvnic_adapter *adapter)
1033{
1034 struct net_device *netdev = adapter->netdev;
1035 int rc;
1036
1037 rc = set_real_num_queues(netdev);
1038 if (rc)
1039 return rc;
1040
1041 adapter->vpd = kzalloc(sizeof(*adapter->vpd), GFP_KERNEL);
1042 if (!adapter->vpd)
1043 return -ENOMEM;
1044
1045 /* Vital Product Data (VPD) */
1046 rc = ibmvnic_get_vpd(adapter);
1047 if (rc) {
1048 netdev_err(netdev, "failed to initialize Vital Product Data (VPD)\n");
1049 return rc;
1050 }
1051
1052 adapter->map_id = 1;
1053
1054 rc = init_napi(adapter);
1055 if (rc)
1056 return rc;
1057
1058 send_map_query(adapter);
1059
1060 rc = init_rx_pools(netdev);
1061 if (rc)
1062 return rc;
1063
1064 rc = init_tx_pools(netdev);
1065 return rc;
1066}
1067
1068static int __ibmvnic_open(struct net_device *netdev)
1069{
1070 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1071 enum vnic_state prev_state = adapter->state;
1072 int i, rc;
1073
1074 adapter->state = VNIC_OPENING;
1075 replenish_pools(adapter);
1076 ibmvnic_napi_enable(adapter);
1077
1078 /* We're ready to receive frames, enable the sub-crq interrupts and
1079 * set the logical link state to up
1080 */
1081 for (i = 0; i < adapter->req_rx_queues; i++) {
1082 netdev_dbg(netdev, "Enabling rx_scrq[%d] irq\n", i);
1083 if (prev_state == VNIC_CLOSED)
1084 enable_irq(adapter->rx_scrq[i]->irq);
1085 enable_scrq_irq(adapter, adapter->rx_scrq[i]);
1086 }
1087
1088 for (i = 0; i < adapter->req_tx_queues; i++) {
1089 netdev_dbg(netdev, "Enabling tx_scrq[%d] irq\n", i);
1090 if (prev_state == VNIC_CLOSED)
1091 enable_irq(adapter->tx_scrq[i]->irq);
1092 enable_scrq_irq(adapter, adapter->tx_scrq[i]);
1093 }
1094
1095 rc = set_link_state(adapter, IBMVNIC_LOGICAL_LNK_UP);
1096 if (rc) {
1097 ibmvnic_napi_disable(adapter);
1098 release_resources(adapter);
1099 return rc;
1100 }
1101
1102 netif_tx_start_all_queues(netdev);
1103
1104 if (prev_state == VNIC_CLOSED) {
1105 for (i = 0; i < adapter->req_rx_queues; i++)
1106 napi_schedule(&adapter->napi[i]);
1107 }
1108
1109 adapter->state = VNIC_OPEN;
1110 return rc;
1111}
1112
1113static int ibmvnic_open(struct net_device *netdev)
1114{
1115 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1116 int rc;
1117
1118 /* If device failover is pending, just set device state and return.
1119 * Device operation will be handled by reset routine.
1120 */
1121 if (adapter->failover_pending) {
1122 adapter->state = VNIC_OPEN;
1123 return 0;
1124 }
1125
1126 if (adapter->state != VNIC_CLOSED) {
1127 rc = ibmvnic_login(netdev);
1128 if (rc)
1129 goto out;
1130
1131 rc = init_resources(adapter);
1132 if (rc) {
1133 netdev_err(netdev, "failed to initialize resources\n");
1134 release_resources(adapter);
1135 goto out;
1136 }
1137 }
1138
1139 rc = __ibmvnic_open(netdev);
1140
1141out:
1142 /*
1143 * If open fails due to a pending failover, set device state and
1144 * return. Device operation will be handled by reset routine.
1145 */
1146 if (rc && adapter->failover_pending) {
1147 adapter->state = VNIC_OPEN;
1148 rc = 0;
1149 }
1150 return rc;
1151}
1152
1153static void clean_rx_pools(struct ibmvnic_adapter *adapter)
1154{
1155 struct ibmvnic_rx_pool *rx_pool;
1156 struct ibmvnic_rx_buff *rx_buff;
1157 u64 rx_entries;
1158 int rx_scrqs;
1159 int i, j;
1160
1161 if (!adapter->rx_pool)
1162 return;
1163
1164 rx_scrqs = adapter->num_active_rx_pools;
1165 rx_entries = adapter->req_rx_add_entries_per_subcrq;
1166
1167 /* Free any remaining skbs in the rx buffer pools */
1168 for (i = 0; i < rx_scrqs; i++) {
1169 rx_pool = &adapter->rx_pool[i];
1170 if (!rx_pool || !rx_pool->rx_buff)
1171 continue;
1172
1173 netdev_dbg(adapter->netdev, "Cleaning rx_pool[%d]\n", i);
1174 for (j = 0; j < rx_entries; j++) {
1175 rx_buff = &rx_pool->rx_buff[j];
1176 if (rx_buff && rx_buff->skb) {
1177 dev_kfree_skb_any(rx_buff->skb);
1178 rx_buff->skb = NULL;
1179 }
1180 }
1181 }
1182}
1183
1184static void clean_one_tx_pool(struct ibmvnic_adapter *adapter,
1185 struct ibmvnic_tx_pool *tx_pool)
1186{
1187 struct ibmvnic_tx_buff *tx_buff;
1188 u64 tx_entries;
1189 int i;
1190
1191 if (!tx_pool || !tx_pool->tx_buff)
1192 return;
1193
1194 tx_entries = tx_pool->num_buffers;
1195
1196 for (i = 0; i < tx_entries; i++) {
1197 tx_buff = &tx_pool->tx_buff[i];
1198 if (tx_buff && tx_buff->skb) {
1199 dev_kfree_skb_any(tx_buff->skb);
1200 tx_buff->skb = NULL;
1201 }
1202 }
1203}
1204
1205static void clean_tx_pools(struct ibmvnic_adapter *adapter)
1206{
1207 int tx_scrqs;
1208 int i;
1209
1210 if (!adapter->tx_pool || !adapter->tso_pool)
1211 return;
1212
1213 tx_scrqs = adapter->num_active_tx_pools;
1214
1215 /* Free any remaining skbs in the tx buffer pools */
1216 for (i = 0; i < tx_scrqs; i++) {
1217 netdev_dbg(adapter->netdev, "Cleaning tx_pool[%d]\n", i);
1218 clean_one_tx_pool(adapter, &adapter->tx_pool[i]);
1219 clean_one_tx_pool(adapter, &adapter->tso_pool[i]);
1220 }
1221}
1222
1223static void ibmvnic_disable_irqs(struct ibmvnic_adapter *adapter)
1224{
1225 struct net_device *netdev = adapter->netdev;
1226 int i;
1227
1228 if (adapter->tx_scrq) {
1229 for (i = 0; i < adapter->req_tx_queues; i++)
1230 if (adapter->tx_scrq[i]->irq) {
1231 netdev_dbg(netdev,
1232 "Disabling tx_scrq[%d] irq\n", i);
1233 disable_scrq_irq(adapter, adapter->tx_scrq[i]);
1234 disable_irq(adapter->tx_scrq[i]->irq);
1235 }
1236 }
1237
1238 if (adapter->rx_scrq) {
1239 for (i = 0; i < adapter->req_rx_queues; i++) {
1240 if (adapter->rx_scrq[i]->irq) {
1241 netdev_dbg(netdev,
1242 "Disabling rx_scrq[%d] irq\n", i);
1243 disable_scrq_irq(adapter, adapter->rx_scrq[i]);
1244 disable_irq(adapter->rx_scrq[i]->irq);
1245 }
1246 }
1247 }
1248}
1249
1250static void ibmvnic_cleanup(struct net_device *netdev)
1251{
1252 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1253
1254 /* ensure that transmissions are stopped if called by do_reset */
1255 if (test_bit(0, &adapter->resetting))
1256 netif_tx_disable(netdev);
1257 else
1258 netif_tx_stop_all_queues(netdev);
1259
1260 ibmvnic_napi_disable(adapter);
1261 ibmvnic_disable_irqs(adapter);
1262
1263 clean_rx_pools(adapter);
1264 clean_tx_pools(adapter);
1265}
1266
1267static int __ibmvnic_close(struct net_device *netdev)
1268{
1269 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1270 int rc = 0;
1271
1272 adapter->state = VNIC_CLOSING;
1273 rc = set_link_state(adapter, IBMVNIC_LOGICAL_LNK_DN);
1274 adapter->state = VNIC_CLOSED;
1275 return rc;
1276}
1277
1278static int ibmvnic_close(struct net_device *netdev)
1279{
1280 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1281 int rc;
1282
1283 /* If device failover is pending, just set device state and return.
1284 * Device operation will be handled by reset routine.
1285 */
1286 if (adapter->failover_pending) {
1287 adapter->state = VNIC_CLOSED;
1288 return 0;
1289 }
1290
1291 rc = __ibmvnic_close(netdev);
1292 ibmvnic_cleanup(netdev);
1293
1294 return rc;
1295}
1296
1297/**
1298 * build_hdr_data - creates L2/L3/L4 header data buffer
1299 * @hdr_field - bitfield determining needed headers
1300 * @skb - socket buffer
1301 * @hdr_len - array of header lengths
1302 * @tot_len - total length of data
1303 *
1304 * Reads hdr_field to determine which headers are needed by firmware.
1305 * Builds a buffer containing these headers. Saves individual header
1306 * lengths and total buffer length to be used to build descriptors.
1307 */
1308static int build_hdr_data(u8 hdr_field, struct sk_buff *skb,
1309 int *hdr_len, u8 *hdr_data)
1310{
1311 int len = 0;
1312 u8 *hdr;
1313
1314 if (skb_vlan_tagged(skb) && !skb_vlan_tag_present(skb))
1315 hdr_len[0] = sizeof(struct vlan_ethhdr);
1316 else
1317 hdr_len[0] = sizeof(struct ethhdr);
1318
1319 if (skb->protocol == htons(ETH_P_IP)) {
1320 hdr_len[1] = ip_hdr(skb)->ihl * 4;
1321 if (ip_hdr(skb)->protocol == IPPROTO_TCP)
1322 hdr_len[2] = tcp_hdrlen(skb);
1323 else if (ip_hdr(skb)->protocol == IPPROTO_UDP)
1324 hdr_len[2] = sizeof(struct udphdr);
1325 } else if (skb->protocol == htons(ETH_P_IPV6)) {
1326 hdr_len[1] = sizeof(struct ipv6hdr);
1327 if (ipv6_hdr(skb)->nexthdr == IPPROTO_TCP)
1328 hdr_len[2] = tcp_hdrlen(skb);
1329 else if (ipv6_hdr(skb)->nexthdr == IPPROTO_UDP)
1330 hdr_len[2] = sizeof(struct udphdr);
1331 } else if (skb->protocol == htons(ETH_P_ARP)) {
1332 hdr_len[1] = arp_hdr_len(skb->dev);
1333 hdr_len[2] = 0;
1334 }
1335
1336 memset(hdr_data, 0, 120);
1337 if ((hdr_field >> 6) & 1) {
1338 hdr = skb_mac_header(skb);
1339 memcpy(hdr_data, hdr, hdr_len[0]);
1340 len += hdr_len[0];
1341 }
1342
1343 if ((hdr_field >> 5) & 1) {
1344 hdr = skb_network_header(skb);
1345 memcpy(hdr_data + len, hdr, hdr_len[1]);
1346 len += hdr_len[1];
1347 }
1348
1349 if ((hdr_field >> 4) & 1) {
1350 hdr = skb_transport_header(skb);
1351 memcpy(hdr_data + len, hdr, hdr_len[2]);
1352 len += hdr_len[2];
1353 }
1354 return len;
1355}
1356
1357/**
1358 * create_hdr_descs - create header and header extension descriptors
1359 * @hdr_field - bitfield determining needed headers
1360 * @data - buffer containing header data
1361 * @len - length of data buffer
1362 * @hdr_len - array of individual header lengths
1363 * @scrq_arr - descriptor array
1364 *
1365 * Creates header and, if needed, header extension descriptors and
1366 * places them in a descriptor array, scrq_arr
1367 */
1368
1369static int create_hdr_descs(u8 hdr_field, u8 *hdr_data, int len, int *hdr_len,
1370 union sub_crq *scrq_arr)
1371{
1372 union sub_crq hdr_desc;
1373 int tmp_len = len;
1374 int num_descs = 0;
1375 u8 *data, *cur;
1376 int tmp;
1377
1378 while (tmp_len > 0) {
1379 cur = hdr_data + len - tmp_len;
1380
1381 memset(&hdr_desc, 0, sizeof(hdr_desc));
1382 if (cur != hdr_data) {
1383 data = hdr_desc.hdr_ext.data;
1384 tmp = tmp_len > 29 ? 29 : tmp_len;
1385 hdr_desc.hdr_ext.first = IBMVNIC_CRQ_CMD;
1386 hdr_desc.hdr_ext.type = IBMVNIC_HDR_EXT_DESC;
1387 hdr_desc.hdr_ext.len = tmp;
1388 } else {
1389 data = hdr_desc.hdr.data;
1390 tmp = tmp_len > 24 ? 24 : tmp_len;
1391 hdr_desc.hdr.first = IBMVNIC_CRQ_CMD;
1392 hdr_desc.hdr.type = IBMVNIC_HDR_DESC;
1393 hdr_desc.hdr.len = tmp;
1394 hdr_desc.hdr.l2_len = (u8)hdr_len[0];
1395 hdr_desc.hdr.l3_len = cpu_to_be16((u16)hdr_len[1]);
1396 hdr_desc.hdr.l4_len = (u8)hdr_len[2];
1397 hdr_desc.hdr.flag = hdr_field << 1;
1398 }
1399 memcpy(data, cur, tmp);
1400 tmp_len -= tmp;
1401 *scrq_arr = hdr_desc;
1402 scrq_arr++;
1403 num_descs++;
1404 }
1405
1406 return num_descs;
1407}
1408
1409/**
1410 * build_hdr_descs_arr - build a header descriptor array
1411 * @skb - socket buffer
1412 * @num_entries - number of descriptors to be sent
1413 * @subcrq - first TX descriptor
1414 * @hdr_field - bit field determining which headers will be sent
1415 *
1416 * This function will build a TX descriptor array with applicable
1417 * L2/L3/L4 packet header descriptors to be sent by send_subcrq_indirect.
1418 */
1419
1420static void build_hdr_descs_arr(struct ibmvnic_tx_buff *txbuff,
1421 int *num_entries, u8 hdr_field)
1422{
1423 int hdr_len[3] = {0, 0, 0};
1424 int tot_len;
1425 u8 *hdr_data = txbuff->hdr_data;
1426
1427 tot_len = build_hdr_data(hdr_field, txbuff->skb, hdr_len,
1428 txbuff->hdr_data);
1429 *num_entries += create_hdr_descs(hdr_field, hdr_data, tot_len, hdr_len,
1430 txbuff->indir_arr + 1);
1431}
1432
1433static int ibmvnic_xmit_workarounds(struct sk_buff *skb,
1434 struct net_device *netdev)
1435{
1436 /* For some backing devices, mishandling of small packets
1437 * can result in a loss of connection or TX stall. Device
1438 * architects recommend that no packet should be smaller
1439 * than the minimum MTU value provided to the driver, so
1440 * pad any packets to that length
1441 */
1442 if (skb->len < netdev->min_mtu)
1443 return skb_put_padto(skb, netdev->min_mtu);
1444
1445 return 0;
1446}
1447
1448static netdev_tx_t ibmvnic_xmit(struct sk_buff *skb, struct net_device *netdev)
1449{
1450 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1451 int queue_num = skb_get_queue_mapping(skb);
1452 u8 *hdrs = (u8 *)&adapter->tx_rx_desc_req;
1453 struct device *dev = &adapter->vdev->dev;
1454 struct ibmvnic_tx_buff *tx_buff = NULL;
1455 struct ibmvnic_sub_crq_queue *tx_scrq;
1456 struct ibmvnic_tx_pool *tx_pool;
1457 unsigned int tx_send_failed = 0;
1458 unsigned int tx_map_failed = 0;
1459 unsigned int tx_dropped = 0;
1460 unsigned int tx_packets = 0;
1461 unsigned int tx_bytes = 0;
1462 dma_addr_t data_dma_addr;
1463 struct netdev_queue *txq;
1464 unsigned long lpar_rc;
1465 union sub_crq tx_crq;
1466 unsigned int offset;
1467 int num_entries = 1;
1468 unsigned char *dst;
1469 u64 *handle_array;
1470 int index = 0;
1471 u8 proto = 0;
1472 netdev_tx_t ret = NETDEV_TX_OK;
1473
1474 if (test_bit(0, &adapter->resetting)) {
1475 dev_kfree_skb_any(skb);
1476
1477 tx_send_failed++;
1478 tx_dropped++;
1479 ret = NETDEV_TX_OK;
1480 goto out;
1481 }
1482
1483 if (ibmvnic_xmit_workarounds(skb, netdev)) {
1484 tx_dropped++;
1485 tx_send_failed++;
1486 ret = NETDEV_TX_OK;
1487 goto out;
1488 }
1489 if (skb_is_gso(skb))
1490 tx_pool = &adapter->tso_pool[queue_num];
1491 else
1492 tx_pool = &adapter->tx_pool[queue_num];
1493
1494 tx_scrq = adapter->tx_scrq[queue_num];
1495 txq = netdev_get_tx_queue(netdev, skb_get_queue_mapping(skb));
1496 handle_array = (u64 *)((u8 *)(adapter->login_rsp_buf) +
1497 be32_to_cpu(adapter->login_rsp_buf->off_txsubm_subcrqs));
1498
1499 index = tx_pool->free_map[tx_pool->consumer_index];
1500
1501 if (index == IBMVNIC_INVALID_MAP) {
1502 dev_kfree_skb_any(skb);
1503 tx_send_failed++;
1504 tx_dropped++;
1505 ret = NETDEV_TX_OK;
1506 goto out;
1507 }
1508
1509 tx_pool->free_map[tx_pool->consumer_index] = IBMVNIC_INVALID_MAP;
1510
1511 offset = index * tx_pool->buf_size;
1512 dst = tx_pool->long_term_buff.buff + offset;
1513 memset(dst, 0, tx_pool->buf_size);
1514 data_dma_addr = tx_pool->long_term_buff.addr + offset;
1515
1516 if (skb_shinfo(skb)->nr_frags) {
1517 int cur, i;
1518
1519 /* Copy the head */
1520 skb_copy_from_linear_data(skb, dst, skb_headlen(skb));
1521 cur = skb_headlen(skb);
1522
1523 /* Copy the frags */
1524 for (i = 0; i < skb_shinfo(skb)->nr_frags; i++) {
1525 const skb_frag_t *frag = &skb_shinfo(skb)->frags[i];
1526
1527 memcpy(dst + cur,
1528 page_address(skb_frag_page(frag)) +
1529 skb_frag_off(frag), skb_frag_size(frag));
1530 cur += skb_frag_size(frag);
1531 }
1532 } else {
1533 skb_copy_from_linear_data(skb, dst, skb->len);
1534 }
1535
1536 /* post changes to long_term_buff *dst before VIOS accessing it */
1537 dma_wmb();
1538
1539 tx_pool->consumer_index =
1540 (tx_pool->consumer_index + 1) % tx_pool->num_buffers;
1541
1542 tx_buff = &tx_pool->tx_buff[index];
1543 tx_buff->skb = skb;
1544 tx_buff->data_dma[0] = data_dma_addr;
1545 tx_buff->data_len[0] = skb->len;
1546 tx_buff->index = index;
1547 tx_buff->pool_index = queue_num;
1548 tx_buff->last_frag = true;
1549
1550 memset(&tx_crq, 0, sizeof(tx_crq));
1551 tx_crq.v1.first = IBMVNIC_CRQ_CMD;
1552 tx_crq.v1.type = IBMVNIC_TX_DESC;
1553 tx_crq.v1.n_crq_elem = 1;
1554 tx_crq.v1.n_sge = 1;
1555 tx_crq.v1.flags1 = IBMVNIC_TX_COMP_NEEDED;
1556
1557 if (skb_is_gso(skb))
1558 tx_crq.v1.correlator =
1559 cpu_to_be32(index | IBMVNIC_TSO_POOL_MASK);
1560 else
1561 tx_crq.v1.correlator = cpu_to_be32(index);
1562 tx_crq.v1.dma_reg = cpu_to_be16(tx_pool->long_term_buff.map_id);
1563 tx_crq.v1.sge_len = cpu_to_be32(skb->len);
1564 tx_crq.v1.ioba = cpu_to_be64(data_dma_addr);
1565
1566 if (adapter->vlan_header_insertion && skb_vlan_tag_present(skb)) {
1567 tx_crq.v1.flags2 |= IBMVNIC_TX_VLAN_INSERT;
1568 tx_crq.v1.vlan_id = cpu_to_be16(skb->vlan_tci);
1569 }
1570
1571 if (skb->protocol == htons(ETH_P_IP)) {
1572 tx_crq.v1.flags1 |= IBMVNIC_TX_PROT_IPV4;
1573 proto = ip_hdr(skb)->protocol;
1574 } else if (skb->protocol == htons(ETH_P_IPV6)) {
1575 tx_crq.v1.flags1 |= IBMVNIC_TX_PROT_IPV6;
1576 proto = ipv6_hdr(skb)->nexthdr;
1577 }
1578
1579 if (proto == IPPROTO_TCP)
1580 tx_crq.v1.flags1 |= IBMVNIC_TX_PROT_TCP;
1581 else if (proto == IPPROTO_UDP)
1582 tx_crq.v1.flags1 |= IBMVNIC_TX_PROT_UDP;
1583
1584 if (skb->ip_summed == CHECKSUM_PARTIAL) {
1585 tx_crq.v1.flags1 |= IBMVNIC_TX_CHKSUM_OFFLOAD;
1586 hdrs += 2;
1587 }
1588 if (skb_is_gso(skb)) {
1589 tx_crq.v1.flags1 |= IBMVNIC_TX_LSO;
1590 tx_crq.v1.mss = cpu_to_be16(skb_shinfo(skb)->gso_size);
1591 hdrs += 2;
1592 }
1593 /* determine if l2/3/4 headers are sent to firmware */
1594 if ((*hdrs >> 7) & 1) {
1595 build_hdr_descs_arr(tx_buff, &num_entries, *hdrs);
1596 tx_crq.v1.n_crq_elem = num_entries;
1597 tx_buff->num_entries = num_entries;
1598 tx_buff->indir_arr[0] = tx_crq;
1599 tx_buff->indir_dma = dma_map_single(dev, tx_buff->indir_arr,
1600 sizeof(tx_buff->indir_arr),
1601 DMA_TO_DEVICE);
1602 if (dma_mapping_error(dev, tx_buff->indir_dma)) {
1603 dev_kfree_skb_any(skb);
1604 tx_buff->skb = NULL;
1605 if (!firmware_has_feature(FW_FEATURE_CMO))
1606 dev_err(dev, "tx: unable to map descriptor array\n");
1607 tx_map_failed++;
1608 tx_dropped++;
1609 ret = NETDEV_TX_OK;
1610 goto tx_err_out;
1611 }
1612 lpar_rc = send_subcrq_indirect(adapter, handle_array[queue_num],
1613 (u64)tx_buff->indir_dma,
1614 (u64)num_entries);
1615 dma_unmap_single(dev, tx_buff->indir_dma,
1616 sizeof(tx_buff->indir_arr), DMA_TO_DEVICE);
1617 } else {
1618 tx_buff->num_entries = num_entries;
1619 lpar_rc = send_subcrq(adapter, handle_array[queue_num],
1620 &tx_crq);
1621 }
1622 if (lpar_rc != H_SUCCESS) {
1623 if (lpar_rc != H_CLOSED && lpar_rc != H_PARAMETER)
1624 dev_err_ratelimited(dev, "tx: send failed\n");
1625 dev_kfree_skb_any(skb);
1626 tx_buff->skb = NULL;
1627
1628 if (lpar_rc == H_CLOSED || adapter->failover_pending) {
1629 /* Disable TX and report carrier off if queue is closed
1630 * or pending failover.
1631 * Firmware guarantees that a signal will be sent to the
1632 * driver, triggering a reset or some other action.
1633 */
1634 netif_tx_stop_all_queues(netdev);
1635 netif_carrier_off(netdev);
1636 }
1637
1638 tx_send_failed++;
1639 tx_dropped++;
1640 ret = NETDEV_TX_OK;
1641 goto tx_err_out;
1642 }
1643
1644 if (atomic_add_return(num_entries, &tx_scrq->used)
1645 >= adapter->req_tx_entries_per_subcrq) {
1646 netdev_dbg(netdev, "Stopping queue %d\n", queue_num);
1647 netif_stop_subqueue(netdev, queue_num);
1648 }
1649
1650 tx_packets++;
1651 tx_bytes += skb->len;
1652 txq->trans_start = jiffies;
1653 ret = NETDEV_TX_OK;
1654 goto out;
1655
1656tx_err_out:
1657 /* roll back consumer index and map array*/
1658 if (tx_pool->consumer_index == 0)
1659 tx_pool->consumer_index =
1660 tx_pool->num_buffers - 1;
1661 else
1662 tx_pool->consumer_index--;
1663 tx_pool->free_map[tx_pool->consumer_index] = index;
1664out:
1665 netdev->stats.tx_dropped += tx_dropped;
1666 netdev->stats.tx_bytes += tx_bytes;
1667 netdev->stats.tx_packets += tx_packets;
1668 adapter->tx_send_failed += tx_send_failed;
1669 adapter->tx_map_failed += tx_map_failed;
1670 adapter->tx_stats_buffers[queue_num].packets += tx_packets;
1671 adapter->tx_stats_buffers[queue_num].bytes += tx_bytes;
1672 adapter->tx_stats_buffers[queue_num].dropped_packets += tx_dropped;
1673
1674 return ret;
1675}
1676
1677static void ibmvnic_set_multi(struct net_device *netdev)
1678{
1679 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1680 struct netdev_hw_addr *ha;
1681 union ibmvnic_crq crq;
1682
1683 memset(&crq, 0, sizeof(crq));
1684 crq.request_capability.first = IBMVNIC_CRQ_CMD;
1685 crq.request_capability.cmd = REQUEST_CAPABILITY;
1686
1687 if (netdev->flags & IFF_PROMISC) {
1688 if (!adapter->promisc_supported)
1689 return;
1690 } else {
1691 if (netdev->flags & IFF_ALLMULTI) {
1692 /* Accept all multicast */
1693 memset(&crq, 0, sizeof(crq));
1694 crq.multicast_ctrl.first = IBMVNIC_CRQ_CMD;
1695 crq.multicast_ctrl.cmd = MULTICAST_CTRL;
1696 crq.multicast_ctrl.flags = IBMVNIC_ENABLE_ALL;
1697 ibmvnic_send_crq(adapter, &crq);
1698 } else if (netdev_mc_empty(netdev)) {
1699 /* Reject all multicast */
1700 memset(&crq, 0, sizeof(crq));
1701 crq.multicast_ctrl.first = IBMVNIC_CRQ_CMD;
1702 crq.multicast_ctrl.cmd = MULTICAST_CTRL;
1703 crq.multicast_ctrl.flags = IBMVNIC_DISABLE_ALL;
1704 ibmvnic_send_crq(adapter, &crq);
1705 } else {
1706 /* Accept one or more multicast(s) */
1707 netdev_for_each_mc_addr(ha, netdev) {
1708 memset(&crq, 0, sizeof(crq));
1709 crq.multicast_ctrl.first = IBMVNIC_CRQ_CMD;
1710 crq.multicast_ctrl.cmd = MULTICAST_CTRL;
1711 crq.multicast_ctrl.flags = IBMVNIC_ENABLE_MC;
1712 ether_addr_copy(&crq.multicast_ctrl.mac_addr[0],
1713 ha->addr);
1714 ibmvnic_send_crq(adapter, &crq);
1715 }
1716 }
1717 }
1718}
1719
1720static int __ibmvnic_set_mac(struct net_device *netdev, u8 *dev_addr)
1721{
1722 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1723 union ibmvnic_crq crq;
1724 int rc;
1725
1726 if (!is_valid_ether_addr(dev_addr)) {
1727 rc = -EADDRNOTAVAIL;
1728 goto err;
1729 }
1730
1731 memset(&crq, 0, sizeof(crq));
1732 crq.change_mac_addr.first = IBMVNIC_CRQ_CMD;
1733 crq.change_mac_addr.cmd = CHANGE_MAC_ADDR;
1734 ether_addr_copy(&crq.change_mac_addr.mac_addr[0], dev_addr);
1735
1736 reinit_completion(&adapter->fw_done);
1737 rc = ibmvnic_send_crq(adapter, &crq);
1738 if (rc) {
1739 rc = -EIO;
1740 goto err;
1741 }
1742
1743 wait_for_completion(&adapter->fw_done);
1744 /* netdev->dev_addr is changed in handle_change_mac_rsp function */
1745 if (adapter->fw_done_rc) {
1746 rc = -EIO;
1747 goto err;
1748 }
1749
1750 return 0;
1751err:
1752 ether_addr_copy(adapter->mac_addr, netdev->dev_addr);
1753 return rc;
1754}
1755
1756static int ibmvnic_set_mac(struct net_device *netdev, void *p)
1757{
1758 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
1759 struct sockaddr *addr = p;
1760 int rc;
1761
1762 rc = 0;
1763 if (!is_valid_ether_addr(addr->sa_data))
1764 return -EADDRNOTAVAIL;
1765
1766 ether_addr_copy(adapter->mac_addr, addr->sa_data);
1767 if (adapter->state != VNIC_PROBED)
1768 rc = __ibmvnic_set_mac(netdev, addr->sa_data);
1769
1770 return rc;
1771}
1772
1773/**
1774 * do_change_param_reset returns zero if we are able to keep processing reset
1775 * events, or non-zero if we hit a fatal error and must halt.
1776 */
1777static int do_change_param_reset(struct ibmvnic_adapter *adapter,
1778 struct ibmvnic_rwi *rwi,
1779 u32 reset_state)
1780{
1781 struct net_device *netdev = adapter->netdev;
1782 int i, rc;
1783
1784 netdev_dbg(adapter->netdev, "Change param resetting driver (%d)\n",
1785 rwi->reset_reason);
1786
1787 netif_carrier_off(netdev);
1788 adapter->reset_reason = rwi->reset_reason;
1789
1790 ibmvnic_cleanup(netdev);
1791
1792 if (reset_state == VNIC_OPEN) {
1793 rc = __ibmvnic_close(netdev);
1794 if (rc)
1795 return rc;
1796 }
1797
1798 release_resources(adapter);
1799 release_sub_crqs(adapter, 1);
1800 release_crq_queue(adapter);
1801
1802 adapter->state = VNIC_PROBED;
1803
1804 rc = init_crq_queue(adapter);
1805
1806 if (rc) {
1807 netdev_err(adapter->netdev,
1808 "Couldn't initialize crq. rc=%d\n", rc);
1809 return rc;
1810 }
1811
1812 rc = ibmvnic_reset_init(adapter);
1813 if (rc)
1814 return IBMVNIC_INIT_FAILED;
1815
1816 /* If the adapter was in PROBE state prior to the reset,
1817 * exit here.
1818 */
1819 if (reset_state == VNIC_PROBED)
1820 return 0;
1821
1822 rc = ibmvnic_login(netdev);
1823 if (rc) {
1824 adapter->state = reset_state;
1825 return rc;
1826 }
1827
1828 rc = init_resources(adapter);
1829 if (rc)
1830 return rc;
1831
1832 ibmvnic_disable_irqs(adapter);
1833
1834 adapter->state = VNIC_CLOSED;
1835
1836 if (reset_state == VNIC_CLOSED)
1837 return 0;
1838
1839 rc = __ibmvnic_open(netdev);
1840 if (rc)
1841 return IBMVNIC_OPEN_FAILED;
1842
1843 /* refresh device's multicast list */
1844 ibmvnic_set_multi(netdev);
1845
1846 /* kick napi */
1847 for (i = 0; i < adapter->req_rx_queues; i++)
1848 napi_schedule(&adapter->napi[i]);
1849
1850 return 0;
1851}
1852
1853/**
1854 * do_reset returns zero if we are able to keep processing reset events, or
1855 * non-zero if we hit a fatal error and must halt.
1856 */
1857static int do_reset(struct ibmvnic_adapter *adapter,
1858 struct ibmvnic_rwi *rwi, u32 reset_state)
1859{
1860 u64 old_num_rx_queues, old_num_tx_queues;
1861 u64 old_num_rx_slots, old_num_tx_slots;
1862 struct net_device *netdev = adapter->netdev;
1863 int rc;
1864
1865 netdev_dbg(adapter->netdev, "Re-setting driver (%d)\n",
1866 rwi->reset_reason);
1867
1868 rtnl_lock();
1869 /*
1870 * Now that we have the rtnl lock, clear any pending failover.
1871 * This will ensure ibmvnic_open() has either completed or will
1872 * block until failover is complete.
1873 */
1874 if (rwi->reset_reason == VNIC_RESET_FAILOVER)
1875 adapter->failover_pending = false;
1876
1877 netif_carrier_off(netdev);
1878 adapter->reset_reason = rwi->reset_reason;
1879
1880 old_num_rx_queues = adapter->req_rx_queues;
1881 old_num_tx_queues = adapter->req_tx_queues;
1882 old_num_rx_slots = adapter->req_rx_add_entries_per_subcrq;
1883 old_num_tx_slots = adapter->req_tx_entries_per_subcrq;
1884
1885 ibmvnic_cleanup(netdev);
1886
1887 if (reset_state == VNIC_OPEN &&
1888 adapter->reset_reason != VNIC_RESET_MOBILITY &&
1889 adapter->reset_reason != VNIC_RESET_FAILOVER) {
1890 adapter->state = VNIC_CLOSING;
1891
1892 /* Release the RTNL lock before link state change and
1893 * re-acquire after the link state change to allow
1894 * linkwatch_event to grab the RTNL lock and run during
1895 * a reset.
1896 */
1897 rtnl_unlock();
1898 rc = set_link_state(adapter, IBMVNIC_LOGICAL_LNK_DN);
1899 rtnl_lock();
1900 if (rc)
1901 goto out;
1902
1903 if (adapter->state != VNIC_CLOSING) {
1904 rc = -1;
1905 goto out;
1906 }
1907
1908 adapter->state = VNIC_CLOSED;
1909 }
1910
1911 if (adapter->reset_reason != VNIC_RESET_NON_FATAL) {
1912 /* remove the closed state so when we call open it appears
1913 * we are coming from the probed state.
1914 */
1915 adapter->state = VNIC_PROBED;
1916
1917 if (adapter->reset_reason == VNIC_RESET_MOBILITY) {
1918 rc = ibmvnic_reenable_crq_queue(adapter);
1919 release_sub_crqs(adapter, 1);
1920 } else {
1921 rc = ibmvnic_reset_crq(adapter);
1922 if (rc == H_CLOSED || rc == H_SUCCESS) {
1923 rc = vio_enable_interrupts(adapter->vdev);
1924 if (rc)
1925 netdev_err(adapter->netdev,
1926 "Reset failed to enable interrupts. rc=%d\n",
1927 rc);
1928 }
1929 }
1930
1931 if (rc) {
1932 netdev_err(adapter->netdev,
1933 "Reset couldn't initialize crq. rc=%d\n", rc);
1934 goto out;
1935 }
1936
1937 rc = ibmvnic_reset_init(adapter);
1938 if (rc) {
1939 rc = IBMVNIC_INIT_FAILED;
1940 goto out;
1941 }
1942
1943 /* If the adapter was in PROBE state prior to the reset,
1944 * exit here.
1945 */
1946 if (reset_state == VNIC_PROBED) {
1947 rc = 0;
1948 goto out;
1949 }
1950
1951 rc = ibmvnic_login(netdev);
1952 if (rc) {
1953 adapter->state = reset_state;
1954 goto out;
1955 }
1956
1957 if (adapter->req_rx_queues != old_num_rx_queues ||
1958 adapter->req_tx_queues != old_num_tx_queues ||
1959 adapter->req_rx_add_entries_per_subcrq !=
1960 old_num_rx_slots ||
1961 adapter->req_tx_entries_per_subcrq !=
1962 old_num_tx_slots ||
1963 !adapter->rx_pool ||
1964 !adapter->tso_pool ||
1965 !adapter->tx_pool) {
1966 release_rx_pools(adapter);
1967 release_tx_pools(adapter);
1968 release_napi(adapter);
1969 release_vpd_data(adapter);
1970
1971 rc = init_resources(adapter);
1972 if (rc)
1973 goto out;
1974
1975 } else {
1976 rc = reset_tx_pools(adapter);
1977 if (rc) {
1978 netdev_dbg(adapter->netdev, "reset tx pools failed (%d)\n",
1979 rc);
1980 goto out;
1981 }
1982
1983 rc = reset_rx_pools(adapter);
1984 if (rc) {
1985 netdev_dbg(adapter->netdev, "reset rx pools failed (%d)\n",
1986 rc);
1987 goto out;
1988 }
1989 }
1990 ibmvnic_disable_irqs(adapter);
1991 }
1992 adapter->state = VNIC_CLOSED;
1993
1994 if (reset_state == VNIC_CLOSED) {
1995 rc = 0;
1996 goto out;
1997 }
1998
1999 rc = __ibmvnic_open(netdev);
2000 if (rc) {
2001 rc = IBMVNIC_OPEN_FAILED;
2002 goto out;
2003 }
2004
2005 /* refresh device's multicast list */
2006 ibmvnic_set_multi(netdev);
2007
2008 if (adapter->reset_reason == VNIC_RESET_FAILOVER ||
2009 adapter->reset_reason == VNIC_RESET_MOBILITY) {
2010 call_netdevice_notifiers(NETDEV_NOTIFY_PEERS, netdev);
2011 call_netdevice_notifiers(NETDEV_RESEND_IGMP, netdev);
2012 }
2013
2014 rc = 0;
2015
2016out:
2017 rtnl_unlock();
2018
2019 return rc;
2020}
2021
2022static int do_hard_reset(struct ibmvnic_adapter *adapter,
2023 struct ibmvnic_rwi *rwi, u32 reset_state)
2024{
2025 struct net_device *netdev = adapter->netdev;
2026 int rc;
2027
2028 netdev_dbg(adapter->netdev, "Hard resetting driver (%d)\n",
2029 rwi->reset_reason);
2030
2031 netif_carrier_off(netdev);
2032 adapter->reset_reason = rwi->reset_reason;
2033
2034 ibmvnic_cleanup(netdev);
2035 release_resources(adapter);
2036 release_sub_crqs(adapter, 0);
2037 release_crq_queue(adapter);
2038
2039 /* remove the closed state so when we call open it appears
2040 * we are coming from the probed state.
2041 */
2042 adapter->state = VNIC_PROBED;
2043
2044 reinit_completion(&adapter->init_done);
2045 rc = init_crq_queue(adapter);
2046 if (rc) {
2047 netdev_err(adapter->netdev,
2048 "Couldn't initialize crq. rc=%d\n", rc);
2049 return rc;
2050 }
2051
2052 rc = ibmvnic_init(adapter);
2053 if (rc)
2054 return rc;
2055
2056 /* If the adapter was in PROBE state prior to the reset,
2057 * exit here.
2058 */
2059 if (reset_state == VNIC_PROBED)
2060 return 0;
2061
2062 rc = ibmvnic_login(netdev);
2063 if (rc) {
2064 adapter->state = VNIC_PROBED;
2065 return 0;
2066 }
2067
2068 rc = init_resources(adapter);
2069 if (rc)
2070 return rc;
2071
2072 ibmvnic_disable_irqs(adapter);
2073 adapter->state = VNIC_CLOSED;
2074
2075 if (reset_state == VNIC_CLOSED)
2076 return 0;
2077
2078 rc = __ibmvnic_open(netdev);
2079 if (rc)
2080 return IBMVNIC_OPEN_FAILED;
2081
2082 call_netdevice_notifiers(NETDEV_NOTIFY_PEERS, netdev);
2083 call_netdevice_notifiers(NETDEV_RESEND_IGMP, netdev);
2084
2085 return 0;
2086}
2087
2088static struct ibmvnic_rwi *get_next_rwi(struct ibmvnic_adapter *adapter)
2089{
2090 struct ibmvnic_rwi *rwi;
2091 unsigned long flags;
2092
2093 spin_lock_irqsave(&adapter->rwi_lock, flags);
2094
2095 if (!list_empty(&adapter->rwi_list)) {
2096 rwi = list_first_entry(&adapter->rwi_list, struct ibmvnic_rwi,
2097 list);
2098 list_del(&rwi->list);
2099 } else {
2100 rwi = NULL;
2101 }
2102
2103 spin_unlock_irqrestore(&adapter->rwi_lock, flags);
2104 return rwi;
2105}
2106
2107static void free_all_rwi(struct ibmvnic_adapter *adapter)
2108{
2109 struct ibmvnic_rwi *rwi;
2110
2111 rwi = get_next_rwi(adapter);
2112 while (rwi) {
2113 kfree(rwi);
2114 rwi = get_next_rwi(adapter);
2115 }
2116}
2117
2118static void __ibmvnic_reset(struct work_struct *work)
2119{
2120 struct ibmvnic_rwi *rwi;
2121 struct ibmvnic_adapter *adapter;
2122 u32 reset_state;
2123 int rc = 0;
2124
2125 adapter = container_of(work, struct ibmvnic_adapter, ibmvnic_reset);
2126
2127 if (test_and_set_bit_lock(0, &adapter->resetting)) {
2128 schedule_delayed_work(&adapter->ibmvnic_delayed_reset,
2129 IBMVNIC_RESET_DELAY);
2130 return;
2131 }
2132
2133 reset_state = adapter->state;
2134
2135 rwi = get_next_rwi(adapter);
2136 while (rwi) {
2137 if (adapter->state == VNIC_REMOVING ||
2138 adapter->state == VNIC_REMOVED) {
2139 kfree(rwi);
2140 rc = EBUSY;
2141 break;
2142 }
2143
2144 if (rwi->reset_reason == VNIC_RESET_CHANGE_PARAM) {
2145 /* CHANGE_PARAM requestor holds rtnl_lock */
2146 rc = do_change_param_reset(adapter, rwi, reset_state);
2147 } else if (adapter->force_reset_recovery) {
2148 /*
2149 * Since we are doing a hard reset now, clear the
2150 * failover_pending flag so we don't ignore any
2151 * future MOBILITY or other resets.
2152 */
2153 adapter->failover_pending = false;
2154
2155 /* Transport event occurred during previous reset */
2156 if (adapter->wait_for_reset) {
2157 /* Previous was CHANGE_PARAM; caller locked */
2158 adapter->force_reset_recovery = false;
2159 rc = do_hard_reset(adapter, rwi, reset_state);
2160 } else {
2161 rtnl_lock();
2162 adapter->force_reset_recovery = false;
2163 rc = do_hard_reset(adapter, rwi, reset_state);
2164 rtnl_unlock();
2165 }
2166 } else {
2167 rc = do_reset(adapter, rwi, reset_state);
2168 }
2169 kfree(rwi);
2170 if (rc == IBMVNIC_OPEN_FAILED) {
2171 if (list_empty(&adapter->rwi_list))
2172 adapter->state = VNIC_CLOSED;
2173 else
2174 adapter->state = reset_state;
2175 rc = 0;
2176 } else if (rc && rc != IBMVNIC_INIT_FAILED &&
2177 !adapter->force_reset_recovery)
2178 break;
2179
2180 rwi = get_next_rwi(adapter);
2181
2182 if (rwi && (rwi->reset_reason == VNIC_RESET_FAILOVER ||
2183 rwi->reset_reason == VNIC_RESET_MOBILITY))
2184 adapter->force_reset_recovery = true;
2185 }
2186
2187 if (adapter->wait_for_reset) {
2188 adapter->reset_done_rc = rc;
2189 complete(&adapter->reset_done);
2190 }
2191
2192 if (rc) {
2193 netdev_dbg(adapter->netdev, "Reset failed\n");
2194 free_all_rwi(adapter);
2195 }
2196
2197 clear_bit_unlock(0, &adapter->resetting);
2198}
2199
2200static void __ibmvnic_delayed_reset(struct work_struct *work)
2201{
2202 struct ibmvnic_adapter *adapter;
2203
2204 adapter = container_of(work, struct ibmvnic_adapter,
2205 ibmvnic_delayed_reset.work);
2206 __ibmvnic_reset(&adapter->ibmvnic_reset);
2207}
2208
2209static int ibmvnic_reset(struct ibmvnic_adapter *adapter,
2210 enum ibmvnic_reset_reason reason)
2211{
2212 struct list_head *entry, *tmp_entry;
2213 struct ibmvnic_rwi *rwi, *tmp;
2214 struct net_device *netdev = adapter->netdev;
2215 unsigned long flags;
2216 int ret;
2217
2218 /*
2219 * If failover is pending don't schedule any other reset.
2220 * Instead let the failover complete. If there is already a
2221 * a failover reset scheduled, we will detect and drop the
2222 * duplicate reset when walking the ->rwi_list below.
2223 */
2224 if (adapter->state == VNIC_REMOVING ||
2225 adapter->state == VNIC_REMOVED ||
2226 (adapter->failover_pending && reason != VNIC_RESET_FAILOVER)) {
2227 ret = EBUSY;
2228 netdev_dbg(netdev, "Adapter removing or pending failover, skipping reset\n");
2229 goto err;
2230 }
2231
2232 if (adapter->state == VNIC_PROBING) {
2233 netdev_warn(netdev, "Adapter reset during probe\n");
2234 ret = adapter->init_done_rc = EAGAIN;
2235 goto err;
2236 }
2237
2238 spin_lock_irqsave(&adapter->rwi_lock, flags);
2239
2240 list_for_each(entry, &adapter->rwi_list) {
2241 tmp = list_entry(entry, struct ibmvnic_rwi, list);
2242 if (tmp->reset_reason == reason) {
2243 netdev_dbg(netdev, "Skipping matching reset\n");
2244 spin_unlock_irqrestore(&adapter->rwi_lock, flags);
2245 ret = EBUSY;
2246 goto err;
2247 }
2248 }
2249
2250 rwi = kzalloc(sizeof(*rwi), GFP_ATOMIC);
2251 if (!rwi) {
2252 spin_unlock_irqrestore(&adapter->rwi_lock, flags);
2253 ibmvnic_close(netdev);
2254 ret = ENOMEM;
2255 goto err;
2256 }
2257 /* if we just received a transport event,
2258 * flush reset queue and process this reset
2259 */
2260 if (adapter->force_reset_recovery && !list_empty(&adapter->rwi_list)) {
2261 list_for_each_safe(entry, tmp_entry, &adapter->rwi_list) {
2262 list_del(entry);
2263 kfree(list_entry(entry, struct ibmvnic_rwi, list));
2264 }
2265 }
2266 rwi->reset_reason = reason;
2267 list_add_tail(&rwi->list, &adapter->rwi_list);
2268 spin_unlock_irqrestore(&adapter->rwi_lock, flags);
2269 netdev_dbg(adapter->netdev, "Scheduling reset (reason %d)\n", reason);
2270 schedule_work(&adapter->ibmvnic_reset);
2271
2272 return 0;
2273err:
2274 return -ret;
2275}
2276
2277static void ibmvnic_tx_timeout(struct net_device *dev)
2278{
2279 struct ibmvnic_adapter *adapter = netdev_priv(dev);
2280
2281 if (test_bit(0, &adapter->resetting)) {
2282 netdev_err(adapter->netdev,
2283 "Adapter is resetting, skip timeout reset\n");
2284 return;
2285 }
2286
2287 ibmvnic_reset(adapter, VNIC_RESET_TIMEOUT);
2288}
2289
2290static void remove_buff_from_pool(struct ibmvnic_adapter *adapter,
2291 struct ibmvnic_rx_buff *rx_buff)
2292{
2293 struct ibmvnic_rx_pool *pool = &adapter->rx_pool[rx_buff->pool_index];
2294
2295 rx_buff->skb = NULL;
2296
2297 pool->free_map[pool->next_alloc] = (int)(rx_buff - pool->rx_buff);
2298 pool->next_alloc = (pool->next_alloc + 1) % pool->size;
2299
2300 atomic_dec(&pool->available);
2301}
2302
2303static int ibmvnic_poll(struct napi_struct *napi, int budget)
2304{
2305 struct net_device *netdev = napi->dev;
2306 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2307 int scrq_num = (int)(napi - adapter->napi);
2308 int frames_processed = 0;
2309
2310restart_poll:
2311 while (frames_processed < budget) {
2312 struct sk_buff *skb;
2313 struct ibmvnic_rx_buff *rx_buff;
2314 union sub_crq *next;
2315 u32 length;
2316 u16 offset;
2317 u8 flags = 0;
2318
2319 if (unlikely(test_bit(0, &adapter->resetting) &&
2320 adapter->reset_reason != VNIC_RESET_NON_FATAL)) {
2321 enable_scrq_irq(adapter, adapter->rx_scrq[scrq_num]);
2322 napi_complete_done(napi, frames_processed);
2323 return frames_processed;
2324 }
2325
2326 if (!pending_scrq(adapter, adapter->rx_scrq[scrq_num]))
2327 break;
2328 /* The queue entry at the current index is peeked at above
2329 * to determine that there is a valid descriptor awaiting
2330 * processing. We want to be sure that the current slot
2331 * holds a valid descriptor before reading its contents.
2332 */
2333 dma_rmb();
2334 next = ibmvnic_next_scrq(adapter, adapter->rx_scrq[scrq_num]);
2335 rx_buff =
2336 (struct ibmvnic_rx_buff *)be64_to_cpu(next->
2337 rx_comp.correlator);
2338 /* do error checking */
2339 if (next->rx_comp.rc) {
2340 netdev_dbg(netdev, "rx buffer returned with rc %x\n",
2341 be16_to_cpu(next->rx_comp.rc));
2342 /* free the entry */
2343 next->rx_comp.first = 0;
2344 dev_kfree_skb_any(rx_buff->skb);
2345 remove_buff_from_pool(adapter, rx_buff);
2346 continue;
2347 } else if (!rx_buff->skb) {
2348 /* free the entry */
2349 next->rx_comp.first = 0;
2350 remove_buff_from_pool(adapter, rx_buff);
2351 continue;
2352 }
2353
2354 length = be32_to_cpu(next->rx_comp.len);
2355 offset = be16_to_cpu(next->rx_comp.off_frame_data);
2356 flags = next->rx_comp.flags;
2357 skb = rx_buff->skb;
2358 /* load long_term_buff before copying to skb */
2359 dma_rmb();
2360 skb_copy_to_linear_data(skb, rx_buff->data + offset,
2361 length);
2362
2363 /* VLAN Header has been stripped by the system firmware and
2364 * needs to be inserted by the driver
2365 */
2366 if (adapter->rx_vlan_header_insertion &&
2367 (flags & IBMVNIC_VLAN_STRIPPED))
2368 __vlan_hwaccel_put_tag(skb, htons(ETH_P_8021Q),
2369 ntohs(next->rx_comp.vlan_tci));
2370
2371 /* free the entry */
2372 next->rx_comp.first = 0;
2373 remove_buff_from_pool(adapter, rx_buff);
2374
2375 skb_put(skb, length);
2376 skb->protocol = eth_type_trans(skb, netdev);
2377 skb_record_rx_queue(skb, scrq_num);
2378
2379 if (flags & IBMVNIC_IP_CHKSUM_GOOD &&
2380 flags & IBMVNIC_TCP_UDP_CHKSUM_GOOD) {
2381 skb->ip_summed = CHECKSUM_UNNECESSARY;
2382 }
2383
2384 length = skb->len;
2385 napi_gro_receive(napi, skb); /* send it up */
2386 netdev->stats.rx_packets++;
2387 netdev->stats.rx_bytes += length;
2388 adapter->rx_stats_buffers[scrq_num].packets++;
2389 adapter->rx_stats_buffers[scrq_num].bytes += length;
2390 frames_processed++;
2391 }
2392
2393 if (adapter->state != VNIC_CLOSING)
2394 replenish_rx_pool(adapter, &adapter->rx_pool[scrq_num]);
2395
2396 if (frames_processed < budget) {
2397 enable_scrq_irq(adapter, adapter->rx_scrq[scrq_num]);
2398 napi_complete_done(napi, frames_processed);
2399 if (pending_scrq(adapter, adapter->rx_scrq[scrq_num]) &&
2400 napi_reschedule(napi)) {
2401 disable_scrq_irq(adapter, adapter->rx_scrq[scrq_num]);
2402 goto restart_poll;
2403 }
2404 }
2405 return frames_processed;
2406}
2407
2408static int wait_for_reset(struct ibmvnic_adapter *adapter)
2409{
2410 int rc, ret;
2411
2412 adapter->fallback.mtu = adapter->req_mtu;
2413 adapter->fallback.rx_queues = adapter->req_rx_queues;
2414 adapter->fallback.tx_queues = adapter->req_tx_queues;
2415 adapter->fallback.rx_entries = adapter->req_rx_add_entries_per_subcrq;
2416 adapter->fallback.tx_entries = adapter->req_tx_entries_per_subcrq;
2417
2418 reinit_completion(&adapter->reset_done);
2419 adapter->wait_for_reset = true;
2420 rc = ibmvnic_reset(adapter, VNIC_RESET_CHANGE_PARAM);
2421 if (rc)
2422 return rc;
2423 wait_for_completion(&adapter->reset_done);
2424
2425 ret = 0;
2426 if (adapter->reset_done_rc) {
2427 ret = -EIO;
2428 adapter->desired.mtu = adapter->fallback.mtu;
2429 adapter->desired.rx_queues = adapter->fallback.rx_queues;
2430 adapter->desired.tx_queues = adapter->fallback.tx_queues;
2431 adapter->desired.rx_entries = adapter->fallback.rx_entries;
2432 adapter->desired.tx_entries = adapter->fallback.tx_entries;
2433
2434 reinit_completion(&adapter->reset_done);
2435 adapter->wait_for_reset = true;
2436 rc = ibmvnic_reset(adapter, VNIC_RESET_CHANGE_PARAM);
2437 if (rc)
2438 return ret;
2439 wait_for_completion(&adapter->reset_done);
2440 }
2441 adapter->wait_for_reset = false;
2442
2443 return ret;
2444}
2445
2446static int ibmvnic_change_mtu(struct net_device *netdev, int new_mtu)
2447{
2448 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2449
2450 adapter->desired.mtu = new_mtu + ETH_HLEN;
2451
2452 return wait_for_reset(adapter);
2453}
2454
2455static netdev_features_t ibmvnic_features_check(struct sk_buff *skb,
2456 struct net_device *dev,
2457 netdev_features_t features)
2458{
2459 /* Some backing hardware adapters can not
2460 * handle packets with a MSS less than 224
2461 * or with only one segment.
2462 */
2463 if (skb_is_gso(skb)) {
2464 if (skb_shinfo(skb)->gso_size < 224 ||
2465 skb_shinfo(skb)->gso_segs == 1)
2466 features &= ~NETIF_F_GSO_MASK;
2467 }
2468
2469 return features;
2470}
2471
2472static const struct net_device_ops ibmvnic_netdev_ops = {
2473 .ndo_open = ibmvnic_open,
2474 .ndo_stop = ibmvnic_close,
2475 .ndo_start_xmit = ibmvnic_xmit,
2476 .ndo_set_rx_mode = ibmvnic_set_multi,
2477 .ndo_set_mac_address = ibmvnic_set_mac,
2478 .ndo_validate_addr = eth_validate_addr,
2479 .ndo_tx_timeout = ibmvnic_tx_timeout,
2480 .ndo_change_mtu = ibmvnic_change_mtu,
2481 .ndo_features_check = ibmvnic_features_check,
2482};
2483
2484/* ethtool functions */
2485
2486static int ibmvnic_get_link_ksettings(struct net_device *netdev,
2487 struct ethtool_link_ksettings *cmd)
2488{
2489 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2490 int rc;
2491
2492 rc = send_query_phys_parms(adapter);
2493 if (rc) {
2494 adapter->speed = SPEED_UNKNOWN;
2495 adapter->duplex = DUPLEX_UNKNOWN;
2496 }
2497 cmd->base.speed = adapter->speed;
2498 cmd->base.duplex = adapter->duplex;
2499 cmd->base.port = PORT_FIBRE;
2500 cmd->base.phy_address = 0;
2501 cmd->base.autoneg = AUTONEG_ENABLE;
2502
2503 return 0;
2504}
2505
2506static void ibmvnic_get_drvinfo(struct net_device *netdev,
2507 struct ethtool_drvinfo *info)
2508{
2509 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2510
2511 strlcpy(info->driver, ibmvnic_driver_name, sizeof(info->driver));
2512 strlcpy(info->version, IBMVNIC_DRIVER_VERSION, sizeof(info->version));
2513 strlcpy(info->fw_version, adapter->fw_version,
2514 sizeof(info->fw_version));
2515}
2516
2517static u32 ibmvnic_get_msglevel(struct net_device *netdev)
2518{
2519 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2520
2521 return adapter->msg_enable;
2522}
2523
2524static void ibmvnic_set_msglevel(struct net_device *netdev, u32 data)
2525{
2526 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2527
2528 adapter->msg_enable = data;
2529}
2530
2531static u32 ibmvnic_get_link(struct net_device *netdev)
2532{
2533 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2534
2535 /* Don't need to send a query because we request a logical link up at
2536 * init and then we wait for link state indications
2537 */
2538 return adapter->logical_link_state;
2539}
2540
2541static void ibmvnic_get_ringparam(struct net_device *netdev,
2542 struct ethtool_ringparam *ring)
2543{
2544 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2545
2546 if (adapter->priv_flags & IBMVNIC_USE_SERVER_MAXES) {
2547 ring->rx_max_pending = adapter->max_rx_add_entries_per_subcrq;
2548 ring->tx_max_pending = adapter->max_tx_entries_per_subcrq;
2549 } else {
2550 ring->rx_max_pending = IBMVNIC_MAX_QUEUE_SZ;
2551 ring->tx_max_pending = IBMVNIC_MAX_QUEUE_SZ;
2552 }
2553 ring->rx_mini_max_pending = 0;
2554 ring->rx_jumbo_max_pending = 0;
2555 ring->rx_pending = adapter->req_rx_add_entries_per_subcrq;
2556 ring->tx_pending = adapter->req_tx_entries_per_subcrq;
2557 ring->rx_mini_pending = 0;
2558 ring->rx_jumbo_pending = 0;
2559}
2560
2561static int ibmvnic_set_ringparam(struct net_device *netdev,
2562 struct ethtool_ringparam *ring)
2563{
2564 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2565 int ret;
2566
2567 ret = 0;
2568 adapter->desired.rx_entries = ring->rx_pending;
2569 adapter->desired.tx_entries = ring->tx_pending;
2570
2571 ret = wait_for_reset(adapter);
2572
2573 if (!ret &&
2574 (adapter->req_rx_add_entries_per_subcrq != ring->rx_pending ||
2575 adapter->req_tx_entries_per_subcrq != ring->tx_pending))
2576 netdev_info(netdev,
2577 "Could not match full ringsize request. Requested: RX %d, TX %d; Allowed: RX %llu, TX %llu\n",
2578 ring->rx_pending, ring->tx_pending,
2579 adapter->req_rx_add_entries_per_subcrq,
2580 adapter->req_tx_entries_per_subcrq);
2581 return ret;
2582}
2583
2584static void ibmvnic_get_channels(struct net_device *netdev,
2585 struct ethtool_channels *channels)
2586{
2587 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2588
2589 if (adapter->priv_flags & IBMVNIC_USE_SERVER_MAXES) {
2590 channels->max_rx = adapter->max_rx_queues;
2591 channels->max_tx = adapter->max_tx_queues;
2592 } else {
2593 channels->max_rx = IBMVNIC_MAX_QUEUES;
2594 channels->max_tx = IBMVNIC_MAX_QUEUES;
2595 }
2596
2597 channels->max_other = 0;
2598 channels->max_combined = 0;
2599 channels->rx_count = adapter->req_rx_queues;
2600 channels->tx_count = adapter->req_tx_queues;
2601 channels->other_count = 0;
2602 channels->combined_count = 0;
2603}
2604
2605static int ibmvnic_set_channels(struct net_device *netdev,
2606 struct ethtool_channels *channels)
2607{
2608 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2609 int ret;
2610
2611 ret = 0;
2612 adapter->desired.rx_queues = channels->rx_count;
2613 adapter->desired.tx_queues = channels->tx_count;
2614
2615 ret = wait_for_reset(adapter);
2616
2617 if (!ret &&
2618 (adapter->req_rx_queues != channels->rx_count ||
2619 adapter->req_tx_queues != channels->tx_count))
2620 netdev_info(netdev,
2621 "Could not match full channels request. Requested: RX %d, TX %d; Allowed: RX %llu, TX %llu\n",
2622 channels->rx_count, channels->tx_count,
2623 adapter->req_rx_queues, adapter->req_tx_queues);
2624 return ret;
2625
2626}
2627
2628static void ibmvnic_get_strings(struct net_device *dev, u32 stringset, u8 *data)
2629{
2630 struct ibmvnic_adapter *adapter = netdev_priv(dev);
2631 int i;
2632
2633 switch (stringset) {
2634 case ETH_SS_STATS:
2635 for (i = 0; i < ARRAY_SIZE(ibmvnic_stats);
2636 i++, data += ETH_GSTRING_LEN)
2637 memcpy(data, ibmvnic_stats[i].name, ETH_GSTRING_LEN);
2638
2639 for (i = 0; i < adapter->req_tx_queues; i++) {
2640 snprintf(data, ETH_GSTRING_LEN, "tx%d_packets", i);
2641 data += ETH_GSTRING_LEN;
2642
2643 snprintf(data, ETH_GSTRING_LEN, "tx%d_bytes", i);
2644 data += ETH_GSTRING_LEN;
2645
2646 snprintf(data, ETH_GSTRING_LEN,
2647 "tx%d_dropped_packets", i);
2648 data += ETH_GSTRING_LEN;
2649 }
2650
2651 for (i = 0; i < adapter->req_rx_queues; i++) {
2652 snprintf(data, ETH_GSTRING_LEN, "rx%d_packets", i);
2653 data += ETH_GSTRING_LEN;
2654
2655 snprintf(data, ETH_GSTRING_LEN, "rx%d_bytes", i);
2656 data += ETH_GSTRING_LEN;
2657
2658 snprintf(data, ETH_GSTRING_LEN, "rx%d_interrupts", i);
2659 data += ETH_GSTRING_LEN;
2660 }
2661 break;
2662
2663 case ETH_SS_PRIV_FLAGS:
2664 for (i = 0; i < ARRAY_SIZE(ibmvnic_priv_flags); i++)
2665 strcpy(data + i * ETH_GSTRING_LEN,
2666 ibmvnic_priv_flags[i]);
2667 break;
2668 default:
2669 return;
2670 }
2671}
2672
2673static int ibmvnic_get_sset_count(struct net_device *dev, int sset)
2674{
2675 struct ibmvnic_adapter *adapter = netdev_priv(dev);
2676
2677 switch (sset) {
2678 case ETH_SS_STATS:
2679 return ARRAY_SIZE(ibmvnic_stats) +
2680 adapter->req_tx_queues * NUM_TX_STATS +
2681 adapter->req_rx_queues * NUM_RX_STATS;
2682 case ETH_SS_PRIV_FLAGS:
2683 return ARRAY_SIZE(ibmvnic_priv_flags);
2684 default:
2685 return -EOPNOTSUPP;
2686 }
2687}
2688
2689static void ibmvnic_get_ethtool_stats(struct net_device *dev,
2690 struct ethtool_stats *stats, u64 *data)
2691{
2692 struct ibmvnic_adapter *adapter = netdev_priv(dev);
2693 union ibmvnic_crq crq;
2694 int i, j;
2695 int rc;
2696
2697 memset(&crq, 0, sizeof(crq));
2698 crq.request_statistics.first = IBMVNIC_CRQ_CMD;
2699 crq.request_statistics.cmd = REQUEST_STATISTICS;
2700 crq.request_statistics.ioba = cpu_to_be32(adapter->stats_token);
2701 crq.request_statistics.len =
2702 cpu_to_be32(sizeof(struct ibmvnic_statistics));
2703
2704 /* Wait for data to be written */
2705 reinit_completion(&adapter->stats_done);
2706 rc = ibmvnic_send_crq(adapter, &crq);
2707 if (rc)
2708 return;
2709 wait_for_completion(&adapter->stats_done);
2710
2711 for (i = 0; i < ARRAY_SIZE(ibmvnic_stats); i++)
2712 data[i] = be64_to_cpu(IBMVNIC_GET_STAT(adapter,
2713 ibmvnic_stats[i].offset));
2714
2715 for (j = 0; j < adapter->req_tx_queues; j++) {
2716 data[i] = adapter->tx_stats_buffers[j].packets;
2717 i++;
2718 data[i] = adapter->tx_stats_buffers[j].bytes;
2719 i++;
2720 data[i] = adapter->tx_stats_buffers[j].dropped_packets;
2721 i++;
2722 }
2723
2724 for (j = 0; j < adapter->req_rx_queues; j++) {
2725 data[i] = adapter->rx_stats_buffers[j].packets;
2726 i++;
2727 data[i] = adapter->rx_stats_buffers[j].bytes;
2728 i++;
2729 data[i] = adapter->rx_stats_buffers[j].interrupts;
2730 i++;
2731 }
2732}
2733
2734static u32 ibmvnic_get_priv_flags(struct net_device *netdev)
2735{
2736 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2737
2738 return adapter->priv_flags;
2739}
2740
2741static int ibmvnic_set_priv_flags(struct net_device *netdev, u32 flags)
2742{
2743 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
2744 bool which_maxes = !!(flags & IBMVNIC_USE_SERVER_MAXES);
2745
2746 if (which_maxes)
2747 adapter->priv_flags |= IBMVNIC_USE_SERVER_MAXES;
2748 else
2749 adapter->priv_flags &= ~IBMVNIC_USE_SERVER_MAXES;
2750
2751 return 0;
2752}
2753static const struct ethtool_ops ibmvnic_ethtool_ops = {
2754 .get_drvinfo = ibmvnic_get_drvinfo,
2755 .get_msglevel = ibmvnic_get_msglevel,
2756 .set_msglevel = ibmvnic_set_msglevel,
2757 .get_link = ibmvnic_get_link,
2758 .get_ringparam = ibmvnic_get_ringparam,
2759 .set_ringparam = ibmvnic_set_ringparam,
2760 .get_channels = ibmvnic_get_channels,
2761 .set_channels = ibmvnic_set_channels,
2762 .get_strings = ibmvnic_get_strings,
2763 .get_sset_count = ibmvnic_get_sset_count,
2764 .get_ethtool_stats = ibmvnic_get_ethtool_stats,
2765 .get_link_ksettings = ibmvnic_get_link_ksettings,
2766 .get_priv_flags = ibmvnic_get_priv_flags,
2767 .set_priv_flags = ibmvnic_set_priv_flags,
2768};
2769
2770/* Routines for managing CRQs/sCRQs */
2771
2772static int reset_one_sub_crq_queue(struct ibmvnic_adapter *adapter,
2773 struct ibmvnic_sub_crq_queue *scrq)
2774{
2775 int rc;
2776
2777 if (scrq->irq) {
2778 free_irq(scrq->irq, scrq);
2779 irq_dispose_mapping(scrq->irq);
2780 scrq->irq = 0;
2781 }
2782
2783 memset(scrq->msgs, 0, 4 * PAGE_SIZE);
2784 atomic_set(&scrq->used, 0);
2785 scrq->cur = 0;
2786
2787 rc = h_reg_sub_crq(adapter->vdev->unit_address, scrq->msg_token,
2788 4 * PAGE_SIZE, &scrq->crq_num, &scrq->hw_irq);
2789 return rc;
2790}
2791
2792static int reset_sub_crq_queues(struct ibmvnic_adapter *adapter)
2793{
2794 int i, rc;
2795
2796 if (!adapter->tx_scrq || !adapter->rx_scrq)
2797 return -EINVAL;
2798
2799 for (i = 0; i < adapter->req_tx_queues; i++) {
2800 netdev_dbg(adapter->netdev, "Re-setting tx_scrq[%d]\n", i);
2801 rc = reset_one_sub_crq_queue(adapter, adapter->tx_scrq[i]);
2802 if (rc)
2803 return rc;
2804 }
2805
2806 for (i = 0; i < adapter->req_rx_queues; i++) {
2807 netdev_dbg(adapter->netdev, "Re-setting rx_scrq[%d]\n", i);
2808 rc = reset_one_sub_crq_queue(adapter, adapter->rx_scrq[i]);
2809 if (rc)
2810 return rc;
2811 }
2812
2813 return rc;
2814}
2815
2816static void release_sub_crq_queue(struct ibmvnic_adapter *adapter,
2817 struct ibmvnic_sub_crq_queue *scrq,
2818 bool do_h_free)
2819{
2820 struct device *dev = &adapter->vdev->dev;
2821 long rc;
2822
2823 netdev_dbg(adapter->netdev, "Releasing sub-CRQ\n");
2824
2825 if (do_h_free) {
2826 /* Close the sub-crqs */
2827 do {
2828 rc = plpar_hcall_norets(H_FREE_SUB_CRQ,
2829 adapter->vdev->unit_address,
2830 scrq->crq_num);
2831 } while (rc == H_BUSY || H_IS_LONG_BUSY(rc));
2832
2833 if (rc) {
2834 netdev_err(adapter->netdev,
2835 "Failed to release sub-CRQ %16lx, rc = %ld\n",
2836 scrq->crq_num, rc);
2837 }
2838 }
2839
2840 dma_unmap_single(dev, scrq->msg_token, 4 * PAGE_SIZE,
2841 DMA_BIDIRECTIONAL);
2842 free_pages((unsigned long)scrq->msgs, 2);
2843 kfree(scrq);
2844}
2845
2846static struct ibmvnic_sub_crq_queue *init_sub_crq_queue(struct ibmvnic_adapter
2847 *adapter)
2848{
2849 struct device *dev = &adapter->vdev->dev;
2850 struct ibmvnic_sub_crq_queue *scrq;
2851 int rc;
2852
2853 scrq = kzalloc(sizeof(*scrq), GFP_KERNEL);
2854 if (!scrq)
2855 return NULL;
2856
2857 scrq->msgs =
2858 (union sub_crq *)__get_free_pages(GFP_KERNEL | __GFP_ZERO, 2);
2859 if (!scrq->msgs) {
2860 dev_warn(dev, "Couldn't allocate crq queue messages page\n");
2861 goto zero_page_failed;
2862 }
2863
2864 scrq->msg_token = dma_map_single(dev, scrq->msgs, 4 * PAGE_SIZE,
2865 DMA_BIDIRECTIONAL);
2866 if (dma_mapping_error(dev, scrq->msg_token)) {
2867 dev_warn(dev, "Couldn't map crq queue messages page\n");
2868 goto map_failed;
2869 }
2870
2871 rc = h_reg_sub_crq(adapter->vdev->unit_address, scrq->msg_token,
2872 4 * PAGE_SIZE, &scrq->crq_num, &scrq->hw_irq);
2873
2874 if (rc == H_RESOURCE)
2875 rc = ibmvnic_reset_crq(adapter);
2876
2877 if (rc == H_CLOSED) {
2878 dev_warn(dev, "Partner adapter not ready, waiting.\n");
2879 } else if (rc) {
2880 dev_warn(dev, "Error %d registering sub-crq\n", rc);
2881 goto reg_failed;
2882 }
2883
2884 scrq->adapter = adapter;
2885 scrq->size = 4 * PAGE_SIZE / sizeof(*scrq->msgs);
2886 spin_lock_init(&scrq->lock);
2887
2888 netdev_dbg(adapter->netdev,
2889 "sub-crq initialized, num %lx, hw_irq=%lx, irq=%x\n",
2890 scrq->crq_num, scrq->hw_irq, scrq->irq);
2891
2892 return scrq;
2893
2894reg_failed:
2895 dma_unmap_single(dev, scrq->msg_token, 4 * PAGE_SIZE,
2896 DMA_BIDIRECTIONAL);
2897map_failed:
2898 free_pages((unsigned long)scrq->msgs, 2);
2899zero_page_failed:
2900 kfree(scrq);
2901
2902 return NULL;
2903}
2904
2905static void release_sub_crqs(struct ibmvnic_adapter *adapter, bool do_h_free)
2906{
2907 int i;
2908
2909 if (adapter->tx_scrq) {
2910 for (i = 0; i < adapter->num_active_tx_scrqs; i++) {
2911 if (!adapter->tx_scrq[i])
2912 continue;
2913
2914 netdev_dbg(adapter->netdev, "Releasing tx_scrq[%d]\n",
2915 i);
2916 if (adapter->tx_scrq[i]->irq) {
2917 free_irq(adapter->tx_scrq[i]->irq,
2918 adapter->tx_scrq[i]);
2919 irq_dispose_mapping(adapter->tx_scrq[i]->irq);
2920 adapter->tx_scrq[i]->irq = 0;
2921 }
2922
2923 release_sub_crq_queue(adapter, adapter->tx_scrq[i],
2924 do_h_free);
2925 }
2926
2927 kfree(adapter->tx_scrq);
2928 adapter->tx_scrq = NULL;
2929 adapter->num_active_tx_scrqs = 0;
2930 }
2931
2932 if (adapter->rx_scrq) {
2933 for (i = 0; i < adapter->num_active_rx_scrqs; i++) {
2934 if (!adapter->rx_scrq[i])
2935 continue;
2936
2937 netdev_dbg(adapter->netdev, "Releasing rx_scrq[%d]\n",
2938 i);
2939 if (adapter->rx_scrq[i]->irq) {
2940 free_irq(adapter->rx_scrq[i]->irq,
2941 adapter->rx_scrq[i]);
2942 irq_dispose_mapping(adapter->rx_scrq[i]->irq);
2943 adapter->rx_scrq[i]->irq = 0;
2944 }
2945
2946 release_sub_crq_queue(adapter, adapter->rx_scrq[i],
2947 do_h_free);
2948 }
2949
2950 kfree(adapter->rx_scrq);
2951 adapter->rx_scrq = NULL;
2952 adapter->num_active_rx_scrqs = 0;
2953 }
2954}
2955
2956static int disable_scrq_irq(struct ibmvnic_adapter *adapter,
2957 struct ibmvnic_sub_crq_queue *scrq)
2958{
2959 struct device *dev = &adapter->vdev->dev;
2960 unsigned long rc;
2961
2962 rc = plpar_hcall_norets(H_VIOCTL, adapter->vdev->unit_address,
2963 H_DISABLE_VIO_INTERRUPT, scrq->hw_irq, 0, 0);
2964 if (rc)
2965 dev_err(dev, "Couldn't disable scrq irq 0x%lx. rc=%ld\n",
2966 scrq->hw_irq, rc);
2967 return rc;
2968}
2969
2970static int enable_scrq_irq(struct ibmvnic_adapter *adapter,
2971 struct ibmvnic_sub_crq_queue *scrq)
2972{
2973 struct device *dev = &adapter->vdev->dev;
2974 unsigned long rc;
2975
2976 if (scrq->hw_irq > 0x100000000ULL) {
2977 dev_err(dev, "bad hw_irq = %lx\n", scrq->hw_irq);
2978 return 1;
2979 }
2980
2981 if (test_bit(0, &adapter->resetting) &&
2982 adapter->reset_reason == VNIC_RESET_MOBILITY) {
2983 u64 val = (0xff000000) | scrq->hw_irq;
2984
2985 rc = plpar_hcall_norets(H_EOI, val);
2986 /* H_EOI would fail with rc = H_FUNCTION when running
2987 * in XIVE mode which is expected, but not an error.
2988 */
2989 if (rc && (rc != H_FUNCTION))
2990 dev_err(dev, "H_EOI FAILED irq 0x%llx. rc=%ld\n",
2991 val, rc);
2992 }
2993
2994 rc = plpar_hcall_norets(H_VIOCTL, adapter->vdev->unit_address,
2995 H_ENABLE_VIO_INTERRUPT, scrq->hw_irq, 0, 0);
2996 if (rc)
2997 dev_err(dev, "Couldn't enable scrq irq 0x%lx. rc=%ld\n",
2998 scrq->hw_irq, rc);
2999 return rc;
3000}
3001
3002static int ibmvnic_complete_tx(struct ibmvnic_adapter *adapter,
3003 struct ibmvnic_sub_crq_queue *scrq)
3004{
3005 struct device *dev = &adapter->vdev->dev;
3006 struct ibmvnic_tx_pool *tx_pool;
3007 struct ibmvnic_tx_buff *txbuff;
3008 union sub_crq *next;
3009 int index;
3010 int i, j;
3011
3012restart_loop:
3013 while (pending_scrq(adapter, scrq)) {
3014 unsigned int pool = scrq->pool_index;
3015 int num_entries = 0;
3016
3017 /* The queue entry at the current index is peeked at above
3018 * to determine that there is a valid descriptor awaiting
3019 * processing. We want to be sure that the current slot
3020 * holds a valid descriptor before reading its contents.
3021 */
3022 dma_rmb();
3023
3024 next = ibmvnic_next_scrq(adapter, scrq);
3025 for (i = 0; i < next->tx_comp.num_comps; i++) {
3026 if (next->tx_comp.rcs[i])
3027 dev_err(dev, "tx error %x\n",
3028 next->tx_comp.rcs[i]);
3029 index = be32_to_cpu(next->tx_comp.correlators[i]);
3030 if (index & IBMVNIC_TSO_POOL_MASK) {
3031 tx_pool = &adapter->tso_pool[pool];
3032 index &= ~IBMVNIC_TSO_POOL_MASK;
3033 } else {
3034 tx_pool = &adapter->tx_pool[pool];
3035 }
3036
3037 txbuff = &tx_pool->tx_buff[index];
3038
3039 for (j = 0; j < IBMVNIC_MAX_FRAGS_PER_CRQ; j++) {
3040 if (!txbuff->data_dma[j])
3041 continue;
3042
3043 txbuff->data_dma[j] = 0;
3044 }
3045
3046 if (txbuff->last_frag) {
3047 dev_kfree_skb_any(txbuff->skb);
3048 txbuff->skb = NULL;
3049 }
3050
3051 num_entries += txbuff->num_entries;
3052
3053 tx_pool->free_map[tx_pool->producer_index] = index;
3054 tx_pool->producer_index =
3055 (tx_pool->producer_index + 1) %
3056 tx_pool->num_buffers;
3057 }
3058 /* remove tx_comp scrq*/
3059 next->tx_comp.first = 0;
3060
3061 if (atomic_sub_return(num_entries, &scrq->used) <=
3062 (adapter->req_tx_entries_per_subcrq / 2) &&
3063 __netif_subqueue_stopped(adapter->netdev,
3064 scrq->pool_index)) {
3065 netif_wake_subqueue(adapter->netdev, scrq->pool_index);
3066 netdev_dbg(adapter->netdev, "Started queue %d\n",
3067 scrq->pool_index);
3068 }
3069 }
3070
3071 enable_scrq_irq(adapter, scrq);
3072
3073 if (pending_scrq(adapter, scrq)) {
3074 disable_scrq_irq(adapter, scrq);
3075 goto restart_loop;
3076 }
3077
3078 return 0;
3079}
3080
3081static irqreturn_t ibmvnic_interrupt_tx(int irq, void *instance)
3082{
3083 struct ibmvnic_sub_crq_queue *scrq = instance;
3084 struct ibmvnic_adapter *adapter = scrq->adapter;
3085
3086 disable_scrq_irq(adapter, scrq);
3087 ibmvnic_complete_tx(adapter, scrq);
3088
3089 return IRQ_HANDLED;
3090}
3091
3092static irqreturn_t ibmvnic_interrupt_rx(int irq, void *instance)
3093{
3094 struct ibmvnic_sub_crq_queue *scrq = instance;
3095 struct ibmvnic_adapter *adapter = scrq->adapter;
3096
3097 /* When booting a kdump kernel we can hit pending interrupts
3098 * prior to completing driver initialization.
3099 */
3100 if (unlikely(adapter->state != VNIC_OPEN))
3101 return IRQ_NONE;
3102
3103 adapter->rx_stats_buffers[scrq->scrq_num].interrupts++;
3104
3105 if (napi_schedule_prep(&adapter->napi[scrq->scrq_num])) {
3106 disable_scrq_irq(adapter, scrq);
3107 __napi_schedule(&adapter->napi[scrq->scrq_num]);
3108 }
3109
3110 return IRQ_HANDLED;
3111}
3112
3113static int init_sub_crq_irqs(struct ibmvnic_adapter *adapter)
3114{
3115 struct device *dev = &adapter->vdev->dev;
3116 struct ibmvnic_sub_crq_queue *scrq;
3117 int i = 0, j = 0;
3118 int rc = 0;
3119
3120 for (i = 0; i < adapter->req_tx_queues; i++) {
3121 netdev_dbg(adapter->netdev, "Initializing tx_scrq[%d] irq\n",
3122 i);
3123 scrq = adapter->tx_scrq[i];
3124 scrq->irq = irq_create_mapping(NULL, scrq->hw_irq);
3125
3126 if (!scrq->irq) {
3127 rc = -EINVAL;
3128 dev_err(dev, "Error mapping irq\n");
3129 goto req_tx_irq_failed;
3130 }
3131
3132 snprintf(scrq->name, sizeof(scrq->name), "ibmvnic-%x-tx%d",
3133 adapter->vdev->unit_address, i);
3134 rc = request_irq(scrq->irq, ibmvnic_interrupt_tx,
3135 0, scrq->name, scrq);
3136
3137 if (rc) {
3138 dev_err(dev, "Couldn't register tx irq 0x%x. rc=%d\n",
3139 scrq->irq, rc);
3140 irq_dispose_mapping(scrq->irq);
3141 goto req_tx_irq_failed;
3142 }
3143 }
3144
3145 for (i = 0; i < adapter->req_rx_queues; i++) {
3146 netdev_dbg(adapter->netdev, "Initializing rx_scrq[%d] irq\n",
3147 i);
3148 scrq = adapter->rx_scrq[i];
3149 scrq->irq = irq_create_mapping(NULL, scrq->hw_irq);
3150 if (!scrq->irq) {
3151 rc = -EINVAL;
3152 dev_err(dev, "Error mapping irq\n");
3153 goto req_rx_irq_failed;
3154 }
3155 snprintf(scrq->name, sizeof(scrq->name), "ibmvnic-%x-rx%d",
3156 adapter->vdev->unit_address, i);
3157 rc = request_irq(scrq->irq, ibmvnic_interrupt_rx,
3158 0, scrq->name, scrq);
3159 if (rc) {
3160 dev_err(dev, "Couldn't register rx irq 0x%x. rc=%d\n",
3161 scrq->irq, rc);
3162 irq_dispose_mapping(scrq->irq);
3163 goto req_rx_irq_failed;
3164 }
3165 }
3166 return rc;
3167
3168req_rx_irq_failed:
3169 for (j = 0; j < i; j++) {
3170 free_irq(adapter->rx_scrq[j]->irq, adapter->rx_scrq[j]);
3171 irq_dispose_mapping(adapter->rx_scrq[j]->irq);
3172 }
3173 i = adapter->req_tx_queues;
3174req_tx_irq_failed:
3175 for (j = 0; j < i; j++) {
3176 free_irq(adapter->tx_scrq[j]->irq, adapter->tx_scrq[j]);
3177 irq_dispose_mapping(adapter->tx_scrq[j]->irq);
3178 }
3179 release_sub_crqs(adapter, 1);
3180 return rc;
3181}
3182
3183static int init_sub_crqs(struct ibmvnic_adapter *adapter)
3184{
3185 struct device *dev = &adapter->vdev->dev;
3186 struct ibmvnic_sub_crq_queue **allqueues;
3187 int registered_queues = 0;
3188 int total_queues;
3189 int more = 0;
3190 int i;
3191
3192 total_queues = adapter->req_tx_queues + adapter->req_rx_queues;
3193
3194 allqueues = kcalloc(total_queues, sizeof(*allqueues), GFP_KERNEL);
3195 if (!allqueues)
3196 return -1;
3197
3198 for (i = 0; i < total_queues; i++) {
3199 allqueues[i] = init_sub_crq_queue(adapter);
3200 if (!allqueues[i]) {
3201 dev_warn(dev, "Couldn't allocate all sub-crqs\n");
3202 break;
3203 }
3204 registered_queues++;
3205 }
3206
3207 /* Make sure we were able to register the minimum number of queues */
3208 if (registered_queues <
3209 adapter->min_tx_queues + adapter->min_rx_queues) {
3210 dev_err(dev, "Fatal: Couldn't init min number of sub-crqs\n");
3211 goto tx_failed;
3212 }
3213
3214 /* Distribute the failed allocated queues*/
3215 for (i = 0; i < total_queues - registered_queues + more ; i++) {
3216 netdev_dbg(adapter->netdev, "Reducing number of queues\n");
3217 switch (i % 3) {
3218 case 0:
3219 if (adapter->req_rx_queues > adapter->min_rx_queues)
3220 adapter->req_rx_queues--;
3221 else
3222 more++;
3223 break;
3224 case 1:
3225 if (adapter->req_tx_queues > adapter->min_tx_queues)
3226 adapter->req_tx_queues--;
3227 else
3228 more++;
3229 break;
3230 }
3231 }
3232
3233 adapter->tx_scrq = kcalloc(adapter->req_tx_queues,
3234 sizeof(*adapter->tx_scrq), GFP_KERNEL);
3235 if (!adapter->tx_scrq)
3236 goto tx_failed;
3237
3238 for (i = 0; i < adapter->req_tx_queues; i++) {
3239 adapter->tx_scrq[i] = allqueues[i];
3240 adapter->tx_scrq[i]->pool_index = i;
3241 adapter->num_active_tx_scrqs++;
3242 }
3243
3244 adapter->rx_scrq = kcalloc(adapter->req_rx_queues,
3245 sizeof(*adapter->rx_scrq), GFP_KERNEL);
3246 if (!adapter->rx_scrq)
3247 goto rx_failed;
3248
3249 for (i = 0; i < adapter->req_rx_queues; i++) {
3250 adapter->rx_scrq[i] = allqueues[i + adapter->req_tx_queues];
3251 adapter->rx_scrq[i]->scrq_num = i;
3252 adapter->num_active_rx_scrqs++;
3253 }
3254
3255 kfree(allqueues);
3256 return 0;
3257
3258rx_failed:
3259 kfree(adapter->tx_scrq);
3260 adapter->tx_scrq = NULL;
3261tx_failed:
3262 for (i = 0; i < registered_queues; i++)
3263 release_sub_crq_queue(adapter, allqueues[i], 1);
3264 kfree(allqueues);
3265 return -1;
3266}
3267
3268static void ibmvnic_send_req_caps(struct ibmvnic_adapter *adapter, int retry)
3269{
3270 struct device *dev = &adapter->vdev->dev;
3271 union ibmvnic_crq crq;
3272 int max_entries;
3273 int cap_reqs;
3274
3275 /* We send out 6 or 7 REQUEST_CAPABILITY CRQs below (depending on
3276 * the PROMISC flag). Initialize this count upfront. When the tasklet
3277 * receives a response to all of these, it will send the next protocol
3278 * message (QUERY_IP_OFFLOAD).
3279 */
3280 if (!(adapter->netdev->flags & IFF_PROMISC) ||
3281 adapter->promisc_supported)
3282 cap_reqs = 7;
3283 else
3284 cap_reqs = 6;
3285
3286 if (!retry) {
3287 /* Sub-CRQ entries are 32 byte long */
3288 int entries_page = 4 * PAGE_SIZE / (sizeof(u64) * 4);
3289
3290 atomic_set(&adapter->running_cap_crqs, cap_reqs);
3291
3292 if (adapter->min_tx_entries_per_subcrq > entries_page ||
3293 adapter->min_rx_add_entries_per_subcrq > entries_page) {
3294 dev_err(dev, "Fatal, invalid entries per sub-crq\n");
3295 return;
3296 }
3297
3298 if (adapter->desired.mtu)
3299 adapter->req_mtu = adapter->desired.mtu;
3300 else
3301 adapter->req_mtu = adapter->netdev->mtu + ETH_HLEN;
3302
3303 if (!adapter->desired.tx_entries)
3304 adapter->desired.tx_entries =
3305 adapter->max_tx_entries_per_subcrq;
3306 if (!adapter->desired.rx_entries)
3307 adapter->desired.rx_entries =
3308 adapter->max_rx_add_entries_per_subcrq;
3309
3310 max_entries = IBMVNIC_MAX_LTB_SIZE /
3311 (adapter->req_mtu + IBMVNIC_BUFFER_HLEN);
3312
3313 if ((adapter->req_mtu + IBMVNIC_BUFFER_HLEN) *
3314 adapter->desired.tx_entries > IBMVNIC_MAX_LTB_SIZE) {
3315 adapter->desired.tx_entries = max_entries;
3316 }
3317
3318 if ((adapter->req_mtu + IBMVNIC_BUFFER_HLEN) *
3319 adapter->desired.rx_entries > IBMVNIC_MAX_LTB_SIZE) {
3320 adapter->desired.rx_entries = max_entries;
3321 }
3322
3323 if (adapter->desired.tx_entries)
3324 adapter->req_tx_entries_per_subcrq =
3325 adapter->desired.tx_entries;
3326 else
3327 adapter->req_tx_entries_per_subcrq =
3328 adapter->max_tx_entries_per_subcrq;
3329
3330 if (adapter->desired.rx_entries)
3331 adapter->req_rx_add_entries_per_subcrq =
3332 adapter->desired.rx_entries;
3333 else
3334 adapter->req_rx_add_entries_per_subcrq =
3335 adapter->max_rx_add_entries_per_subcrq;
3336
3337 if (adapter->desired.tx_queues)
3338 adapter->req_tx_queues =
3339 adapter->desired.tx_queues;
3340 else
3341 adapter->req_tx_queues =
3342 adapter->opt_tx_comp_sub_queues;
3343
3344 if (adapter->desired.rx_queues)
3345 adapter->req_rx_queues =
3346 adapter->desired.rx_queues;
3347 else
3348 adapter->req_rx_queues =
3349 adapter->opt_rx_comp_queues;
3350
3351 adapter->req_rx_add_queues = adapter->max_rx_add_queues;
3352 } else {
3353 atomic_add(cap_reqs, &adapter->running_cap_crqs);
3354 }
3355 memset(&crq, 0, sizeof(crq));
3356 crq.request_capability.first = IBMVNIC_CRQ_CMD;
3357 crq.request_capability.cmd = REQUEST_CAPABILITY;
3358
3359 crq.request_capability.capability = cpu_to_be16(REQ_TX_QUEUES);
3360 crq.request_capability.number = cpu_to_be64(adapter->req_tx_queues);
3361 cap_reqs--;
3362 ibmvnic_send_crq(adapter, &crq);
3363
3364 crq.request_capability.capability = cpu_to_be16(REQ_RX_QUEUES);
3365 crq.request_capability.number = cpu_to_be64(adapter->req_rx_queues);
3366 cap_reqs--;
3367 ibmvnic_send_crq(adapter, &crq);
3368
3369 crq.request_capability.capability = cpu_to_be16(REQ_RX_ADD_QUEUES);
3370 crq.request_capability.number = cpu_to_be64(adapter->req_rx_add_queues);
3371 cap_reqs--;
3372 ibmvnic_send_crq(adapter, &crq);
3373
3374 crq.request_capability.capability =
3375 cpu_to_be16(REQ_TX_ENTRIES_PER_SUBCRQ);
3376 crq.request_capability.number =
3377 cpu_to_be64(adapter->req_tx_entries_per_subcrq);
3378 cap_reqs--;
3379 ibmvnic_send_crq(adapter, &crq);
3380
3381 crq.request_capability.capability =
3382 cpu_to_be16(REQ_RX_ADD_ENTRIES_PER_SUBCRQ);
3383 crq.request_capability.number =
3384 cpu_to_be64(adapter->req_rx_add_entries_per_subcrq);
3385 cap_reqs--;
3386 ibmvnic_send_crq(adapter, &crq);
3387
3388 crq.request_capability.capability = cpu_to_be16(REQ_MTU);
3389 crq.request_capability.number = cpu_to_be64(adapter->req_mtu);
3390 cap_reqs--;
3391 ibmvnic_send_crq(adapter, &crq);
3392
3393 if (adapter->netdev->flags & IFF_PROMISC) {
3394 if (adapter->promisc_supported) {
3395 crq.request_capability.capability =
3396 cpu_to_be16(PROMISC_REQUESTED);
3397 crq.request_capability.number = cpu_to_be64(1);
3398 cap_reqs--;
3399 ibmvnic_send_crq(adapter, &crq);
3400 }
3401 } else {
3402 crq.request_capability.capability =
3403 cpu_to_be16(PROMISC_REQUESTED);
3404 crq.request_capability.number = cpu_to_be64(0);
3405 cap_reqs--;
3406 ibmvnic_send_crq(adapter, &crq);
3407 }
3408
3409 /* Keep at end to catch any discrepancy between expected and actual
3410 * CRQs sent.
3411 */
3412 WARN_ON(cap_reqs != 0);
3413}
3414
3415static int pending_scrq(struct ibmvnic_adapter *adapter,
3416 struct ibmvnic_sub_crq_queue *scrq)
3417{
3418 union sub_crq *entry = &scrq->msgs[scrq->cur];
3419
3420 if (entry->generic.first & IBMVNIC_CRQ_CMD_RSP)
3421 return 1;
3422 else
3423 return 0;
3424}
3425
3426static union sub_crq *ibmvnic_next_scrq(struct ibmvnic_adapter *adapter,
3427 struct ibmvnic_sub_crq_queue *scrq)
3428{
3429 union sub_crq *entry;
3430 unsigned long flags;
3431
3432 spin_lock_irqsave(&scrq->lock, flags);
3433 entry = &scrq->msgs[scrq->cur];
3434 if (entry->generic.first & IBMVNIC_CRQ_CMD_RSP) {
3435 if (++scrq->cur == scrq->size)
3436 scrq->cur = 0;
3437 } else {
3438 entry = NULL;
3439 }
3440 spin_unlock_irqrestore(&scrq->lock, flags);
3441
3442 /* Ensure that the entire buffer descriptor has been
3443 * loaded before reading its contents
3444 */
3445 dma_rmb();
3446
3447 return entry;
3448}
3449
3450static union ibmvnic_crq *ibmvnic_next_crq(struct ibmvnic_adapter *adapter)
3451{
3452 struct ibmvnic_crq_queue *queue = &adapter->crq;
3453 union ibmvnic_crq *crq;
3454
3455 crq = &queue->msgs[queue->cur];
3456 if (crq->generic.first & IBMVNIC_CRQ_CMD_RSP) {
3457 if (++queue->cur == queue->size)
3458 queue->cur = 0;
3459 } else {
3460 crq = NULL;
3461 }
3462
3463 return crq;
3464}
3465
3466static void print_subcrq_error(struct device *dev, int rc, const char *func)
3467{
3468 switch (rc) {
3469 case H_PARAMETER:
3470 dev_warn_ratelimited(dev,
3471 "%s failed: Send request is malformed or adapter failover pending. (rc=%d)\n",
3472 func, rc);
3473 break;
3474 case H_CLOSED:
3475 dev_warn_ratelimited(dev,
3476 "%s failed: Backing queue closed. Adapter is down or failover pending. (rc=%d)\n",
3477 func, rc);
3478 break;
3479 default:
3480 dev_err_ratelimited(dev, "%s failed: (rc=%d)\n", func, rc);
3481 break;
3482 }
3483}
3484
3485static int send_subcrq(struct ibmvnic_adapter *adapter, u64 remote_handle,
3486 union sub_crq *sub_crq)
3487{
3488 unsigned int ua = adapter->vdev->unit_address;
3489 struct device *dev = &adapter->vdev->dev;
3490 u64 *u64_crq = (u64 *)sub_crq;
3491 int rc;
3492
3493 netdev_dbg(adapter->netdev,
3494 "Sending sCRQ %016lx: %016lx %016lx %016lx %016lx\n",
3495 (unsigned long int)cpu_to_be64(remote_handle),
3496 (unsigned long int)cpu_to_be64(u64_crq[0]),
3497 (unsigned long int)cpu_to_be64(u64_crq[1]),
3498 (unsigned long int)cpu_to_be64(u64_crq[2]),
3499 (unsigned long int)cpu_to_be64(u64_crq[3]));
3500
3501 /* Make sure the hypervisor sees the complete request */
3502 mb();
3503
3504 rc = plpar_hcall_norets(H_SEND_SUB_CRQ, ua,
3505 cpu_to_be64(remote_handle),
3506 cpu_to_be64(u64_crq[0]),
3507 cpu_to_be64(u64_crq[1]),
3508 cpu_to_be64(u64_crq[2]),
3509 cpu_to_be64(u64_crq[3]));
3510
3511 if (rc)
3512 print_subcrq_error(dev, rc, __func__);
3513
3514 return rc;
3515}
3516
3517static int send_subcrq_indirect(struct ibmvnic_adapter *adapter,
3518 u64 remote_handle, u64 ioba, u64 num_entries)
3519{
3520 unsigned int ua = adapter->vdev->unit_address;
3521 struct device *dev = &adapter->vdev->dev;
3522 int rc;
3523
3524 /* Make sure the hypervisor sees the complete request */
3525 mb();
3526 rc = plpar_hcall_norets(H_SEND_SUB_CRQ_INDIRECT, ua,
3527 cpu_to_be64(remote_handle),
3528 ioba, num_entries);
3529
3530 if (rc)
3531 print_subcrq_error(dev, rc, __func__);
3532
3533 return rc;
3534}
3535
3536static int ibmvnic_send_crq(struct ibmvnic_adapter *adapter,
3537 union ibmvnic_crq *crq)
3538{
3539 unsigned int ua = adapter->vdev->unit_address;
3540 struct device *dev = &adapter->vdev->dev;
3541 u64 *u64_crq = (u64 *)crq;
3542 int rc;
3543
3544 netdev_dbg(adapter->netdev, "Sending CRQ: %016lx %016lx\n",
3545 (unsigned long int)cpu_to_be64(u64_crq[0]),
3546 (unsigned long int)cpu_to_be64(u64_crq[1]));
3547
3548 if (!adapter->crq.active &&
3549 crq->generic.first != IBMVNIC_CRQ_INIT_CMD) {
3550 dev_warn(dev, "Invalid request detected while CRQ is inactive, possible device state change during reset\n");
3551 return -EINVAL;
3552 }
3553
3554 /* Make sure the hypervisor sees the complete request */
3555 mb();
3556
3557 rc = plpar_hcall_norets(H_SEND_CRQ, ua,
3558 cpu_to_be64(u64_crq[0]),
3559 cpu_to_be64(u64_crq[1]));
3560
3561 if (rc) {
3562 if (rc == H_CLOSED) {
3563 dev_warn(dev, "CRQ Queue closed\n");
3564 if (test_bit(0, &adapter->resetting))
3565 ibmvnic_reset(adapter, VNIC_RESET_FATAL);
3566 }
3567
3568 dev_warn(dev, "Send error (rc=%d)\n", rc);
3569 }
3570
3571 return rc;
3572}
3573
3574static int ibmvnic_send_crq_init(struct ibmvnic_adapter *adapter)
3575{
3576 union ibmvnic_crq crq;
3577
3578 memset(&crq, 0, sizeof(crq));
3579 crq.generic.first = IBMVNIC_CRQ_INIT_CMD;
3580 crq.generic.cmd = IBMVNIC_CRQ_INIT;
3581 netdev_dbg(adapter->netdev, "Sending CRQ init\n");
3582
3583 return ibmvnic_send_crq(adapter, &crq);
3584}
3585
3586static int send_version_xchg(struct ibmvnic_adapter *adapter)
3587{
3588 union ibmvnic_crq crq;
3589
3590 memset(&crq, 0, sizeof(crq));
3591 crq.version_exchange.first = IBMVNIC_CRQ_CMD;
3592 crq.version_exchange.cmd = VERSION_EXCHANGE;
3593 crq.version_exchange.version = cpu_to_be16(ibmvnic_version);
3594
3595 return ibmvnic_send_crq(adapter, &crq);
3596}
3597
3598struct vnic_login_client_data {
3599 u8 type;
3600 __be16 len;
3601 char name[];
3602} __packed;
3603
3604static int vnic_client_data_len(struct ibmvnic_adapter *adapter)
3605{
3606 int len;
3607
3608 /* Calculate the amount of buffer space needed for the
3609 * vnic client data in the login buffer. There are four entries,
3610 * OS name, LPAR name, device name, and a null last entry.
3611 */
3612 len = 4 * sizeof(struct vnic_login_client_data);
3613 len += 6; /* "Linux" plus NULL */
3614 len += strlen(utsname()->nodename) + 1;
3615 len += strlen(adapter->netdev->name) + 1;
3616
3617 return len;
3618}
3619
3620static void vnic_add_client_data(struct ibmvnic_adapter *adapter,
3621 struct vnic_login_client_data *vlcd)
3622{
3623 const char *os_name = "Linux";
3624 int len;
3625
3626 /* Type 1 - LPAR OS */
3627 vlcd->type = 1;
3628 len = strlen(os_name) + 1;
3629 vlcd->len = cpu_to_be16(len);
3630 strncpy(vlcd->name, os_name, len);
3631 vlcd = (struct vnic_login_client_data *)(vlcd->name + len);
3632
3633 /* Type 2 - LPAR name */
3634 vlcd->type = 2;
3635 len = strlen(utsname()->nodename) + 1;
3636 vlcd->len = cpu_to_be16(len);
3637 strncpy(vlcd->name, utsname()->nodename, len);
3638 vlcd = (struct vnic_login_client_data *)(vlcd->name + len);
3639
3640 /* Type 3 - device name */
3641 vlcd->type = 3;
3642 len = strlen(adapter->netdev->name) + 1;
3643 vlcd->len = cpu_to_be16(len);
3644 strncpy(vlcd->name, adapter->netdev->name, len);
3645}
3646
3647static int send_login(struct ibmvnic_adapter *adapter)
3648{
3649 struct ibmvnic_login_rsp_buffer *login_rsp_buffer;
3650 struct ibmvnic_login_buffer *login_buffer;
3651 struct device *dev = &adapter->vdev->dev;
3652 dma_addr_t rsp_buffer_token;
3653 dma_addr_t buffer_token;
3654 size_t rsp_buffer_size;
3655 union ibmvnic_crq crq;
3656 size_t buffer_size;
3657 __be64 *tx_list_p;
3658 __be64 *rx_list_p;
3659 int client_data_len;
3660 struct vnic_login_client_data *vlcd;
3661 int i;
3662
3663 if (!adapter->tx_scrq || !adapter->rx_scrq) {
3664 netdev_err(adapter->netdev,
3665 "RX or TX queues are not allocated, device login failed\n");
3666 return -1;
3667 }
3668
3669 release_login_rsp_buffer(adapter);
3670 client_data_len = vnic_client_data_len(adapter);
3671
3672 buffer_size =
3673 sizeof(struct ibmvnic_login_buffer) +
3674 sizeof(u64) * (adapter->req_tx_queues + adapter->req_rx_queues) +
3675 client_data_len;
3676
3677 login_buffer = kzalloc(buffer_size, GFP_ATOMIC);
3678 if (!login_buffer)
3679 goto buf_alloc_failed;
3680
3681 buffer_token = dma_map_single(dev, login_buffer, buffer_size,
3682 DMA_TO_DEVICE);
3683 if (dma_mapping_error(dev, buffer_token)) {
3684 dev_err(dev, "Couldn't map login buffer\n");
3685 goto buf_map_failed;
3686 }
3687
3688 rsp_buffer_size = sizeof(struct ibmvnic_login_rsp_buffer) +
3689 sizeof(u64) * adapter->req_tx_queues +
3690 sizeof(u64) * adapter->req_rx_queues +
3691 sizeof(u64) * adapter->req_rx_queues +
3692 sizeof(u8) * IBMVNIC_TX_DESC_VERSIONS;
3693
3694 login_rsp_buffer = kmalloc(rsp_buffer_size, GFP_ATOMIC);
3695 if (!login_rsp_buffer)
3696 goto buf_rsp_alloc_failed;
3697
3698 rsp_buffer_token = dma_map_single(dev, login_rsp_buffer,
3699 rsp_buffer_size, DMA_FROM_DEVICE);
3700 if (dma_mapping_error(dev, rsp_buffer_token)) {
3701 dev_err(dev, "Couldn't map login rsp buffer\n");
3702 goto buf_rsp_map_failed;
3703 }
3704
3705 adapter->login_buf = login_buffer;
3706 adapter->login_buf_token = buffer_token;
3707 adapter->login_buf_sz = buffer_size;
3708 adapter->login_rsp_buf = login_rsp_buffer;
3709 adapter->login_rsp_buf_token = rsp_buffer_token;
3710 adapter->login_rsp_buf_sz = rsp_buffer_size;
3711
3712 login_buffer->len = cpu_to_be32(buffer_size);
3713 login_buffer->version = cpu_to_be32(INITIAL_VERSION_LB);
3714 login_buffer->num_txcomp_subcrqs = cpu_to_be32(adapter->req_tx_queues);
3715 login_buffer->off_txcomp_subcrqs =
3716 cpu_to_be32(sizeof(struct ibmvnic_login_buffer));
3717 login_buffer->num_rxcomp_subcrqs = cpu_to_be32(adapter->req_rx_queues);
3718 login_buffer->off_rxcomp_subcrqs =
3719 cpu_to_be32(sizeof(struct ibmvnic_login_buffer) +
3720 sizeof(u64) * adapter->req_tx_queues);
3721 login_buffer->login_rsp_ioba = cpu_to_be32(rsp_buffer_token);
3722 login_buffer->login_rsp_len = cpu_to_be32(rsp_buffer_size);
3723
3724 tx_list_p = (__be64 *)((char *)login_buffer +
3725 sizeof(struct ibmvnic_login_buffer));
3726 rx_list_p = (__be64 *)((char *)login_buffer +
3727 sizeof(struct ibmvnic_login_buffer) +
3728 sizeof(u64) * adapter->req_tx_queues);
3729
3730 for (i = 0; i < adapter->req_tx_queues; i++) {
3731 if (adapter->tx_scrq[i]) {
3732 tx_list_p[i] = cpu_to_be64(adapter->tx_scrq[i]->
3733 crq_num);
3734 }
3735 }
3736
3737 for (i = 0; i < adapter->req_rx_queues; i++) {
3738 if (adapter->rx_scrq[i]) {
3739 rx_list_p[i] = cpu_to_be64(adapter->rx_scrq[i]->
3740 crq_num);
3741 }
3742 }
3743
3744 /* Insert vNIC login client data */
3745 vlcd = (struct vnic_login_client_data *)
3746 ((char *)rx_list_p + (sizeof(u64) * adapter->req_rx_queues));
3747 login_buffer->client_data_offset =
3748 cpu_to_be32((char *)vlcd - (char *)login_buffer);
3749 login_buffer->client_data_len = cpu_to_be32(client_data_len);
3750
3751 vnic_add_client_data(adapter, vlcd);
3752
3753 netdev_dbg(adapter->netdev, "Login Buffer:\n");
3754 for (i = 0; i < (adapter->login_buf_sz - 1) / 8 + 1; i++) {
3755 netdev_dbg(adapter->netdev, "%016lx\n",
3756 ((unsigned long int *)(adapter->login_buf))[i]);
3757 }
3758
3759 memset(&crq, 0, sizeof(crq));
3760 crq.login.first = IBMVNIC_CRQ_CMD;
3761 crq.login.cmd = LOGIN;
3762 crq.login.ioba = cpu_to_be32(buffer_token);
3763 crq.login.len = cpu_to_be32(buffer_size);
3764 ibmvnic_send_crq(adapter, &crq);
3765
3766 return 0;
3767
3768buf_rsp_map_failed:
3769 kfree(login_rsp_buffer);
3770buf_rsp_alloc_failed:
3771 dma_unmap_single(dev, buffer_token, buffer_size, DMA_TO_DEVICE);
3772buf_map_failed:
3773 kfree(login_buffer);
3774buf_alloc_failed:
3775 return -1;
3776}
3777
3778static int send_request_map(struct ibmvnic_adapter *adapter, dma_addr_t addr,
3779 u32 len, u8 map_id)
3780{
3781 union ibmvnic_crq crq;
3782
3783 memset(&crq, 0, sizeof(crq));
3784 crq.request_map.first = IBMVNIC_CRQ_CMD;
3785 crq.request_map.cmd = REQUEST_MAP;
3786 crq.request_map.map_id = map_id;
3787 crq.request_map.ioba = cpu_to_be32(addr);
3788 crq.request_map.len = cpu_to_be32(len);
3789 return ibmvnic_send_crq(adapter, &crq);
3790}
3791
3792static int send_request_unmap(struct ibmvnic_adapter *adapter, u8 map_id)
3793{
3794 union ibmvnic_crq crq;
3795
3796 memset(&crq, 0, sizeof(crq));
3797 crq.request_unmap.first = IBMVNIC_CRQ_CMD;
3798 crq.request_unmap.cmd = REQUEST_UNMAP;
3799 crq.request_unmap.map_id = map_id;
3800 return ibmvnic_send_crq(adapter, &crq);
3801}
3802
3803static void send_map_query(struct ibmvnic_adapter *adapter)
3804{
3805 union ibmvnic_crq crq;
3806
3807 memset(&crq, 0, sizeof(crq));
3808 crq.query_map.first = IBMVNIC_CRQ_CMD;
3809 crq.query_map.cmd = QUERY_MAP;
3810 ibmvnic_send_crq(adapter, &crq);
3811}
3812
3813/* Send a series of CRQs requesting various capabilities of the VNIC server */
3814static void send_cap_queries(struct ibmvnic_adapter *adapter)
3815{
3816 union ibmvnic_crq crq;
3817 int cap_reqs;
3818
3819 /* We send out 25 QUERY_CAPABILITY CRQs below. Initialize this count
3820 * upfront. When the tasklet receives a response to all of these, it
3821 * can send out the next protocol messaage (REQUEST_CAPABILITY).
3822 */
3823 cap_reqs = 25;
3824
3825 atomic_set(&adapter->running_cap_crqs, cap_reqs);
3826
3827 memset(&crq, 0, sizeof(crq));
3828 crq.query_capability.first = IBMVNIC_CRQ_CMD;
3829 crq.query_capability.cmd = QUERY_CAPABILITY;
3830
3831 crq.query_capability.capability = cpu_to_be16(MIN_TX_QUEUES);
3832 ibmvnic_send_crq(adapter, &crq);
3833 cap_reqs--;
3834
3835 crq.query_capability.capability = cpu_to_be16(MIN_RX_QUEUES);
3836 ibmvnic_send_crq(adapter, &crq);
3837 cap_reqs--;
3838
3839 crq.query_capability.capability = cpu_to_be16(MIN_RX_ADD_QUEUES);
3840 ibmvnic_send_crq(adapter, &crq);
3841 cap_reqs--;
3842
3843 crq.query_capability.capability = cpu_to_be16(MAX_TX_QUEUES);
3844 ibmvnic_send_crq(adapter, &crq);
3845 cap_reqs--;
3846
3847 crq.query_capability.capability = cpu_to_be16(MAX_RX_QUEUES);
3848 ibmvnic_send_crq(adapter, &crq);
3849 cap_reqs--;
3850
3851 crq.query_capability.capability = cpu_to_be16(MAX_RX_ADD_QUEUES);
3852 ibmvnic_send_crq(adapter, &crq);
3853 cap_reqs--;
3854
3855 crq.query_capability.capability =
3856 cpu_to_be16(MIN_TX_ENTRIES_PER_SUBCRQ);
3857 ibmvnic_send_crq(adapter, &crq);
3858 cap_reqs--;
3859
3860 crq.query_capability.capability =
3861 cpu_to_be16(MIN_RX_ADD_ENTRIES_PER_SUBCRQ);
3862 ibmvnic_send_crq(adapter, &crq);
3863 cap_reqs--;
3864
3865 crq.query_capability.capability =
3866 cpu_to_be16(MAX_TX_ENTRIES_PER_SUBCRQ);
3867 ibmvnic_send_crq(adapter, &crq);
3868 cap_reqs--;
3869
3870 crq.query_capability.capability =
3871 cpu_to_be16(MAX_RX_ADD_ENTRIES_PER_SUBCRQ);
3872 ibmvnic_send_crq(adapter, &crq);
3873 cap_reqs--;
3874
3875 crq.query_capability.capability = cpu_to_be16(TCP_IP_OFFLOAD);
3876 ibmvnic_send_crq(adapter, &crq);
3877 cap_reqs--;
3878
3879 crq.query_capability.capability = cpu_to_be16(PROMISC_SUPPORTED);
3880 ibmvnic_send_crq(adapter, &crq);
3881 cap_reqs--;
3882
3883 crq.query_capability.capability = cpu_to_be16(MIN_MTU);
3884 ibmvnic_send_crq(adapter, &crq);
3885 cap_reqs--;
3886
3887 crq.query_capability.capability = cpu_to_be16(MAX_MTU);
3888 ibmvnic_send_crq(adapter, &crq);
3889 cap_reqs--;
3890
3891 crq.query_capability.capability = cpu_to_be16(MAX_MULTICAST_FILTERS);
3892 ibmvnic_send_crq(adapter, &crq);
3893 cap_reqs--;
3894
3895 crq.query_capability.capability = cpu_to_be16(VLAN_HEADER_INSERTION);
3896 ibmvnic_send_crq(adapter, &crq);
3897 cap_reqs--;
3898
3899 crq.query_capability.capability = cpu_to_be16(RX_VLAN_HEADER_INSERTION);
3900 ibmvnic_send_crq(adapter, &crq);
3901 cap_reqs--;
3902
3903 crq.query_capability.capability = cpu_to_be16(MAX_TX_SG_ENTRIES);
3904 ibmvnic_send_crq(adapter, &crq);
3905 cap_reqs--;
3906
3907 crq.query_capability.capability = cpu_to_be16(RX_SG_SUPPORTED);
3908 ibmvnic_send_crq(adapter, &crq);
3909 cap_reqs--;
3910
3911 crq.query_capability.capability = cpu_to_be16(OPT_TX_COMP_SUB_QUEUES);
3912 ibmvnic_send_crq(adapter, &crq);
3913 cap_reqs--;
3914
3915 crq.query_capability.capability = cpu_to_be16(OPT_RX_COMP_QUEUES);
3916 ibmvnic_send_crq(adapter, &crq);
3917 cap_reqs--;
3918
3919 crq.query_capability.capability =
3920 cpu_to_be16(OPT_RX_BUFADD_Q_PER_RX_COMP_Q);
3921 ibmvnic_send_crq(adapter, &crq);
3922 cap_reqs--;
3923
3924 crq.query_capability.capability =
3925 cpu_to_be16(OPT_TX_ENTRIES_PER_SUBCRQ);
3926 ibmvnic_send_crq(adapter, &crq);
3927 cap_reqs--;
3928
3929 crq.query_capability.capability =
3930 cpu_to_be16(OPT_RXBA_ENTRIES_PER_SUBCRQ);
3931 ibmvnic_send_crq(adapter, &crq);
3932 cap_reqs--;
3933
3934 crq.query_capability.capability = cpu_to_be16(TX_RX_DESC_REQ);
3935
3936 ibmvnic_send_crq(adapter, &crq);
3937 cap_reqs--;
3938
3939 /* Keep at end to catch any discrepancy between expected and actual
3940 * CRQs sent.
3941 */
3942 WARN_ON(cap_reqs != 0);
3943}
3944
3945static void handle_vpd_size_rsp(union ibmvnic_crq *crq,
3946 struct ibmvnic_adapter *adapter)
3947{
3948 struct device *dev = &adapter->vdev->dev;
3949
3950 if (crq->get_vpd_size_rsp.rc.code) {
3951 dev_err(dev, "Error retrieving VPD size, rc=%x\n",
3952 crq->get_vpd_size_rsp.rc.code);
3953 complete(&adapter->fw_done);
3954 return;
3955 }
3956
3957 adapter->vpd->len = be64_to_cpu(crq->get_vpd_size_rsp.len);
3958 complete(&adapter->fw_done);
3959}
3960
3961static void handle_vpd_rsp(union ibmvnic_crq *crq,
3962 struct ibmvnic_adapter *adapter)
3963{
3964 struct device *dev = &adapter->vdev->dev;
3965 unsigned char *substr = NULL;
3966 u8 fw_level_len = 0;
3967
3968 memset(adapter->fw_version, 0, 32);
3969
3970 dma_unmap_single(dev, adapter->vpd->dma_addr, adapter->vpd->len,
3971 DMA_FROM_DEVICE);
3972
3973 if (crq->get_vpd_rsp.rc.code) {
3974 dev_err(dev, "Error retrieving VPD from device, rc=%x\n",
3975 crq->get_vpd_rsp.rc.code);
3976 goto complete;
3977 }
3978
3979 /* get the position of the firmware version info
3980 * located after the ASCII 'RM' substring in the buffer
3981 */
3982 substr = strnstr(adapter->vpd->buff, "RM", adapter->vpd->len);
3983 if (!substr) {
3984 dev_info(dev, "Warning - No FW level has been provided in the VPD buffer by the VIOS Server\n");
3985 goto complete;
3986 }
3987
3988 /* get length of firmware level ASCII substring */
3989 if ((substr + 2) < (adapter->vpd->buff + adapter->vpd->len)) {
3990 fw_level_len = *(substr + 2);
3991 } else {
3992 dev_info(dev, "Length of FW substr extrapolated VDP buff\n");
3993 goto complete;
3994 }
3995
3996 /* copy firmware version string from vpd into adapter */
3997 if ((substr + 3 + fw_level_len) <
3998 (adapter->vpd->buff + adapter->vpd->len)) {
3999 strncpy((char *)adapter->fw_version, substr + 3, fw_level_len);
4000 } else {
4001 dev_info(dev, "FW substr extrapolated VPD buff\n");
4002 }
4003
4004complete:
4005 if (adapter->fw_version[0] == '\0')
4006 strncpy((char *)adapter->fw_version, "N/A", 3 * sizeof(char));
4007 complete(&adapter->fw_done);
4008}
4009
4010static void handle_query_ip_offload_rsp(struct ibmvnic_adapter *adapter)
4011{
4012 struct device *dev = &adapter->vdev->dev;
4013 struct ibmvnic_query_ip_offload_buffer *buf = &adapter->ip_offload_buf;
4014 netdev_features_t old_hw_features = 0;
4015 union ibmvnic_crq crq;
4016 int i;
4017
4018 dma_unmap_single(dev, adapter->ip_offload_tok,
4019 sizeof(adapter->ip_offload_buf), DMA_FROM_DEVICE);
4020
4021 netdev_dbg(adapter->netdev, "Query IP Offload Buffer:\n");
4022 for (i = 0; i < (sizeof(adapter->ip_offload_buf) - 1) / 8 + 1; i++)
4023 netdev_dbg(adapter->netdev, "%016lx\n",
4024 ((unsigned long int *)(buf))[i]);
4025
4026 netdev_dbg(adapter->netdev, "ipv4_chksum = %d\n", buf->ipv4_chksum);
4027 netdev_dbg(adapter->netdev, "ipv6_chksum = %d\n", buf->ipv6_chksum);
4028 netdev_dbg(adapter->netdev, "tcp_ipv4_chksum = %d\n",
4029 buf->tcp_ipv4_chksum);
4030 netdev_dbg(adapter->netdev, "tcp_ipv6_chksum = %d\n",
4031 buf->tcp_ipv6_chksum);
4032 netdev_dbg(adapter->netdev, "udp_ipv4_chksum = %d\n",
4033 buf->udp_ipv4_chksum);
4034 netdev_dbg(adapter->netdev, "udp_ipv6_chksum = %d\n",
4035 buf->udp_ipv6_chksum);
4036 netdev_dbg(adapter->netdev, "large_tx_ipv4 = %d\n",
4037 buf->large_tx_ipv4);
4038 netdev_dbg(adapter->netdev, "large_tx_ipv6 = %d\n",
4039 buf->large_tx_ipv6);
4040 netdev_dbg(adapter->netdev, "large_rx_ipv4 = %d\n",
4041 buf->large_rx_ipv4);
4042 netdev_dbg(adapter->netdev, "large_rx_ipv6 = %d\n",
4043 buf->large_rx_ipv6);
4044 netdev_dbg(adapter->netdev, "max_ipv4_hdr_sz = %d\n",
4045 buf->max_ipv4_header_size);
4046 netdev_dbg(adapter->netdev, "max_ipv6_hdr_sz = %d\n",
4047 buf->max_ipv6_header_size);
4048 netdev_dbg(adapter->netdev, "max_tcp_hdr_size = %d\n",
4049 buf->max_tcp_header_size);
4050 netdev_dbg(adapter->netdev, "max_udp_hdr_size = %d\n",
4051 buf->max_udp_header_size);
4052 netdev_dbg(adapter->netdev, "max_large_tx_size = %d\n",
4053 buf->max_large_tx_size);
4054 netdev_dbg(adapter->netdev, "max_large_rx_size = %d\n",
4055 buf->max_large_rx_size);
4056 netdev_dbg(adapter->netdev, "ipv6_ext_hdr = %d\n",
4057 buf->ipv6_extension_header);
4058 netdev_dbg(adapter->netdev, "tcp_pseudosum_req = %d\n",
4059 buf->tcp_pseudosum_req);
4060 netdev_dbg(adapter->netdev, "num_ipv6_ext_hd = %d\n",
4061 buf->num_ipv6_ext_headers);
4062 netdev_dbg(adapter->netdev, "off_ipv6_ext_hd = %d\n",
4063 buf->off_ipv6_ext_headers);
4064
4065 adapter->ip_offload_ctrl_tok =
4066 dma_map_single(dev, &adapter->ip_offload_ctrl,
4067 sizeof(adapter->ip_offload_ctrl), DMA_TO_DEVICE);
4068
4069 if (dma_mapping_error(dev, adapter->ip_offload_ctrl_tok)) {
4070 dev_err(dev, "Couldn't map ip offload control buffer\n");
4071 return;
4072 }
4073
4074 adapter->ip_offload_ctrl.len =
4075 cpu_to_be32(sizeof(adapter->ip_offload_ctrl));
4076 adapter->ip_offload_ctrl.version = cpu_to_be32(INITIAL_VERSION_IOB);
4077 adapter->ip_offload_ctrl.ipv4_chksum = buf->ipv4_chksum;
4078 adapter->ip_offload_ctrl.ipv6_chksum = buf->ipv6_chksum;
4079 adapter->ip_offload_ctrl.tcp_ipv4_chksum = buf->tcp_ipv4_chksum;
4080 adapter->ip_offload_ctrl.udp_ipv4_chksum = buf->udp_ipv4_chksum;
4081 adapter->ip_offload_ctrl.tcp_ipv6_chksum = buf->tcp_ipv6_chksum;
4082 adapter->ip_offload_ctrl.udp_ipv6_chksum = buf->udp_ipv6_chksum;
4083 adapter->ip_offload_ctrl.large_tx_ipv4 = buf->large_tx_ipv4;
4084 adapter->ip_offload_ctrl.large_tx_ipv6 = buf->large_tx_ipv6;
4085
4086 /* large_rx disabled for now, additional features needed */
4087 adapter->ip_offload_ctrl.large_rx_ipv4 = 0;
4088 adapter->ip_offload_ctrl.large_rx_ipv6 = 0;
4089
4090 if (adapter->state != VNIC_PROBING) {
4091 old_hw_features = adapter->netdev->hw_features;
4092 adapter->netdev->hw_features = 0;
4093 }
4094
4095 adapter->netdev->hw_features = NETIF_F_SG | NETIF_F_GSO | NETIF_F_GRO;
4096
4097 if (buf->tcp_ipv4_chksum || buf->udp_ipv4_chksum)
4098 adapter->netdev->hw_features |= NETIF_F_IP_CSUM;
4099
4100 if (buf->tcp_ipv6_chksum || buf->udp_ipv6_chksum)
4101 adapter->netdev->hw_features |= NETIF_F_IPV6_CSUM;
4102
4103 if ((adapter->netdev->features &
4104 (NETIF_F_IP_CSUM | NETIF_F_IPV6_CSUM)))
4105 adapter->netdev->hw_features |= NETIF_F_RXCSUM;
4106
4107 if (buf->large_tx_ipv4)
4108 adapter->netdev->hw_features |= NETIF_F_TSO;
4109 if (buf->large_tx_ipv6)
4110 adapter->netdev->hw_features |= NETIF_F_TSO6;
4111
4112 if (adapter->state == VNIC_PROBING) {
4113 adapter->netdev->features |= adapter->netdev->hw_features;
4114 } else if (old_hw_features != adapter->netdev->hw_features) {
4115 netdev_features_t tmp = 0;
4116
4117 /* disable features no longer supported */
4118 adapter->netdev->features &= adapter->netdev->hw_features;
4119 /* turn on features now supported if previously enabled */
4120 tmp = (old_hw_features ^ adapter->netdev->hw_features) &
4121 adapter->netdev->hw_features;
4122 adapter->netdev->features |=
4123 tmp & adapter->netdev->wanted_features;
4124 }
4125
4126 memset(&crq, 0, sizeof(crq));
4127 crq.control_ip_offload.first = IBMVNIC_CRQ_CMD;
4128 crq.control_ip_offload.cmd = CONTROL_IP_OFFLOAD;
4129 crq.control_ip_offload.len =
4130 cpu_to_be32(sizeof(adapter->ip_offload_ctrl));
4131 crq.control_ip_offload.ioba = cpu_to_be32(adapter->ip_offload_ctrl_tok);
4132 ibmvnic_send_crq(adapter, &crq);
4133}
4134
4135static const char *ibmvnic_fw_err_cause(u16 cause)
4136{
4137 switch (cause) {
4138 case ADAPTER_PROBLEM:
4139 return "adapter problem";
4140 case BUS_PROBLEM:
4141 return "bus problem";
4142 case FW_PROBLEM:
4143 return "firmware problem";
4144 case DD_PROBLEM:
4145 return "device driver problem";
4146 case EEH_RECOVERY:
4147 return "EEH recovery";
4148 case FW_UPDATED:
4149 return "firmware updated";
4150 case LOW_MEMORY:
4151 return "low Memory";
4152 default:
4153 return "unknown";
4154 }
4155}
4156
4157static void handle_error_indication(union ibmvnic_crq *crq,
4158 struct ibmvnic_adapter *adapter)
4159{
4160 struct device *dev = &adapter->vdev->dev;
4161 u16 cause;
4162
4163 cause = be16_to_cpu(crq->error_indication.error_cause);
4164
4165 dev_warn_ratelimited(dev,
4166 "Firmware reports %serror, cause: %s. Starting recovery...\n",
4167 crq->error_indication.flags
4168 & IBMVNIC_FATAL_ERROR ? "FATAL " : "",
4169 ibmvnic_fw_err_cause(cause));
4170
4171 if (crq->error_indication.flags & IBMVNIC_FATAL_ERROR)
4172 ibmvnic_reset(adapter, VNIC_RESET_FATAL);
4173 else
4174 ibmvnic_reset(adapter, VNIC_RESET_NON_FATAL);
4175}
4176
4177static int handle_change_mac_rsp(union ibmvnic_crq *crq,
4178 struct ibmvnic_adapter *adapter)
4179{
4180 struct net_device *netdev = adapter->netdev;
4181 struct device *dev = &adapter->vdev->dev;
4182 long rc;
4183
4184 rc = crq->change_mac_addr_rsp.rc.code;
4185 if (rc) {
4186 dev_err(dev, "Error %ld in CHANGE_MAC_ADDR_RSP\n", rc);
4187 goto out;
4188 }
4189 /* crq->change_mac_addr.mac_addr is the requested one
4190 * crq->change_mac_addr_rsp.mac_addr is the returned valid one.
4191 */
4192 ether_addr_copy(netdev->dev_addr,
4193 &crq->change_mac_addr_rsp.mac_addr[0]);
4194 ether_addr_copy(adapter->mac_addr,
4195 &crq->change_mac_addr_rsp.mac_addr[0]);
4196out:
4197 complete(&adapter->fw_done);
4198 return rc;
4199}
4200
4201static void handle_request_cap_rsp(union ibmvnic_crq *crq,
4202 struct ibmvnic_adapter *adapter)
4203{
4204 struct device *dev = &adapter->vdev->dev;
4205 u64 *req_value;
4206 char *name;
4207
4208 atomic_dec(&adapter->running_cap_crqs);
4209 netdev_dbg(adapter->netdev, "Outstanding request-caps: %d\n",
4210 atomic_read(&adapter->running_cap_crqs));
4211 switch (be16_to_cpu(crq->request_capability_rsp.capability)) {
4212 case REQ_TX_QUEUES:
4213 req_value = &adapter->req_tx_queues;
4214 name = "tx";
4215 break;
4216 case REQ_RX_QUEUES:
4217 req_value = &adapter->req_rx_queues;
4218 name = "rx";
4219 break;
4220 case REQ_RX_ADD_QUEUES:
4221 req_value = &adapter->req_rx_add_queues;
4222 name = "rx_add";
4223 break;
4224 case REQ_TX_ENTRIES_PER_SUBCRQ:
4225 req_value = &adapter->req_tx_entries_per_subcrq;
4226 name = "tx_entries_per_subcrq";
4227 break;
4228 case REQ_RX_ADD_ENTRIES_PER_SUBCRQ:
4229 req_value = &adapter->req_rx_add_entries_per_subcrq;
4230 name = "rx_add_entries_per_subcrq";
4231 break;
4232 case REQ_MTU:
4233 req_value = &adapter->req_mtu;
4234 name = "mtu";
4235 break;
4236 case PROMISC_REQUESTED:
4237 req_value = &adapter->promisc;
4238 name = "promisc";
4239 break;
4240 default:
4241 dev_err(dev, "Got invalid cap request rsp %d\n",
4242 crq->request_capability.capability);
4243 return;
4244 }
4245
4246 switch (crq->request_capability_rsp.rc.code) {
4247 case SUCCESS:
4248 break;
4249 case PARTIALSUCCESS:
4250 dev_info(dev, "req=%lld, rsp=%ld in %s queue, retrying.\n",
4251 *req_value,
4252 (long int)be64_to_cpu(crq->request_capability_rsp.
4253 number), name);
4254
4255 if (be16_to_cpu(crq->request_capability_rsp.capability) ==
4256 REQ_MTU) {
4257 pr_err("mtu of %llu is not supported. Reverting.\n",
4258 *req_value);
4259 *req_value = adapter->fallback.mtu;
4260 } else {
4261 *req_value =
4262 be64_to_cpu(crq->request_capability_rsp.number);
4263 }
4264
4265 ibmvnic_send_req_caps(adapter, 1);
4266 return;
4267 default:
4268 dev_err(dev, "Error %d in request cap rsp\n",
4269 crq->request_capability_rsp.rc.code);
4270 return;
4271 }
4272
4273 /* Done receiving requested capabilities, query IP offload support */
4274 if (atomic_read(&adapter->running_cap_crqs) == 0) {
4275 union ibmvnic_crq newcrq;
4276 int buf_sz = sizeof(struct ibmvnic_query_ip_offload_buffer);
4277 struct ibmvnic_query_ip_offload_buffer *ip_offload_buf =
4278 &adapter->ip_offload_buf;
4279
4280 adapter->wait_capability = false;
4281 adapter->ip_offload_tok = dma_map_single(dev, ip_offload_buf,
4282 buf_sz,
4283 DMA_FROM_DEVICE);
4284
4285 if (dma_mapping_error(dev, adapter->ip_offload_tok)) {
4286 if (!firmware_has_feature(FW_FEATURE_CMO))
4287 dev_err(dev, "Couldn't map offload buffer\n");
4288 return;
4289 }
4290
4291 memset(&newcrq, 0, sizeof(newcrq));
4292 newcrq.query_ip_offload.first = IBMVNIC_CRQ_CMD;
4293 newcrq.query_ip_offload.cmd = QUERY_IP_OFFLOAD;
4294 newcrq.query_ip_offload.len = cpu_to_be32(buf_sz);
4295 newcrq.query_ip_offload.ioba =
4296 cpu_to_be32(adapter->ip_offload_tok);
4297
4298 ibmvnic_send_crq(adapter, &newcrq);
4299 }
4300}
4301
4302static int handle_login_rsp(union ibmvnic_crq *login_rsp_crq,
4303 struct ibmvnic_adapter *adapter)
4304{
4305 struct device *dev = &adapter->vdev->dev;
4306 struct net_device *netdev = adapter->netdev;
4307 struct ibmvnic_login_rsp_buffer *login_rsp = adapter->login_rsp_buf;
4308 struct ibmvnic_login_buffer *login = adapter->login_buf;
4309 int i;
4310
4311 /* If the number of queues requested can't be allocated by the
4312 * server, the login response will return with code 1. We will need
4313 * to resend the login buffer with fewer queues requested.
4314 */
4315 if (login_rsp_crq->generic.rc.code) {
4316 adapter->init_done_rc = login_rsp_crq->generic.rc.code;
4317 complete(&adapter->init_done);
4318 return 0;
4319 }
4320
4321 if (adapter->failover_pending) {
4322 adapter->init_done_rc = -EAGAIN;
4323 netdev_dbg(netdev, "Failover pending, ignoring login response\n");
4324 complete(&adapter->init_done);
4325 /* login response buffer will be released on reset */
4326 return 0;
4327 }
4328
4329 netdev->mtu = adapter->req_mtu - ETH_HLEN;
4330
4331 netdev_dbg(adapter->netdev, "Login Response Buffer:\n");
4332 for (i = 0; i < (adapter->login_rsp_buf_sz - 1) / 8 + 1; i++) {
4333 netdev_dbg(adapter->netdev, "%016lx\n",
4334 ((unsigned long int *)(adapter->login_rsp_buf))[i]);
4335 }
4336
4337 /* Sanity checks */
4338 if (login->num_txcomp_subcrqs != login_rsp->num_txsubm_subcrqs ||
4339 (be32_to_cpu(login->num_rxcomp_subcrqs) *
4340 adapter->req_rx_add_queues !=
4341 be32_to_cpu(login_rsp->num_rxadd_subcrqs))) {
4342 dev_err(dev, "FATAL: Inconsistent login and login rsp\n");
4343 ibmvnic_remove(adapter->vdev);
4344 return -EIO;
4345 }
4346 release_login_buffer(adapter);
4347 complete(&adapter->init_done);
4348
4349 return 0;
4350}
4351
4352static void handle_request_unmap_rsp(union ibmvnic_crq *crq,
4353 struct ibmvnic_adapter *adapter)
4354{
4355 struct device *dev = &adapter->vdev->dev;
4356 long rc;
4357
4358 rc = crq->request_unmap_rsp.rc.code;
4359 if (rc)
4360 dev_err(dev, "Error %ld in REQUEST_UNMAP_RSP\n", rc);
4361}
4362
4363static void handle_query_map_rsp(union ibmvnic_crq *crq,
4364 struct ibmvnic_adapter *adapter)
4365{
4366 struct net_device *netdev = adapter->netdev;
4367 struct device *dev = &adapter->vdev->dev;
4368 long rc;
4369
4370 rc = crq->query_map_rsp.rc.code;
4371 if (rc) {
4372 dev_err(dev, "Error %ld in QUERY_MAP_RSP\n", rc);
4373 return;
4374 }
4375 netdev_dbg(netdev, "page_size = %d\ntot_pages = %d\nfree_pages = %d\n",
4376 crq->query_map_rsp.page_size, crq->query_map_rsp.tot_pages,
4377 crq->query_map_rsp.free_pages);
4378}
4379
4380static void handle_query_cap_rsp(union ibmvnic_crq *crq,
4381 struct ibmvnic_adapter *adapter)
4382{
4383 struct net_device *netdev = adapter->netdev;
4384 struct device *dev = &adapter->vdev->dev;
4385 long rc;
4386
4387 atomic_dec(&adapter->running_cap_crqs);
4388 netdev_dbg(netdev, "Outstanding queries: %d\n",
4389 atomic_read(&adapter->running_cap_crqs));
4390 rc = crq->query_capability.rc.code;
4391 if (rc) {
4392 dev_err(dev, "Error %ld in QUERY_CAP_RSP\n", rc);
4393 goto out;
4394 }
4395
4396 switch (be16_to_cpu(crq->query_capability.capability)) {
4397 case MIN_TX_QUEUES:
4398 adapter->min_tx_queues =
4399 be64_to_cpu(crq->query_capability.number);
4400 netdev_dbg(netdev, "min_tx_queues = %lld\n",
4401 adapter->min_tx_queues);
4402 break;
4403 case MIN_RX_QUEUES:
4404 adapter->min_rx_queues =
4405 be64_to_cpu(crq->query_capability.number);
4406 netdev_dbg(netdev, "min_rx_queues = %lld\n",
4407 adapter->min_rx_queues);
4408 break;
4409 case MIN_RX_ADD_QUEUES:
4410 adapter->min_rx_add_queues =
4411 be64_to_cpu(crq->query_capability.number);
4412 netdev_dbg(netdev, "min_rx_add_queues = %lld\n",
4413 adapter->min_rx_add_queues);
4414 break;
4415 case MAX_TX_QUEUES:
4416 adapter->max_tx_queues =
4417 be64_to_cpu(crq->query_capability.number);
4418 netdev_dbg(netdev, "max_tx_queues = %lld\n",
4419 adapter->max_tx_queues);
4420 break;
4421 case MAX_RX_QUEUES:
4422 adapter->max_rx_queues =
4423 be64_to_cpu(crq->query_capability.number);
4424 netdev_dbg(netdev, "max_rx_queues = %lld\n",
4425 adapter->max_rx_queues);
4426 break;
4427 case MAX_RX_ADD_QUEUES:
4428 adapter->max_rx_add_queues =
4429 be64_to_cpu(crq->query_capability.number);
4430 netdev_dbg(netdev, "max_rx_add_queues = %lld\n",
4431 adapter->max_rx_add_queues);
4432 break;
4433 case MIN_TX_ENTRIES_PER_SUBCRQ:
4434 adapter->min_tx_entries_per_subcrq =
4435 be64_to_cpu(crq->query_capability.number);
4436 netdev_dbg(netdev, "min_tx_entries_per_subcrq = %lld\n",
4437 adapter->min_tx_entries_per_subcrq);
4438 break;
4439 case MIN_RX_ADD_ENTRIES_PER_SUBCRQ:
4440 adapter->min_rx_add_entries_per_subcrq =
4441 be64_to_cpu(crq->query_capability.number);
4442 netdev_dbg(netdev, "min_rx_add_entrs_per_subcrq = %lld\n",
4443 adapter->min_rx_add_entries_per_subcrq);
4444 break;
4445 case MAX_TX_ENTRIES_PER_SUBCRQ:
4446 adapter->max_tx_entries_per_subcrq =
4447 be64_to_cpu(crq->query_capability.number);
4448 netdev_dbg(netdev, "max_tx_entries_per_subcrq = %lld\n",
4449 adapter->max_tx_entries_per_subcrq);
4450 break;
4451 case MAX_RX_ADD_ENTRIES_PER_SUBCRQ:
4452 adapter->max_rx_add_entries_per_subcrq =
4453 be64_to_cpu(crq->query_capability.number);
4454 netdev_dbg(netdev, "max_rx_add_entrs_per_subcrq = %lld\n",
4455 adapter->max_rx_add_entries_per_subcrq);
4456 break;
4457 case TCP_IP_OFFLOAD:
4458 adapter->tcp_ip_offload =
4459 be64_to_cpu(crq->query_capability.number);
4460 netdev_dbg(netdev, "tcp_ip_offload = %lld\n",
4461 adapter->tcp_ip_offload);
4462 break;
4463 case PROMISC_SUPPORTED:
4464 adapter->promisc_supported =
4465 be64_to_cpu(crq->query_capability.number);
4466 netdev_dbg(netdev, "promisc_supported = %lld\n",
4467 adapter->promisc_supported);
4468 break;
4469 case MIN_MTU:
4470 adapter->min_mtu = be64_to_cpu(crq->query_capability.number);
4471 netdev->min_mtu = adapter->min_mtu - ETH_HLEN;
4472 netdev_dbg(netdev, "min_mtu = %lld\n", adapter->min_mtu);
4473 break;
4474 case MAX_MTU:
4475 adapter->max_mtu = be64_to_cpu(crq->query_capability.number);
4476 netdev->max_mtu = adapter->max_mtu - ETH_HLEN;
4477 netdev_dbg(netdev, "max_mtu = %lld\n", adapter->max_mtu);
4478 break;
4479 case MAX_MULTICAST_FILTERS:
4480 adapter->max_multicast_filters =
4481 be64_to_cpu(crq->query_capability.number);
4482 netdev_dbg(netdev, "max_multicast_filters = %lld\n",
4483 adapter->max_multicast_filters);
4484 break;
4485 case VLAN_HEADER_INSERTION:
4486 adapter->vlan_header_insertion =
4487 be64_to_cpu(crq->query_capability.number);
4488 if (adapter->vlan_header_insertion)
4489 netdev->features |= NETIF_F_HW_VLAN_STAG_TX;
4490 netdev_dbg(netdev, "vlan_header_insertion = %lld\n",
4491 adapter->vlan_header_insertion);
4492 break;
4493 case RX_VLAN_HEADER_INSERTION:
4494 adapter->rx_vlan_header_insertion =
4495 be64_to_cpu(crq->query_capability.number);
4496 netdev_dbg(netdev, "rx_vlan_header_insertion = %lld\n",
4497 adapter->rx_vlan_header_insertion);
4498 break;
4499 case MAX_TX_SG_ENTRIES:
4500 adapter->max_tx_sg_entries =
4501 be64_to_cpu(crq->query_capability.number);
4502 netdev_dbg(netdev, "max_tx_sg_entries = %lld\n",
4503 adapter->max_tx_sg_entries);
4504 break;
4505 case RX_SG_SUPPORTED:
4506 adapter->rx_sg_supported =
4507 be64_to_cpu(crq->query_capability.number);
4508 netdev_dbg(netdev, "rx_sg_supported = %lld\n",
4509 adapter->rx_sg_supported);
4510 break;
4511 case OPT_TX_COMP_SUB_QUEUES:
4512 adapter->opt_tx_comp_sub_queues =
4513 be64_to_cpu(crq->query_capability.number);
4514 netdev_dbg(netdev, "opt_tx_comp_sub_queues = %lld\n",
4515 adapter->opt_tx_comp_sub_queues);
4516 break;
4517 case OPT_RX_COMP_QUEUES:
4518 adapter->opt_rx_comp_queues =
4519 be64_to_cpu(crq->query_capability.number);
4520 netdev_dbg(netdev, "opt_rx_comp_queues = %lld\n",
4521 adapter->opt_rx_comp_queues);
4522 break;
4523 case OPT_RX_BUFADD_Q_PER_RX_COMP_Q:
4524 adapter->opt_rx_bufadd_q_per_rx_comp_q =
4525 be64_to_cpu(crq->query_capability.number);
4526 netdev_dbg(netdev, "opt_rx_bufadd_q_per_rx_comp_q = %lld\n",
4527 adapter->opt_rx_bufadd_q_per_rx_comp_q);
4528 break;
4529 case OPT_TX_ENTRIES_PER_SUBCRQ:
4530 adapter->opt_tx_entries_per_subcrq =
4531 be64_to_cpu(crq->query_capability.number);
4532 netdev_dbg(netdev, "opt_tx_entries_per_subcrq = %lld\n",
4533 adapter->opt_tx_entries_per_subcrq);
4534 break;
4535 case OPT_RXBA_ENTRIES_PER_SUBCRQ:
4536 adapter->opt_rxba_entries_per_subcrq =
4537 be64_to_cpu(crq->query_capability.number);
4538 netdev_dbg(netdev, "opt_rxba_entries_per_subcrq = %lld\n",
4539 adapter->opt_rxba_entries_per_subcrq);
4540 break;
4541 case TX_RX_DESC_REQ:
4542 adapter->tx_rx_desc_req = crq->query_capability.number;
4543 netdev_dbg(netdev, "tx_rx_desc_req = %llx\n",
4544 adapter->tx_rx_desc_req);
4545 break;
4546
4547 default:
4548 netdev_err(netdev, "Got invalid cap rsp %d\n",
4549 crq->query_capability.capability);
4550 }
4551
4552out:
4553 if (atomic_read(&adapter->running_cap_crqs) == 0) {
4554 adapter->wait_capability = false;
4555 ibmvnic_send_req_caps(adapter, 0);
4556 }
4557}
4558
4559static int send_query_phys_parms(struct ibmvnic_adapter *adapter)
4560{
4561 union ibmvnic_crq crq;
4562 int rc;
4563
4564 memset(&crq, 0, sizeof(crq));
4565 crq.query_phys_parms.first = IBMVNIC_CRQ_CMD;
4566 crq.query_phys_parms.cmd = QUERY_PHYS_PARMS;
4567 reinit_completion(&adapter->fw_done);
4568 rc = ibmvnic_send_crq(adapter, &crq);
4569 if (rc)
4570 return rc;
4571 wait_for_completion(&adapter->fw_done);
4572 return adapter->fw_done_rc ? -EIO : 0;
4573}
4574
4575static int handle_query_phys_parms_rsp(union ibmvnic_crq *crq,
4576 struct ibmvnic_adapter *adapter)
4577{
4578 struct net_device *netdev = adapter->netdev;
4579 int rc;
4580 __be32 rspeed = cpu_to_be32(crq->query_phys_parms_rsp.speed);
4581
4582 rc = crq->query_phys_parms_rsp.rc.code;
4583 if (rc) {
4584 netdev_err(netdev, "Error %d in QUERY_PHYS_PARMS\n", rc);
4585 return rc;
4586 }
4587 switch (rspeed) {
4588 case IBMVNIC_10MBPS:
4589 adapter->speed = SPEED_10;
4590 break;
4591 case IBMVNIC_100MBPS:
4592 adapter->speed = SPEED_100;
4593 break;
4594 case IBMVNIC_1GBPS:
4595 adapter->speed = SPEED_1000;
4596 break;
4597 case IBMVNIC_10GBPS:
4598 adapter->speed = SPEED_10000;
4599 break;
4600 case IBMVNIC_25GBPS:
4601 adapter->speed = SPEED_25000;
4602 break;
4603 case IBMVNIC_40GBPS:
4604 adapter->speed = SPEED_40000;
4605 break;
4606 case IBMVNIC_50GBPS:
4607 adapter->speed = SPEED_50000;
4608 break;
4609 case IBMVNIC_100GBPS:
4610 adapter->speed = SPEED_100000;
4611 break;
4612 case IBMVNIC_200GBPS:
4613 adapter->speed = SPEED_200000;
4614 break;
4615 default:
4616 if (netif_carrier_ok(netdev))
4617 netdev_warn(netdev, "Unknown speed 0x%08x\n", rspeed);
4618 adapter->speed = SPEED_UNKNOWN;
4619 }
4620 if (crq->query_phys_parms_rsp.flags1 & IBMVNIC_FULL_DUPLEX)
4621 adapter->duplex = DUPLEX_FULL;
4622 else if (crq->query_phys_parms_rsp.flags1 & IBMVNIC_HALF_DUPLEX)
4623 adapter->duplex = DUPLEX_HALF;
4624 else
4625 adapter->duplex = DUPLEX_UNKNOWN;
4626
4627 return rc;
4628}
4629
4630static void ibmvnic_handle_crq(union ibmvnic_crq *crq,
4631 struct ibmvnic_adapter *adapter)
4632{
4633 struct ibmvnic_generic_crq *gen_crq = &crq->generic;
4634 struct net_device *netdev = adapter->netdev;
4635 struct device *dev = &adapter->vdev->dev;
4636 u64 *u64_crq = (u64 *)crq;
4637 long rc;
4638
4639 netdev_dbg(netdev, "Handling CRQ: %016lx %016lx\n",
4640 (unsigned long int)cpu_to_be64(u64_crq[0]),
4641 (unsigned long int)cpu_to_be64(u64_crq[1]));
4642 switch (gen_crq->first) {
4643 case IBMVNIC_CRQ_INIT_RSP:
4644 switch (gen_crq->cmd) {
4645 case IBMVNIC_CRQ_INIT:
4646 dev_info(dev, "Partner initialized\n");
4647 adapter->from_passive_init = true;
4648 if (!completion_done(&adapter->init_done)) {
4649 complete(&adapter->init_done);
4650 adapter->init_done_rc = -EIO;
4651 }
4652 rc = ibmvnic_reset(adapter, VNIC_RESET_FAILOVER);
4653 if (rc && rc != -EBUSY) {
4654 /* We were unable to schedule the failover
4655 * reset either because the adapter was still
4656 * probing (eg: during kexec) or we could not
4657 * allocate memory. Clear the failover_pending
4658 * flag since no one else will. We ignore
4659 * EBUSY because it means either FAILOVER reset
4660 * is already scheduled or the adapter is
4661 * being removed.
4662 */
4663 netdev_err(netdev,
4664 "Error %ld scheduling failover reset\n",
4665 rc);
4666 adapter->failover_pending = false;
4667 }
4668 break;
4669 case IBMVNIC_CRQ_INIT_COMPLETE:
4670 dev_info(dev, "Partner initialization complete\n");
4671 adapter->crq.active = true;
4672 send_version_xchg(adapter);
4673 break;
4674 default:
4675 dev_err(dev, "Unknown crq cmd: %d\n", gen_crq->cmd);
4676 }
4677 return;
4678 case IBMVNIC_CRQ_XPORT_EVENT:
4679 netif_carrier_off(netdev);
4680 adapter->crq.active = false;
4681 if (test_bit(0, &adapter->resetting))
4682 adapter->force_reset_recovery = true;
4683 if (gen_crq->cmd == IBMVNIC_PARTITION_MIGRATED) {
4684 dev_info(dev, "Migrated, re-enabling adapter\n");
4685 ibmvnic_reset(adapter, VNIC_RESET_MOBILITY);
4686 } else if (gen_crq->cmd == IBMVNIC_DEVICE_FAILOVER) {
4687 dev_info(dev, "Backing device failover detected\n");
4688 adapter->failover_pending = true;
4689 } else {
4690 /* The adapter lost the connection */
4691 dev_err(dev, "Virtual Adapter failed (rc=%d)\n",
4692 gen_crq->cmd);
4693 ibmvnic_reset(adapter, VNIC_RESET_FATAL);
4694 }
4695 return;
4696 case IBMVNIC_CRQ_CMD_RSP:
4697 break;
4698 default:
4699 dev_err(dev, "Got an invalid msg type 0x%02x\n",
4700 gen_crq->first);
4701 return;
4702 }
4703
4704 switch (gen_crq->cmd) {
4705 case VERSION_EXCHANGE_RSP:
4706 rc = crq->version_exchange_rsp.rc.code;
4707 if (rc) {
4708 dev_err(dev, "Error %ld in VERSION_EXCHG_RSP\n", rc);
4709 break;
4710 }
4711 ibmvnic_version =
4712 be16_to_cpu(crq->version_exchange_rsp.version);
4713 dev_info(dev, "Partner protocol version is %d\n",
4714 ibmvnic_version);
4715 send_cap_queries(adapter);
4716 break;
4717 case QUERY_CAPABILITY_RSP:
4718 handle_query_cap_rsp(crq, adapter);
4719 break;
4720 case QUERY_MAP_RSP:
4721 handle_query_map_rsp(crq, adapter);
4722 break;
4723 case REQUEST_MAP_RSP:
4724 adapter->fw_done_rc = crq->request_map_rsp.rc.code;
4725 complete(&adapter->fw_done);
4726 break;
4727 case REQUEST_UNMAP_RSP:
4728 handle_request_unmap_rsp(crq, adapter);
4729 break;
4730 case REQUEST_CAPABILITY_RSP:
4731 handle_request_cap_rsp(crq, adapter);
4732 break;
4733 case LOGIN_RSP:
4734 netdev_dbg(netdev, "Got Login Response\n");
4735 handle_login_rsp(crq, adapter);
4736 break;
4737 case LOGICAL_LINK_STATE_RSP:
4738 netdev_dbg(netdev,
4739 "Got Logical Link State Response, state: %d rc: %d\n",
4740 crq->logical_link_state_rsp.link_state,
4741 crq->logical_link_state_rsp.rc.code);
4742 adapter->logical_link_state =
4743 crq->logical_link_state_rsp.link_state;
4744 adapter->init_done_rc = crq->logical_link_state_rsp.rc.code;
4745 complete(&adapter->init_done);
4746 break;
4747 case LINK_STATE_INDICATION:
4748 netdev_dbg(netdev, "Got Logical Link State Indication\n");
4749 adapter->phys_link_state =
4750 crq->link_state_indication.phys_link_state;
4751 adapter->logical_link_state =
4752 crq->link_state_indication.logical_link_state;
4753 if (adapter->phys_link_state && adapter->logical_link_state)
4754 netif_carrier_on(netdev);
4755 else
4756 netif_carrier_off(netdev);
4757 break;
4758 case CHANGE_MAC_ADDR_RSP:
4759 netdev_dbg(netdev, "Got MAC address change Response\n");
4760 adapter->fw_done_rc = handle_change_mac_rsp(crq, adapter);
4761 break;
4762 case ERROR_INDICATION:
4763 netdev_dbg(netdev, "Got Error Indication\n");
4764 handle_error_indication(crq, adapter);
4765 break;
4766 case REQUEST_STATISTICS_RSP:
4767 netdev_dbg(netdev, "Got Statistics Response\n");
4768 complete(&adapter->stats_done);
4769 break;
4770 case QUERY_IP_OFFLOAD_RSP:
4771 netdev_dbg(netdev, "Got Query IP offload Response\n");
4772 handle_query_ip_offload_rsp(adapter);
4773 break;
4774 case MULTICAST_CTRL_RSP:
4775 netdev_dbg(netdev, "Got multicast control Response\n");
4776 break;
4777 case CONTROL_IP_OFFLOAD_RSP:
4778 netdev_dbg(netdev, "Got Control IP offload Response\n");
4779 dma_unmap_single(dev, adapter->ip_offload_ctrl_tok,
4780 sizeof(adapter->ip_offload_ctrl),
4781 DMA_TO_DEVICE);
4782 complete(&adapter->init_done);
4783 break;
4784 case COLLECT_FW_TRACE_RSP:
4785 netdev_dbg(netdev, "Got Collect firmware trace Response\n");
4786 complete(&adapter->fw_done);
4787 break;
4788 case GET_VPD_SIZE_RSP:
4789 handle_vpd_size_rsp(crq, adapter);
4790 break;
4791 case GET_VPD_RSP:
4792 handle_vpd_rsp(crq, adapter);
4793 break;
4794 case QUERY_PHYS_PARMS_RSP:
4795 adapter->fw_done_rc = handle_query_phys_parms_rsp(crq, adapter);
4796 complete(&adapter->fw_done);
4797 break;
4798 default:
4799 netdev_err(netdev, "Got an invalid cmd type 0x%02x\n",
4800 gen_crq->cmd);
4801 }
4802}
4803
4804static irqreturn_t ibmvnic_interrupt(int irq, void *instance)
4805{
4806 struct ibmvnic_adapter *adapter = instance;
4807
4808 tasklet_schedule(&adapter->tasklet);
4809 return IRQ_HANDLED;
4810}
4811
4812static void ibmvnic_tasklet(void *data)
4813{
4814 struct ibmvnic_adapter *adapter = data;
4815 struct ibmvnic_crq_queue *queue = &adapter->crq;
4816 union ibmvnic_crq *crq;
4817 unsigned long flags;
4818 bool done = false;
4819
4820 spin_lock_irqsave(&queue->lock, flags);
4821 while (!done) {
4822 /* Pull all the valid messages off the CRQ */
4823 while ((crq = ibmvnic_next_crq(adapter)) != NULL) {
4824 /* This barrier makes sure ibmvnic_next_crq()'s
4825 * crq->generic.first & IBMVNIC_CRQ_CMD_RSP is loaded
4826 * before ibmvnic_handle_crq()'s
4827 * switch(gen_crq->first) and switch(gen_crq->cmd).
4828 */
4829 dma_rmb();
4830 ibmvnic_handle_crq(crq, adapter);
4831 crq->generic.first = 0;
4832 }
4833 }
4834 /* if capabilities CRQ's were sent in this tasklet, the following
4835 * tasklet must wait until all responses are received
4836 */
4837 if (atomic_read(&adapter->running_cap_crqs) != 0)
4838 adapter->wait_capability = true;
4839 spin_unlock_irqrestore(&queue->lock, flags);
4840}
4841
4842static int ibmvnic_reenable_crq_queue(struct ibmvnic_adapter *adapter)
4843{
4844 struct vio_dev *vdev = adapter->vdev;
4845 int rc;
4846
4847 do {
4848 rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
4849 } while (rc == H_IN_PROGRESS || rc == H_BUSY || H_IS_LONG_BUSY(rc));
4850
4851 if (rc)
4852 dev_err(&vdev->dev, "Error enabling adapter (rc=%d)\n", rc);
4853
4854 return rc;
4855}
4856
4857static int ibmvnic_reset_crq(struct ibmvnic_adapter *adapter)
4858{
4859 struct ibmvnic_crq_queue *crq = &adapter->crq;
4860 struct device *dev = &adapter->vdev->dev;
4861 struct vio_dev *vdev = adapter->vdev;
4862 int rc;
4863
4864 /* Close the CRQ */
4865 do {
4866 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
4867 } while (rc == H_BUSY || H_IS_LONG_BUSY(rc));
4868
4869 /* Clean out the queue */
4870 if (!crq->msgs)
4871 return -EINVAL;
4872
4873 memset(crq->msgs, 0, PAGE_SIZE);
4874 crq->cur = 0;
4875 crq->active = false;
4876
4877 /* And re-open it again */
4878 rc = plpar_hcall_norets(H_REG_CRQ, vdev->unit_address,
4879 crq->msg_token, PAGE_SIZE);
4880
4881 if (rc == H_CLOSED)
4882 /* Adapter is good, but other end is not ready */
4883 dev_warn(dev, "Partner adapter not ready\n");
4884 else if (rc != 0)
4885 dev_warn(dev, "Couldn't register crq (rc=%d)\n", rc);
4886
4887 return rc;
4888}
4889
4890static void release_crq_queue(struct ibmvnic_adapter *adapter)
4891{
4892 struct ibmvnic_crq_queue *crq = &adapter->crq;
4893 struct vio_dev *vdev = adapter->vdev;
4894 long rc;
4895
4896 if (!crq->msgs)
4897 return;
4898
4899 netdev_dbg(adapter->netdev, "Releasing CRQ\n");
4900 free_irq(vdev->irq, adapter);
4901 tasklet_kill(&adapter->tasklet);
4902 do {
4903 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
4904 } while (rc == H_BUSY || H_IS_LONG_BUSY(rc));
4905
4906 dma_unmap_single(&vdev->dev, crq->msg_token, PAGE_SIZE,
4907 DMA_BIDIRECTIONAL);
4908 free_page((unsigned long)crq->msgs);
4909 crq->msgs = NULL;
4910 crq->active = false;
4911}
4912
4913static int init_crq_queue(struct ibmvnic_adapter *adapter)
4914{
4915 struct ibmvnic_crq_queue *crq = &adapter->crq;
4916 struct device *dev = &adapter->vdev->dev;
4917 struct vio_dev *vdev = adapter->vdev;
4918 int rc, retrc = -ENOMEM;
4919
4920 if (crq->msgs)
4921 return 0;
4922
4923 crq->msgs = (union ibmvnic_crq *)get_zeroed_page(GFP_KERNEL);
4924 /* Should we allocate more than one page? */
4925
4926 if (!crq->msgs)
4927 return -ENOMEM;
4928
4929 crq->size = PAGE_SIZE / sizeof(*crq->msgs);
4930 crq->msg_token = dma_map_single(dev, crq->msgs, PAGE_SIZE,
4931 DMA_BIDIRECTIONAL);
4932 if (dma_mapping_error(dev, crq->msg_token))
4933 goto map_failed;
4934
4935 rc = plpar_hcall_norets(H_REG_CRQ, vdev->unit_address,
4936 crq->msg_token, PAGE_SIZE);
4937
4938 if (rc == H_RESOURCE)
4939 /* maybe kexecing and resource is busy. try a reset */
4940 rc = ibmvnic_reset_crq(adapter);
4941 retrc = rc;
4942
4943 if (rc == H_CLOSED) {
4944 dev_warn(dev, "Partner adapter not ready\n");
4945 } else if (rc) {
4946 dev_warn(dev, "Error %d opening adapter\n", rc);
4947 goto reg_crq_failed;
4948 }
4949
4950 retrc = 0;
4951
4952 tasklet_init(&adapter->tasklet, (void *)ibmvnic_tasklet,
4953 (unsigned long)adapter);
4954
4955 netdev_dbg(adapter->netdev, "registering irq 0x%x\n", vdev->irq);
4956 snprintf(crq->name, sizeof(crq->name), "ibmvnic-%x",
4957 adapter->vdev->unit_address);
4958 rc = request_irq(vdev->irq, ibmvnic_interrupt, 0, crq->name, adapter);
4959 if (rc) {
4960 dev_err(dev, "Couldn't register irq 0x%x. rc=%d\n",
4961 vdev->irq, rc);
4962 goto req_irq_failed;
4963 }
4964
4965 rc = vio_enable_interrupts(vdev);
4966 if (rc) {
4967 dev_err(dev, "Error %d enabling interrupts\n", rc);
4968 goto req_irq_failed;
4969 }
4970
4971 crq->cur = 0;
4972 spin_lock_init(&crq->lock);
4973
4974 /* process any CRQs that were queued before we enabled interrupts */
4975 tasklet_schedule(&adapter->tasklet);
4976
4977 return retrc;
4978
4979req_irq_failed:
4980 tasklet_kill(&adapter->tasklet);
4981 do {
4982 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
4983 } while (rc == H_BUSY || H_IS_LONG_BUSY(rc));
4984reg_crq_failed:
4985 dma_unmap_single(dev, crq->msg_token, PAGE_SIZE, DMA_BIDIRECTIONAL);
4986map_failed:
4987 free_page((unsigned long)crq->msgs);
4988 crq->msgs = NULL;
4989 return retrc;
4990}
4991
4992static int ibmvnic_reset_init(struct ibmvnic_adapter *adapter)
4993{
4994 struct device *dev = &adapter->vdev->dev;
4995 unsigned long timeout = msecs_to_jiffies(30000);
4996 u64 old_num_rx_queues, old_num_tx_queues;
4997 int rc;
4998
4999 adapter->from_passive_init = false;
5000
5001 old_num_rx_queues = adapter->req_rx_queues;
5002 old_num_tx_queues = adapter->req_tx_queues;
5003
5004 reinit_completion(&adapter->init_done);
5005 adapter->init_done_rc = 0;
5006 ibmvnic_send_crq_init(adapter);
5007 if (!wait_for_completion_timeout(&adapter->init_done, timeout)) {
5008 dev_err(dev, "Initialization sequence timed out\n");
5009 return -1;
5010 }
5011
5012 if (adapter->init_done_rc) {
5013 release_crq_queue(adapter);
5014 return adapter->init_done_rc;
5015 }
5016
5017 if (adapter->from_passive_init) {
5018 adapter->state = VNIC_OPEN;
5019 adapter->from_passive_init = false;
5020 return -1;
5021 }
5022
5023 if (test_bit(0, &adapter->resetting) && !adapter->wait_for_reset &&
5024 adapter->reset_reason != VNIC_RESET_MOBILITY) {
5025 if (adapter->req_rx_queues != old_num_rx_queues ||
5026 adapter->req_tx_queues != old_num_tx_queues) {
5027 release_sub_crqs(adapter, 0);
5028 rc = init_sub_crqs(adapter);
5029 } else {
5030 /* no need to reinitialize completely, but we do
5031 * need to clean up transmits that were in flight
5032 * when we processed the reset. Failure to do so
5033 * will confound the upper layer, usually TCP, by
5034 * creating the illusion of transmits that are
5035 * awaiting completion.
5036 */
5037 clean_tx_pools(adapter);
5038
5039 rc = reset_sub_crq_queues(adapter);
5040 }
5041 } else {
5042 rc = init_sub_crqs(adapter);
5043 }
5044
5045 if (rc) {
5046 dev_err(dev, "Initialization of sub crqs failed\n");
5047 release_crq_queue(adapter);
5048 return rc;
5049 }
5050
5051 rc = init_sub_crq_irqs(adapter);
5052 if (rc) {
5053 dev_err(dev, "Failed to initialize sub crq irqs\n");
5054 release_crq_queue(adapter);
5055 }
5056
5057 return rc;
5058}
5059
5060static int ibmvnic_init(struct ibmvnic_adapter *adapter)
5061{
5062 struct device *dev = &adapter->vdev->dev;
5063 unsigned long timeout = msecs_to_jiffies(30000);
5064 int rc;
5065
5066 adapter->from_passive_init = false;
5067
5068 adapter->init_done_rc = 0;
5069 ibmvnic_send_crq_init(adapter);
5070 if (!wait_for_completion_timeout(&adapter->init_done, timeout)) {
5071 dev_err(dev, "Initialization sequence timed out\n");
5072 return -1;
5073 }
5074
5075 if (adapter->init_done_rc) {
5076 release_crq_queue(adapter);
5077 return adapter->init_done_rc;
5078 }
5079
5080 if (adapter->from_passive_init) {
5081 adapter->state = VNIC_OPEN;
5082 adapter->from_passive_init = false;
5083 return -1;
5084 }
5085
5086 rc = init_sub_crqs(adapter);
5087 if (rc) {
5088 dev_err(dev, "Initialization of sub crqs failed\n");
5089 release_crq_queue(adapter);
5090 return rc;
5091 }
5092
5093 rc = init_sub_crq_irqs(adapter);
5094 if (rc) {
5095 dev_err(dev, "Failed to initialize sub crq irqs\n");
5096 release_crq_queue(adapter);
5097 }
5098
5099 return rc;
5100}
5101
5102static struct device_attribute dev_attr_failover;
5103
5104static int ibmvnic_probe(struct vio_dev *dev, const struct vio_device_id *id)
5105{
5106 struct ibmvnic_adapter *adapter;
5107 struct net_device *netdev;
5108 unsigned char *mac_addr_p;
5109 int rc;
5110
5111 dev_dbg(&dev->dev, "entering ibmvnic_probe for UA 0x%x\n",
5112 dev->unit_address);
5113
5114 mac_addr_p = (unsigned char *)vio_get_attribute(dev,
5115 VETH_MAC_ADDR, NULL);
5116 if (!mac_addr_p) {
5117 dev_err(&dev->dev,
5118 "(%s:%3.3d) ERROR: Can't find MAC_ADDR attribute\n",
5119 __FILE__, __LINE__);
5120 return 0;
5121 }
5122
5123 netdev = alloc_etherdev_mq(sizeof(struct ibmvnic_adapter),
5124 IBMVNIC_MAX_QUEUES);
5125 if (!netdev)
5126 return -ENOMEM;
5127
5128 adapter = netdev_priv(netdev);
5129 adapter->state = VNIC_PROBING;
5130 dev_set_drvdata(&dev->dev, netdev);
5131 adapter->vdev = dev;
5132 adapter->netdev = netdev;
5133
5134 ether_addr_copy(adapter->mac_addr, mac_addr_p);
5135 ether_addr_copy(netdev->dev_addr, adapter->mac_addr);
5136 netdev->irq = dev->irq;
5137 netdev->netdev_ops = &ibmvnic_netdev_ops;
5138 netdev->ethtool_ops = &ibmvnic_ethtool_ops;
5139 SET_NETDEV_DEV(netdev, &dev->dev);
5140
5141 spin_lock_init(&adapter->stats_lock);
5142
5143 INIT_WORK(&adapter->ibmvnic_reset, __ibmvnic_reset);
5144 INIT_DELAYED_WORK(&adapter->ibmvnic_delayed_reset,
5145 __ibmvnic_delayed_reset);
5146 INIT_LIST_HEAD(&adapter->rwi_list);
5147 spin_lock_init(&adapter->rwi_lock);
5148 init_completion(&adapter->init_done);
5149 init_completion(&adapter->fw_done);
5150 init_completion(&adapter->reset_done);
5151 init_completion(&adapter->stats_done);
5152 clear_bit(0, &adapter->resetting);
5153
5154 do {
5155 rc = init_crq_queue(adapter);
5156 if (rc) {
5157 dev_err(&dev->dev, "Couldn't initialize crq. rc=%d\n",
5158 rc);
5159 goto ibmvnic_init_fail;
5160 }
5161
5162 rc = ibmvnic_init(adapter);
5163 if (rc && rc != EAGAIN)
5164 goto ibmvnic_init_fail;
5165 } while (rc == EAGAIN);
5166
5167 rc = init_stats_buffers(adapter);
5168 if (rc)
5169 goto ibmvnic_init_fail;
5170
5171 rc = init_stats_token(adapter);
5172 if (rc)
5173 goto ibmvnic_stats_fail;
5174
5175 netdev->mtu = adapter->req_mtu - ETH_HLEN;
5176 netdev->min_mtu = adapter->min_mtu - ETH_HLEN;
5177 netdev->max_mtu = adapter->max_mtu - ETH_HLEN;
5178
5179 rc = device_create_file(&dev->dev, &dev_attr_failover);
5180 if (rc)
5181 goto ibmvnic_dev_file_err;
5182
5183 netif_carrier_off(netdev);
5184 rc = register_netdev(netdev);
5185 if (rc) {
5186 dev_err(&dev->dev, "failed to register netdev rc=%d\n", rc);
5187 goto ibmvnic_register_fail;
5188 }
5189 dev_info(&dev->dev, "ibmvnic registered\n");
5190
5191 adapter->state = VNIC_PROBED;
5192
5193 adapter->wait_for_reset = false;
5194
5195 return 0;
5196
5197ibmvnic_register_fail:
5198 device_remove_file(&dev->dev, &dev_attr_failover);
5199
5200ibmvnic_dev_file_err:
5201 release_stats_token(adapter);
5202
5203ibmvnic_stats_fail:
5204 release_stats_buffers(adapter);
5205
5206ibmvnic_init_fail:
5207 release_sub_crqs(adapter, 1);
5208 release_crq_queue(adapter);
5209 free_netdev(netdev);
5210
5211 return rc;
5212}
5213
5214static int ibmvnic_remove(struct vio_dev *dev)
5215{
5216 struct net_device *netdev = dev_get_drvdata(&dev->dev);
5217 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
5218
5219 adapter->state = VNIC_REMOVING;
5220 rtnl_lock();
5221 unregister_netdevice(netdev);
5222
5223 release_resources(adapter);
5224 release_sub_crqs(adapter, 1);
5225 release_crq_queue(adapter);
5226
5227 release_stats_token(adapter);
5228 release_stats_buffers(adapter);
5229
5230 adapter->state = VNIC_REMOVED;
5231
5232 rtnl_unlock();
5233 device_remove_file(&dev->dev, &dev_attr_failover);
5234 free_netdev(netdev);
5235 dev_set_drvdata(&dev->dev, NULL);
5236
5237 return 0;
5238}
5239
5240static ssize_t failover_store(struct device *dev, struct device_attribute *attr,
5241 const char *buf, size_t count)
5242{
5243 struct net_device *netdev = dev_get_drvdata(dev);
5244 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
5245 unsigned long retbuf[PLPAR_HCALL_BUFSIZE];
5246 __be64 session_token;
5247 long rc;
5248
5249 if (!sysfs_streq(buf, "1"))
5250 return -EINVAL;
5251
5252 rc = plpar_hcall(H_VIOCTL, retbuf, adapter->vdev->unit_address,
5253 H_GET_SESSION_TOKEN, 0, 0, 0);
5254 if (rc) {
5255 netdev_err(netdev, "Couldn't retrieve session token, rc %ld\n",
5256 rc);
5257 return -EINVAL;
5258 }
5259
5260 session_token = (__be64)retbuf[0];
5261 netdev_dbg(netdev, "Initiating client failover, session id %llx\n",
5262 be64_to_cpu(session_token));
5263 rc = plpar_hcall_norets(H_VIOCTL, adapter->vdev->unit_address,
5264 H_SESSION_ERR_DETECTED, session_token, 0, 0);
5265 if (rc) {
5266 netdev_err(netdev, "Client initiated failover failed, rc %ld\n",
5267 rc);
5268 return -EINVAL;
5269 }
5270
5271 return count;
5272}
5273
5274static DEVICE_ATTR_WO(failover);
5275
5276static unsigned long ibmvnic_get_desired_dma(struct vio_dev *vdev)
5277{
5278 struct net_device *netdev = dev_get_drvdata(&vdev->dev);
5279 struct ibmvnic_adapter *adapter;
5280 struct iommu_table *tbl;
5281 unsigned long ret = 0;
5282 int i;
5283
5284 tbl = get_iommu_table_base(&vdev->dev);
5285
5286 /* netdev inits at probe time along with the structures we need below*/
5287 if (!netdev)
5288 return IOMMU_PAGE_ALIGN(IBMVNIC_IO_ENTITLEMENT_DEFAULT, tbl);
5289
5290 adapter = netdev_priv(netdev);
5291
5292 ret += PAGE_SIZE; /* the crq message queue */
5293 ret += IOMMU_PAGE_ALIGN(sizeof(struct ibmvnic_statistics), tbl);
5294
5295 for (i = 0; i < adapter->req_tx_queues + adapter->req_rx_queues; i++)
5296 ret += 4 * PAGE_SIZE; /* the scrq message queue */
5297
5298 for (i = 0; i < be32_to_cpu(adapter->login_rsp_buf->num_rxadd_subcrqs);
5299 i++)
5300 ret += adapter->rx_pool[i].size *
5301 IOMMU_PAGE_ALIGN(adapter->rx_pool[i].buff_size, tbl);
5302
5303 return ret;
5304}
5305
5306static int ibmvnic_resume(struct device *dev)
5307{
5308 struct net_device *netdev = dev_get_drvdata(dev);
5309 struct ibmvnic_adapter *adapter = netdev_priv(netdev);
5310
5311 if (adapter->state != VNIC_OPEN)
5312 return 0;
5313
5314 tasklet_schedule(&adapter->tasklet);
5315
5316 return 0;
5317}
5318
5319static const struct vio_device_id ibmvnic_device_table[] = {
5320 {"network", "IBM,vnic"},
5321 {"", "" }
5322};
5323MODULE_DEVICE_TABLE(vio, ibmvnic_device_table);
5324
5325static const struct dev_pm_ops ibmvnic_pm_ops = {
5326 .resume = ibmvnic_resume
5327};
5328
5329static struct vio_driver ibmvnic_driver = {
5330 .id_table = ibmvnic_device_table,
5331 .probe = ibmvnic_probe,
5332 .remove = ibmvnic_remove,
5333 .get_desired_dma = ibmvnic_get_desired_dma,
5334 .name = ibmvnic_driver_name,
5335 .pm = &ibmvnic_pm_ops,
5336};
5337
5338/* module functions */
5339static int __init ibmvnic_module_init(void)
5340{
5341 pr_info("%s: %s %s\n", ibmvnic_driver_name, ibmvnic_driver_string,
5342 IBMVNIC_DRIVER_VERSION);
5343
5344 return vio_register_driver(&ibmvnic_driver);
5345}
5346
5347static void __exit ibmvnic_module_exit(void)
5348{
5349 vio_unregister_driver(&ibmvnic_driver);
5350}
5351
5352module_init(ibmvnic_module_init);
5353module_exit(ibmvnic_module_exit);