blob: e60822f07653ec5e32d84db426ea8b56e762a4a0 [file] [log] [blame]
xjb04a4022021-11-25 15:01:52 +08001/* ------------------------------------------------------------
2 * ibmvscsi.c
3 * (C) Copyright IBM Corporation 1994, 2004
4 * Authors: Colin DeVilbiss (devilbis@us.ibm.com)
5 * Santiago Leon (santil@us.ibm.com)
6 * Dave Boutcher (sleddog@us.ibm.com)
7 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2 of the License, or
11 * (at your option) any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307
21 * USA
22 *
23 * ------------------------------------------------------------
24 * Emulation of a SCSI host adapter for Virtual I/O devices
25 *
26 * This driver supports the SCSI adapter implemented by the IBM
27 * Power5 firmware. That SCSI adapter is not a physical adapter,
28 * but allows Linux SCSI peripheral drivers to directly
29 * access devices in another logical partition on the physical system.
30 *
31 * The virtual adapter(s) are present in the open firmware device
32 * tree just like real adapters.
33 *
34 * One of the capabilities provided on these systems is the ability
35 * to DMA between partitions. The architecture states that for VSCSI,
36 * the server side is allowed to DMA to and from the client. The client
37 * is never trusted to DMA to or from the server directly.
38 *
39 * Messages are sent between partitions on a "Command/Response Queue"
40 * (CRQ), which is just a buffer of 16 byte entries in the receiver's
41 * Senders cannot access the buffer directly, but send messages by
42 * making a hypervisor call and passing in the 16 bytes. The hypervisor
43 * puts the message in the next 16 byte space in round-robin fashion,
44 * turns on the high order bit of the message (the valid bit), and
45 * generates an interrupt to the receiver (if interrupts are turned on.)
46 * The receiver just turns off the valid bit when they have copied out
47 * the message.
48 *
49 * The VSCSI client builds a SCSI Remote Protocol (SRP) Information Unit
50 * (IU) (as defined in the T10 standard available at www.t10.org), gets
51 * a DMA address for the message, and sends it to the server as the
52 * payload of a CRQ message. The server DMAs the SRP IU and processes it,
53 * including doing any additional data transfers. When it is done, it
54 * DMAs the SRP response back to the same address as the request came from,
55 * and sends a CRQ message back to inform the client that the request has
56 * completed.
57 *
58 * TODO: This is currently pretty tied to the IBM pSeries hypervisor
59 * interfaces. It would be really nice to abstract this above an RDMA
60 * layer.
61 */
62
63#include <linux/module.h>
64#include <linux/moduleparam.h>
65#include <linux/dma-mapping.h>
66#include <linux/delay.h>
67#include <linux/slab.h>
68#include <linux/of.h>
69#include <linux/pm.h>
70#include <linux/kthread.h>
71#include <asm/firmware.h>
72#include <asm/vio.h>
73#include <scsi/scsi.h>
74#include <scsi/scsi_cmnd.h>
75#include <scsi/scsi_host.h>
76#include <scsi/scsi_device.h>
77#include <scsi/scsi_transport_srp.h>
78#include "ibmvscsi.h"
79
80/* The values below are somewhat arbitrary default values, but
81 * OS/400 will use 3 busses (disks, CDs, tapes, I think.)
82 * Note that there are 3 bits of channel value, 6 bits of id, and
83 * 5 bits of LUN.
84 */
85static int max_id = 64;
86static int max_channel = 3;
87static int init_timeout = 300;
88static int login_timeout = 60;
89static int info_timeout = 30;
90static int abort_timeout = 60;
91static int reset_timeout = 60;
92static int max_requests = IBMVSCSI_MAX_REQUESTS_DEFAULT;
93static int max_events = IBMVSCSI_MAX_REQUESTS_DEFAULT + 2;
94static int fast_fail = 1;
95static int client_reserve = 1;
96static char partition_name[96] = "UNKNOWN";
97static unsigned int partition_number = -1;
98static LIST_HEAD(ibmvscsi_head);
99static DEFINE_SPINLOCK(ibmvscsi_driver_lock);
100
101static struct scsi_transport_template *ibmvscsi_transport_template;
102
103#define IBMVSCSI_VERSION "1.5.9"
104
105MODULE_DESCRIPTION("IBM Virtual SCSI");
106MODULE_AUTHOR("Dave Boutcher");
107MODULE_LICENSE("GPL");
108MODULE_VERSION(IBMVSCSI_VERSION);
109
110module_param_named(max_id, max_id, int, S_IRUGO | S_IWUSR);
111MODULE_PARM_DESC(max_id, "Largest ID value for each channel [Default=64]");
112module_param_named(max_channel, max_channel, int, S_IRUGO | S_IWUSR);
113MODULE_PARM_DESC(max_channel, "Largest channel value [Default=3]");
114module_param_named(init_timeout, init_timeout, int, S_IRUGO | S_IWUSR);
115MODULE_PARM_DESC(init_timeout, "Initialization timeout in seconds");
116module_param_named(max_requests, max_requests, int, S_IRUGO);
117MODULE_PARM_DESC(max_requests, "Maximum requests for this adapter");
118module_param_named(fast_fail, fast_fail, int, S_IRUGO | S_IWUSR);
119MODULE_PARM_DESC(fast_fail, "Enable fast fail. [Default=1]");
120module_param_named(client_reserve, client_reserve, int, S_IRUGO );
121MODULE_PARM_DESC(client_reserve, "Attempt client managed reserve/release");
122
123static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
124 struct ibmvscsi_host_data *hostdata);
125
126/* ------------------------------------------------------------
127 * Routines for managing the command/response queue
128 */
129/**
130 * ibmvscsi_handle_event: - Interrupt handler for crq events
131 * @irq: number of irq to handle, not used
132 * @dev_instance: ibmvscsi_host_data of host that received interrupt
133 *
134 * Disables interrupts and schedules srp_task
135 * Always returns IRQ_HANDLED
136 */
137static irqreturn_t ibmvscsi_handle_event(int irq, void *dev_instance)
138{
139 struct ibmvscsi_host_data *hostdata =
140 (struct ibmvscsi_host_data *)dev_instance;
141 vio_disable_interrupts(to_vio_dev(hostdata->dev));
142 tasklet_schedule(&hostdata->srp_task);
143 return IRQ_HANDLED;
144}
145
146/**
147 * release_crq_queue: - Deallocates data and unregisters CRQ
148 * @queue: crq_queue to initialize and register
149 * @host_data: ibmvscsi_host_data of host
150 *
151 * Frees irq, deallocates a page for messages, unmaps dma, and unregisters
152 * the crq with the hypervisor.
153 */
154static void ibmvscsi_release_crq_queue(struct crq_queue *queue,
155 struct ibmvscsi_host_data *hostdata,
156 int max_requests)
157{
158 long rc = 0;
159 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
160 free_irq(vdev->irq, (void *)hostdata);
161 tasklet_kill(&hostdata->srp_task);
162 do {
163 if (rc)
164 msleep(100);
165 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
166 } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
167 dma_unmap_single(hostdata->dev,
168 queue->msg_token,
169 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
170 free_page((unsigned long)queue->msgs);
171}
172
173/**
174 * crq_queue_next_crq: - Returns the next entry in message queue
175 * @queue: crq_queue to use
176 *
177 * Returns pointer to next entry in queue, or NULL if there are no new
178 * entried in the CRQ.
179 */
180static struct viosrp_crq *crq_queue_next_crq(struct crq_queue *queue)
181{
182 struct viosrp_crq *crq;
183 unsigned long flags;
184
185 spin_lock_irqsave(&queue->lock, flags);
186 crq = &queue->msgs[queue->cur];
187 if (crq->valid != VIOSRP_CRQ_FREE) {
188 if (++queue->cur == queue->size)
189 queue->cur = 0;
190
191 /* Ensure the read of the valid bit occurs before reading any
192 * other bits of the CRQ entry
193 */
194 rmb();
195 } else
196 crq = NULL;
197 spin_unlock_irqrestore(&queue->lock, flags);
198
199 return crq;
200}
201
202/**
203 * ibmvscsi_send_crq: - Send a CRQ
204 * @hostdata: the adapter
205 * @word1: the first 64 bits of the data
206 * @word2: the second 64 bits of the data
207 */
208static int ibmvscsi_send_crq(struct ibmvscsi_host_data *hostdata,
209 u64 word1, u64 word2)
210{
211 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
212
213 /*
214 * Ensure the command buffer is flushed to memory before handing it
215 * over to the VIOS to prevent it from fetching any stale data.
216 */
217 mb();
218 return plpar_hcall_norets(H_SEND_CRQ, vdev->unit_address, word1, word2);
219}
220
221/**
222 * ibmvscsi_task: - Process srps asynchronously
223 * @data: ibmvscsi_host_data of host
224 */
225static void ibmvscsi_task(void *data)
226{
227 struct ibmvscsi_host_data *hostdata = (struct ibmvscsi_host_data *)data;
228 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
229 struct viosrp_crq *crq;
230 int done = 0;
231
232 while (!done) {
233 /* Pull all the valid messages off the CRQ */
234 while ((crq = crq_queue_next_crq(&hostdata->queue)) != NULL) {
235 ibmvscsi_handle_crq(crq, hostdata);
236 crq->valid = VIOSRP_CRQ_FREE;
237 wmb();
238 }
239
240 vio_enable_interrupts(vdev);
241 crq = crq_queue_next_crq(&hostdata->queue);
242 if (crq != NULL) {
243 vio_disable_interrupts(vdev);
244 ibmvscsi_handle_crq(crq, hostdata);
245 crq->valid = VIOSRP_CRQ_FREE;
246 wmb();
247 } else {
248 done = 1;
249 }
250 }
251}
252
253static void gather_partition_info(void)
254{
255 const char *ppartition_name;
256 const __be32 *p_number_ptr;
257
258 /* Retrieve information about this partition */
259 if (!of_root)
260 return;
261
262 of_node_get(of_root);
263
264 ppartition_name = of_get_property(of_root, "ibm,partition-name", NULL);
265 if (ppartition_name)
266 strlcpy(partition_name, ppartition_name,
267 sizeof(partition_name));
268 p_number_ptr = of_get_property(of_root, "ibm,partition-no", NULL);
269 if (p_number_ptr)
270 partition_number = of_read_number(p_number_ptr, 1);
271 of_node_put(of_root);
272}
273
274static void set_adapter_info(struct ibmvscsi_host_data *hostdata)
275{
276 memset(&hostdata->madapter_info, 0x00,
277 sizeof(hostdata->madapter_info));
278
279 dev_info(hostdata->dev, "SRP_VERSION: %s\n", SRP_VERSION);
280 strcpy(hostdata->madapter_info.srp_version, SRP_VERSION);
281
282 strncpy(hostdata->madapter_info.partition_name, partition_name,
283 sizeof(hostdata->madapter_info.partition_name));
284
285 hostdata->madapter_info.partition_number =
286 cpu_to_be32(partition_number);
287
288 hostdata->madapter_info.mad_version = cpu_to_be32(SRP_MAD_VERSION_1);
289 hostdata->madapter_info.os_type = cpu_to_be32(SRP_MAD_OS_LINUX);
290}
291
292/**
293 * reset_crq_queue: - resets a crq after a failure
294 * @queue: crq_queue to initialize and register
295 * @hostdata: ibmvscsi_host_data of host
296 *
297 */
298static int ibmvscsi_reset_crq_queue(struct crq_queue *queue,
299 struct ibmvscsi_host_data *hostdata)
300{
301 int rc = 0;
302 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
303
304 /* Close the CRQ */
305 do {
306 if (rc)
307 msleep(100);
308 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
309 } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
310
311 /* Clean out the queue */
312 memset(queue->msgs, 0x00, PAGE_SIZE);
313 queue->cur = 0;
314
315 set_adapter_info(hostdata);
316
317 /* And re-open it again */
318 rc = plpar_hcall_norets(H_REG_CRQ,
319 vdev->unit_address,
320 queue->msg_token, PAGE_SIZE);
321 if (rc == H_CLOSED) {
322 /* Adapter is good, but other end is not ready */
323 dev_warn(hostdata->dev, "Partner adapter not ready\n");
324 } else if (rc != 0) {
325 dev_warn(hostdata->dev, "couldn't register crq--rc 0x%x\n", rc);
326 }
327 return rc;
328}
329
330/**
331 * initialize_crq_queue: - Initializes and registers CRQ with hypervisor
332 * @queue: crq_queue to initialize and register
333 * @hostdata: ibmvscsi_host_data of host
334 *
335 * Allocates a page for messages, maps it for dma, and registers
336 * the crq with the hypervisor.
337 * Returns zero on success.
338 */
339static int ibmvscsi_init_crq_queue(struct crq_queue *queue,
340 struct ibmvscsi_host_data *hostdata,
341 int max_requests)
342{
343 int rc;
344 int retrc;
345 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
346
347 queue->msgs = (struct viosrp_crq *)get_zeroed_page(GFP_KERNEL);
348
349 if (!queue->msgs)
350 goto malloc_failed;
351 queue->size = PAGE_SIZE / sizeof(*queue->msgs);
352
353 queue->msg_token = dma_map_single(hostdata->dev, queue->msgs,
354 queue->size * sizeof(*queue->msgs),
355 DMA_BIDIRECTIONAL);
356
357 if (dma_mapping_error(hostdata->dev, queue->msg_token))
358 goto map_failed;
359
360 gather_partition_info();
361 set_adapter_info(hostdata);
362
363 retrc = rc = plpar_hcall_norets(H_REG_CRQ,
364 vdev->unit_address,
365 queue->msg_token, PAGE_SIZE);
366 if (rc == H_RESOURCE)
367 /* maybe kexecing and resource is busy. try a reset */
368 rc = ibmvscsi_reset_crq_queue(queue,
369 hostdata);
370
371 if (rc == H_CLOSED) {
372 /* Adapter is good, but other end is not ready */
373 dev_warn(hostdata->dev, "Partner adapter not ready\n");
374 retrc = 0;
375 } else if (rc != 0) {
376 dev_warn(hostdata->dev, "Error %d opening adapter\n", rc);
377 goto reg_crq_failed;
378 }
379
380 queue->cur = 0;
381 spin_lock_init(&queue->lock);
382
383 tasklet_init(&hostdata->srp_task, (void *)ibmvscsi_task,
384 (unsigned long)hostdata);
385
386 if (request_irq(vdev->irq,
387 ibmvscsi_handle_event,
388 0, "ibmvscsi", (void *)hostdata) != 0) {
389 dev_err(hostdata->dev, "couldn't register irq 0x%x\n",
390 vdev->irq);
391 goto req_irq_failed;
392 }
393
394 rc = vio_enable_interrupts(vdev);
395 if (rc != 0) {
396 dev_err(hostdata->dev, "Error %d enabling interrupts!!!\n", rc);
397 goto req_irq_failed;
398 }
399
400 return retrc;
401
402 req_irq_failed:
403 tasklet_kill(&hostdata->srp_task);
404 rc = 0;
405 do {
406 if (rc)
407 msleep(100);
408 rc = plpar_hcall_norets(H_FREE_CRQ, vdev->unit_address);
409 } while ((rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
410 reg_crq_failed:
411 dma_unmap_single(hostdata->dev,
412 queue->msg_token,
413 queue->size * sizeof(*queue->msgs), DMA_BIDIRECTIONAL);
414 map_failed:
415 free_page((unsigned long)queue->msgs);
416 malloc_failed:
417 return -1;
418}
419
420/**
421 * reenable_crq_queue: - reenables a crq after
422 * @queue: crq_queue to initialize and register
423 * @hostdata: ibmvscsi_host_data of host
424 *
425 */
426static int ibmvscsi_reenable_crq_queue(struct crq_queue *queue,
427 struct ibmvscsi_host_data *hostdata)
428{
429 int rc = 0;
430 struct vio_dev *vdev = to_vio_dev(hostdata->dev);
431
432 /* Re-enable the CRQ */
433 do {
434 if (rc)
435 msleep(100);
436 rc = plpar_hcall_norets(H_ENABLE_CRQ, vdev->unit_address);
437 } while ((rc == H_IN_PROGRESS) || (rc == H_BUSY) || (H_IS_LONG_BUSY(rc)));
438
439 if (rc)
440 dev_err(hostdata->dev, "Error %d enabling adapter\n", rc);
441 return rc;
442}
443
444/* ------------------------------------------------------------
445 * Routines for the event pool and event structs
446 */
447/**
448 * initialize_event_pool: - Allocates and initializes the event pool for a host
449 * @pool: event_pool to be initialized
450 * @size: Number of events in pool
451 * @hostdata: ibmvscsi_host_data who owns the event pool
452 *
453 * Returns zero on success.
454*/
455static int initialize_event_pool(struct event_pool *pool,
456 int size, struct ibmvscsi_host_data *hostdata)
457{
458 int i;
459
460 pool->size = size;
461 pool->next = 0;
462 pool->events = kcalloc(pool->size, sizeof(*pool->events), GFP_KERNEL);
463 if (!pool->events)
464 return -ENOMEM;
465
466 pool->iu_storage =
467 dma_alloc_coherent(hostdata->dev,
468 pool->size * sizeof(*pool->iu_storage),
469 &pool->iu_token, 0);
470 if (!pool->iu_storage) {
471 kfree(pool->events);
472 return -ENOMEM;
473 }
474
475 for (i = 0; i < pool->size; ++i) {
476 struct srp_event_struct *evt = &pool->events[i];
477 memset(&evt->crq, 0x00, sizeof(evt->crq));
478 atomic_set(&evt->free, 1);
479 evt->crq.valid = VIOSRP_CRQ_CMD_RSP;
480 evt->crq.IU_length = cpu_to_be16(sizeof(*evt->xfer_iu));
481 evt->crq.IU_data_ptr = cpu_to_be64(pool->iu_token +
482 sizeof(*evt->xfer_iu) * i);
483 evt->xfer_iu = pool->iu_storage + i;
484 evt->hostdata = hostdata;
485 evt->ext_list = NULL;
486 evt->ext_list_token = 0;
487 }
488
489 return 0;
490}
491
492/**
493 * release_event_pool: - Frees memory of an event pool of a host
494 * @pool: event_pool to be released
495 * @hostdata: ibmvscsi_host_data who owns the even pool
496 *
497 * Returns zero on success.
498*/
499static void release_event_pool(struct event_pool *pool,
500 struct ibmvscsi_host_data *hostdata)
501{
502 int i, in_use = 0;
503 for (i = 0; i < pool->size; ++i) {
504 if (atomic_read(&pool->events[i].free) != 1)
505 ++in_use;
506 if (pool->events[i].ext_list) {
507 dma_free_coherent(hostdata->dev,
508 SG_ALL * sizeof(struct srp_direct_buf),
509 pool->events[i].ext_list,
510 pool->events[i].ext_list_token);
511 }
512 }
513 if (in_use)
514 dev_warn(hostdata->dev, "releasing event pool with %d "
515 "events still in use?\n", in_use);
516 kfree(pool->events);
517 dma_free_coherent(hostdata->dev,
518 pool->size * sizeof(*pool->iu_storage),
519 pool->iu_storage, pool->iu_token);
520}
521
522/**
523 * valid_event_struct: - Determines if event is valid.
524 * @pool: event_pool that contains the event
525 * @evt: srp_event_struct to be checked for validity
526 *
527 * Returns zero if event is invalid, one otherwise.
528*/
529static int valid_event_struct(struct event_pool *pool,
530 struct srp_event_struct *evt)
531{
532 int index = evt - pool->events;
533 if (index < 0 || index >= pool->size) /* outside of bounds */
534 return 0;
535 if (evt != pool->events + index) /* unaligned */
536 return 0;
537 return 1;
538}
539
540/**
541 * ibmvscsi_free-event_struct: - Changes status of event to "free"
542 * @pool: event_pool that contains the event
543 * @evt: srp_event_struct to be modified
544 *
545*/
546static void free_event_struct(struct event_pool *pool,
547 struct srp_event_struct *evt)
548{
549 if (!valid_event_struct(pool, evt)) {
550 dev_err(evt->hostdata->dev, "Freeing invalid event_struct %p "
551 "(not in pool %p)\n", evt, pool->events);
552 return;
553 }
554 if (atomic_inc_return(&evt->free) != 1) {
555 dev_err(evt->hostdata->dev, "Freeing event_struct %p "
556 "which is not in use!\n", evt);
557 return;
558 }
559}
560
561/**
562 * get_evt_struct: - Gets the next free event in pool
563 * @pool: event_pool that contains the events to be searched
564 *
565 * Returns the next event in "free" state, and NULL if none are free.
566 * Note that no synchronization is done here, we assume the host_lock
567 * will syncrhonze things.
568*/
569static struct srp_event_struct *get_event_struct(struct event_pool *pool)
570{
571 int i;
572 int poolsize = pool->size;
573 int offset = pool->next;
574
575 for (i = 0; i < poolsize; i++) {
576 offset = (offset + 1) % poolsize;
577 if (!atomic_dec_if_positive(&pool->events[offset].free)) {
578 pool->next = offset;
579 return &pool->events[offset];
580 }
581 }
582
583 printk(KERN_ERR "ibmvscsi: found no event struct in pool!\n");
584 return NULL;
585}
586
587/**
588 * init_event_struct: Initialize fields in an event struct that are always
589 * required.
590 * @evt: The event
591 * @done: Routine to call when the event is responded to
592 * @format: SRP or MAD format
593 * @timeout: timeout value set in the CRQ
594 */
595static void init_event_struct(struct srp_event_struct *evt_struct,
596 void (*done) (struct srp_event_struct *),
597 u8 format,
598 int timeout)
599{
600 evt_struct->cmnd = NULL;
601 evt_struct->cmnd_done = NULL;
602 evt_struct->sync_srp = NULL;
603 evt_struct->crq.format = format;
604 evt_struct->crq.timeout = cpu_to_be16(timeout);
605 evt_struct->done = done;
606}
607
608/* ------------------------------------------------------------
609 * Routines for receiving SCSI responses from the hosting partition
610 */
611
612/**
613 * set_srp_direction: Set the fields in the srp related to data
614 * direction and number of buffers based on the direction in
615 * the scsi_cmnd and the number of buffers
616 */
617static void set_srp_direction(struct scsi_cmnd *cmd,
618 struct srp_cmd *srp_cmd,
619 int numbuf)
620{
621 u8 fmt;
622
623 if (numbuf == 0)
624 return;
625
626 if (numbuf == 1)
627 fmt = SRP_DATA_DESC_DIRECT;
628 else {
629 fmt = SRP_DATA_DESC_INDIRECT;
630 numbuf = min(numbuf, MAX_INDIRECT_BUFS);
631
632 if (cmd->sc_data_direction == DMA_TO_DEVICE)
633 srp_cmd->data_out_desc_cnt = numbuf;
634 else
635 srp_cmd->data_in_desc_cnt = numbuf;
636 }
637
638 if (cmd->sc_data_direction == DMA_TO_DEVICE)
639 srp_cmd->buf_fmt = fmt << 4;
640 else
641 srp_cmd->buf_fmt = fmt;
642}
643
644/**
645 * unmap_cmd_data: - Unmap data pointed in srp_cmd based on the format
646 * @cmd: srp_cmd whose additional_data member will be unmapped
647 * @dev: device for which the memory is mapped
648 *
649*/
650static void unmap_cmd_data(struct srp_cmd *cmd,
651 struct srp_event_struct *evt_struct,
652 struct device *dev)
653{
654 u8 out_fmt, in_fmt;
655
656 out_fmt = cmd->buf_fmt >> 4;
657 in_fmt = cmd->buf_fmt & ((1U << 4) - 1);
658
659 if (out_fmt == SRP_NO_DATA_DESC && in_fmt == SRP_NO_DATA_DESC)
660 return;
661
662 if (evt_struct->cmnd)
663 scsi_dma_unmap(evt_struct->cmnd);
664}
665
666static int map_sg_list(struct scsi_cmnd *cmd, int nseg,
667 struct srp_direct_buf *md)
668{
669 int i;
670 struct scatterlist *sg;
671 u64 total_length = 0;
672
673 scsi_for_each_sg(cmd, sg, nseg, i) {
674 struct srp_direct_buf *descr = md + i;
675 descr->va = cpu_to_be64(sg_dma_address(sg));
676 descr->len = cpu_to_be32(sg_dma_len(sg));
677 descr->key = 0;
678 total_length += sg_dma_len(sg);
679 }
680 return total_length;
681}
682
683/**
684 * map_sg_data: - Maps dma for a scatterlist and initializes decriptor fields
685 * @cmd: struct scsi_cmnd with the scatterlist
686 * @srp_cmd: srp_cmd that contains the memory descriptor
687 * @dev: device for which to map dma memory
688 *
689 * Called by map_data_for_srp_cmd() when building srp cmd from scsi cmd.
690 * Returns 1 on success.
691*/
692static int map_sg_data(struct scsi_cmnd *cmd,
693 struct srp_event_struct *evt_struct,
694 struct srp_cmd *srp_cmd, struct device *dev)
695{
696
697 int sg_mapped;
698 u64 total_length = 0;
699 struct srp_direct_buf *data =
700 (struct srp_direct_buf *) srp_cmd->add_data;
701 struct srp_indirect_buf *indirect =
702 (struct srp_indirect_buf *) data;
703
704 sg_mapped = scsi_dma_map(cmd);
705 if (!sg_mapped)
706 return 1;
707 else if (sg_mapped < 0)
708 return 0;
709
710 set_srp_direction(cmd, srp_cmd, sg_mapped);
711
712 /* special case; we can use a single direct descriptor */
713 if (sg_mapped == 1) {
714 map_sg_list(cmd, sg_mapped, data);
715 return 1;
716 }
717
718 indirect->table_desc.va = 0;
719 indirect->table_desc.len = cpu_to_be32(sg_mapped *
720 sizeof(struct srp_direct_buf));
721 indirect->table_desc.key = 0;
722
723 if (sg_mapped <= MAX_INDIRECT_BUFS) {
724 total_length = map_sg_list(cmd, sg_mapped,
725 &indirect->desc_list[0]);
726 indirect->len = cpu_to_be32(total_length);
727 return 1;
728 }
729
730 /* get indirect table */
731 if (!evt_struct->ext_list) {
732 evt_struct->ext_list = (struct srp_direct_buf *)
733 dma_alloc_coherent(dev,
734 SG_ALL * sizeof(struct srp_direct_buf),
735 &evt_struct->ext_list_token, 0);
736 if (!evt_struct->ext_list) {
737 if (!firmware_has_feature(FW_FEATURE_CMO))
738 sdev_printk(KERN_ERR, cmd->device,
739 "Can't allocate memory "
740 "for indirect table\n");
741 scsi_dma_unmap(cmd);
742 return 0;
743 }
744 }
745
746 total_length = map_sg_list(cmd, sg_mapped, evt_struct->ext_list);
747
748 indirect->len = cpu_to_be32(total_length);
749 indirect->table_desc.va = cpu_to_be64(evt_struct->ext_list_token);
750 indirect->table_desc.len = cpu_to_be32(sg_mapped *
751 sizeof(indirect->desc_list[0]));
752 memcpy(indirect->desc_list, evt_struct->ext_list,
753 MAX_INDIRECT_BUFS * sizeof(struct srp_direct_buf));
754 return 1;
755}
756
757/**
758 * map_data_for_srp_cmd: - Calls functions to map data for srp cmds
759 * @cmd: struct scsi_cmnd with the memory to be mapped
760 * @srp_cmd: srp_cmd that contains the memory descriptor
761 * @dev: dma device for which to map dma memory
762 *
763 * Called by scsi_cmd_to_srp_cmd() when converting scsi cmds to srp cmds
764 * Returns 1 on success.
765*/
766static int map_data_for_srp_cmd(struct scsi_cmnd *cmd,
767 struct srp_event_struct *evt_struct,
768 struct srp_cmd *srp_cmd, struct device *dev)
769{
770 switch (cmd->sc_data_direction) {
771 case DMA_FROM_DEVICE:
772 case DMA_TO_DEVICE:
773 break;
774 case DMA_NONE:
775 return 1;
776 case DMA_BIDIRECTIONAL:
777 sdev_printk(KERN_ERR, cmd->device,
778 "Can't map DMA_BIDIRECTIONAL to read/write\n");
779 return 0;
780 default:
781 sdev_printk(KERN_ERR, cmd->device,
782 "Unknown data direction 0x%02x; can't map!\n",
783 cmd->sc_data_direction);
784 return 0;
785 }
786
787 return map_sg_data(cmd, evt_struct, srp_cmd, dev);
788}
789
790/**
791 * purge_requests: Our virtual adapter just shut down. purge any sent requests
792 * @hostdata: the adapter
793 */
794static void purge_requests(struct ibmvscsi_host_data *hostdata, int error_code)
795{
796 struct srp_event_struct *evt;
797 unsigned long flags;
798
799 spin_lock_irqsave(hostdata->host->host_lock, flags);
800 while (!list_empty(&hostdata->sent)) {
801 evt = list_first_entry(&hostdata->sent, struct srp_event_struct, list);
802 list_del(&evt->list);
803 del_timer(&evt->timer);
804
805 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
806 if (evt->cmnd) {
807 evt->cmnd->result = (error_code << 16);
808 unmap_cmd_data(&evt->iu.srp.cmd, evt,
809 evt->hostdata->dev);
810 if (evt->cmnd_done)
811 evt->cmnd_done(evt->cmnd);
812 } else if (evt->done && evt->crq.format != VIOSRP_MAD_FORMAT &&
813 evt->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
814 evt->done(evt);
815 free_event_struct(&evt->hostdata->pool, evt);
816 spin_lock_irqsave(hostdata->host->host_lock, flags);
817 }
818 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
819}
820
821/**
822 * ibmvscsi_reset_host - Reset the connection to the server
823 * @hostdata: struct ibmvscsi_host_data to reset
824*/
825static void ibmvscsi_reset_host(struct ibmvscsi_host_data *hostdata)
826{
827 scsi_block_requests(hostdata->host);
828 atomic_set(&hostdata->request_limit, 0);
829
830 purge_requests(hostdata, DID_ERROR);
831 hostdata->reset_crq = 1;
832 wake_up(&hostdata->work_wait_q);
833}
834
835/**
836 * ibmvscsi_timeout - Internal command timeout handler
837 * @evt_struct: struct srp_event_struct that timed out
838 *
839 * Called when an internally generated command times out
840*/
841static void ibmvscsi_timeout(struct timer_list *t)
842{
843 struct srp_event_struct *evt_struct = from_timer(evt_struct, t, timer);
844 struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
845
846 dev_err(hostdata->dev, "Command timed out (%x). Resetting connection\n",
847 evt_struct->iu.srp.cmd.opcode);
848
849 ibmvscsi_reset_host(hostdata);
850}
851
852
853/* ------------------------------------------------------------
854 * Routines for sending and receiving SRPs
855 */
856/**
857 * ibmvscsi_send_srp_event: - Transforms event to u64 array and calls send_crq()
858 * @evt_struct: evt_struct to be sent
859 * @hostdata: ibmvscsi_host_data of host
860 * @timeout: timeout in seconds - 0 means do not time command
861 *
862 * Returns the value returned from ibmvscsi_send_crq(). (Zero for success)
863 * Note that this routine assumes that host_lock is held for synchronization
864*/
865static int ibmvscsi_send_srp_event(struct srp_event_struct *evt_struct,
866 struct ibmvscsi_host_data *hostdata,
867 unsigned long timeout)
868{
869 __be64 *crq_as_u64 = (__be64 *)&evt_struct->crq;
870 int request_status = 0;
871 int rc;
872 int srp_req = 0;
873
874 /* If we have exhausted our request limit, just fail this request,
875 * unless it is for a reset or abort.
876 * Note that there are rare cases involving driver generated requests
877 * (such as task management requests) that the mid layer may think we
878 * can handle more requests (can_queue) when we actually can't
879 */
880 if (evt_struct->crq.format == VIOSRP_SRP_FORMAT) {
881 srp_req = 1;
882 request_status =
883 atomic_dec_if_positive(&hostdata->request_limit);
884 /* If request limit was -1 when we started, it is now even
885 * less than that
886 */
887 if (request_status < -1)
888 goto send_error;
889 /* Otherwise, we may have run out of requests. */
890 /* If request limit was 0 when we started the adapter is in the
891 * process of performing a login with the server adapter, or
892 * we may have run out of requests.
893 */
894 else if (request_status == -1 &&
895 evt_struct->iu.srp.login_req.opcode != SRP_LOGIN_REQ)
896 goto send_busy;
897 /* Abort and reset calls should make it through.
898 * Nothing except abort and reset should use the last two
899 * slots unless we had two or less to begin with.
900 */
901 else if (request_status < 2 &&
902 evt_struct->iu.srp.cmd.opcode != SRP_TSK_MGMT) {
903 /* In the case that we have less than two requests
904 * available, check the server limit as a combination
905 * of the request limit and the number of requests
906 * in-flight (the size of the send list). If the
907 * server limit is greater than 2, return busy so
908 * that the last two are reserved for reset and abort.
909 */
910 int server_limit = request_status;
911 struct srp_event_struct *tmp_evt;
912
913 list_for_each_entry(tmp_evt, &hostdata->sent, list) {
914 server_limit++;
915 }
916
917 if (server_limit > 2)
918 goto send_busy;
919 }
920 }
921
922 /* Copy the IU into the transfer area */
923 *evt_struct->xfer_iu = evt_struct->iu;
924 evt_struct->xfer_iu->srp.rsp.tag = (u64)evt_struct;
925
926 /* Add this to the sent list. We need to do this
927 * before we actually send
928 * in case it comes back REALLY fast
929 */
930 list_add_tail(&evt_struct->list, &hostdata->sent);
931
932 timer_setup(&evt_struct->timer, ibmvscsi_timeout, 0);
933 if (timeout) {
934 evt_struct->timer.expires = jiffies + (timeout * HZ);
935 add_timer(&evt_struct->timer);
936 }
937
938 rc = ibmvscsi_send_crq(hostdata, be64_to_cpu(crq_as_u64[0]),
939 be64_to_cpu(crq_as_u64[1]));
940 if (rc != 0) {
941 list_del(&evt_struct->list);
942 del_timer(&evt_struct->timer);
943
944 /* If send_crq returns H_CLOSED, return SCSI_MLQUEUE_HOST_BUSY.
945 * Firmware will send a CRQ with a transport event (0xFF) to
946 * tell this client what has happened to the transport. This
947 * will be handled in ibmvscsi_handle_crq()
948 */
949 if (rc == H_CLOSED) {
950 dev_warn(hostdata->dev, "send warning. "
951 "Receive queue closed, will retry.\n");
952 goto send_busy;
953 }
954 dev_err(hostdata->dev, "send error %d\n", rc);
955 if (srp_req)
956 atomic_inc(&hostdata->request_limit);
957 goto send_error;
958 }
959
960 return 0;
961
962 send_busy:
963 unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
964
965 free_event_struct(&hostdata->pool, evt_struct);
966 if (srp_req && request_status != -1)
967 atomic_inc(&hostdata->request_limit);
968 return SCSI_MLQUEUE_HOST_BUSY;
969
970 send_error:
971 unmap_cmd_data(&evt_struct->iu.srp.cmd, evt_struct, hostdata->dev);
972
973 if (evt_struct->cmnd != NULL) {
974 evt_struct->cmnd->result = DID_ERROR << 16;
975 evt_struct->cmnd_done(evt_struct->cmnd);
976 } else if (evt_struct->done)
977 evt_struct->done(evt_struct);
978
979 free_event_struct(&hostdata->pool, evt_struct);
980 return 0;
981}
982
983/**
984 * handle_cmd_rsp: - Handle responses from commands
985 * @evt_struct: srp_event_struct to be handled
986 *
987 * Used as a callback by when sending scsi cmds.
988 * Gets called by ibmvscsi_handle_crq()
989*/
990static void handle_cmd_rsp(struct srp_event_struct *evt_struct)
991{
992 struct srp_rsp *rsp = &evt_struct->xfer_iu->srp.rsp;
993 struct scsi_cmnd *cmnd = evt_struct->cmnd;
994
995 if (unlikely(rsp->opcode != SRP_RSP)) {
996 if (printk_ratelimit())
997 dev_warn(evt_struct->hostdata->dev,
998 "bad SRP RSP type %#02x\n", rsp->opcode);
999 }
1000
1001 if (cmnd) {
1002 cmnd->result |= rsp->status;
1003 if (((cmnd->result >> 1) & 0x1f) == CHECK_CONDITION)
1004 memcpy(cmnd->sense_buffer,
1005 rsp->data,
1006 be32_to_cpu(rsp->sense_data_len));
1007 unmap_cmd_data(&evt_struct->iu.srp.cmd,
1008 evt_struct,
1009 evt_struct->hostdata->dev);
1010
1011 if (rsp->flags & SRP_RSP_FLAG_DOOVER)
1012 scsi_set_resid(cmnd,
1013 be32_to_cpu(rsp->data_out_res_cnt));
1014 else if (rsp->flags & SRP_RSP_FLAG_DIOVER)
1015 scsi_set_resid(cmnd, be32_to_cpu(rsp->data_in_res_cnt));
1016 }
1017
1018 if (evt_struct->cmnd_done)
1019 evt_struct->cmnd_done(cmnd);
1020}
1021
1022/**
1023 * lun_from_dev: - Returns the lun of the scsi device
1024 * @dev: struct scsi_device
1025 *
1026*/
1027static inline u16 lun_from_dev(struct scsi_device *dev)
1028{
1029 return (0x2 << 14) | (dev->id << 8) | (dev->channel << 5) | dev->lun;
1030}
1031
1032/**
1033 * ibmvscsi_queue: - The queuecommand function of the scsi template
1034 * @cmd: struct scsi_cmnd to be executed
1035 * @done: Callback function to be called when cmd is completed
1036*/
1037static int ibmvscsi_queuecommand_lck(struct scsi_cmnd *cmnd,
1038 void (*done) (struct scsi_cmnd *))
1039{
1040 struct srp_cmd *srp_cmd;
1041 struct srp_event_struct *evt_struct;
1042 struct srp_indirect_buf *indirect;
1043 struct ibmvscsi_host_data *hostdata = shost_priv(cmnd->device->host);
1044 u16 lun = lun_from_dev(cmnd->device);
1045 u8 out_fmt, in_fmt;
1046
1047 cmnd->result = (DID_OK << 16);
1048 evt_struct = get_event_struct(&hostdata->pool);
1049 if (!evt_struct)
1050 return SCSI_MLQUEUE_HOST_BUSY;
1051
1052 /* Set up the actual SRP IU */
1053 srp_cmd = &evt_struct->iu.srp.cmd;
1054 memset(srp_cmd, 0x00, SRP_MAX_IU_LEN);
1055 srp_cmd->opcode = SRP_CMD;
1056 memcpy(srp_cmd->cdb, cmnd->cmnd, sizeof(srp_cmd->cdb));
1057 int_to_scsilun(lun, &srp_cmd->lun);
1058
1059 if (!map_data_for_srp_cmd(cmnd, evt_struct, srp_cmd, hostdata->dev)) {
1060 if (!firmware_has_feature(FW_FEATURE_CMO))
1061 sdev_printk(KERN_ERR, cmnd->device,
1062 "couldn't convert cmd to srp_cmd\n");
1063 free_event_struct(&hostdata->pool, evt_struct);
1064 return SCSI_MLQUEUE_HOST_BUSY;
1065 }
1066
1067 init_event_struct(evt_struct,
1068 handle_cmd_rsp,
1069 VIOSRP_SRP_FORMAT,
1070 cmnd->request->timeout/HZ);
1071
1072 evt_struct->cmnd = cmnd;
1073 evt_struct->cmnd_done = done;
1074
1075 /* Fix up dma address of the buffer itself */
1076 indirect = (struct srp_indirect_buf *) srp_cmd->add_data;
1077 out_fmt = srp_cmd->buf_fmt >> 4;
1078 in_fmt = srp_cmd->buf_fmt & ((1U << 4) - 1);
1079 if ((in_fmt == SRP_DATA_DESC_INDIRECT ||
1080 out_fmt == SRP_DATA_DESC_INDIRECT) &&
1081 indirect->table_desc.va == 0) {
1082 indirect->table_desc.va =
1083 cpu_to_be64(be64_to_cpu(evt_struct->crq.IU_data_ptr) +
1084 offsetof(struct srp_cmd, add_data) +
1085 offsetof(struct srp_indirect_buf, desc_list));
1086 }
1087
1088 return ibmvscsi_send_srp_event(evt_struct, hostdata, 0);
1089}
1090
1091static DEF_SCSI_QCMD(ibmvscsi_queuecommand)
1092
1093/* ------------------------------------------------------------
1094 * Routines for driver initialization
1095 */
1096
1097/**
1098 * map_persist_bufs: - Pre-map persistent data for adapter logins
1099 * @hostdata: ibmvscsi_host_data of host
1100 *
1101 * Map the capabilities and adapter info DMA buffers to avoid runtime failures.
1102 * Return 1 on error, 0 on success.
1103 */
1104static int map_persist_bufs(struct ibmvscsi_host_data *hostdata)
1105{
1106
1107 hostdata->caps_addr = dma_map_single(hostdata->dev, &hostdata->caps,
1108 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1109
1110 if (dma_mapping_error(hostdata->dev, hostdata->caps_addr)) {
1111 dev_err(hostdata->dev, "Unable to map capabilities buffer!\n");
1112 return 1;
1113 }
1114
1115 hostdata->adapter_info_addr = dma_map_single(hostdata->dev,
1116 &hostdata->madapter_info,
1117 sizeof(hostdata->madapter_info),
1118 DMA_BIDIRECTIONAL);
1119 if (dma_mapping_error(hostdata->dev, hostdata->adapter_info_addr)) {
1120 dev_err(hostdata->dev, "Unable to map adapter info buffer!\n");
1121 dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1122 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1123 return 1;
1124 }
1125
1126 return 0;
1127}
1128
1129/**
1130 * unmap_persist_bufs: - Unmap persistent data needed for adapter logins
1131 * @hostdata: ibmvscsi_host_data of host
1132 *
1133 * Unmap the capabilities and adapter info DMA buffers
1134 */
1135static void unmap_persist_bufs(struct ibmvscsi_host_data *hostdata)
1136{
1137 dma_unmap_single(hostdata->dev, hostdata->caps_addr,
1138 sizeof(hostdata->caps), DMA_BIDIRECTIONAL);
1139
1140 dma_unmap_single(hostdata->dev, hostdata->adapter_info_addr,
1141 sizeof(hostdata->madapter_info), DMA_BIDIRECTIONAL);
1142}
1143
1144/**
1145 * login_rsp: - Handle response to SRP login request
1146 * @evt_struct: srp_event_struct with the response
1147 *
1148 * Used as a "done" callback by when sending srp_login. Gets called
1149 * by ibmvscsi_handle_crq()
1150*/
1151static void login_rsp(struct srp_event_struct *evt_struct)
1152{
1153 struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1154 switch (evt_struct->xfer_iu->srp.login_rsp.opcode) {
1155 case SRP_LOGIN_RSP: /* it worked! */
1156 break;
1157 case SRP_LOGIN_REJ: /* refused! */
1158 dev_info(hostdata->dev, "SRP_LOGIN_REJ reason %u\n",
1159 evt_struct->xfer_iu->srp.login_rej.reason);
1160 /* Login failed. */
1161 atomic_set(&hostdata->request_limit, -1);
1162 return;
1163 default:
1164 dev_err(hostdata->dev, "Invalid login response typecode 0x%02x!\n",
1165 evt_struct->xfer_iu->srp.login_rsp.opcode);
1166 /* Login failed. */
1167 atomic_set(&hostdata->request_limit, -1);
1168 return;
1169 }
1170
1171 dev_info(hostdata->dev, "SRP_LOGIN succeeded\n");
1172 hostdata->client_migrated = 0;
1173
1174 /* Now we know what the real request-limit is.
1175 * This value is set rather than added to request_limit because
1176 * request_limit could have been set to -1 by this client.
1177 */
1178 atomic_set(&hostdata->request_limit,
1179 be32_to_cpu(evt_struct->xfer_iu->srp.login_rsp.req_lim_delta));
1180
1181 /* If we had any pending I/Os, kick them */
1182 scsi_unblock_requests(hostdata->host);
1183}
1184
1185/**
1186 * send_srp_login: - Sends the srp login
1187 * @hostdata: ibmvscsi_host_data of host
1188 *
1189 * Returns zero if successful.
1190*/
1191static int send_srp_login(struct ibmvscsi_host_data *hostdata)
1192{
1193 int rc;
1194 unsigned long flags;
1195 struct srp_login_req *login;
1196 struct srp_event_struct *evt_struct = get_event_struct(&hostdata->pool);
1197
1198 BUG_ON(!evt_struct);
1199 init_event_struct(evt_struct, login_rsp,
1200 VIOSRP_SRP_FORMAT, login_timeout);
1201
1202 login = &evt_struct->iu.srp.login_req;
1203 memset(login, 0, sizeof(*login));
1204 login->opcode = SRP_LOGIN_REQ;
1205 login->req_it_iu_len = cpu_to_be32(sizeof(union srp_iu));
1206 login->req_buf_fmt = cpu_to_be16(SRP_BUF_FORMAT_DIRECT |
1207 SRP_BUF_FORMAT_INDIRECT);
1208
1209 spin_lock_irqsave(hostdata->host->host_lock, flags);
1210 /* Start out with a request limit of 0, since this is negotiated in
1211 * the login request we are just sending and login requests always
1212 * get sent by the driver regardless of request_limit.
1213 */
1214 atomic_set(&hostdata->request_limit, 0);
1215
1216 rc = ibmvscsi_send_srp_event(evt_struct, hostdata, login_timeout * 2);
1217 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1218 dev_info(hostdata->dev, "sent SRP login\n");
1219 return rc;
1220};
1221
1222/**
1223 * capabilities_rsp: - Handle response to MAD adapter capabilities request
1224 * @evt_struct: srp_event_struct with the response
1225 *
1226 * Used as a "done" callback by when sending adapter_info.
1227 */
1228static void capabilities_rsp(struct srp_event_struct *evt_struct)
1229{
1230 struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1231
1232 if (evt_struct->xfer_iu->mad.capabilities.common.status) {
1233 dev_err(hostdata->dev, "error 0x%X getting capabilities info\n",
1234 evt_struct->xfer_iu->mad.capabilities.common.status);
1235 } else {
1236 if (hostdata->caps.migration.common.server_support !=
1237 cpu_to_be16(SERVER_SUPPORTS_CAP))
1238 dev_info(hostdata->dev, "Partition migration not supported\n");
1239
1240 if (client_reserve) {
1241 if (hostdata->caps.reserve.common.server_support ==
1242 cpu_to_be16(SERVER_SUPPORTS_CAP))
1243 dev_info(hostdata->dev, "Client reserve enabled\n");
1244 else
1245 dev_info(hostdata->dev, "Client reserve not supported\n");
1246 }
1247 }
1248
1249 send_srp_login(hostdata);
1250}
1251
1252/**
1253 * send_mad_capabilities: - Sends the mad capabilities request
1254 * and stores the result so it can be retrieved with
1255 * @hostdata: ibmvscsi_host_data of host
1256 */
1257static void send_mad_capabilities(struct ibmvscsi_host_data *hostdata)
1258{
1259 struct viosrp_capabilities *req;
1260 struct srp_event_struct *evt_struct;
1261 unsigned long flags;
1262 struct device_node *of_node = hostdata->dev->of_node;
1263 const char *location;
1264
1265 evt_struct = get_event_struct(&hostdata->pool);
1266 BUG_ON(!evt_struct);
1267
1268 init_event_struct(evt_struct, capabilities_rsp,
1269 VIOSRP_MAD_FORMAT, info_timeout);
1270
1271 req = &evt_struct->iu.mad.capabilities;
1272 memset(req, 0, sizeof(*req));
1273
1274 hostdata->caps.flags = cpu_to_be32(CAP_LIST_SUPPORTED);
1275 if (hostdata->client_migrated)
1276 hostdata->caps.flags |= cpu_to_be32(CLIENT_MIGRATED);
1277
1278 strlcpy(hostdata->caps.name, dev_name(&hostdata->host->shost_gendev),
1279 sizeof(hostdata->caps.name));
1280
1281 location = of_get_property(of_node, "ibm,loc-code", NULL);
1282 location = location ? location : dev_name(hostdata->dev);
1283 strlcpy(hostdata->caps.loc, location, sizeof(hostdata->caps.loc));
1284
1285 req->common.type = cpu_to_be32(VIOSRP_CAPABILITIES_TYPE);
1286 req->buffer = cpu_to_be64(hostdata->caps_addr);
1287
1288 hostdata->caps.migration.common.cap_type =
1289 cpu_to_be32(MIGRATION_CAPABILITIES);
1290 hostdata->caps.migration.common.length =
1291 cpu_to_be16(sizeof(hostdata->caps.migration));
1292 hostdata->caps.migration.common.server_support =
1293 cpu_to_be16(SERVER_SUPPORTS_CAP);
1294 hostdata->caps.migration.ecl = cpu_to_be32(1);
1295
1296 if (client_reserve) {
1297 hostdata->caps.reserve.common.cap_type =
1298 cpu_to_be32(RESERVATION_CAPABILITIES);
1299 hostdata->caps.reserve.common.length =
1300 cpu_to_be16(sizeof(hostdata->caps.reserve));
1301 hostdata->caps.reserve.common.server_support =
1302 cpu_to_be16(SERVER_SUPPORTS_CAP);
1303 hostdata->caps.reserve.type =
1304 cpu_to_be32(CLIENT_RESERVE_SCSI_2);
1305 req->common.length =
1306 cpu_to_be16(sizeof(hostdata->caps));
1307 } else
1308 req->common.length = cpu_to_be16(sizeof(hostdata->caps) -
1309 sizeof(hostdata->caps.reserve));
1310
1311 spin_lock_irqsave(hostdata->host->host_lock, flags);
1312 if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1313 dev_err(hostdata->dev, "couldn't send CAPABILITIES_REQ!\n");
1314 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1315};
1316
1317/**
1318 * fast_fail_rsp: - Handle response to MAD enable fast fail
1319 * @evt_struct: srp_event_struct with the response
1320 *
1321 * Used as a "done" callback by when sending enable fast fail. Gets called
1322 * by ibmvscsi_handle_crq()
1323 */
1324static void fast_fail_rsp(struct srp_event_struct *evt_struct)
1325{
1326 struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1327 u16 status = be16_to_cpu(evt_struct->xfer_iu->mad.fast_fail.common.status);
1328
1329 if (status == VIOSRP_MAD_NOT_SUPPORTED)
1330 dev_err(hostdata->dev, "fast_fail not supported in server\n");
1331 else if (status == VIOSRP_MAD_FAILED)
1332 dev_err(hostdata->dev, "fast_fail request failed\n");
1333 else if (status != VIOSRP_MAD_SUCCESS)
1334 dev_err(hostdata->dev, "error 0x%X enabling fast_fail\n", status);
1335
1336 send_mad_capabilities(hostdata);
1337}
1338
1339/**
1340 * init_host - Start host initialization
1341 * @hostdata: ibmvscsi_host_data of host
1342 *
1343 * Returns zero if successful.
1344 */
1345static int enable_fast_fail(struct ibmvscsi_host_data *hostdata)
1346{
1347 int rc;
1348 unsigned long flags;
1349 struct viosrp_fast_fail *fast_fail_mad;
1350 struct srp_event_struct *evt_struct;
1351
1352 if (!fast_fail) {
1353 send_mad_capabilities(hostdata);
1354 return 0;
1355 }
1356
1357 evt_struct = get_event_struct(&hostdata->pool);
1358 BUG_ON(!evt_struct);
1359
1360 init_event_struct(evt_struct, fast_fail_rsp, VIOSRP_MAD_FORMAT, info_timeout);
1361
1362 fast_fail_mad = &evt_struct->iu.mad.fast_fail;
1363 memset(fast_fail_mad, 0, sizeof(*fast_fail_mad));
1364 fast_fail_mad->common.type = cpu_to_be32(VIOSRP_ENABLE_FAST_FAIL);
1365 fast_fail_mad->common.length = cpu_to_be16(sizeof(*fast_fail_mad));
1366
1367 spin_lock_irqsave(hostdata->host->host_lock, flags);
1368 rc = ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2);
1369 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1370 return rc;
1371}
1372
1373/**
1374 * adapter_info_rsp: - Handle response to MAD adapter info request
1375 * @evt_struct: srp_event_struct with the response
1376 *
1377 * Used as a "done" callback by when sending adapter_info. Gets called
1378 * by ibmvscsi_handle_crq()
1379*/
1380static void adapter_info_rsp(struct srp_event_struct *evt_struct)
1381{
1382 struct ibmvscsi_host_data *hostdata = evt_struct->hostdata;
1383
1384 if (evt_struct->xfer_iu->mad.adapter_info.common.status) {
1385 dev_err(hostdata->dev, "error %d getting adapter info\n",
1386 evt_struct->xfer_iu->mad.adapter_info.common.status);
1387 } else {
1388 dev_info(hostdata->dev, "host srp version: %s, "
1389 "host partition %s (%d), OS %d, max io %u\n",
1390 hostdata->madapter_info.srp_version,
1391 hostdata->madapter_info.partition_name,
1392 be32_to_cpu(hostdata->madapter_info.partition_number),
1393 be32_to_cpu(hostdata->madapter_info.os_type),
1394 be32_to_cpu(hostdata->madapter_info.port_max_txu[0]));
1395
1396 if (hostdata->madapter_info.port_max_txu[0])
1397 hostdata->host->max_sectors =
1398 be32_to_cpu(hostdata->madapter_info.port_max_txu[0]) >> 9;
1399
1400 if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX &&
1401 strcmp(hostdata->madapter_info.srp_version, "1.6a") <= 0) {
1402 dev_err(hostdata->dev, "host (Ver. %s) doesn't support large transfers\n",
1403 hostdata->madapter_info.srp_version);
1404 dev_err(hostdata->dev, "limiting scatterlists to %d\n",
1405 MAX_INDIRECT_BUFS);
1406 hostdata->host->sg_tablesize = MAX_INDIRECT_BUFS;
1407 }
1408
1409 if (be32_to_cpu(hostdata->madapter_info.os_type) == SRP_MAD_OS_AIX) {
1410 enable_fast_fail(hostdata);
1411 return;
1412 }
1413 }
1414
1415 send_srp_login(hostdata);
1416}
1417
1418/**
1419 * send_mad_adapter_info: - Sends the mad adapter info request
1420 * and stores the result so it can be retrieved with
1421 * sysfs. We COULD consider causing a failure if the
1422 * returned SRP version doesn't match ours.
1423 * @hostdata: ibmvscsi_host_data of host
1424 *
1425 * Returns zero if successful.
1426*/
1427static void send_mad_adapter_info(struct ibmvscsi_host_data *hostdata)
1428{
1429 struct viosrp_adapter_info *req;
1430 struct srp_event_struct *evt_struct;
1431 unsigned long flags;
1432
1433 evt_struct = get_event_struct(&hostdata->pool);
1434 BUG_ON(!evt_struct);
1435
1436 init_event_struct(evt_struct,
1437 adapter_info_rsp,
1438 VIOSRP_MAD_FORMAT,
1439 info_timeout);
1440
1441 req = &evt_struct->iu.mad.adapter_info;
1442 memset(req, 0x00, sizeof(*req));
1443
1444 req->common.type = cpu_to_be32(VIOSRP_ADAPTER_INFO_TYPE);
1445 req->common.length = cpu_to_be16(sizeof(hostdata->madapter_info));
1446 req->buffer = cpu_to_be64(hostdata->adapter_info_addr);
1447
1448 spin_lock_irqsave(hostdata->host->host_lock, flags);
1449 if (ibmvscsi_send_srp_event(evt_struct, hostdata, info_timeout * 2))
1450 dev_err(hostdata->dev, "couldn't send ADAPTER_INFO_REQ!\n");
1451 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1452};
1453
1454/**
1455 * init_adapter: Start virtual adapter initialization sequence
1456 *
1457 */
1458static void init_adapter(struct ibmvscsi_host_data *hostdata)
1459{
1460 send_mad_adapter_info(hostdata);
1461}
1462
1463/**
1464 * sync_completion: Signal that a synchronous command has completed
1465 * Note that after returning from this call, the evt_struct is freed.
1466 * the caller waiting on this completion shouldn't touch the evt_struct
1467 * again.
1468 */
1469static void sync_completion(struct srp_event_struct *evt_struct)
1470{
1471 /* copy the response back */
1472 if (evt_struct->sync_srp)
1473 *evt_struct->sync_srp = *evt_struct->xfer_iu;
1474
1475 complete(&evt_struct->comp);
1476}
1477
1478/**
1479 * ibmvscsi_abort: Abort a command...from scsi host template
1480 * send this over to the server and wait synchronously for the response
1481 */
1482static int ibmvscsi_eh_abort_handler(struct scsi_cmnd *cmd)
1483{
1484 struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1485 struct srp_tsk_mgmt *tsk_mgmt;
1486 struct srp_event_struct *evt;
1487 struct srp_event_struct *tmp_evt, *found_evt;
1488 union viosrp_iu srp_rsp;
1489 int rsp_rc;
1490 unsigned long flags;
1491 u16 lun = lun_from_dev(cmd->device);
1492 unsigned long wait_switch = 0;
1493
1494 /* First, find this command in our sent list so we can figure
1495 * out the correct tag
1496 */
1497 spin_lock_irqsave(hostdata->host->host_lock, flags);
1498 wait_switch = jiffies + (init_timeout * HZ);
1499 do {
1500 found_evt = NULL;
1501 list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1502 if (tmp_evt->cmnd == cmd) {
1503 found_evt = tmp_evt;
1504 break;
1505 }
1506 }
1507
1508 if (!found_evt) {
1509 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1510 return SUCCESS;
1511 }
1512
1513 evt = get_event_struct(&hostdata->pool);
1514 if (evt == NULL) {
1515 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1516 sdev_printk(KERN_ERR, cmd->device,
1517 "failed to allocate abort event\n");
1518 return FAILED;
1519 }
1520
1521 init_event_struct(evt,
1522 sync_completion,
1523 VIOSRP_SRP_FORMAT,
1524 abort_timeout);
1525
1526 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1527
1528 /* Set up an abort SRP command */
1529 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1530 tsk_mgmt->opcode = SRP_TSK_MGMT;
1531 int_to_scsilun(lun, &tsk_mgmt->lun);
1532 tsk_mgmt->tsk_mgmt_func = SRP_TSK_ABORT_TASK;
1533 tsk_mgmt->task_tag = (u64) found_evt;
1534
1535 evt->sync_srp = &srp_rsp;
1536
1537 init_completion(&evt->comp);
1538 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, abort_timeout * 2);
1539
1540 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1541 break;
1542
1543 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1544 msleep(10);
1545 spin_lock_irqsave(hostdata->host->host_lock, flags);
1546 } while (time_before(jiffies, wait_switch));
1547
1548 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1549
1550 if (rsp_rc != 0) {
1551 sdev_printk(KERN_ERR, cmd->device,
1552 "failed to send abort() event. rc=%d\n", rsp_rc);
1553 return FAILED;
1554 }
1555
1556 sdev_printk(KERN_INFO, cmd->device,
1557 "aborting command. lun 0x%llx, tag 0x%llx\n",
1558 (((u64) lun) << 48), (u64) found_evt);
1559
1560 wait_for_completion(&evt->comp);
1561
1562 /* make sure we got a good response */
1563 if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1564 if (printk_ratelimit())
1565 sdev_printk(KERN_WARNING, cmd->device, "abort bad SRP RSP type %d\n",
1566 srp_rsp.srp.rsp.opcode);
1567 return FAILED;
1568 }
1569
1570 if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1571 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1572 else
1573 rsp_rc = srp_rsp.srp.rsp.status;
1574
1575 if (rsp_rc) {
1576 if (printk_ratelimit())
1577 sdev_printk(KERN_WARNING, cmd->device,
1578 "abort code %d for task tag 0x%llx\n",
1579 rsp_rc, tsk_mgmt->task_tag);
1580 return FAILED;
1581 }
1582
1583 /* Because we dropped the spinlock above, it's possible
1584 * The event is no longer in our list. Make sure it didn't
1585 * complete while we were aborting
1586 */
1587 spin_lock_irqsave(hostdata->host->host_lock, flags);
1588 found_evt = NULL;
1589 list_for_each_entry(tmp_evt, &hostdata->sent, list) {
1590 if (tmp_evt->cmnd == cmd) {
1591 found_evt = tmp_evt;
1592 break;
1593 }
1594 }
1595
1596 if (found_evt == NULL) {
1597 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1598 sdev_printk(KERN_INFO, cmd->device, "aborted task tag 0x%llx completed\n",
1599 tsk_mgmt->task_tag);
1600 return SUCCESS;
1601 }
1602
1603 sdev_printk(KERN_INFO, cmd->device, "successfully aborted task tag 0x%llx\n",
1604 tsk_mgmt->task_tag);
1605
1606 cmd->result = (DID_ABORT << 16);
1607 list_del(&found_evt->list);
1608 unmap_cmd_data(&found_evt->iu.srp.cmd, found_evt,
1609 found_evt->hostdata->dev);
1610 free_event_struct(&found_evt->hostdata->pool, found_evt);
1611 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1612 atomic_inc(&hostdata->request_limit);
1613 return SUCCESS;
1614}
1615
1616/**
1617 * ibmvscsi_eh_device_reset_handler: Reset a single LUN...from scsi host
1618 * template send this over to the server and wait synchronously for the
1619 * response
1620 */
1621static int ibmvscsi_eh_device_reset_handler(struct scsi_cmnd *cmd)
1622{
1623 struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1624 struct srp_tsk_mgmt *tsk_mgmt;
1625 struct srp_event_struct *evt;
1626 struct srp_event_struct *tmp_evt, *pos;
1627 union viosrp_iu srp_rsp;
1628 int rsp_rc;
1629 unsigned long flags;
1630 u16 lun = lun_from_dev(cmd->device);
1631 unsigned long wait_switch = 0;
1632
1633 spin_lock_irqsave(hostdata->host->host_lock, flags);
1634 wait_switch = jiffies + (init_timeout * HZ);
1635 do {
1636 evt = get_event_struct(&hostdata->pool);
1637 if (evt == NULL) {
1638 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1639 sdev_printk(KERN_ERR, cmd->device,
1640 "failed to allocate reset event\n");
1641 return FAILED;
1642 }
1643
1644 init_event_struct(evt,
1645 sync_completion,
1646 VIOSRP_SRP_FORMAT,
1647 reset_timeout);
1648
1649 tsk_mgmt = &evt->iu.srp.tsk_mgmt;
1650
1651 /* Set up a lun reset SRP command */
1652 memset(tsk_mgmt, 0x00, sizeof(*tsk_mgmt));
1653 tsk_mgmt->opcode = SRP_TSK_MGMT;
1654 int_to_scsilun(lun, &tsk_mgmt->lun);
1655 tsk_mgmt->tsk_mgmt_func = SRP_TSK_LUN_RESET;
1656
1657 evt->sync_srp = &srp_rsp;
1658
1659 init_completion(&evt->comp);
1660 rsp_rc = ibmvscsi_send_srp_event(evt, hostdata, reset_timeout * 2);
1661
1662 if (rsp_rc != SCSI_MLQUEUE_HOST_BUSY)
1663 break;
1664
1665 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1666 msleep(10);
1667 spin_lock_irqsave(hostdata->host->host_lock, flags);
1668 } while (time_before(jiffies, wait_switch));
1669
1670 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1671
1672 if (rsp_rc != 0) {
1673 sdev_printk(KERN_ERR, cmd->device,
1674 "failed to send reset event. rc=%d\n", rsp_rc);
1675 return FAILED;
1676 }
1677
1678 sdev_printk(KERN_INFO, cmd->device, "resetting device. lun 0x%llx\n",
1679 (((u64) lun) << 48));
1680
1681 wait_for_completion(&evt->comp);
1682
1683 /* make sure we got a good response */
1684 if (unlikely(srp_rsp.srp.rsp.opcode != SRP_RSP)) {
1685 if (printk_ratelimit())
1686 sdev_printk(KERN_WARNING, cmd->device, "reset bad SRP RSP type %d\n",
1687 srp_rsp.srp.rsp.opcode);
1688 return FAILED;
1689 }
1690
1691 if (srp_rsp.srp.rsp.flags & SRP_RSP_FLAG_RSPVALID)
1692 rsp_rc = *((int *)srp_rsp.srp.rsp.data);
1693 else
1694 rsp_rc = srp_rsp.srp.rsp.status;
1695
1696 if (rsp_rc) {
1697 if (printk_ratelimit())
1698 sdev_printk(KERN_WARNING, cmd->device,
1699 "reset code %d for task tag 0x%llx\n",
1700 rsp_rc, tsk_mgmt->task_tag);
1701 return FAILED;
1702 }
1703
1704 /* We need to find all commands for this LUN that have not yet been
1705 * responded to, and fail them with DID_RESET
1706 */
1707 spin_lock_irqsave(hostdata->host->host_lock, flags);
1708 list_for_each_entry_safe(tmp_evt, pos, &hostdata->sent, list) {
1709 if ((tmp_evt->cmnd) && (tmp_evt->cmnd->device == cmd->device)) {
1710 if (tmp_evt->cmnd)
1711 tmp_evt->cmnd->result = (DID_RESET << 16);
1712 list_del(&tmp_evt->list);
1713 unmap_cmd_data(&tmp_evt->iu.srp.cmd, tmp_evt,
1714 tmp_evt->hostdata->dev);
1715 free_event_struct(&tmp_evt->hostdata->pool,
1716 tmp_evt);
1717 atomic_inc(&hostdata->request_limit);
1718 if (tmp_evt->cmnd_done)
1719 tmp_evt->cmnd_done(tmp_evt->cmnd);
1720 else if (tmp_evt->done)
1721 tmp_evt->done(tmp_evt);
1722 }
1723 }
1724 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
1725 return SUCCESS;
1726}
1727
1728/**
1729 * ibmvscsi_eh_host_reset_handler - Reset the connection to the server
1730 * @cmd: struct scsi_cmnd having problems
1731*/
1732static int ibmvscsi_eh_host_reset_handler(struct scsi_cmnd *cmd)
1733{
1734 unsigned long wait_switch = 0;
1735 struct ibmvscsi_host_data *hostdata = shost_priv(cmd->device->host);
1736
1737 dev_err(hostdata->dev, "Resetting connection due to error recovery\n");
1738
1739 ibmvscsi_reset_host(hostdata);
1740
1741 for (wait_switch = jiffies + (init_timeout * HZ);
1742 time_before(jiffies, wait_switch) &&
1743 atomic_read(&hostdata->request_limit) < 2;) {
1744
1745 msleep(10);
1746 }
1747
1748 if (atomic_read(&hostdata->request_limit) <= 0)
1749 return FAILED;
1750
1751 return SUCCESS;
1752}
1753
1754/**
1755 * ibmvscsi_handle_crq: - Handles and frees received events in the CRQ
1756 * @crq: Command/Response queue
1757 * @hostdata: ibmvscsi_host_data of host
1758 *
1759*/
1760static void ibmvscsi_handle_crq(struct viosrp_crq *crq,
1761 struct ibmvscsi_host_data *hostdata)
1762{
1763 long rc;
1764 unsigned long flags;
1765 /* The hypervisor copies our tag value here so no byteswapping */
1766 struct srp_event_struct *evt_struct =
1767 (__force struct srp_event_struct *)crq->IU_data_ptr;
1768 switch (crq->valid) {
1769 case VIOSRP_CRQ_INIT_RSP: /* initialization */
1770 switch (crq->format) {
1771 case VIOSRP_CRQ_INIT: /* Initialization message */
1772 dev_info(hostdata->dev, "partner initialized\n");
1773 /* Send back a response */
1774 rc = ibmvscsi_send_crq(hostdata, 0xC002000000000000LL, 0);
1775 if (rc == 0) {
1776 /* Now login */
1777 init_adapter(hostdata);
1778 } else {
1779 dev_err(hostdata->dev, "Unable to send init rsp. rc=%ld\n", rc);
1780 }
1781
1782 break;
1783 case VIOSRP_CRQ_INIT_COMPLETE: /* Initialization response */
1784 dev_info(hostdata->dev, "partner initialization complete\n");
1785
1786 /* Now login */
1787 init_adapter(hostdata);
1788 break;
1789 default:
1790 dev_err(hostdata->dev, "unknown crq message type: %d\n", crq->format);
1791 }
1792 return;
1793 case VIOSRP_CRQ_XPORT_EVENT: /* Hypervisor telling us the connection is closed */
1794 scsi_block_requests(hostdata->host);
1795 atomic_set(&hostdata->request_limit, 0);
1796 if (crq->format == 0x06) {
1797 /* We need to re-setup the interpartition connection */
1798 dev_info(hostdata->dev, "Re-enabling adapter!\n");
1799 hostdata->client_migrated = 1;
1800 hostdata->reenable_crq = 1;
1801 purge_requests(hostdata, DID_REQUEUE);
1802 wake_up(&hostdata->work_wait_q);
1803 } else {
1804 dev_err(hostdata->dev, "Virtual adapter failed rc %d!\n",
1805 crq->format);
1806 ibmvscsi_reset_host(hostdata);
1807 }
1808 return;
1809 case VIOSRP_CRQ_CMD_RSP: /* real payload */
1810 break;
1811 default:
1812 dev_err(hostdata->dev, "got an invalid message type 0x%02x\n",
1813 crq->valid);
1814 return;
1815 }
1816
1817 /* The only kind of payload CRQs we should get are responses to
1818 * things we send. Make sure this response is to something we
1819 * actually sent
1820 */
1821 if (!valid_event_struct(&hostdata->pool, evt_struct)) {
1822 dev_err(hostdata->dev, "returned correlation_token 0x%p is invalid!\n",
1823 evt_struct);
1824 return;
1825 }
1826
1827 if (atomic_read(&evt_struct->free)) {
1828 dev_err(hostdata->dev, "received duplicate correlation_token 0x%p!\n",
1829 evt_struct);
1830 return;
1831 }
1832
1833 if (crq->format == VIOSRP_SRP_FORMAT)
1834 atomic_add(be32_to_cpu(evt_struct->xfer_iu->srp.rsp.req_lim_delta),
1835 &hostdata->request_limit);
1836
1837 del_timer(&evt_struct->timer);
1838
1839 if ((crq->status != VIOSRP_OK && crq->status != VIOSRP_OK2) && evt_struct->cmnd)
1840 evt_struct->cmnd->result = DID_ERROR << 16;
1841 if (evt_struct->done)
1842 evt_struct->done(evt_struct);
1843 else
1844 dev_err(hostdata->dev, "returned done() is NULL; not running it!\n");
1845
1846 /*
1847 * Lock the host_lock before messing with these structures, since we
1848 * are running in a task context
1849 */
1850 spin_lock_irqsave(evt_struct->hostdata->host->host_lock, flags);
1851 list_del(&evt_struct->list);
1852 free_event_struct(&evt_struct->hostdata->pool, evt_struct);
1853 spin_unlock_irqrestore(evt_struct->hostdata->host->host_lock, flags);
1854}
1855
1856/**
1857 * ibmvscsi_slave_configure: Set the "allow_restart" flag for each disk.
1858 * @sdev: struct scsi_device device to configure
1859 *
1860 * Enable allow_restart for a device if it is a disk. Adjust the
1861 * queue_depth here also as is required by the documentation for
1862 * struct scsi_host_template.
1863 */
1864static int ibmvscsi_slave_configure(struct scsi_device *sdev)
1865{
1866 struct Scsi_Host *shost = sdev->host;
1867 unsigned long lock_flags = 0;
1868
1869 spin_lock_irqsave(shost->host_lock, lock_flags);
1870 if (sdev->type == TYPE_DISK) {
1871 sdev->allow_restart = 1;
1872 blk_queue_rq_timeout(sdev->request_queue, 120 * HZ);
1873 }
1874 spin_unlock_irqrestore(shost->host_lock, lock_flags);
1875 return 0;
1876}
1877
1878/**
1879 * ibmvscsi_change_queue_depth - Change the device's queue depth
1880 * @sdev: scsi device struct
1881 * @qdepth: depth to set
1882 * @reason: calling context
1883 *
1884 * Return value:
1885 * actual depth set
1886 **/
1887static int ibmvscsi_change_queue_depth(struct scsi_device *sdev, int qdepth)
1888{
1889 if (qdepth > IBMVSCSI_MAX_CMDS_PER_LUN)
1890 qdepth = IBMVSCSI_MAX_CMDS_PER_LUN;
1891 return scsi_change_queue_depth(sdev, qdepth);
1892}
1893
1894/* ------------------------------------------------------------
1895 * sysfs attributes
1896 */
1897static ssize_t show_host_vhost_loc(struct device *dev,
1898 struct device_attribute *attr, char *buf)
1899{
1900 struct Scsi_Host *shost = class_to_shost(dev);
1901 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1902 int len;
1903
1904 len = snprintf(buf, sizeof(hostdata->caps.loc), "%s\n",
1905 hostdata->caps.loc);
1906 return len;
1907}
1908
1909static struct device_attribute ibmvscsi_host_vhost_loc = {
1910 .attr = {
1911 .name = "vhost_loc",
1912 .mode = S_IRUGO,
1913 },
1914 .show = show_host_vhost_loc,
1915};
1916
1917static ssize_t show_host_vhost_name(struct device *dev,
1918 struct device_attribute *attr, char *buf)
1919{
1920 struct Scsi_Host *shost = class_to_shost(dev);
1921 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1922 int len;
1923
1924 len = snprintf(buf, sizeof(hostdata->caps.name), "%s\n",
1925 hostdata->caps.name);
1926 return len;
1927}
1928
1929static struct device_attribute ibmvscsi_host_vhost_name = {
1930 .attr = {
1931 .name = "vhost_name",
1932 .mode = S_IRUGO,
1933 },
1934 .show = show_host_vhost_name,
1935};
1936
1937static ssize_t show_host_srp_version(struct device *dev,
1938 struct device_attribute *attr, char *buf)
1939{
1940 struct Scsi_Host *shost = class_to_shost(dev);
1941 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1942 int len;
1943
1944 len = snprintf(buf, PAGE_SIZE, "%s\n",
1945 hostdata->madapter_info.srp_version);
1946 return len;
1947}
1948
1949static struct device_attribute ibmvscsi_host_srp_version = {
1950 .attr = {
1951 .name = "srp_version",
1952 .mode = S_IRUGO,
1953 },
1954 .show = show_host_srp_version,
1955};
1956
1957static ssize_t show_host_partition_name(struct device *dev,
1958 struct device_attribute *attr,
1959 char *buf)
1960{
1961 struct Scsi_Host *shost = class_to_shost(dev);
1962 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1963 int len;
1964
1965 len = snprintf(buf, PAGE_SIZE, "%s\n",
1966 hostdata->madapter_info.partition_name);
1967 return len;
1968}
1969
1970static struct device_attribute ibmvscsi_host_partition_name = {
1971 .attr = {
1972 .name = "partition_name",
1973 .mode = S_IRUGO,
1974 },
1975 .show = show_host_partition_name,
1976};
1977
1978static ssize_t show_host_partition_number(struct device *dev,
1979 struct device_attribute *attr,
1980 char *buf)
1981{
1982 struct Scsi_Host *shost = class_to_shost(dev);
1983 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
1984 int len;
1985
1986 len = snprintf(buf, PAGE_SIZE, "%d\n",
1987 be32_to_cpu(hostdata->madapter_info.partition_number));
1988 return len;
1989}
1990
1991static struct device_attribute ibmvscsi_host_partition_number = {
1992 .attr = {
1993 .name = "partition_number",
1994 .mode = S_IRUGO,
1995 },
1996 .show = show_host_partition_number,
1997};
1998
1999static ssize_t show_host_mad_version(struct device *dev,
2000 struct device_attribute *attr, char *buf)
2001{
2002 struct Scsi_Host *shost = class_to_shost(dev);
2003 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2004 int len;
2005
2006 len = snprintf(buf, PAGE_SIZE, "%d\n",
2007 be32_to_cpu(hostdata->madapter_info.mad_version));
2008 return len;
2009}
2010
2011static struct device_attribute ibmvscsi_host_mad_version = {
2012 .attr = {
2013 .name = "mad_version",
2014 .mode = S_IRUGO,
2015 },
2016 .show = show_host_mad_version,
2017};
2018
2019static ssize_t show_host_os_type(struct device *dev,
2020 struct device_attribute *attr, char *buf)
2021{
2022 struct Scsi_Host *shost = class_to_shost(dev);
2023 struct ibmvscsi_host_data *hostdata = shost_priv(shost);
2024 int len;
2025
2026 len = snprintf(buf, PAGE_SIZE, "%d\n",
2027 be32_to_cpu(hostdata->madapter_info.os_type));
2028 return len;
2029}
2030
2031static struct device_attribute ibmvscsi_host_os_type = {
2032 .attr = {
2033 .name = "os_type",
2034 .mode = S_IRUGO,
2035 },
2036 .show = show_host_os_type,
2037};
2038
2039static ssize_t show_host_config(struct device *dev,
2040 struct device_attribute *attr, char *buf)
2041{
2042 return 0;
2043}
2044
2045static struct device_attribute ibmvscsi_host_config = {
2046 .attr = {
2047 .name = "config",
2048 .mode = S_IRUGO,
2049 },
2050 .show = show_host_config,
2051};
2052
2053static struct device_attribute *ibmvscsi_attrs[] = {
2054 &ibmvscsi_host_vhost_loc,
2055 &ibmvscsi_host_vhost_name,
2056 &ibmvscsi_host_srp_version,
2057 &ibmvscsi_host_partition_name,
2058 &ibmvscsi_host_partition_number,
2059 &ibmvscsi_host_mad_version,
2060 &ibmvscsi_host_os_type,
2061 &ibmvscsi_host_config,
2062 NULL
2063};
2064
2065/* ------------------------------------------------------------
2066 * SCSI driver registration
2067 */
2068static struct scsi_host_template driver_template = {
2069 .module = THIS_MODULE,
2070 .name = "IBM POWER Virtual SCSI Adapter " IBMVSCSI_VERSION,
2071 .proc_name = "ibmvscsi",
2072 .queuecommand = ibmvscsi_queuecommand,
2073 .eh_timed_out = srp_timed_out,
2074 .eh_abort_handler = ibmvscsi_eh_abort_handler,
2075 .eh_device_reset_handler = ibmvscsi_eh_device_reset_handler,
2076 .eh_host_reset_handler = ibmvscsi_eh_host_reset_handler,
2077 .slave_configure = ibmvscsi_slave_configure,
2078 .change_queue_depth = ibmvscsi_change_queue_depth,
2079 .cmd_per_lun = IBMVSCSI_CMDS_PER_LUN_DEFAULT,
2080 .can_queue = IBMVSCSI_MAX_REQUESTS_DEFAULT,
2081 .this_id = -1,
2082 .sg_tablesize = SG_ALL,
2083 .use_clustering = ENABLE_CLUSTERING,
2084 .shost_attrs = ibmvscsi_attrs,
2085};
2086
2087/**
2088 * ibmvscsi_get_desired_dma - Calculate IO memory desired by the driver
2089 *
2090 * @vdev: struct vio_dev for the device whose desired IO mem is to be returned
2091 *
2092 * Return value:
2093 * Number of bytes of IO data the driver will need to perform well.
2094 */
2095static unsigned long ibmvscsi_get_desired_dma(struct vio_dev *vdev)
2096{
2097 /* iu_storage data allocated in initialize_event_pool */
2098 unsigned long desired_io = max_events * sizeof(union viosrp_iu);
2099
2100 /* add io space for sg data */
2101 desired_io += (IBMVSCSI_MAX_SECTORS_DEFAULT * 512 *
2102 IBMVSCSI_CMDS_PER_LUN_DEFAULT);
2103
2104 return desired_io;
2105}
2106
2107static void ibmvscsi_do_work(struct ibmvscsi_host_data *hostdata)
2108{
2109 int rc;
2110 char *action = "reset";
2111
2112 if (hostdata->reset_crq) {
2113 smp_rmb();
2114 hostdata->reset_crq = 0;
2115
2116 rc = ibmvscsi_reset_crq_queue(&hostdata->queue, hostdata);
2117 if (!rc)
2118 rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2119 vio_enable_interrupts(to_vio_dev(hostdata->dev));
2120 } else if (hostdata->reenable_crq) {
2121 smp_rmb();
2122 action = "enable";
2123 rc = ibmvscsi_reenable_crq_queue(&hostdata->queue, hostdata);
2124 hostdata->reenable_crq = 0;
2125 if (!rc)
2126 rc = ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0);
2127 } else
2128 return;
2129
2130 if (rc) {
2131 atomic_set(&hostdata->request_limit, -1);
2132 dev_err(hostdata->dev, "error after %s\n", action);
2133 }
2134
2135 scsi_unblock_requests(hostdata->host);
2136}
2137
2138static int ibmvscsi_work_to_do(struct ibmvscsi_host_data *hostdata)
2139{
2140 if (kthread_should_stop())
2141 return 1;
2142 else if (hostdata->reset_crq) {
2143 smp_rmb();
2144 return 1;
2145 } else if (hostdata->reenable_crq) {
2146 smp_rmb();
2147 return 1;
2148 }
2149
2150 return 0;
2151}
2152
2153static int ibmvscsi_work(void *data)
2154{
2155 struct ibmvscsi_host_data *hostdata = data;
2156 int rc;
2157
2158 set_user_nice(current, MIN_NICE);
2159
2160 while (1) {
2161 rc = wait_event_interruptible(hostdata->work_wait_q,
2162 ibmvscsi_work_to_do(hostdata));
2163
2164 BUG_ON(rc);
2165
2166 if (kthread_should_stop())
2167 break;
2168
2169 ibmvscsi_do_work(hostdata);
2170 }
2171
2172 return 0;
2173}
2174
2175/**
2176 * Called by bus code for each adapter
2177 */
2178static int ibmvscsi_probe(struct vio_dev *vdev, const struct vio_device_id *id)
2179{
2180 struct ibmvscsi_host_data *hostdata;
2181 struct Scsi_Host *host;
2182 struct device *dev = &vdev->dev;
2183 struct srp_rport_identifiers ids;
2184 struct srp_rport *rport;
2185 unsigned long wait_switch = 0;
2186 int rc;
2187
2188 dev_set_drvdata(&vdev->dev, NULL);
2189
2190 host = scsi_host_alloc(&driver_template, sizeof(*hostdata));
2191 if (!host) {
2192 dev_err(&vdev->dev, "couldn't allocate host data\n");
2193 goto scsi_host_alloc_failed;
2194 }
2195
2196 host->transportt = ibmvscsi_transport_template;
2197 hostdata = shost_priv(host);
2198 memset(hostdata, 0x00, sizeof(*hostdata));
2199 INIT_LIST_HEAD(&hostdata->sent);
2200 init_waitqueue_head(&hostdata->work_wait_q);
2201 hostdata->host = host;
2202 hostdata->dev = dev;
2203 atomic_set(&hostdata->request_limit, -1);
2204 hostdata->host->max_sectors = IBMVSCSI_MAX_SECTORS_DEFAULT;
2205
2206 if (map_persist_bufs(hostdata)) {
2207 dev_err(&vdev->dev, "couldn't map persistent buffers\n");
2208 goto persist_bufs_failed;
2209 }
2210
2211 hostdata->work_thread = kthread_run(ibmvscsi_work, hostdata, "%s_%d",
2212 "ibmvscsi", host->host_no);
2213
2214 if (IS_ERR(hostdata->work_thread)) {
2215 dev_err(&vdev->dev, "couldn't initialize kthread. rc=%ld\n",
2216 PTR_ERR(hostdata->work_thread));
2217 goto init_crq_failed;
2218 }
2219
2220 rc = ibmvscsi_init_crq_queue(&hostdata->queue, hostdata, max_events);
2221 if (rc != 0 && rc != H_RESOURCE) {
2222 dev_err(&vdev->dev, "couldn't initialize crq. rc=%d\n", rc);
2223 goto kill_kthread;
2224 }
2225 if (initialize_event_pool(&hostdata->pool, max_events, hostdata) != 0) {
2226 dev_err(&vdev->dev, "couldn't initialize event pool\n");
2227 goto init_pool_failed;
2228 }
2229
2230 host->max_lun = IBMVSCSI_MAX_LUN;
2231 host->max_id = max_id;
2232 host->max_channel = max_channel;
2233 host->max_cmd_len = 16;
2234
2235 dev_info(dev,
2236 "Maximum ID: %d Maximum LUN: %llu Maximum Channel: %d\n",
2237 host->max_id, host->max_lun, host->max_channel);
2238
2239 if (scsi_add_host(hostdata->host, hostdata->dev))
2240 goto add_host_failed;
2241
2242 /* we don't have a proper target_port_id so let's use the fake one */
2243 memcpy(ids.port_id, hostdata->madapter_info.partition_name,
2244 sizeof(ids.port_id));
2245 ids.roles = SRP_RPORT_ROLE_TARGET;
2246 rport = srp_rport_add(host, &ids);
2247 if (IS_ERR(rport))
2248 goto add_srp_port_failed;
2249
2250 /* Try to send an initialization message. Note that this is allowed
2251 * to fail if the other end is not acive. In that case we don't
2252 * want to scan
2253 */
2254 if (ibmvscsi_send_crq(hostdata, 0xC001000000000000LL, 0) == 0
2255 || rc == H_RESOURCE) {
2256 /*
2257 * Wait around max init_timeout secs for the adapter to finish
2258 * initializing. When we are done initializing, we will have a
2259 * valid request_limit. We don't want Linux scanning before
2260 * we are ready.
2261 */
2262 for (wait_switch = jiffies + (init_timeout * HZ);
2263 time_before(jiffies, wait_switch) &&
2264 atomic_read(&hostdata->request_limit) < 2;) {
2265
2266 msleep(10);
2267 }
2268
2269 /* if we now have a valid request_limit, initiate a scan */
2270 if (atomic_read(&hostdata->request_limit) > 0)
2271 scsi_scan_host(host);
2272 }
2273
2274 dev_set_drvdata(&vdev->dev, hostdata);
2275 spin_lock(&ibmvscsi_driver_lock);
2276 list_add_tail(&hostdata->host_list, &ibmvscsi_head);
2277 spin_unlock(&ibmvscsi_driver_lock);
2278 return 0;
2279
2280 add_srp_port_failed:
2281 scsi_remove_host(hostdata->host);
2282 add_host_failed:
2283 release_event_pool(&hostdata->pool, hostdata);
2284 init_pool_failed:
2285 ibmvscsi_release_crq_queue(&hostdata->queue, hostdata, max_events);
2286 kill_kthread:
2287 kthread_stop(hostdata->work_thread);
2288 init_crq_failed:
2289 unmap_persist_bufs(hostdata);
2290 persist_bufs_failed:
2291 scsi_host_put(host);
2292 scsi_host_alloc_failed:
2293 return -1;
2294}
2295
2296static int ibmvscsi_remove(struct vio_dev *vdev)
2297{
2298 struct ibmvscsi_host_data *hostdata = dev_get_drvdata(&vdev->dev);
2299 unsigned long flags;
2300
2301 srp_remove_host(hostdata->host);
2302 scsi_remove_host(hostdata->host);
2303
2304 purge_requests(hostdata, DID_ERROR);
2305
2306 spin_lock_irqsave(hostdata->host->host_lock, flags);
2307 release_event_pool(&hostdata->pool, hostdata);
2308 spin_unlock_irqrestore(hostdata->host->host_lock, flags);
2309
2310 ibmvscsi_release_crq_queue(&hostdata->queue, hostdata,
2311 max_events);
2312
2313 kthread_stop(hostdata->work_thread);
2314 unmap_persist_bufs(hostdata);
2315
2316 spin_lock(&ibmvscsi_driver_lock);
2317 list_del(&hostdata->host_list);
2318 spin_unlock(&ibmvscsi_driver_lock);
2319
2320 scsi_host_put(hostdata->host);
2321
2322 return 0;
2323}
2324
2325/**
2326 * ibmvscsi_resume: Resume from suspend
2327 * @dev: device struct
2328 *
2329 * We may have lost an interrupt across suspend/resume, so kick the
2330 * interrupt handler
2331 */
2332static int ibmvscsi_resume(struct device *dev)
2333{
2334 struct ibmvscsi_host_data *hostdata = dev_get_drvdata(dev);
2335 vio_disable_interrupts(to_vio_dev(hostdata->dev));
2336 tasklet_schedule(&hostdata->srp_task);
2337
2338 return 0;
2339}
2340
2341/**
2342 * ibmvscsi_device_table: Used by vio.c to match devices in the device tree we
2343 * support.
2344 */
2345static const struct vio_device_id ibmvscsi_device_table[] = {
2346 {"vscsi", "IBM,v-scsi"},
2347 { "", "" }
2348};
2349MODULE_DEVICE_TABLE(vio, ibmvscsi_device_table);
2350
2351static const struct dev_pm_ops ibmvscsi_pm_ops = {
2352 .resume = ibmvscsi_resume
2353};
2354
2355static struct vio_driver ibmvscsi_driver = {
2356 .id_table = ibmvscsi_device_table,
2357 .probe = ibmvscsi_probe,
2358 .remove = ibmvscsi_remove,
2359 .get_desired_dma = ibmvscsi_get_desired_dma,
2360 .name = "ibmvscsi",
2361 .pm = &ibmvscsi_pm_ops,
2362};
2363
2364static struct srp_function_template ibmvscsi_transport_functions = {
2365};
2366
2367int __init ibmvscsi_module_init(void)
2368{
2369 int ret;
2370
2371 /* Ensure we have two requests to do error recovery */
2372 driver_template.can_queue = max_requests;
2373 max_events = max_requests + 2;
2374
2375 if (!firmware_has_feature(FW_FEATURE_VIO))
2376 return -ENODEV;
2377
2378 ibmvscsi_transport_template =
2379 srp_attach_transport(&ibmvscsi_transport_functions);
2380 if (!ibmvscsi_transport_template)
2381 return -ENOMEM;
2382
2383 ret = vio_register_driver(&ibmvscsi_driver);
2384 if (ret)
2385 srp_release_transport(ibmvscsi_transport_template);
2386 return ret;
2387}
2388
2389void __exit ibmvscsi_module_exit(void)
2390{
2391 vio_unregister_driver(&ibmvscsi_driver);
2392 srp_release_transport(ibmvscsi_transport_template);
2393}
2394
2395module_init(ibmvscsi_module_init);
2396module_exit(ibmvscsi_module_exit);