1 From: Gerald Schaefer <geraldsc@de.ibm.com>
2 Subject: cio: failing set online/offline processing
3 References: bnc#533267,LTC#55510
5 Symptom: A set online or set offline fails for a DASD device.
6 Afterwards this device can neither be set online nor offline.
7 Problem: When unit checks trigger sensing the device state is set to W4SENSE
8 until sense completion; then the device state is set back to
9 ONLINE. If a unit check occurs while set online or set offline
10 requests are processed then it might happen that the device's
11 temporary W4SENSE state causes these functions to terminate,
12 leaving the device in an inconsistent state when the state is set
13 back to ONLINE later on so that the device cannot be set online or
15 Solution: Process set online/offline and related rollback or error routines
16 only if the device is in a final or DISCONNECTED state.
18 Acked-by: John Jolly <jjolly@suse.de>
20 Index: linux-sles11/drivers/s390/cio/device.c
21 ===================================================================
22 --- linux-sles11.orig/drivers/s390/cio/device.c 2009-08-18 13:31:25.000000000 +0200
23 +++ linux-sles11/drivers/s390/cio/device.c 2009-08-18 13:36:48.000000000 +0200
27 spin_lock_irq(cdev->ccwlock);
28 - ret = ccw_device_offline(cdev);
29 - if (ret == -ENODEV) {
30 - if (cdev->private->state != DEV_STATE_NOT_OPER) {
31 - cdev->private->state = DEV_STATE_OFFLINE;
32 - dev_fsm_event(cdev, DEV_EVENT_NOTOPER);
34 + /* Wait until a final state or DISCONNECTED is reached */
35 + while (!dev_fsm_final_state(cdev) &&
36 + cdev->private->state != DEV_STATE_DISCONNECTED) {
37 spin_unlock_irq(cdev->ccwlock);
39 + wait_event(cdev->private->wait_q, (dev_fsm_final_state(cdev) ||
40 + cdev->private->state == DEV_STATE_DISCONNECTED));
41 + spin_lock_irq(cdev->ccwlock);
43 + ret = ccw_device_offline(cdev);
46 spin_unlock_irq(cdev->ccwlock);
48 - wait_event(cdev->private->wait_q, dev_fsm_final_state(cdev));
50 - CIO_MSG_EVENT(0, "ccw_device_offline returned %d, "
51 - "device 0.%x.%04x\n",
52 - ret, cdev->private->dev_id.ssid,
53 - cdev->private->dev_id.devno);
57 + wait_event(cdev->private->wait_q, (dev_fsm_final_state(cdev) ||
58 + cdev->private->state == DEV_STATE_DISCONNECTED));
62 + CIO_MSG_EVENT(0, "ccw_device_offline returned %d, device 0.%x.%04x\n",
63 + ret, cdev->private->dev_id.ssid,
64 + cdev->private->dev_id.devno);
65 + cdev->private->state = DEV_STATE_OFFLINE;
66 + dev_fsm_event(cdev, DEV_EVENT_NOTOPER);
67 + spin_unlock_irq(cdev->ccwlock);
73 int ccw_device_set_online(struct ccw_device *cdev)
81 cdev->private->dev_id.devno);
84 - if (cdev->private->state != DEV_STATE_ONLINE)
85 + spin_lock_irq(cdev->ccwlock);
86 + /* Check if online processing was successful */
87 + if ((cdev->private->state != DEV_STATE_ONLINE) &&
88 + (cdev->private->state != DEV_STATE_W4SENSE)) {
89 + spin_unlock_irq(cdev->ccwlock);
91 - if (!cdev->drv->set_online || cdev->drv->set_online(cdev) == 0) {
95 + spin_unlock_irq(cdev->ccwlock);
96 + if (cdev->drv->set_online)
97 + ret = cdev->drv->set_online(cdev);
104 spin_lock_irq(cdev->ccwlock);
105 - ret = ccw_device_offline(cdev);
106 + /* Wait until a final state or DISCONNECTED is reached */
107 + while (!dev_fsm_final_state(cdev) &&
108 + cdev->private->state != DEV_STATE_DISCONNECTED) {
109 + spin_unlock_irq(cdev->ccwlock);
110 + wait_event(cdev->private->wait_q, (dev_fsm_final_state(cdev) ||
111 + cdev->private->state == DEV_STATE_DISCONNECTED));
112 + spin_lock_irq(cdev->ccwlock);
114 + ret2 = ccw_device_offline(cdev);
117 spin_unlock_irq(cdev->ccwlock);
119 - wait_event(cdev->private->wait_q, dev_fsm_final_state(cdev));
121 - CIO_MSG_EVENT(0, "ccw_device_offline returned %d, "
122 - "device 0.%x.%04x\n",
123 - ret, cdev->private->dev_id.ssid,
124 - cdev->private->dev_id.devno);
125 - return (ret == 0) ? -ENODEV : ret;
126 + wait_event(cdev->private->wait_q, (dev_fsm_final_state(cdev) ||
127 + cdev->private->state == DEV_STATE_DISCONNECTED));
131 + CIO_MSG_EVENT(0, "rollback ccw_device_offline returned %d, "
132 + "device 0.%x.%04x\n",
133 + ret2, cdev->private->dev_id.ssid,
134 + cdev->private->dev_id.devno);
135 + cdev->private->state = DEV_STATE_OFFLINE;
136 + spin_unlock_irq(cdev->ccwlock);
140 static void online_store_handle_offline(struct ccw_device *cdev)
141 Index: linux-sles11/drivers/s390/cio/device_fsm.c
142 ===================================================================
143 --- linux-sles11.orig/drivers/s390/cio/device_fsm.c 2009-08-18 13:31:26.000000000 +0200
144 +++ linux-sles11/drivers/s390/cio/device_fsm.c 2009-08-18 13:32:47.000000000 +0200
148 cdev->private->state = DEV_STATE_ONLINE;
149 + /* In case sensing interfered with setting the device online */
150 + wake_up(&cdev->private->wait_q);
151 /* Call the handler. */
152 if (ccw_device_call_handler(cdev) && cdev->private->flags.doverify)
153 /* Start delayed path verification. */