2 * File...........: linux/drivers/s390/block/dasd_3990_erp.c
3 * Author(s)......: Horst Hummel <Horst.Hummel@de.ibm.com>
4 * Holger Smolinski <Holger.Smolinski@de.ibm.com>
5 * Bugreports.to..: <Linux390@de.ibm.com>
6 * (C) IBM Corporation, IBM Deutschland Entwicklung GmbH, 2000, 2001
10 #define KMSG_COMPONENT "dasd-eckd"
12 #include <linux/timer.h>
13 #include <linux/slab.h>
14 #include <asm/idals.h>
16 #define PRINTK_HEADER "dasd_erp(3990): "
19 #include "dasd_eckd.h"
23 unsigned char subcommand; /* e.g Inhibit Write, Enable Write,... */
24 unsigned char modifier; /* Subcommand modifier */
25 unsigned short res; /* reserved */
26 } __attribute__ ((packed));
29 *****************************************************************************
30 * SECTION ERP HANDLING
31 *****************************************************************************
34 *****************************************************************************
35 * 24 and 32 byte sense ERP functions
36 *****************************************************************************
40 * DASD_3990_ERP_CLEANUP
43 * Removes the already build but not necessary ERP request and sets
44 * the status of the original cqr / erp to the given (final) status
47 * erp request to be blocked
48 * final_status either DASD_CQR_DONE or DASD_CQR_FAILED
53 static struct dasd_ccw_req *
54 dasd_3990_erp_cleanup(struct dasd_ccw_req * erp, char final_status)
56 struct dasd_ccw_req *cqr = erp->refers;
58 dasd_free_erp_request(erp, erp->memdev);
59 cqr->status = final_status;
62 } /* end dasd_3990_erp_cleanup */
65 * DASD_3990_ERP_BLOCK_QUEUE
68 * Block the given device request queue to prevent from further
69 * processing until the started timer has expired or an related
70 * interrupt was received.
72 static void dasd_3990_erp_block_queue(struct dasd_ccw_req *erp, int expires)
75 struct dasd_device *device = erp->startdev;
78 DBF_DEV_EVENT(DBF_INFO, device,
79 "blocking request queue for %is", expires/HZ);
81 spin_lock_irqsave(get_ccwdev_lock(device->cdev), flags);
82 dasd_device_set_stop_bits(device, DASD_STOPPED_PENDING);
83 spin_unlock_irqrestore(get_ccwdev_lock(device->cdev), flags);
84 erp->status = DASD_CQR_FILLED;
86 dasd_block_set_timer(erp->block, expires);
88 dasd_device_set_timer(device, expires);
92 * DASD_3990_ERP_INT_REQ
95 * Handles 'Intervention Required' error.
96 * This means either device offline or not installed.
103 static struct dasd_ccw_req *
104 dasd_3990_erp_int_req(struct dasd_ccw_req * erp)
107 struct dasd_device *device = erp->startdev;
109 /* first time set initial retry counter and erp_function */
110 /* and retry once without blocking queue */
111 /* (this enables easier enqueing of the cqr) */
112 if (erp->function != dasd_3990_erp_int_req) {
115 erp->function = dasd_3990_erp_int_req;
119 /* issue a message and wait for 'device ready' interrupt */
120 dev_err(&device->cdev->dev,
121 "is offline or not installed - "
122 "INTERVENTION REQUIRED!!\n");
124 dasd_3990_erp_block_queue(erp, 60*HZ);
129 } /* end dasd_3990_erp_int_req */
132 * DASD_3990_ERP_ALTERNATE_PATH
135 * Repeat the operation on a different channel path.
136 * If all alternate paths have been tried, the request is posted with a
140 * erp pointer to the current ERP
143 * erp modified pointer to the ERP
146 dasd_3990_erp_alternate_path(struct dasd_ccw_req * erp)
148 struct dasd_device *device = erp->startdev;
152 /* try alternate valid path */
153 spin_lock_irqsave(get_ccwdev_lock(device->cdev), flags);
154 opm = ccw_device_get_path_mask(device->cdev);
155 spin_unlock_irqrestore(get_ccwdev_lock(device->cdev), flags);
156 //FIXME: start with get_opm ?
158 erp->lpm = LPM_ANYPATH & ~(erp->irb.esw.esw0.sublog.lpum);
160 erp->lpm &= ~(erp->irb.esw.esw0.sublog.lpum);
162 if ((erp->lpm & opm) != 0x00) {
164 DBF_DEV_EVENT(DBF_WARNING, device,
165 "try alternate lpm=%x (lpum=%x / opm=%x)",
166 erp->lpm, erp->irb.esw.esw0.sublog.lpum, opm);
168 /* reset status to submit the request again... */
169 erp->status = DASD_CQR_FILLED;
172 dev_err(&device->cdev->dev,
173 "The DASD cannot be reached on any path (lpum=%x"
174 "/opm=%x)\n", erp->irb.esw.esw0.sublog.lpum, opm);
176 /* post request with permanent error */
177 erp->status = DASD_CQR_FAILED;
179 } /* end dasd_3990_erp_alternate_path */
185 * Setup cqr to do the Diagnostic Control (DCTL) command with an
186 * Inhibit Write subcommand (0x20) and the given modifier.
189 * erp pointer to the current (failed) ERP
190 * modifier subcommand modifier
193 * dctl_cqr pointer to NEW dctl_cqr
196 static struct dasd_ccw_req *
197 dasd_3990_erp_DCTL(struct dasd_ccw_req * erp, char modifier)
200 struct dasd_device *device = erp->startdev;
201 struct DCTL_data *DCTL_data;
203 struct dasd_ccw_req *dctl_cqr;
205 dctl_cqr = dasd_alloc_erp_request((char *) &erp->magic, 1,
206 sizeof(struct DCTL_data),
208 if (IS_ERR(dctl_cqr)) {
209 dev_err(&device->cdev->dev,
210 "Unable to allocate DCTL-CQR\n");
211 erp->status = DASD_CQR_FAILED;
215 DCTL_data = dctl_cqr->data;
217 DCTL_data->subcommand = 0x02; /* Inhibit Write */
218 DCTL_data->modifier = modifier;
220 ccw = dctl_cqr->cpaddr;
221 memset(ccw, 0, sizeof(struct ccw1));
222 ccw->cmd_code = CCW_CMD_DCTL;
224 ccw->cda = (__u32)(addr_t) DCTL_data;
225 dctl_cqr->function = dasd_3990_erp_DCTL;
226 dctl_cqr->refers = erp;
227 dctl_cqr->startdev = device;
228 dctl_cqr->memdev = device;
229 dctl_cqr->magic = erp->magic;
230 dctl_cqr->expires = 5 * 60 * HZ;
231 dctl_cqr->retries = 2;
233 dctl_cqr->buildclk = get_clock();
235 dctl_cqr->status = DASD_CQR_FILLED;
239 } /* end dasd_3990_erp_DCTL */
242 * DASD_3990_ERP_ACTION_1
245 * Setup ERP to do the ERP action 1 (see Reference manual).
246 * Repeat the operation on a different channel path.
247 * As deviation from the recommended recovery action, we reset the path mask
248 * after we have tried each path and go through all paths a second time.
249 * This will cover situations where only one path at a time is actually down,
250 * but all paths fail and recover just with the same sequence and timing as
251 * we try to use them (flapping links).
252 * If all alternate paths have been tried twice, the request is posted with
256 * erp pointer to the current ERP
259 * erp pointer to the ERP
262 static struct dasd_ccw_req *dasd_3990_erp_action_1_sec(struct dasd_ccw_req *erp)
264 erp->function = dasd_3990_erp_action_1_sec;
265 dasd_3990_erp_alternate_path(erp);
269 static struct dasd_ccw_req *dasd_3990_erp_action_1(struct dasd_ccw_req *erp)
271 erp->function = dasd_3990_erp_action_1;
272 dasd_3990_erp_alternate_path(erp);
273 if (erp->status == DASD_CQR_FAILED) {
274 erp->status = DASD_CQR_FILLED;
276 erp->lpm = LPM_ANYPATH;
277 erp->function = dasd_3990_erp_action_1_sec;
280 } /* end dasd_3990_erp_action_1(b) */
283 * DASD_3990_ERP_ACTION_4
286 * Setup ERP to do the ERP action 4 (see Reference manual).
287 * Set the current request to PENDING to block the CQR queue for that device
288 * until the state change interrupt appears.
289 * Use a timer (20 seconds) to retry the cqr if the interrupt is still
293 * sense sense data of the actual error
294 * erp pointer to the current ERP
297 * erp pointer to the ERP
300 static struct dasd_ccw_req *
301 dasd_3990_erp_action_4(struct dasd_ccw_req * erp, char *sense)
304 struct dasd_device *device = erp->startdev;
306 /* first time set initial retry counter and erp_function */
307 /* and retry once without waiting for state change pending */
308 /* interrupt (this enables easier enqueing of the cqr) */
309 if (erp->function != dasd_3990_erp_action_4) {
311 DBF_DEV_EVENT(DBF_INFO, device, "%s",
312 "dasd_3990_erp_action_4: first time retry");
315 erp->function = dasd_3990_erp_action_4;
318 if (sense && (sense[25] == 0x1D)) { /* state change pending */
320 DBF_DEV_EVENT(DBF_INFO, device,
321 "waiting for state change pending "
322 "interrupt, %d retries left",
325 dasd_3990_erp_block_queue(erp, 30*HZ);
327 } else if (sense && (sense[25] == 0x1E)) { /* busy */
328 DBF_DEV_EVENT(DBF_INFO, device,
329 "busy - redriving request later, "
332 dasd_3990_erp_block_queue(erp, HZ);
334 /* no state change pending - retry */
335 DBF_DEV_EVENT(DBF_INFO, device,
336 "redriving request immediately, "
339 erp->status = DASD_CQR_FILLED;
345 } /* end dasd_3990_erp_action_4 */
348 *****************************************************************************
349 * 24 byte sense ERP functions (only)
350 *****************************************************************************
354 * DASD_3990_ERP_ACTION_5
357 * Setup ERP to do the ERP action 5 (see Reference manual).
358 * NOTE: Further handling is done in xxx_further_erp after the retries.
361 * erp pointer to the current ERP
364 * erp pointer to the ERP
367 static struct dasd_ccw_req *
368 dasd_3990_erp_action_5(struct dasd_ccw_req * erp)
371 /* first of all retry */
373 erp->function = dasd_3990_erp_action_5;
377 } /* end dasd_3990_erp_action_5 */
380 * DASD_3990_HANDLE_ENV_DATA
383 * Handles 24 byte 'Environmental data present'.
384 * Does a analysis of the sense data (message Format)
385 * and prints the error messages.
388 * sense current sense data
394 dasd_3990_handle_env_data(struct dasd_ccw_req * erp, char *sense)
397 struct dasd_device *device = erp->startdev;
398 char msg_format = (sense[7] & 0xF0);
399 char msg_no = (sense[7] & 0x0F);
400 char errorstring[ERRORLENGTH];
402 switch (msg_format) {
403 case 0x00: /* Format 0 - Program or System Checks */
405 if (sense[1] & 0x10) { /* check message to operator bit */
408 case 0x00: /* No Message */
411 dev_warn(&device->cdev->dev,
412 "FORMAT 0 - Invalid Command\n");
415 dev_warn(&device->cdev->dev,
416 "FORMAT 0 - Invalid Command "
420 dev_warn(&device->cdev->dev,
421 "FORMAT 0 - CCW Count less than "
425 dev_warn(&device->cdev->dev,
426 "FORMAT 0 - Invalid Parameter\n");
429 dev_warn(&device->cdev->dev,
430 "FORMAT 0 - Diagnostic of Special"
431 " Command Violates File Mask\n");
434 dev_warn(&device->cdev->dev,
435 "FORMAT 0 - Channel Returned with "
436 "Incorrect retry CCW\n");
439 dev_warn(&device->cdev->dev,
440 "FORMAT 0 - Reset Notification\n");
443 dev_warn(&device->cdev->dev,
444 "FORMAT 0 - Storage Path Restart\n");
447 dev_warn(&device->cdev->dev,
448 "FORMAT 0 - Channel requested "
449 "... %02x\n", sense[8]);
452 dev_warn(&device->cdev->dev,
453 "FORMAT 0 - Invalid Defective/"
454 "Alternate Track Pointer\n");
457 dev_warn(&device->cdev->dev,
458 "FORMAT 0 - DPS Installation "
462 dev_warn(&device->cdev->dev,
463 "FORMAT 0 - Command Invalid on "
464 "Secondary Address\n");
467 dev_warn(&device->cdev->dev,
468 "FORMAT 0 - Status Not As "
469 "Required: reason %02x\n",
473 dev_warn(&device->cdev->dev,
474 "FORMAT 0 - Reserved\n");
478 case 0x00: /* No Message */
481 dev_warn(&device->cdev->dev,
482 "FORMAT 0 - Device Error "
486 dev_warn(&device->cdev->dev,
487 "FORMAT 0 - Reserved\n");
490 dev_warn(&device->cdev->dev,
491 "FORMAT 0 - Device Fenced - "
492 "device = %02x\n", sense[4]);
495 dev_warn(&device->cdev->dev,
496 "FORMAT 0 - Data Pinned for "
500 dev_warn(&device->cdev->dev,
501 "FORMAT 0 - Reserved\n");
506 case 0x10: /* Format 1 - Device Equipment Checks */
508 case 0x00: /* No Message */
511 dev_warn(&device->cdev->dev,
512 "FORMAT 1 - Device Status 1 not as "
516 dev_warn(&device->cdev->dev,
517 "FORMAT 1 - Index missing\n");
520 dev_warn(&device->cdev->dev,
521 "FORMAT 1 - Interruption cannot be "
525 dev_warn(&device->cdev->dev,
526 "FORMAT 1 - Device did not respond to "
530 dev_warn(&device->cdev->dev,
531 "FORMAT 1 - Device check-2 error or Set "
532 "Sector is not complete\n");
535 dev_warn(&device->cdev->dev,
536 "FORMAT 1 - Head address does not "
540 dev_warn(&device->cdev->dev,
541 "FORMAT 1 - Device status 1 not valid\n");
544 dev_warn(&device->cdev->dev,
545 "FORMAT 1 - Device not ready\n");
548 dev_warn(&device->cdev->dev,
549 "FORMAT 1 - Track physical address did "
553 dev_warn(&device->cdev->dev,
554 "FORMAT 1 - Missing device address bit\n");
557 dev_warn(&device->cdev->dev,
558 "FORMAT 1 - Drive motor switch is off\n");
561 dev_warn(&device->cdev->dev,
562 "FORMAT 1 - Seek incomplete\n");
565 dev_warn(&device->cdev->dev,
566 "FORMAT 1 - Cylinder address did not "
570 dev_warn(&device->cdev->dev,
571 "FORMAT 1 - Offset active cannot be "
575 dev_warn(&device->cdev->dev,
576 "FORMAT 1 - Reserved\n");
580 case 0x20: /* Format 2 - 3990 Equipment Checks */
583 dev_warn(&device->cdev->dev,
584 "FORMAT 2 - 3990 check-2 error\n");
587 dev_warn(&device->cdev->dev,
588 "FORMAT 2 - Support facility errors\n");
591 dev_warn(&device->cdev->dev,
592 "FORMAT 2 - Microcode detected error "
597 dev_warn(&device->cdev->dev,
598 "FORMAT 2 - Reserved\n");
602 case 0x30: /* Format 3 - 3990 Control Checks */
605 dev_warn(&device->cdev->dev,
606 "FORMAT 3 - Allegiance terminated\n");
609 dev_warn(&device->cdev->dev,
610 "FORMAT 3 - Reserved\n");
614 case 0x40: /* Format 4 - Data Checks */
617 dev_warn(&device->cdev->dev,
618 "FORMAT 4 - Home address area error\n");
621 dev_warn(&device->cdev->dev,
622 "FORMAT 4 - Count area error\n");
625 dev_warn(&device->cdev->dev,
626 "FORMAT 4 - Key area error\n");
629 dev_warn(&device->cdev->dev,
630 "FORMAT 4 - Data area error\n");
633 dev_warn(&device->cdev->dev,
634 "FORMAT 4 - No sync byte in home address "
638 dev_warn(&device->cdev->dev,
639 "FORMAT 4 - No sync byte in count address "
643 dev_warn(&device->cdev->dev,
644 "FORMAT 4 - No sync byte in key area\n");
647 dev_warn(&device->cdev->dev,
648 "FORMAT 4 - No sync byte in data area\n");
651 dev_warn(&device->cdev->dev,
652 "FORMAT 4 - Home address area error; "
656 dev_warn(&device->cdev->dev,
657 "FORMAT 4 - Count area error; offset "
661 dev_warn(&device->cdev->dev,
662 "FORMAT 4 - Key area error; offset "
666 dev_warn(&device->cdev->dev,
667 "FORMAT 4 - Data area error; "
671 dev_warn(&device->cdev->dev,
672 "FORMAT 4 - No sync byte in home "
673 "address area; offset active\n");
676 dev_warn(&device->cdev->dev,
677 "FORMAT 4 - No syn byte in count "
678 "address area; offset active\n");
681 dev_warn(&device->cdev->dev,
682 "FORMAT 4 - No sync byte in key area; "
686 dev_warn(&device->cdev->dev,
687 "FORMAT 4 - No syn byte in data area; "
691 dev_warn(&device->cdev->dev,
692 "FORMAT 4 - Reserved\n");
696 case 0x50: /* Format 5 - Data Check with displacement information */
699 dev_warn(&device->cdev->dev,
700 "FORMAT 5 - Data Check in the "
701 "home address area\n");
704 dev_warn(&device->cdev->dev,
705 "FORMAT 5 - Data Check in the count "
709 dev_warn(&device->cdev->dev,
710 "FORMAT 5 - Data Check in the key area\n");
713 dev_warn(&device->cdev->dev,
714 "FORMAT 5 - Data Check in the data "
718 dev_warn(&device->cdev->dev,
719 "FORMAT 5 - Data Check in the "
720 "home address area; offset active\n");
723 dev_warn(&device->cdev->dev,
724 "FORMAT 5 - Data Check in the count area; "
728 dev_warn(&device->cdev->dev,
729 "FORMAT 5 - Data Check in the key area; "
733 dev_warn(&device->cdev->dev,
734 "FORMAT 5 - Data Check in the data area; "
738 dev_warn(&device->cdev->dev,
739 "FORMAT 5 - Reserved\n");
743 case 0x60: /* Format 6 - Usage Statistics/Overrun Errors */
746 dev_warn(&device->cdev->dev,
747 "FORMAT 6 - Overrun on channel A\n");
750 dev_warn(&device->cdev->dev,
751 "FORMAT 6 - Overrun on channel B\n");
754 dev_warn(&device->cdev->dev,
755 "FORMAT 6 - Overrun on channel C\n");
758 dev_warn(&device->cdev->dev,
759 "FORMAT 6 - Overrun on channel D\n");
762 dev_warn(&device->cdev->dev,
763 "FORMAT 6 - Overrun on channel E\n");
766 dev_warn(&device->cdev->dev,
767 "FORMAT 6 - Overrun on channel F\n");
770 dev_warn(&device->cdev->dev,
771 "FORMAT 6 - Overrun on channel G\n");
774 dev_warn(&device->cdev->dev,
775 "FORMAT 6 - Overrun on channel H\n");
778 dev_warn(&device->cdev->dev,
779 "FORMAT 6 - Reserved\n");
783 case 0x70: /* Format 7 - Device Connection Control Checks */
786 dev_warn(&device->cdev->dev,
787 "FORMAT 7 - RCC initiated by a connection "
791 dev_warn(&device->cdev->dev,
792 "FORMAT 7 - RCC 1 sequence not "
796 dev_warn(&device->cdev->dev,
797 "FORMAT 7 - RCC 1 and RCC 2 sequences not "
801 dev_warn(&device->cdev->dev,
802 "FORMAT 7 - Invalid tag-in during "
803 "selection sequence\n");
806 dev_warn(&device->cdev->dev,
807 "FORMAT 7 - extra RCC required\n");
810 dev_warn(&device->cdev->dev,
811 "FORMAT 7 - Invalid DCC selection "
812 "response or timeout\n");
815 dev_warn(&device->cdev->dev,
816 "FORMAT 7 - Missing end operation; device "
817 "transfer complete\n");
820 dev_warn(&device->cdev->dev,
821 "FORMAT 7 - Missing end operation; device "
822 "transfer incomplete\n");
825 dev_warn(&device->cdev->dev,
826 "FORMAT 7 - Invalid tag-in for an "
827 "immediate command sequence\n");
830 dev_warn(&device->cdev->dev,
831 "FORMAT 7 - Invalid tag-in for an "
832 "extended command sequence\n");
835 dev_warn(&device->cdev->dev,
836 "FORMAT 7 - 3990 microcode time out when "
837 "stopping selection\n");
840 dev_warn(&device->cdev->dev,
841 "FORMAT 7 - No response to selection "
842 "after a poll interruption\n");
845 dev_warn(&device->cdev->dev,
846 "FORMAT 7 - Permanent path error (DASD "
847 "controller not available)\n");
850 dev_warn(&device->cdev->dev,
851 "FORMAT 7 - DASD controller not available"
852 " on disconnected command chain\n");
855 dev_warn(&device->cdev->dev,
856 "FORMAT 7 - Reserved\n");
860 case 0x80: /* Format 8 - Additional Device Equipment Checks */
862 case 0x00: /* No Message */
864 dev_warn(&device->cdev->dev,
865 "FORMAT 8 - Error correction code "
869 dev_warn(&device->cdev->dev,
870 "FORMAT 8 - Unexpected end operation "
874 dev_warn(&device->cdev->dev,
875 "FORMAT 8 - End operation with transfer "
879 dev_warn(&device->cdev->dev,
880 "FORMAT 8 - End operation with transfer "
884 dev_warn(&device->cdev->dev,
885 "FORMAT 8 - DPS checks after a system "
886 "reset or selective reset\n");
889 dev_warn(&device->cdev->dev,
890 "FORMAT 8 - DPS cannot be filled\n");
893 dev_warn(&device->cdev->dev,
894 "FORMAT 8 - Short busy time-out during "
895 "device selection\n");
898 dev_warn(&device->cdev->dev,
899 "FORMAT 8 - DASD controller failed to "
900 "set or reset the long busy latch\n");
903 dev_warn(&device->cdev->dev,
904 "FORMAT 8 - No interruption from device "
905 "during a command chain\n");
908 dev_warn(&device->cdev->dev,
909 "FORMAT 8 - Reserved\n");
913 case 0x90: /* Format 9 - Device Read, Write, and Seek Checks */
916 break; /* No Message */
918 dev_warn(&device->cdev->dev,
919 "FORMAT 9 - Device check-2 error\n");
922 dev_warn(&device->cdev->dev,
923 "FORMAT 9 - Head address did not "
927 dev_warn(&device->cdev->dev,
928 "FORMAT 9 - Track physical address did "
929 "not compare while oriented\n");
932 dev_warn(&device->cdev->dev,
933 "FORMAT 9 - Cylinder address did not "
937 dev_warn(&device->cdev->dev,
938 "FORMAT 9 - Reserved\n");
942 case 0xF0: /* Format F - Cache Storage Checks */
945 dev_warn(&device->cdev->dev,
946 "FORMAT F - Operation Terminated\n");
949 dev_warn(&device->cdev->dev,
950 "FORMAT F - Subsystem Processing Error\n");
953 dev_warn(&device->cdev->dev,
954 "FORMAT F - Cache or nonvolatile storage "
955 "equipment failure\n");
958 dev_warn(&device->cdev->dev,
959 "FORMAT F - Caching terminated\n");
962 dev_warn(&device->cdev->dev,
963 "FORMAT F - Cache fast write access not "
967 dev_warn(&device->cdev->dev,
968 "FORMAT F - Track format incorrect\n");
971 dev_warn(&device->cdev->dev,
972 "FORMAT F - Caching reinitiated\n");
975 dev_warn(&device->cdev->dev,
976 "FORMAT F - Nonvolatile storage "
980 dev_warn(&device->cdev->dev,
981 "FORMAT F - Volume is suspended duplex\n");
982 /* call extended error reporting (EER) */
983 dasd_eer_write(device, erp->refers,
984 DASD_EER_PPRCSUSPEND);
987 dev_warn(&device->cdev->dev,
988 "FORMAT F - Subsystem status cannot be "
992 dev_warn(&device->cdev->dev,
993 "FORMAT F - Caching status reset to "
997 dev_warn(&device->cdev->dev,
998 "FORMAT F - DASD Fast Write inhibited\n");
1001 dev_warn(&device->cdev->dev,
1002 "FORMAT D - Reserved\n");
1006 default: /* unknown message format - should not happen
1007 internal error 03 - unknown message format */
1008 snprintf(errorstring, ERRORLENGTH, "03 %x02", msg_format);
1009 dev_err(&device->cdev->dev,
1010 "An error occurred in the DASD device driver, "
1011 "reason=%s\n", errorstring);
1013 } /* end switch message format */
1015 } /* end dasd_3990_handle_env_data */
1018 * DASD_3990_ERP_COM_REJ
1021 * Handles 24 byte 'Command Reject' error.
1024 * erp current erp_head
1025 * sense current sense data
1028 * erp 'new' erp_head - pointer to new ERP
1030 static struct dasd_ccw_req *
1031 dasd_3990_erp_com_rej(struct dasd_ccw_req * erp, char *sense)
1034 struct dasd_device *device = erp->startdev;
1036 erp->function = dasd_3990_erp_com_rej;
1038 /* env data present (ACTION 10 - retry should work) */
1039 if (sense[2] & SNS2_ENV_DATA_PRESENT) {
1041 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1042 "Command Reject - environmental data present");
1044 dasd_3990_handle_env_data(erp, sense);
1049 /* fatal error - set status to FAILED
1050 internal error 09 - Command Reject */
1051 dev_err(&device->cdev->dev, "An error occurred in the DASD "
1052 "device driver, reason=%s\n", "09");
1054 erp = dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
1059 } /* end dasd_3990_erp_com_rej */
1062 * DASD_3990_ERP_BUS_OUT
1065 * Handles 24 byte 'Bus Out Parity Check' error.
1068 * erp current erp_head
1070 * erp new erp_head - pointer to new ERP
1072 static struct dasd_ccw_req *
1073 dasd_3990_erp_bus_out(struct dasd_ccw_req * erp)
1076 struct dasd_device *device = erp->startdev;
1078 /* first time set initial retry counter and erp_function */
1079 /* and retry once without blocking queue */
1080 /* (this enables easier enqueing of the cqr) */
1081 if (erp->function != dasd_3990_erp_bus_out) {
1083 erp->function = dasd_3990_erp_bus_out;
1087 /* issue a message and wait for 'device ready' interrupt */
1088 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1089 "bus out parity error or BOPC requested by "
1092 dasd_3990_erp_block_queue(erp, 60*HZ);
1098 } /* end dasd_3990_erp_bus_out */
1101 * DASD_3990_ERP_EQUIP_CHECK
1104 * Handles 24 byte 'Equipment Check' error.
1107 * erp current erp_head
1109 * erp new erp_head - pointer to new ERP
1111 static struct dasd_ccw_req *
1112 dasd_3990_erp_equip_check(struct dasd_ccw_req * erp, char *sense)
1115 struct dasd_device *device = erp->startdev;
1117 erp->function = dasd_3990_erp_equip_check;
1119 if (sense[1] & SNS1_WRITE_INHIBITED) {
1120 dev_info(&device->cdev->dev,
1121 "Write inhibited path encountered\n");
1123 /* vary path offline
1124 internal error 04 - Path should be varied off-line.*/
1125 dev_err(&device->cdev->dev, "An error occurred in the DASD "
1126 "device driver, reason=%s\n", "04");
1128 erp = dasd_3990_erp_action_1(erp);
1130 } else if (sense[2] & SNS2_ENV_DATA_PRESENT) {
1132 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1133 "Equipment Check - " "environmental data present");
1135 dasd_3990_handle_env_data(erp, sense);
1137 erp = dasd_3990_erp_action_4(erp, sense);
1139 } else if (sense[1] & SNS1_PERM_ERR) {
1141 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1142 "Equipment Check - retry exhausted or "
1145 erp = dasd_3990_erp_action_1(erp);
1148 /* all other equipment checks - Action 5 */
1149 /* rest is done when retries == 0 */
1150 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1151 "Equipment check or processing error");
1153 erp = dasd_3990_erp_action_5(erp);
1157 } /* end dasd_3990_erp_equip_check */
1160 * DASD_3990_ERP_DATA_CHECK
1163 * Handles 24 byte 'Data Check' error.
1166 * erp current erp_head
1168 * erp new erp_head - pointer to new ERP
1170 static struct dasd_ccw_req *
1171 dasd_3990_erp_data_check(struct dasd_ccw_req * erp, char *sense)
1174 struct dasd_device *device = erp->startdev;
1176 erp->function = dasd_3990_erp_data_check;
1178 if (sense[2] & SNS2_CORRECTABLE) { /* correctable data check */
1180 /* issue message that the data has been corrected */
1181 dev_emerg(&device->cdev->dev,
1182 "Data recovered during retry with PCI "
1183 "fetch mode active\n");
1185 /* not possible to handle this situation in Linux */
1186 panic("No way to inform application about the possibly "
1189 } else if (sense[2] & SNS2_ENV_DATA_PRESENT) {
1191 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1192 "Uncorrectable data check recovered secondary "
1193 "addr of duplex pair");
1195 erp = dasd_3990_erp_action_4(erp, sense);
1197 } else if (sense[1] & SNS1_PERM_ERR) {
1199 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1200 "Uncorrectable data check with internal "
1203 erp = dasd_3990_erp_action_1(erp);
1206 /* all other data checks */
1207 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1208 "Uncorrectable data check with retry count "
1211 erp = dasd_3990_erp_action_5(erp);
1216 } /* end dasd_3990_erp_data_check */
1219 * DASD_3990_ERP_OVERRUN
1222 * Handles 24 byte 'Overrun' error.
1225 * erp current erp_head
1227 * erp new erp_head - pointer to new ERP
1229 static struct dasd_ccw_req *
1230 dasd_3990_erp_overrun(struct dasd_ccw_req * erp, char *sense)
1233 struct dasd_device *device = erp->startdev;
1235 erp->function = dasd_3990_erp_overrun;
1237 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1238 "Overrun - service overrun or overrun"
1239 " error requested by channel");
1241 erp = dasd_3990_erp_action_5(erp);
1245 } /* end dasd_3990_erp_overrun */
1248 * DASD_3990_ERP_INV_FORMAT
1251 * Handles 24 byte 'Invalid Track Format' error.
1254 * erp current erp_head
1256 * erp new erp_head - pointer to new ERP
1258 static struct dasd_ccw_req *
1259 dasd_3990_erp_inv_format(struct dasd_ccw_req * erp, char *sense)
1262 struct dasd_device *device = erp->startdev;
1264 erp->function = dasd_3990_erp_inv_format;
1266 if (sense[2] & SNS2_ENV_DATA_PRESENT) {
1268 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1269 "Track format error when destaging or "
1272 dasd_3990_handle_env_data(erp, sense);
1274 erp = dasd_3990_erp_action_4(erp, sense);
1277 /* internal error 06 - The track format is not valid*/
1278 dev_err(&device->cdev->dev,
1279 "An error occurred in the DASD device driver, "
1280 "reason=%s\n", "06");
1282 erp = dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
1287 } /* end dasd_3990_erp_inv_format */
1293 * Handles 24 byte 'End-of-Cylinder' error.
1296 * erp already added default erp
1298 * erp pointer to original (failed) cqr.
1300 static struct dasd_ccw_req *
1301 dasd_3990_erp_EOC(struct dasd_ccw_req * default_erp, char *sense)
1304 struct dasd_device *device = default_erp->startdev;
1306 dev_err(&device->cdev->dev,
1307 "The cylinder data for accessing the DASD is inconsistent\n");
1309 /* implement action 7 - BUG */
1310 return dasd_3990_erp_cleanup(default_erp, DASD_CQR_FAILED);
1312 } /* end dasd_3990_erp_EOC */
1315 * DASD_3990_ERP_ENV_DATA
1318 * Handles 24 byte 'Environmental-Data Present' error.
1321 * erp current erp_head
1323 * erp new erp_head - pointer to new ERP
1325 static struct dasd_ccw_req *
1326 dasd_3990_erp_env_data(struct dasd_ccw_req * erp, char *sense)
1329 struct dasd_device *device = erp->startdev;
1331 erp->function = dasd_3990_erp_env_data;
1333 DBF_DEV_EVENT(DBF_WARNING, device, "%s", "Environmental data present");
1335 dasd_3990_handle_env_data(erp, sense);
1337 /* don't retry on disabled interface */
1338 if (sense[7] != 0x0F) {
1339 erp = dasd_3990_erp_action_4(erp, sense);
1341 erp->status = DASD_CQR_FILLED;
1346 } /* end dasd_3990_erp_env_data */
1349 * DASD_3990_ERP_NO_REC
1352 * Handles 24 byte 'No Record Found' error.
1355 * erp already added default ERP
1358 * erp new erp_head - pointer to new ERP
1360 static struct dasd_ccw_req *
1361 dasd_3990_erp_no_rec(struct dasd_ccw_req * default_erp, char *sense)
1364 struct dasd_device *device = default_erp->startdev;
1366 dev_err(&device->cdev->dev,
1367 "The specified record was not found\n");
1369 return dasd_3990_erp_cleanup(default_erp, DASD_CQR_FAILED);
1371 } /* end dasd_3990_erp_no_rec */
1374 * DASD_3990_ERP_FILE_PROT
1377 * Handles 24 byte 'File Protected' error.
1378 * Note: Seek related recovery is not implemented because
1379 * wee don't use the seek command yet.
1382 * erp current erp_head
1384 * erp new erp_head - pointer to new ERP
1386 static struct dasd_ccw_req *
1387 dasd_3990_erp_file_prot(struct dasd_ccw_req * erp)
1390 struct dasd_device *device = erp->startdev;
1392 dev_err(&device->cdev->dev, "Accessing the DASD failed because of "
1393 "a hardware error\n");
1395 return dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
1397 } /* end dasd_3990_erp_file_prot */
1400 * DASD_3990_ERP_INSPECT_ALIAS
1403 * Checks if the original request was started on an alias device.
1404 * If yes, it modifies the original and the erp request so that
1405 * the erp request can be started on a base device.
1408 * erp pointer to the currently created default ERP
1411 * erp pointer to the modified ERP, or NULL
1414 static struct dasd_ccw_req *dasd_3990_erp_inspect_alias(
1415 struct dasd_ccw_req *erp)
1417 struct dasd_ccw_req *cqr = erp->refers;
1420 (cqr->block->base != cqr->startdev)) {
1421 if (cqr->startdev->features & DASD_FEATURE_ERPLOG) {
1422 DBF_DEV_EVENT(DBF_ERR, cqr->startdev,
1423 "ERP on alias device for request %p,"
1424 " recover on base device %s", cqr,
1425 dev_name(&cqr->block->base->cdev->dev));
1427 dasd_eckd_reset_ccw_to_base_io(cqr);
1428 erp->startdev = cqr->block->base;
1429 erp->function = dasd_3990_erp_inspect_alias;
1437 * DASD_3990_ERP_INSPECT_24
1440 * Does a detailed inspection of the 24 byte sense data
1441 * and sets up a related error recovery action.
1444 * sense sense data of the actual error
1445 * erp pointer to the currently created default ERP
1448 * erp pointer to the (addtitional) ERP
1450 static struct dasd_ccw_req *
1451 dasd_3990_erp_inspect_24(struct dasd_ccw_req * erp, char *sense)
1454 struct dasd_ccw_req *erp_filled = NULL;
1456 /* Check sense for .... */
1457 /* 'Command Reject' */
1458 if ((erp_filled == NULL) && (sense[0] & SNS0_CMD_REJECT)) {
1459 erp_filled = dasd_3990_erp_com_rej(erp, sense);
1461 /* 'Intervention Required' */
1462 if ((erp_filled == NULL) && (sense[0] & SNS0_INTERVENTION_REQ)) {
1463 erp_filled = dasd_3990_erp_int_req(erp);
1465 /* 'Bus Out Parity Check' */
1466 if ((erp_filled == NULL) && (sense[0] & SNS0_BUS_OUT_CHECK)) {
1467 erp_filled = dasd_3990_erp_bus_out(erp);
1469 /* 'Equipment Check' */
1470 if ((erp_filled == NULL) && (sense[0] & SNS0_EQUIPMENT_CHECK)) {
1471 erp_filled = dasd_3990_erp_equip_check(erp, sense);
1474 if ((erp_filled == NULL) && (sense[0] & SNS0_DATA_CHECK)) {
1475 erp_filled = dasd_3990_erp_data_check(erp, sense);
1478 if ((erp_filled == NULL) && (sense[0] & SNS0_OVERRUN)) {
1479 erp_filled = dasd_3990_erp_overrun(erp, sense);
1481 /* 'Invalid Track Format' */
1482 if ((erp_filled == NULL) && (sense[1] & SNS1_INV_TRACK_FORMAT)) {
1483 erp_filled = dasd_3990_erp_inv_format(erp, sense);
1485 /* 'End-of-Cylinder' */
1486 if ((erp_filled == NULL) && (sense[1] & SNS1_EOC)) {
1487 erp_filled = dasd_3990_erp_EOC(erp, sense);
1489 /* 'Environmental Data' */
1490 if ((erp_filled == NULL) && (sense[2] & SNS2_ENV_DATA_PRESENT)) {
1491 erp_filled = dasd_3990_erp_env_data(erp, sense);
1493 /* 'No Record Found' */
1494 if ((erp_filled == NULL) && (sense[1] & SNS1_NO_REC_FOUND)) {
1495 erp_filled = dasd_3990_erp_no_rec(erp, sense);
1497 /* 'File Protected' */
1498 if ((erp_filled == NULL) && (sense[1] & SNS1_FILE_PROTECTED)) {
1499 erp_filled = dasd_3990_erp_file_prot(erp);
1501 /* other (unknown) error - do default ERP */
1502 if (erp_filled == NULL) {
1509 } /* END dasd_3990_erp_inspect_24 */
1512 *****************************************************************************
1513 * 32 byte sense ERP functions (only)
1514 *****************************************************************************
1518 * DASD_3990_ERPACTION_10_32
1521 * Handles 32 byte 'Action 10' of Single Program Action Codes.
1522 * Just retry and if retry doesn't work, return with error.
1525 * erp current erp_head
1526 * sense current sense data
1528 * erp modified erp_head
1530 static struct dasd_ccw_req *
1531 dasd_3990_erp_action_10_32(struct dasd_ccw_req * erp, char *sense)
1534 struct dasd_device *device = erp->startdev;
1537 erp->function = dasd_3990_erp_action_10_32;
1539 DBF_DEV_EVENT(DBF_WARNING, device, "%s", "Perform logging requested");
1543 } /* end dasd_3990_erp_action_10_32 */
1546 * DASD_3990_ERP_ACTION_1B_32
1549 * Handles 32 byte 'Action 1B' of Single Program Action Codes.
1550 * A write operation could not be finished because of an unexpected
1552 * The already created 'default erp' is used to get the link to
1553 * the erp chain, but it can not be used for this recovery
1554 * action because it contains no DE/LO data space.
1557 * default_erp already added default erp.
1558 * sense current sense data
1562 * default_erp in case of imprecise ending or error
1564 static struct dasd_ccw_req *
1565 dasd_3990_erp_action_1B_32(struct dasd_ccw_req * default_erp, char *sense)
1568 struct dasd_device *device = default_erp->startdev;
1570 struct dasd_ccw_req *cqr;
1571 struct dasd_ccw_req *erp;
1572 struct DE_eckd_data *DE_data;
1573 struct PFX_eckd_data *PFX_data;
1574 char *LO_data; /* LO_eckd_data_t */
1575 struct ccw1 *ccw, *oldccw;
1577 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1578 "Write not finished because of unexpected condition");
1580 default_erp->function = dasd_3990_erp_action_1B_32;
1582 /* determine the original cqr */
1585 while (cqr->refers != NULL) {
1589 if (scsw_is_tm(&cqr->irb.scsw)) {
1590 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1591 "32 bit sense, action 1B is not defined"
1592 " in transport mode - just retry");
1596 /* for imprecise ending just do default erp */
1597 if (sense[1] & 0x01) {
1598 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1599 "Imprecise ending is set - just retry");
1604 /* determine the address of the CCW to be restarted */
1605 /* Imprecise ending is not set -> addr from IRB-SCSW */
1606 cpa = default_erp->refers->irb.scsw.cmd.cpa;
1609 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1610 "Unable to determine address of the CCW "
1613 return dasd_3990_erp_cleanup(default_erp, DASD_CQR_FAILED);
1616 /* Build new ERP request including DE/LO */
1617 erp = dasd_alloc_erp_request((char *) &cqr->magic,
1618 2 + 1,/* DE/LO + TIC */
1619 sizeof(struct DE_eckd_data) +
1620 sizeof(struct LO_eckd_data), device);
1623 /* internal error 01 - Unable to allocate ERP */
1624 dev_err(&device->cdev->dev, "An error occurred in the DASD "
1625 "device driver, reason=%s\n", "01");
1626 return dasd_3990_erp_cleanup(default_erp, DASD_CQR_FAILED);
1629 /* use original DE */
1630 DE_data = erp->data;
1631 oldccw = cqr->cpaddr;
1632 if (oldccw->cmd_code == DASD_ECKD_CCW_PFX) {
1633 PFX_data = cqr->data;
1634 memcpy(DE_data, &PFX_data->define_extent,
1635 sizeof(struct DE_eckd_data));
1637 memcpy(DE_data, cqr->data, sizeof(struct DE_eckd_data));
1640 LO_data = erp->data + sizeof(struct DE_eckd_data);
1642 if ((sense[3] == 0x01) && (LO_data[1] & 0x01)) {
1644 return dasd_3990_erp_cleanup(default_erp, DASD_CQR_FAILED);
1647 if ((sense[7] & 0x3F) == 0x01) {
1648 /* operation code is WRITE DATA -> data area orientation */
1651 } else if ((sense[7] & 0x3F) == 0x03) {
1652 /* operation code is FORMAT WRITE -> index orientation */
1656 LO_data[0] = sense[7]; /* operation */
1659 LO_data[1] = sense[8]; /* auxiliary */
1660 LO_data[2] = sense[9];
1661 LO_data[3] = sense[3]; /* count */
1662 LO_data[4] = sense[29]; /* seek_addr.cyl */
1663 LO_data[5] = sense[30]; /* seek_addr.cyl 2nd byte */
1664 LO_data[7] = sense[31]; /* seek_addr.head 2nd byte */
1666 memcpy(&(LO_data[8]), &(sense[11]), 8);
1670 memset(ccw, 0, sizeof(struct ccw1));
1671 ccw->cmd_code = DASD_ECKD_CCW_DEFINE_EXTENT;
1672 ccw->flags = CCW_FLAG_CC;
1674 ccw->cda = (__u32)(addr_t) DE_data;
1678 memset(ccw, 0, sizeof(struct ccw1));
1679 ccw->cmd_code = DASD_ECKD_CCW_LOCATE_RECORD;
1680 ccw->flags = CCW_FLAG_CC;
1682 ccw->cda = (__u32)(addr_t) LO_data;
1684 /* TIC to the failed ccw */
1686 ccw->cmd_code = CCW_CMD_TIC;
1689 /* fill erp related fields */
1690 erp->function = dasd_3990_erp_action_1B_32;
1691 erp->refers = default_erp->refers;
1692 erp->startdev = device;
1693 erp->memdev = device;
1694 erp->magic = default_erp->magic;
1697 erp->buildclk = get_clock();
1698 erp->status = DASD_CQR_FILLED;
1700 /* remove the default erp */
1701 dasd_free_erp_request(default_erp, device);
1705 } /* end dasd_3990_erp_action_1B_32 */
1708 * DASD_3990_UPDATE_1B
1711 * Handles the update to the 32 byte 'Action 1B' of Single Program
1712 * Action Codes in case the first action was not successful.
1713 * The already created 'previous_erp' is the currently not successful
1717 * previous_erp already created previous erp.
1718 * sense current sense data
1722 static struct dasd_ccw_req *
1723 dasd_3990_update_1B(struct dasd_ccw_req * previous_erp, char *sense)
1726 struct dasd_device *device = previous_erp->startdev;
1728 struct dasd_ccw_req *cqr;
1729 struct dasd_ccw_req *erp;
1730 char *LO_data; /* struct LO_eckd_data */
1733 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1734 "Write not finished because of unexpected condition"
1737 /* determine the original cqr */
1740 while (cqr->refers != NULL) {
1744 if (scsw_is_tm(&cqr->irb.scsw)) {
1745 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1746 "32 bit sense, action 1B, update,"
1747 " in transport mode - just retry");
1748 return previous_erp;
1751 /* for imprecise ending just do default erp */
1752 if (sense[1] & 0x01) {
1753 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
1754 "Imprecise ending is set - just retry");
1756 previous_erp->status = DASD_CQR_FILLED;
1758 return previous_erp;
1761 /* determine the address of the CCW to be restarted */
1762 /* Imprecise ending is not set -> addr from IRB-SCSW */
1763 cpa = previous_erp->irb.scsw.cmd.cpa;
1766 /* internal error 02 -
1767 Unable to determine address of the CCW to be restarted */
1768 dev_err(&device->cdev->dev, "An error occurred in the DASD "
1769 "device driver, reason=%s\n", "02");
1771 previous_erp->status = DASD_CQR_FAILED;
1773 return previous_erp;
1778 /* update the LO with the new returned sense data */
1779 LO_data = erp->data + sizeof(struct DE_eckd_data);
1781 if ((sense[3] == 0x01) && (LO_data[1] & 0x01)) {
1782 /* should not happen */
1783 previous_erp->status = DASD_CQR_FAILED;
1785 return previous_erp;
1788 if ((sense[7] & 0x3F) == 0x01) {
1789 /* operation code is WRITE DATA -> data area orientation */
1792 } else if ((sense[7] & 0x3F) == 0x03) {
1793 /* operation code is FORMAT WRITE -> index orientation */
1797 LO_data[0] = sense[7]; /* operation */
1800 LO_data[1] = sense[8]; /* auxiliary */
1801 LO_data[2] = sense[9];
1802 LO_data[3] = sense[3]; /* count */
1803 LO_data[4] = sense[29]; /* seek_addr.cyl */
1804 LO_data[5] = sense[30]; /* seek_addr.cyl 2nd byte */
1805 LO_data[7] = sense[31]; /* seek_addr.head 2nd byte */
1807 memcpy(&(LO_data[8]), &(sense[11]), 8);
1809 /* TIC to the failed ccw */
1810 ccw = erp->cpaddr; /* addr of DE ccw */
1811 ccw++; /* addr of LE ccw */
1812 ccw++; /* addr of TIC ccw */
1815 erp->status = DASD_CQR_FILLED;
1819 } /* end dasd_3990_update_1B */
1822 * DASD_3990_ERP_COMPOUND_RETRY
1825 * Handles the compound ERP action retry code.
1826 * NOTE: At least one retry is done even if zero is specified
1827 * by the sense data. This makes enqueueing of the request
1831 * sense sense data of the actual error
1832 * erp pointer to the currently created ERP
1835 * erp modified ERP pointer
1839 dasd_3990_erp_compound_retry(struct dasd_ccw_req * erp, char *sense)
1842 switch (sense[25] & 0x03) {
1843 case 0x00: /* no not retry */
1847 case 0x01: /* retry 2 times */
1851 case 0x02: /* retry 10 times */
1855 case 0x03: /* retry 256 times */
1863 erp->function = dasd_3990_erp_compound_retry;
1865 } /* end dasd_3990_erp_compound_retry */
1868 * DASD_3990_ERP_COMPOUND_PATH
1871 * Handles the compound ERP action for retry on alternate
1875 * sense sense data of the actual error
1876 * erp pointer to the currently created ERP
1879 * erp modified ERP pointer
1883 dasd_3990_erp_compound_path(struct dasd_ccw_req * erp, char *sense)
1886 if (sense[25] & DASD_SENSE_BIT_3) {
1887 dasd_3990_erp_alternate_path(erp);
1889 if (erp->status == DASD_CQR_FAILED) {
1890 /* reset the lpm and the status to be able to
1891 * try further actions. */
1894 erp->status = DASD_CQR_NEED_ERP;
1898 erp->function = dasd_3990_erp_compound_path;
1900 } /* end dasd_3990_erp_compound_path */
1903 * DASD_3990_ERP_COMPOUND_CODE
1906 * Handles the compound ERP action for retry code.
1909 * sense sense data of the actual error
1910 * erp pointer to the currently created ERP
1913 * erp NEW ERP pointer
1916 static struct dasd_ccw_req *
1917 dasd_3990_erp_compound_code(struct dasd_ccw_req * erp, char *sense)
1920 if (sense[25] & DASD_SENSE_BIT_2) {
1922 switch (sense[28]) {
1924 /* issue a Diagnostic Control command with an
1925 * Inhibit Write subcommand and controller modifier */
1926 erp = dasd_3990_erp_DCTL(erp, 0x20);
1930 /* wait for 5 seconds and retry again */
1933 dasd_3990_erp_block_queue (erp, 5*HZ);
1937 /* should not happen - continue */
1942 erp->function = dasd_3990_erp_compound_code;
1946 } /* end dasd_3990_erp_compound_code */
1949 * DASD_3990_ERP_COMPOUND_CONFIG
1952 * Handles the compound ERP action for configruation
1954 * Note: duplex handling is not implemented (yet).
1957 * sense sense data of the actual error
1958 * erp pointer to the currently created ERP
1961 * erp modified ERP pointer
1965 dasd_3990_erp_compound_config(struct dasd_ccw_req * erp, char *sense)
1968 if ((sense[25] & DASD_SENSE_BIT_1) && (sense[26] & DASD_SENSE_BIT_2)) {
1970 /* set to suspended duplex state then restart
1971 internal error 05 - Set device to suspended duplex state
1973 struct dasd_device *device = erp->startdev;
1974 dev_err(&device->cdev->dev,
1975 "An error occurred in the DASD device driver, "
1976 "reason=%s\n", "05");
1980 erp->function = dasd_3990_erp_compound_config;
1982 } /* end dasd_3990_erp_compound_config */
1985 * DASD_3990_ERP_COMPOUND
1988 * Does the further compound program action if
1989 * compound retry was not successful.
1992 * sense sense data of the actual error
1993 * erp pointer to the current (failed) ERP
1996 * erp (additional) ERP pointer
1999 static struct dasd_ccw_req *
2000 dasd_3990_erp_compound(struct dasd_ccw_req * erp, char *sense)
2003 if ((erp->function == dasd_3990_erp_compound_retry) &&
2004 (erp->status == DASD_CQR_NEED_ERP)) {
2006 dasd_3990_erp_compound_path(erp, sense);
2009 if ((erp->function == dasd_3990_erp_compound_path) &&
2010 (erp->status == DASD_CQR_NEED_ERP)) {
2012 erp = dasd_3990_erp_compound_code(erp, sense);
2015 if ((erp->function == dasd_3990_erp_compound_code) &&
2016 (erp->status == DASD_CQR_NEED_ERP)) {
2018 dasd_3990_erp_compound_config(erp, sense);
2021 /* if no compound action ERP specified, the request failed */
2022 if (erp->status == DASD_CQR_NEED_ERP)
2023 erp->status = DASD_CQR_FAILED;
2027 } /* end dasd_3990_erp_compound */
2030 *DASD_3990_ERP_HANDLE_SIM
2033 * inspects the SIM SENSE data and starts an appropriate action
2036 * sense sense data of the actual error
2042 dasd_3990_erp_handle_sim(struct dasd_device *device, char *sense)
2044 /* print message according to log or message to operator mode */
2045 if ((sense[24] & DASD_SIM_MSG_TO_OP) || (sense[1] & 0x10)) {
2046 /* print SIM SRC from RefCode */
2047 dev_err(&device->cdev->dev, "SIM - SRC: "
2048 "%02x%02x%02x%02x\n", sense[22],
2049 sense[23], sense[11], sense[12]);
2050 } else if (sense[24] & DASD_SIM_LOG) {
2051 /* print SIM SRC Refcode */
2052 dev_warn(&device->cdev->dev, "log SIM - SRC: "
2053 "%02x%02x%02x%02x\n", sense[22],
2054 sense[23], sense[11], sense[12]);
2059 * DASD_3990_ERP_INSPECT_32
2062 * Does a detailed inspection of the 32 byte sense data
2063 * and sets up a related error recovery action.
2066 * sense sense data of the actual error
2067 * erp pointer to the currently created default ERP
2070 * erp_filled pointer to the ERP
2073 static struct dasd_ccw_req *
2074 dasd_3990_erp_inspect_32(struct dasd_ccw_req * erp, char *sense)
2077 struct dasd_device *device = erp->startdev;
2079 erp->function = dasd_3990_erp_inspect_32;
2081 /* check for SIM sense data */
2082 if ((sense[6] & DASD_SIM_SENSE) == DASD_SIM_SENSE)
2083 dasd_3990_erp_handle_sim(device, sense);
2085 if (sense[25] & DASD_SENSE_BIT_0) {
2087 /* compound program action codes (byte25 bit 0 == '1') */
2088 dasd_3990_erp_compound_retry(erp, sense);
2092 /* single program action codes (byte25 bit 0 == '0') */
2093 switch (sense[25]) {
2095 case 0x00: /* success - use default ERP for retries */
2096 DBF_DEV_EVENT(DBF_DEBUG, device, "%s",
2097 "ERP called for successful request"
2101 case 0x01: /* fatal error */
2102 dev_err(&device->cdev->dev,
2103 "ERP failed for the DASD\n");
2105 erp = dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
2108 case 0x02: /* intervention required */
2109 case 0x03: /* intervention required during dual copy */
2110 erp = dasd_3990_erp_int_req(erp);
2113 case 0x0F: /* length mismatch during update write command
2114 internal error 08 - update write command error*/
2115 dev_err(&device->cdev->dev, "An error occurred in the "
2116 "DASD device driver, reason=%s\n", "08");
2118 erp = dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
2121 case 0x10: /* logging required for other channel program */
2122 erp = dasd_3990_erp_action_10_32(erp, sense);
2125 case 0x15: /* next track outside defined extend
2126 internal error 07 - The next track is not
2127 within the defined storage extent */
2128 dev_err(&device->cdev->dev,
2129 "An error occurred in the DASD device driver, "
2130 "reason=%s\n", "07");
2132 erp = dasd_3990_erp_cleanup(erp, DASD_CQR_FAILED);
2135 case 0x1B: /* unexpected condition during write */
2137 erp = dasd_3990_erp_action_1B_32(erp, sense);
2140 case 0x1C: /* invalid data */
2141 dev_emerg(&device->cdev->dev,
2142 "Data recovered during retry with PCI "
2143 "fetch mode active\n");
2145 /* not possible to handle this situation in Linux */
2147 ("Invalid data - No way to inform application "
2148 "about the possibly incorrect data");
2151 case 0x1D: /* state-change pending */
2152 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
2153 "A State change pending condition exists "
2154 "for the subsystem or device");
2156 erp = dasd_3990_erp_action_4(erp, sense);
2159 case 0x1E: /* busy */
2160 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
2161 "Busy condition exists "
2162 "for the subsystem or device");
2163 erp = dasd_3990_erp_action_4(erp, sense);
2166 default: /* all others errors - default erp */
2173 } /* end dasd_3990_erp_inspect_32 */
2176 *****************************************************************************
2177 * main ERP control fuctions (24 and 32 byte sense)
2178 *****************************************************************************
2182 * DASD_3990_ERP_CONTROL_CHECK
2185 * Does a generic inspection if a control check occured and sets up
2186 * the related error recovery procedure
2189 * erp pointer to the currently created default ERP
2192 * erp_filled pointer to the erp
2195 static struct dasd_ccw_req *
2196 dasd_3990_erp_control_check(struct dasd_ccw_req *erp)
2198 struct dasd_device *device = erp->startdev;
2200 if (scsw_cstat(&erp->refers->irb.scsw) & (SCHN_STAT_INTF_CTRL_CHK
2201 | SCHN_STAT_CHN_CTRL_CHK)) {
2202 DBF_DEV_EVENT(DBF_WARNING, device, "%s",
2203 "channel or interface control check");
2204 erp = dasd_3990_erp_action_4(erp, NULL);
2210 * DASD_3990_ERP_INSPECT
2213 * Does a detailed inspection for sense data by calling either
2214 * the 24-byte or the 32-byte inspection routine.
2217 * erp pointer to the currently created default ERP
2219 * erp_new contens was possibly modified
2221 static struct dasd_ccw_req *
2222 dasd_3990_erp_inspect(struct dasd_ccw_req *erp)
2225 struct dasd_ccw_req *erp_new = NULL;
2228 /* if this problem occured on an alias retry on base */
2229 erp_new = dasd_3990_erp_inspect_alias(erp);
2233 /* sense data are located in the refers record of the
2234 * already set up new ERP !
2235 * check if concurrent sens is available
2237 sense = dasd_get_sense(&erp->refers->irb);
2239 erp_new = dasd_3990_erp_control_check(erp);
2240 /* distinguish between 24 and 32 byte sense data */
2241 else if (sense[27] & DASD_SENSE_BIT_0) {
2243 /* inspect the 24 byte sense data */
2244 erp_new = dasd_3990_erp_inspect_24(erp, sense);
2248 /* inspect the 32 byte sense data */
2249 erp_new = dasd_3990_erp_inspect_32(erp, sense);
2251 } /* end distinguish between 24 and 32 byte sense data */
2257 * DASD_3990_ERP_ADD_ERP
2260 * This funtion adds an additional request block (ERP) to the head of
2261 * the given cqr (or erp).
2262 * For a command mode cqr the erp is initialized as an default erp
2264 * For transport mode we make a copy of the original TCW (points to
2265 * the original TCCB, TIDALs, etc.) but give it a fresh
2266 * TSB so the original sense data will not be changed.
2269 * cqr head of the current ERP-chain (or single cqr if
2272 * erp pointer to new ERP-chain head
2274 static struct dasd_ccw_req *dasd_3990_erp_add_erp(struct dasd_ccw_req *cqr)
2277 struct dasd_device *device = cqr->startdev;
2279 struct dasd_ccw_req *erp;
2280 int cplength, datasize;
2284 if (cqr->cpmode == 1) {
2286 datasize = sizeof(struct tcw) + sizeof(struct tsb);
2292 /* allocate additional request block */
2293 erp = dasd_alloc_erp_request((char *) &cqr->magic,
2294 cplength, datasize, device);
2296 if (cqr->retries <= 0) {
2297 DBF_DEV_EVENT(DBF_ERR, device, "%s",
2298 "Unable to allocate ERP request");
2299 cqr->status = DASD_CQR_FAILED;
2300 cqr->stopclk = get_clock ();
2302 DBF_DEV_EVENT(DBF_ERR, device,
2303 "Unable to allocate ERP request "
2304 "(%i retries left)",
2306 dasd_block_set_timer(device->block, (HZ << 3));
2312 if (cqr->cpmode == 1) {
2313 /* make a shallow copy of the original tcw but set new tsb */
2315 erp->cpaddr = erp->data;
2317 tsb = (struct tsb *) &tcw[1];
2318 *tcw = *((struct tcw *)cqr->cpaddr);
2319 tcw->tsb = (long)tsb;
2320 } else if (ccw->cmd_code == DASD_ECKD_CCW_PSF) {
2321 /* PSF cannot be chained from NOOP/TIC */
2322 erp->cpaddr = cqr->cpaddr;
2324 /* initialize request with default TIC to current ERP/CQR */
2326 ccw->cmd_code = CCW_CMD_NOOP;
2327 ccw->flags = CCW_FLAG_CC;
2329 ccw->cmd_code = CCW_CMD_TIC;
2330 ccw->cda = (long)(cqr->cpaddr);
2333 erp->function = dasd_3990_erp_add_erp;
2335 erp->startdev = device;
2336 erp->memdev = device;
2337 erp->block = cqr->block;
2338 erp->magic = cqr->magic;
2341 erp->buildclk = get_clock();
2342 erp->status = DASD_CQR_FILLED;
2348 * DASD_3990_ERP_ADDITIONAL_ERP
2351 * An additional ERP is needed to handle the current error.
2352 * Add ERP to the head of the ERP-chain containing the ERP processing
2353 * determined based on the sense data.
2356 * cqr head of the current ERP-chain (or single cqr if
2360 * erp pointer to new ERP-chain head
2362 static struct dasd_ccw_req *
2363 dasd_3990_erp_additional_erp(struct dasd_ccw_req * cqr)
2366 struct dasd_ccw_req *erp = NULL;
2368 /* add erp and initialize with default TIC */
2369 erp = dasd_3990_erp_add_erp(cqr);
2371 /* inspect sense, determine specific ERP if possible */
2374 erp = dasd_3990_erp_inspect(erp);
2379 } /* end dasd_3990_erp_additional_erp */
2382 * DASD_3990_ERP_ERROR_MATCH
2385 * Check if the device status of the given cqr is the same.
2386 * This means that the failed CCW and the relevant sense data
2388 * I don't distinguish between 24 and 32 byte sense because in case of
2389 * 24 byte sense byte 25 and 27 is set as well.
2392 * cqr1 first cqr, which will be compared with the
2396 * match 'boolean' for match found
2397 * returns 1 if match found, otherwise 0.
2399 static int dasd_3990_erp_error_match(struct dasd_ccw_req *cqr1,
2400 struct dasd_ccw_req *cqr2)
2402 char *sense1, *sense2;
2404 if (cqr1->startdev != cqr2->startdev)
2407 sense1 = dasd_get_sense(&cqr1->irb);
2408 sense2 = dasd_get_sense(&cqr2->irb);
2410 /* one request has sense data, the other not -> no match, return 0 */
2411 if (!sense1 != !sense2)
2413 /* no sense data in both cases -> check cstat for IFCC */
2414 if (!sense1 && !sense2) {
2415 if ((scsw_cstat(&cqr1->irb.scsw) & (SCHN_STAT_INTF_CTRL_CHK |
2416 SCHN_STAT_CHN_CTRL_CHK)) ==
2417 (scsw_cstat(&cqr2->irb.scsw) & (SCHN_STAT_INTF_CTRL_CHK |
2418 SCHN_STAT_CHN_CTRL_CHK)))
2419 return 1; /* match with ifcc*/
2421 /* check sense data; byte 0-2,25,27 */
2422 if (!(sense1 && sense2 &&
2423 (memcmp(sense1, sense2, 3) == 0) &&
2424 (sense1[27] == sense2[27]) &&
2425 (sense1[25] == sense2[25]))) {
2427 return 0; /* sense doesn't match */
2430 return 1; /* match */
2432 } /* end dasd_3990_erp_error_match */
2435 * DASD_3990_ERP_IN_ERP
2438 * check if the current error already happened before.
2439 * quick exit if current cqr is not an ERP (cqr->refers=NULL)
2442 * cqr failed cqr (either original cqr or already an erp)
2445 * erp erp-pointer to the already defined error
2446 * recovery procedure OR
2447 * NULL if a 'new' error occurred.
2449 static struct dasd_ccw_req *
2450 dasd_3990_erp_in_erp(struct dasd_ccw_req *cqr)
2453 struct dasd_ccw_req *erp_head = cqr, /* save erp chain head */
2454 *erp_match = NULL; /* save erp chain head */
2455 int match = 0; /* 'boolean' for matching error found */
2457 if (cqr->refers == NULL) { /* return if not in erp */
2461 /* check the erp/cqr chain for current error */
2463 match = dasd_3990_erp_error_match(erp_head, cqr->refers);
2464 erp_match = cqr; /* save possible matching erp */
2465 cqr = cqr->refers; /* check next erp/cqr in queue */
2467 } while ((cqr->refers != NULL) && (!match));
2470 return NULL; /* no match was found */
2473 return erp_match; /* return address of matching erp */
2475 } /* END dasd_3990_erp_in_erp */
2478 * DASD_3990_ERP_FURTHER_ERP (24 & 32 byte sense)
2481 * No retry is left for the current ERP. Check what has to be done
2483 * - do further defined ERP action or
2484 * - wait for interrupt or
2485 * - exit with permanent error
2488 * erp ERP which is in progress with no retry left
2491 * erp modified/additional ERP
2493 static struct dasd_ccw_req *
2494 dasd_3990_erp_further_erp(struct dasd_ccw_req *erp)
2497 struct dasd_device *device = erp->startdev;
2498 char *sense = dasd_get_sense(&erp->irb);
2500 /* check for 24 byte sense ERP */
2501 if ((erp->function == dasd_3990_erp_bus_out) ||
2502 (erp->function == dasd_3990_erp_action_1) ||
2503 (erp->function == dasd_3990_erp_action_4)) {
2505 erp = dasd_3990_erp_action_1(erp);
2507 } else if (erp->function == dasd_3990_erp_action_1_sec) {
2508 erp = dasd_3990_erp_action_1_sec(erp);
2509 } else if (erp->function == dasd_3990_erp_action_5) {
2511 /* retries have not been successful */
2512 /* prepare erp for retry on different channel path */
2513 erp = dasd_3990_erp_action_1(erp);
2515 if (sense && !(sense[2] & DASD_SENSE_BIT_0)) {
2517 /* issue a Diagnostic Control command with an
2518 * Inhibit Write subcommand */
2520 switch (sense[25]) {
2522 case 0x57:{ /* controller */
2523 erp = dasd_3990_erp_DCTL(erp, 0x20);
2527 case 0x58:{ /* channel path */
2528 erp = dasd_3990_erp_DCTL(erp, 0x40);
2532 case 0x59:{ /* storage director */
2533 erp = dasd_3990_erp_DCTL(erp, 0x80);
2537 DBF_DEV_EVENT(DBF_WARNING, device,
2538 "invalid subcommand modifier 0x%x "
2539 "for Diagnostic Control Command",
2544 /* check for 32 byte sense ERP */
2546 ((erp->function == dasd_3990_erp_compound_retry) ||
2547 (erp->function == dasd_3990_erp_compound_path) ||
2548 (erp->function == dasd_3990_erp_compound_code) ||
2549 (erp->function == dasd_3990_erp_compound_config))) {
2551 erp = dasd_3990_erp_compound(erp, sense);
2555 * No retry left and no additional special handling
2558 dev_err(&device->cdev->dev,
2559 "ERP %p has run out of retries and failed\n", erp);
2561 erp->status = DASD_CQR_FAILED;
2566 } /* end dasd_3990_erp_further_erp */
2569 * DASD_3990_ERP_HANDLE_MATCH_ERP
2572 * An error occurred again and an ERP has been detected which is already
2573 * used to handle this error (e.g. retries).
2574 * All prior ERP's are asumed to be successful and therefore removed
2576 * If retry counter of matching erp is already 0, it is checked if further
2577 * action is needed (besides retry) or if the ERP has failed.
2580 * erp_head first ERP in ERP-chain
2581 * erp ERP that handles the actual error.
2585 * erp modified/additional ERP
2587 static struct dasd_ccw_req *
2588 dasd_3990_erp_handle_match_erp(struct dasd_ccw_req *erp_head,
2589 struct dasd_ccw_req *erp)
2592 struct dasd_device *device = erp_head->startdev;
2593 struct dasd_ccw_req *erp_done = erp_head; /* finished req */
2594 struct dasd_ccw_req *erp_free = NULL; /* req to be freed */
2596 /* loop over successful ERPs and remove them from chanq */
2597 while (erp_done != erp) {
2599 if (erp_done == NULL) /* end of chain reached */
2600 panic(PRINTK_HEADER "Programming error in ERP! The "
2601 "original request was lost\n");
2603 /* remove the request from the device queue */
2604 list_del(&erp_done->blocklist);
2606 erp_free = erp_done;
2607 erp_done = erp_done->refers;
2609 /* free the finished erp request */
2610 dasd_free_erp_request(erp_free, erp_free->memdev);
2614 if (erp->retries > 0) {
2616 char *sense = dasd_get_sense(&erp->refers->irb);
2618 /* check for special retries */
2619 if (sense && erp->function == dasd_3990_erp_action_4) {
2621 erp = dasd_3990_erp_action_4(erp, sense);
2624 erp->function == dasd_3990_erp_action_1B_32) {
2626 erp = dasd_3990_update_1B(erp, sense);
2628 } else if (sense && erp->function == dasd_3990_erp_int_req) {
2630 erp = dasd_3990_erp_int_req(erp);
2634 DBF_DEV_EVENT(DBF_DEBUG, device,
2635 "%i retries left for erp %p",
2638 /* handle the request again... */
2639 erp->status = DASD_CQR_FILLED;
2643 /* no retry left - check for further necessary action */
2644 /* if no further actions, handle rest as permanent error */
2645 erp = dasd_3990_erp_further_erp(erp);
2650 } /* end dasd_3990_erp_handle_match_erp */
2653 * DASD_3990_ERP_ACTION
2656 * control routine for 3990 erp actions.
2657 * Has to be called with the queue lock (namely the s390_irq_lock) acquired.
2660 * cqr failed cqr (either original cqr or already an erp)
2663 * erp erp-pointer to the head of the ERP action chain.
2665 * - either a ptr to an additional ERP cqr or
2666 * - the original given cqr (which's status might
2669 struct dasd_ccw_req *
2670 dasd_3990_erp_action(struct dasd_ccw_req * cqr)
2672 struct dasd_ccw_req *erp = NULL;
2673 struct dasd_device *device = cqr->startdev;
2674 struct dasd_ccw_req *temp_erp = NULL;
2676 if (device->features & DASD_FEATURE_ERPLOG) {
2677 /* print current erp_chain */
2678 dev_err(&device->cdev->dev,
2679 "ERP chain at BEGINNING of ERP-ACTION\n");
2680 for (temp_erp = cqr;
2681 temp_erp != NULL; temp_erp = temp_erp->refers) {
2683 dev_err(&device->cdev->dev,
2684 "ERP %p (%02x) refers to %p\n",
2685 temp_erp, temp_erp->status,
2690 /* double-check if current erp/cqr was successful */
2691 if ((scsw_cstat(&cqr->irb.scsw) == 0x00) &&
2692 (scsw_dstat(&cqr->irb.scsw) ==
2693 (DEV_STAT_CHN_END | DEV_STAT_DEV_END))) {
2695 DBF_DEV_EVENT(DBF_DEBUG, device,
2696 "ERP called for successful request %p"
2697 " - NO ERP necessary", cqr);
2699 cqr->status = DASD_CQR_DONE;
2704 /* check if error happened before */
2705 erp = dasd_3990_erp_in_erp(cqr);
2708 /* no matching erp found - set up erp */
2709 erp = dasd_3990_erp_additional_erp(cqr);
2711 /* matching erp found - set all leading erp's to DONE */
2712 erp = dasd_3990_erp_handle_match_erp(cqr, erp);
2715 if (device->features & DASD_FEATURE_ERPLOG) {
2716 /* print current erp_chain */
2717 dev_err(&device->cdev->dev,
2718 "ERP chain at END of ERP-ACTION\n");
2719 for (temp_erp = erp;
2720 temp_erp != NULL; temp_erp = temp_erp->refers) {
2722 dev_err(&device->cdev->dev,
2723 "ERP %p (%02x) refers to %p\n",
2724 temp_erp, temp_erp->status,
2729 /* enqueue ERP request if it's a new one */
2730 if (list_empty(&erp->blocklist)) {
2731 cqr->status = DASD_CQR_IN_ERP;
2732 /* add erp request before the cqr */
2733 list_add_tail(&erp->blocklist, &cqr->blocklist);
2740 } /* end dasd_3990_erp_action */