SCSI: sd: Update WRITE SAME heuristics
[firefly-linux-kernel-4.4.55.git] / drivers / scsi / sd.c
1 /*
2  *      sd.c Copyright (C) 1992 Drew Eckhardt
3  *           Copyright (C) 1993, 1994, 1995, 1999 Eric Youngdale
4  *
5  *      Linux scsi disk driver
6  *              Initial versions: Drew Eckhardt
7  *              Subsequent revisions: Eric Youngdale
8  *      Modification history:
9  *       - Drew Eckhardt <drew@colorado.edu> original
10  *       - Eric Youngdale <eric@andante.org> add scatter-gather, multiple 
11  *         outstanding request, and other enhancements.
12  *         Support loadable low-level scsi drivers.
13  *       - Jirka Hanika <geo@ff.cuni.cz> support more scsi disks using 
14  *         eight major numbers.
15  *       - Richard Gooch <rgooch@atnf.csiro.au> support devfs.
16  *       - Torben Mathiasen <tmm@image.dk> Resource allocation fixes in 
17  *         sd_init and cleanups.
18  *       - Alex Davis <letmein@erols.com> Fix problem where partition info
19  *         not being read in sd_open. Fix problem where removable media 
20  *         could be ejected after sd_open.
21  *       - Douglas Gilbert <dgilbert@interlog.com> cleanup for lk 2.5.x
22  *       - Badari Pulavarty <pbadari@us.ibm.com>, Matthew Wilcox 
23  *         <willy@debian.org>, Kurt Garloff <garloff@suse.de>: 
24  *         Support 32k/1M disks.
25  *
26  *      Logging policy (needs CONFIG_SCSI_LOGGING defined):
27  *       - setting up transfer: SCSI_LOG_HLQUEUE levels 1 and 2
28  *       - end of transfer (bh + scsi_lib): SCSI_LOG_HLCOMPLETE level 1
29  *       - entering sd_ioctl: SCSI_LOG_IOCTL level 1
30  *       - entering other commands: SCSI_LOG_HLQUEUE level 3
31  *      Note: when the logging level is set by the user, it must be greater
32  *      than the level indicated above to trigger output.       
33  */
34
35 #include <linux/module.h>
36 #include <linux/fs.h>
37 #include <linux/kernel.h>
38 #include <linux/mm.h>
39 #include <linux/bio.h>
40 #include <linux/genhd.h>
41 #include <linux/hdreg.h>
42 #include <linux/errno.h>
43 #include <linux/idr.h>
44 #include <linux/interrupt.h>
45 #include <linux/init.h>
46 #include <linux/blkdev.h>
47 #include <linux/blkpg.h>
48 #include <linux/delay.h>
49 #include <linux/mutex.h>
50 #include <linux/string_helpers.h>
51 #include <linux/async.h>
52 #include <linux/slab.h>
53 #include <linux/pm_runtime.h>
54 #include <asm/uaccess.h>
55 #include <asm/unaligned.h>
56
57 #include <scsi/scsi.h>
58 #include <scsi/scsi_cmnd.h>
59 #include <scsi/scsi_dbg.h>
60 #include <scsi/scsi_device.h>
61 #include <scsi/scsi_driver.h>
62 #include <scsi/scsi_eh.h>
63 #include <scsi/scsi_host.h>
64 #include <scsi/scsi_ioctl.h>
65 #include <scsi/scsicam.h>
66
67 #include "sd.h"
68 #include "scsi_priv.h"
69 #include "scsi_logging.h"
70
71 MODULE_AUTHOR("Eric Youngdale");
72 MODULE_DESCRIPTION("SCSI disk (sd) driver");
73 MODULE_LICENSE("GPL");
74
75 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK0_MAJOR);
76 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK1_MAJOR);
77 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK2_MAJOR);
78 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK3_MAJOR);
79 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK4_MAJOR);
80 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK5_MAJOR);
81 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK6_MAJOR);
82 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK7_MAJOR);
83 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK8_MAJOR);
84 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK9_MAJOR);
85 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK10_MAJOR);
86 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK11_MAJOR);
87 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK12_MAJOR);
88 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK13_MAJOR);
89 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK14_MAJOR);
90 MODULE_ALIAS_BLOCKDEV_MAJOR(SCSI_DISK15_MAJOR);
91 MODULE_ALIAS_SCSI_DEVICE(TYPE_DISK);
92 MODULE_ALIAS_SCSI_DEVICE(TYPE_MOD);
93 MODULE_ALIAS_SCSI_DEVICE(TYPE_RBC);
94
95 #if !defined(CONFIG_DEBUG_BLOCK_EXT_DEVT)
96 #define SD_MINORS       16
97 #else
98 #define SD_MINORS       0
99 #endif
100
101 static void sd_config_discard(struct scsi_disk *, unsigned int);
102 static void sd_config_write_same(struct scsi_disk *);
103 static int  sd_revalidate_disk(struct gendisk *);
104 static void sd_unlock_native_capacity(struct gendisk *disk);
105 static int  sd_probe(struct device *);
106 static int  sd_remove(struct device *);
107 static void sd_shutdown(struct device *);
108 static int sd_suspend(struct device *);
109 static int sd_resume(struct device *);
110 static void sd_rescan(struct device *);
111 static int sd_done(struct scsi_cmnd *);
112 static int sd_eh_action(struct scsi_cmnd *, unsigned char *, int, int);
113 static void sd_read_capacity(struct scsi_disk *sdkp, unsigned char *buffer);
114 static void scsi_disk_release(struct device *cdev);
115 static void sd_print_sense_hdr(struct scsi_disk *, struct scsi_sense_hdr *);
116 static void sd_print_result(struct scsi_disk *, int);
117
118 static DEFINE_SPINLOCK(sd_index_lock);
119 static DEFINE_IDA(sd_index_ida);
120
121 /* This semaphore is used to mediate the 0->1 reference get in the
122  * face of object destruction (i.e. we can't allow a get on an
123  * object after last put) */
124 static DEFINE_MUTEX(sd_ref_mutex);
125
126 static struct kmem_cache *sd_cdb_cache;
127 static mempool_t *sd_cdb_pool;
128
129 static const char *sd_cache_types[] = {
130         "write through", "none", "write back",
131         "write back, no read (daft)"
132 };
133
134 static ssize_t
135 sd_store_cache_type(struct device *dev, struct device_attribute *attr,
136                     const char *buf, size_t count)
137 {
138         int i, ct = -1, rcd, wce, sp;
139         struct scsi_disk *sdkp = to_scsi_disk(dev);
140         struct scsi_device *sdp = sdkp->device;
141         char buffer[64];
142         char *buffer_data;
143         struct scsi_mode_data data;
144         struct scsi_sense_hdr sshdr;
145         static const char temp[] = "temporary ";
146         int len;
147
148         if (sdp->type != TYPE_DISK)
149                 /* no cache control on RBC devices; theoretically they
150                  * can do it, but there's probably so many exceptions
151                  * it's not worth the risk */
152                 return -EINVAL;
153
154         if (strncmp(buf, temp, sizeof(temp) - 1) == 0) {
155                 buf += sizeof(temp) - 1;
156                 sdkp->cache_override = 1;
157         } else {
158                 sdkp->cache_override = 0;
159         }
160
161         for (i = 0; i < ARRAY_SIZE(sd_cache_types); i++) {
162                 len = strlen(sd_cache_types[i]);
163                 if (strncmp(sd_cache_types[i], buf, len) == 0 &&
164                     buf[len] == '\n') {
165                         ct = i;
166                         break;
167                 }
168         }
169         if (ct < 0)
170                 return -EINVAL;
171         rcd = ct & 0x01 ? 1 : 0;
172         wce = ct & 0x02 ? 1 : 0;
173
174         if (sdkp->cache_override) {
175                 sdkp->WCE = wce;
176                 sdkp->RCD = rcd;
177                 return count;
178         }
179
180         if (scsi_mode_sense(sdp, 0x08, 8, buffer, sizeof(buffer), SD_TIMEOUT,
181                             SD_MAX_RETRIES, &data, NULL))
182                 return -EINVAL;
183         len = min_t(size_t, sizeof(buffer), data.length - data.header_length -
184                   data.block_descriptor_length);
185         buffer_data = buffer + data.header_length +
186                 data.block_descriptor_length;
187         buffer_data[2] &= ~0x05;
188         buffer_data[2] |= wce << 2 | rcd;
189         sp = buffer_data[0] & 0x80 ? 1 : 0;
190
191         if (scsi_mode_select(sdp, 1, sp, 8, buffer_data, len, SD_TIMEOUT,
192                              SD_MAX_RETRIES, &data, &sshdr)) {
193                 if (scsi_sense_valid(&sshdr))
194                         sd_print_sense_hdr(sdkp, &sshdr);
195                 return -EINVAL;
196         }
197         revalidate_disk(sdkp->disk);
198         return count;
199 }
200
201 static ssize_t
202 sd_store_manage_start_stop(struct device *dev, struct device_attribute *attr,
203                            const char *buf, size_t count)
204 {
205         struct scsi_disk *sdkp = to_scsi_disk(dev);
206         struct scsi_device *sdp = sdkp->device;
207
208         if (!capable(CAP_SYS_ADMIN))
209                 return -EACCES;
210
211         sdp->manage_start_stop = simple_strtoul(buf, NULL, 10);
212
213         return count;
214 }
215
216 static ssize_t
217 sd_store_allow_restart(struct device *dev, struct device_attribute *attr,
218                        const char *buf, size_t count)
219 {
220         struct scsi_disk *sdkp = to_scsi_disk(dev);
221         struct scsi_device *sdp = sdkp->device;
222
223         if (!capable(CAP_SYS_ADMIN))
224                 return -EACCES;
225
226         if (sdp->type != TYPE_DISK)
227                 return -EINVAL;
228
229         sdp->allow_restart = simple_strtoul(buf, NULL, 10);
230
231         return count;
232 }
233
234 static ssize_t
235 sd_show_cache_type(struct device *dev, struct device_attribute *attr,
236                    char *buf)
237 {
238         struct scsi_disk *sdkp = to_scsi_disk(dev);
239         int ct = sdkp->RCD + 2*sdkp->WCE;
240
241         return snprintf(buf, 40, "%s\n", sd_cache_types[ct]);
242 }
243
244 static ssize_t
245 sd_show_fua(struct device *dev, struct device_attribute *attr, char *buf)
246 {
247         struct scsi_disk *sdkp = to_scsi_disk(dev);
248
249         return snprintf(buf, 20, "%u\n", sdkp->DPOFUA);
250 }
251
252 static ssize_t
253 sd_show_manage_start_stop(struct device *dev, struct device_attribute *attr,
254                           char *buf)
255 {
256         struct scsi_disk *sdkp = to_scsi_disk(dev);
257         struct scsi_device *sdp = sdkp->device;
258
259         return snprintf(buf, 20, "%u\n", sdp->manage_start_stop);
260 }
261
262 static ssize_t
263 sd_show_allow_restart(struct device *dev, struct device_attribute *attr,
264                       char *buf)
265 {
266         struct scsi_disk *sdkp = to_scsi_disk(dev);
267
268         return snprintf(buf, 40, "%d\n", sdkp->device->allow_restart);
269 }
270
271 static ssize_t
272 sd_show_protection_type(struct device *dev, struct device_attribute *attr,
273                         char *buf)
274 {
275         struct scsi_disk *sdkp = to_scsi_disk(dev);
276
277         return snprintf(buf, 20, "%u\n", sdkp->protection_type);
278 }
279
280 static ssize_t
281 sd_store_protection_type(struct device *dev, struct device_attribute *attr,
282                          const char *buf, size_t count)
283 {
284         struct scsi_disk *sdkp = to_scsi_disk(dev);
285         unsigned int val;
286         int err;
287
288         if (!capable(CAP_SYS_ADMIN))
289                 return -EACCES;
290
291         err = kstrtouint(buf, 10, &val);
292
293         if (err)
294                 return err;
295
296         if (val >= 0 && val <= SD_DIF_TYPE3_PROTECTION)
297                 sdkp->protection_type = val;
298
299         return count;
300 }
301
302 static ssize_t
303 sd_show_protection_mode(struct device *dev, struct device_attribute *attr,
304                         char *buf)
305 {
306         struct scsi_disk *sdkp = to_scsi_disk(dev);
307         struct scsi_device *sdp = sdkp->device;
308         unsigned int dif, dix;
309
310         dif = scsi_host_dif_capable(sdp->host, sdkp->protection_type);
311         dix = scsi_host_dix_capable(sdp->host, sdkp->protection_type);
312
313         if (!dix && scsi_host_dix_capable(sdp->host, SD_DIF_TYPE0_PROTECTION)) {
314                 dif = 0;
315                 dix = 1;
316         }
317
318         if (!dif && !dix)
319                 return snprintf(buf, 20, "none\n");
320
321         return snprintf(buf, 20, "%s%u\n", dix ? "dix" : "dif", dif);
322 }
323
324 static ssize_t
325 sd_show_app_tag_own(struct device *dev, struct device_attribute *attr,
326                     char *buf)
327 {
328         struct scsi_disk *sdkp = to_scsi_disk(dev);
329
330         return snprintf(buf, 20, "%u\n", sdkp->ATO);
331 }
332
333 static ssize_t
334 sd_show_thin_provisioning(struct device *dev, struct device_attribute *attr,
335                           char *buf)
336 {
337         struct scsi_disk *sdkp = to_scsi_disk(dev);
338
339         return snprintf(buf, 20, "%u\n", sdkp->lbpme);
340 }
341
342 static const char *lbp_mode[] = {
343         [SD_LBP_FULL]           = "full",
344         [SD_LBP_UNMAP]          = "unmap",
345         [SD_LBP_WS16]           = "writesame_16",
346         [SD_LBP_WS10]           = "writesame_10",
347         [SD_LBP_ZERO]           = "writesame_zero",
348         [SD_LBP_DISABLE]        = "disabled",
349 };
350
351 static ssize_t
352 sd_show_provisioning_mode(struct device *dev, struct device_attribute *attr,
353                           char *buf)
354 {
355         struct scsi_disk *sdkp = to_scsi_disk(dev);
356
357         return snprintf(buf, 20, "%s\n", lbp_mode[sdkp->provisioning_mode]);
358 }
359
360 static ssize_t
361 sd_store_provisioning_mode(struct device *dev, struct device_attribute *attr,
362                            const char *buf, size_t count)
363 {
364         struct scsi_disk *sdkp = to_scsi_disk(dev);
365         struct scsi_device *sdp = sdkp->device;
366
367         if (!capable(CAP_SYS_ADMIN))
368                 return -EACCES;
369
370         if (sdp->type != TYPE_DISK)
371                 return -EINVAL;
372
373         if (!strncmp(buf, lbp_mode[SD_LBP_UNMAP], 20))
374                 sd_config_discard(sdkp, SD_LBP_UNMAP);
375         else if (!strncmp(buf, lbp_mode[SD_LBP_WS16], 20))
376                 sd_config_discard(sdkp, SD_LBP_WS16);
377         else if (!strncmp(buf, lbp_mode[SD_LBP_WS10], 20))
378                 sd_config_discard(sdkp, SD_LBP_WS10);
379         else if (!strncmp(buf, lbp_mode[SD_LBP_ZERO], 20))
380                 sd_config_discard(sdkp, SD_LBP_ZERO);
381         else if (!strncmp(buf, lbp_mode[SD_LBP_DISABLE], 20))
382                 sd_config_discard(sdkp, SD_LBP_DISABLE);
383         else
384                 return -EINVAL;
385
386         return count;
387 }
388
389 static ssize_t
390 sd_show_max_medium_access_timeouts(struct device *dev,
391                                    struct device_attribute *attr, char *buf)
392 {
393         struct scsi_disk *sdkp = to_scsi_disk(dev);
394
395         return snprintf(buf, 20, "%u\n", sdkp->max_medium_access_timeouts);
396 }
397
398 static ssize_t
399 sd_store_max_medium_access_timeouts(struct device *dev,
400                                     struct device_attribute *attr,
401                                     const char *buf, size_t count)
402 {
403         struct scsi_disk *sdkp = to_scsi_disk(dev);
404         int err;
405
406         if (!capable(CAP_SYS_ADMIN))
407                 return -EACCES;
408
409         err = kstrtouint(buf, 10, &sdkp->max_medium_access_timeouts);
410
411         return err ? err : count;
412 }
413
414 static ssize_t
415 sd_show_write_same_blocks(struct device *dev, struct device_attribute *attr,
416                           char *buf)
417 {
418         struct scsi_disk *sdkp = to_scsi_disk(dev);
419
420         return snprintf(buf, 20, "%u\n", sdkp->max_ws_blocks);
421 }
422
423 static ssize_t
424 sd_store_write_same_blocks(struct device *dev, struct device_attribute *attr,
425                            const char *buf, size_t count)
426 {
427         struct scsi_disk *sdkp = to_scsi_disk(dev);
428         struct scsi_device *sdp = sdkp->device;
429         unsigned long max;
430         int err;
431
432         if (!capable(CAP_SYS_ADMIN))
433                 return -EACCES;
434
435         if (sdp->type != TYPE_DISK)
436                 return -EINVAL;
437
438         err = kstrtoul(buf, 10, &max);
439
440         if (err)
441                 return err;
442
443         if (max == 0)
444                 sdp->no_write_same = 1;
445         else if (max <= SD_MAX_WS16_BLOCKS) {
446                 sdp->no_write_same = 0;
447                 sdkp->max_ws_blocks = max;
448         }
449
450         sd_config_write_same(sdkp);
451
452         return count;
453 }
454
455 static struct device_attribute sd_disk_attrs[] = {
456         __ATTR(cache_type, S_IRUGO|S_IWUSR, sd_show_cache_type,
457                sd_store_cache_type),
458         __ATTR(FUA, S_IRUGO, sd_show_fua, NULL),
459         __ATTR(allow_restart, S_IRUGO|S_IWUSR, sd_show_allow_restart,
460                sd_store_allow_restart),
461         __ATTR(manage_start_stop, S_IRUGO|S_IWUSR, sd_show_manage_start_stop,
462                sd_store_manage_start_stop),
463         __ATTR(protection_type, S_IRUGO|S_IWUSR, sd_show_protection_type,
464                sd_store_protection_type),
465         __ATTR(protection_mode, S_IRUGO, sd_show_protection_mode, NULL),
466         __ATTR(app_tag_own, S_IRUGO, sd_show_app_tag_own, NULL),
467         __ATTR(thin_provisioning, S_IRUGO, sd_show_thin_provisioning, NULL),
468         __ATTR(provisioning_mode, S_IRUGO|S_IWUSR, sd_show_provisioning_mode,
469                sd_store_provisioning_mode),
470         __ATTR(max_write_same_blocks, S_IRUGO|S_IWUSR,
471                sd_show_write_same_blocks, sd_store_write_same_blocks),
472         __ATTR(max_medium_access_timeouts, S_IRUGO|S_IWUSR,
473                sd_show_max_medium_access_timeouts,
474                sd_store_max_medium_access_timeouts),
475         __ATTR_NULL,
476 };
477
478 static struct class sd_disk_class = {
479         .name           = "scsi_disk",
480         .owner          = THIS_MODULE,
481         .dev_release    = scsi_disk_release,
482         .dev_attrs      = sd_disk_attrs,
483 };
484
485 static const struct dev_pm_ops sd_pm_ops = {
486         .suspend                = sd_suspend,
487         .resume                 = sd_resume,
488         .poweroff               = sd_suspend,
489         .restore                = sd_resume,
490         .runtime_suspend        = sd_suspend,
491         .runtime_resume         = sd_resume,
492 };
493
494 static struct scsi_driver sd_template = {
495         .owner                  = THIS_MODULE,
496         .gendrv = {
497                 .name           = "sd",
498                 .probe          = sd_probe,
499                 .remove         = sd_remove,
500                 .shutdown       = sd_shutdown,
501                 .pm             = &sd_pm_ops,
502         },
503         .rescan                 = sd_rescan,
504         .done                   = sd_done,
505         .eh_action              = sd_eh_action,
506 };
507
508 /*
509  * Device no to disk mapping:
510  * 
511  *       major         disc2     disc  p1
512  *   |............|.............|....|....| <- dev_t
513  *    31        20 19          8 7  4 3  0
514  * 
515  * Inside a major, we have 16k disks, however mapped non-
516  * contiguously. The first 16 disks are for major0, the next
517  * ones with major1, ... Disk 256 is for major0 again, disk 272 
518  * for major1, ... 
519  * As we stay compatible with our numbering scheme, we can reuse 
520  * the well-know SCSI majors 8, 65--71, 136--143.
521  */
522 static int sd_major(int major_idx)
523 {
524         switch (major_idx) {
525         case 0:
526                 return SCSI_DISK0_MAJOR;
527         case 1 ... 7:
528                 return SCSI_DISK1_MAJOR + major_idx - 1;
529         case 8 ... 15:
530                 return SCSI_DISK8_MAJOR + major_idx - 8;
531         default:
532                 BUG();
533                 return 0;       /* shut up gcc */
534         }
535 }
536
537 static struct scsi_disk *__scsi_disk_get(struct gendisk *disk)
538 {
539         struct scsi_disk *sdkp = NULL;
540
541         if (disk->private_data) {
542                 sdkp = scsi_disk(disk);
543                 if (scsi_device_get(sdkp->device) == 0)
544                         get_device(&sdkp->dev);
545                 else
546                         sdkp = NULL;
547         }
548         return sdkp;
549 }
550
551 static struct scsi_disk *scsi_disk_get(struct gendisk *disk)
552 {
553         struct scsi_disk *sdkp;
554
555         mutex_lock(&sd_ref_mutex);
556         sdkp = __scsi_disk_get(disk);
557         mutex_unlock(&sd_ref_mutex);
558         return sdkp;
559 }
560
561 static struct scsi_disk *scsi_disk_get_from_dev(struct device *dev)
562 {
563         struct scsi_disk *sdkp;
564
565         mutex_lock(&sd_ref_mutex);
566         sdkp = dev_get_drvdata(dev);
567         if (sdkp)
568                 sdkp = __scsi_disk_get(sdkp->disk);
569         mutex_unlock(&sd_ref_mutex);
570         return sdkp;
571 }
572
573 static void scsi_disk_put(struct scsi_disk *sdkp)
574 {
575         struct scsi_device *sdev = sdkp->device;
576
577         mutex_lock(&sd_ref_mutex);
578         put_device(&sdkp->dev);
579         scsi_device_put(sdev);
580         mutex_unlock(&sd_ref_mutex);
581 }
582
583 static void sd_prot_op(struct scsi_cmnd *scmd, unsigned int dif)
584 {
585         unsigned int prot_op = SCSI_PROT_NORMAL;
586         unsigned int dix = scsi_prot_sg_count(scmd);
587
588         if (scmd->sc_data_direction == DMA_FROM_DEVICE) {
589                 if (dif && dix)
590                         prot_op = SCSI_PROT_READ_PASS;
591                 else if (dif && !dix)
592                         prot_op = SCSI_PROT_READ_STRIP;
593                 else if (!dif && dix)
594                         prot_op = SCSI_PROT_READ_INSERT;
595         } else {
596                 if (dif && dix)
597                         prot_op = SCSI_PROT_WRITE_PASS;
598                 else if (dif && !dix)
599                         prot_op = SCSI_PROT_WRITE_INSERT;
600                 else if (!dif && dix)
601                         prot_op = SCSI_PROT_WRITE_STRIP;
602         }
603
604         scsi_set_prot_op(scmd, prot_op);
605         scsi_set_prot_type(scmd, dif);
606 }
607
608 static void sd_config_discard(struct scsi_disk *sdkp, unsigned int mode)
609 {
610         struct request_queue *q = sdkp->disk->queue;
611         unsigned int logical_block_size = sdkp->device->sector_size;
612         unsigned int max_blocks = 0;
613
614         q->limits.discard_zeroes_data = sdkp->lbprz;
615         q->limits.discard_alignment = sdkp->unmap_alignment *
616                 logical_block_size;
617         q->limits.discard_granularity =
618                 max(sdkp->physical_block_size,
619                     sdkp->unmap_granularity * logical_block_size);
620
621         sdkp->provisioning_mode = mode;
622
623         switch (mode) {
624
625         case SD_LBP_DISABLE:
626                 q->limits.max_discard_sectors = 0;
627                 queue_flag_clear_unlocked(QUEUE_FLAG_DISCARD, q);
628                 return;
629
630         case SD_LBP_UNMAP:
631                 max_blocks = min_not_zero(sdkp->max_unmap_blocks,
632                                           (u32)SD_MAX_WS16_BLOCKS);
633                 break;
634
635         case SD_LBP_WS16:
636                 max_blocks = min_not_zero(sdkp->max_ws_blocks,
637                                           (u32)SD_MAX_WS16_BLOCKS);
638                 break;
639
640         case SD_LBP_WS10:
641                 max_blocks = min_not_zero(sdkp->max_ws_blocks,
642                                           (u32)SD_MAX_WS10_BLOCKS);
643                 break;
644
645         case SD_LBP_ZERO:
646                 max_blocks = min_not_zero(sdkp->max_ws_blocks,
647                                           (u32)SD_MAX_WS10_BLOCKS);
648                 q->limits.discard_zeroes_data = 1;
649                 break;
650         }
651
652         q->limits.max_discard_sectors = max_blocks * (logical_block_size >> 9);
653         queue_flag_set_unlocked(QUEUE_FLAG_DISCARD, q);
654 }
655
656 /**
657  * sd_setup_discard_cmnd - unmap blocks on thinly provisioned device
658  * @sdp: scsi device to operate one
659  * @rq: Request to prepare
660  *
661  * Will issue either UNMAP or WRITE SAME(16) depending on preference
662  * indicated by target device.
663  **/
664 static int sd_setup_discard_cmnd(struct scsi_device *sdp, struct request *rq)
665 {
666         struct scsi_disk *sdkp = scsi_disk(rq->rq_disk);
667         sector_t sector = blk_rq_pos(rq);
668         unsigned int nr_sectors = blk_rq_sectors(rq);
669         unsigned int nr_bytes = blk_rq_bytes(rq);
670         unsigned int len;
671         int ret;
672         char *buf;
673         struct page *page;
674
675         sector >>= ilog2(sdp->sector_size) - 9;
676         nr_sectors >>= ilog2(sdp->sector_size) - 9;
677         rq->timeout = SD_TIMEOUT;
678
679         memset(rq->cmd, 0, rq->cmd_len);
680
681         page = alloc_page(GFP_ATOMIC | __GFP_ZERO);
682         if (!page)
683                 return BLKPREP_DEFER;
684
685         switch (sdkp->provisioning_mode) {
686         case SD_LBP_UNMAP:
687                 buf = page_address(page);
688
689                 rq->cmd_len = 10;
690                 rq->cmd[0] = UNMAP;
691                 rq->cmd[8] = 24;
692
693                 put_unaligned_be16(6 + 16, &buf[0]);
694                 put_unaligned_be16(16, &buf[2]);
695                 put_unaligned_be64(sector, &buf[8]);
696                 put_unaligned_be32(nr_sectors, &buf[16]);
697
698                 len = 24;
699                 break;
700
701         case SD_LBP_WS16:
702                 rq->cmd_len = 16;
703                 rq->cmd[0] = WRITE_SAME_16;
704                 rq->cmd[1] = 0x8; /* UNMAP */
705                 put_unaligned_be64(sector, &rq->cmd[2]);
706                 put_unaligned_be32(nr_sectors, &rq->cmd[10]);
707
708                 len = sdkp->device->sector_size;
709                 break;
710
711         case SD_LBP_WS10:
712         case SD_LBP_ZERO:
713                 rq->cmd_len = 10;
714                 rq->cmd[0] = WRITE_SAME;
715                 if (sdkp->provisioning_mode == SD_LBP_WS10)
716                         rq->cmd[1] = 0x8; /* UNMAP */
717                 put_unaligned_be32(sector, &rq->cmd[2]);
718                 put_unaligned_be16(nr_sectors, &rq->cmd[7]);
719
720                 len = sdkp->device->sector_size;
721                 break;
722
723         default:
724                 ret = BLKPREP_KILL;
725                 goto out;
726         }
727
728         blk_add_request_payload(rq, page, len);
729         ret = scsi_setup_blk_pc_cmnd(sdp, rq);
730         rq->buffer = page_address(page);
731         rq->__data_len = nr_bytes;
732
733 out:
734         if (ret != BLKPREP_OK) {
735                 __free_page(page);
736                 rq->buffer = NULL;
737         }
738         return ret;
739 }
740
741 static void sd_config_write_same(struct scsi_disk *sdkp)
742 {
743         struct request_queue *q = sdkp->disk->queue;
744         unsigned int logical_block_size = sdkp->device->sector_size;
745
746         if (sdkp->device->no_write_same) {
747                 sdkp->max_ws_blocks = 0;
748                 goto out;
749         }
750
751         /* Some devices can not handle block counts above 0xffff despite
752          * supporting WRITE SAME(16). Consequently we default to 64k
753          * blocks per I/O unless the device explicitly advertises a
754          * bigger limit.
755          */
756         if (sdkp->max_ws_blocks > SD_MAX_WS10_BLOCKS)
757                 sdkp->max_ws_blocks = min_not_zero(sdkp->max_ws_blocks,
758                                                    (u32)SD_MAX_WS16_BLOCKS);
759         else if (sdkp->ws16 || sdkp->ws10 || sdkp->device->no_report_opcodes)
760                 sdkp->max_ws_blocks = min_not_zero(sdkp->max_ws_blocks,
761                                                    (u32)SD_MAX_WS10_BLOCKS);
762         else {
763                 sdkp->device->no_write_same = 1;
764                 sdkp->max_ws_blocks = 0;
765         }
766
767 out:
768         blk_queue_max_write_same_sectors(q, sdkp->max_ws_blocks *
769                                          (logical_block_size >> 9));
770 }
771
772 /**
773  * sd_setup_write_same_cmnd - write the same data to multiple blocks
774  * @sdp: scsi device to operate one
775  * @rq: Request to prepare
776  *
777  * Will issue either WRITE SAME(10) or WRITE SAME(16) depending on
778  * preference indicated by target device.
779  **/
780 static int sd_setup_write_same_cmnd(struct scsi_device *sdp, struct request *rq)
781 {
782         struct scsi_disk *sdkp = scsi_disk(rq->rq_disk);
783         struct bio *bio = rq->bio;
784         sector_t sector = blk_rq_pos(rq);
785         unsigned int nr_sectors = blk_rq_sectors(rq);
786         unsigned int nr_bytes = blk_rq_bytes(rq);
787         int ret;
788
789         if (sdkp->device->no_write_same)
790                 return BLKPREP_KILL;
791
792         BUG_ON(bio_offset(bio) || bio_iovec(bio)->bv_len != sdp->sector_size);
793
794         sector >>= ilog2(sdp->sector_size) - 9;
795         nr_sectors >>= ilog2(sdp->sector_size) - 9;
796
797         rq->__data_len = sdp->sector_size;
798         rq->timeout = SD_WRITE_SAME_TIMEOUT;
799         memset(rq->cmd, 0, rq->cmd_len);
800
801         if (sdkp->ws16 || sector > 0xffffffff || nr_sectors > 0xffff) {
802                 rq->cmd_len = 16;
803                 rq->cmd[0] = WRITE_SAME_16;
804                 put_unaligned_be64(sector, &rq->cmd[2]);
805                 put_unaligned_be32(nr_sectors, &rq->cmd[10]);
806         } else {
807                 rq->cmd_len = 10;
808                 rq->cmd[0] = WRITE_SAME;
809                 put_unaligned_be32(sector, &rq->cmd[2]);
810                 put_unaligned_be16(nr_sectors, &rq->cmd[7]);
811         }
812
813         ret = scsi_setup_blk_pc_cmnd(sdp, rq);
814         rq->__data_len = nr_bytes;
815
816         return ret;
817 }
818
819 static int scsi_setup_flush_cmnd(struct scsi_device *sdp, struct request *rq)
820 {
821         rq->timeout = SD_FLUSH_TIMEOUT;
822         rq->retries = SD_MAX_RETRIES;
823         rq->cmd[0] = SYNCHRONIZE_CACHE;
824         rq->cmd_len = 10;
825
826         return scsi_setup_blk_pc_cmnd(sdp, rq);
827 }
828
829 static void sd_unprep_fn(struct request_queue *q, struct request *rq)
830 {
831         if (rq->cmd_flags & REQ_DISCARD) {
832                 free_page((unsigned long)rq->buffer);
833                 rq->buffer = NULL;
834         }
835 }
836
837 /**
838  *      sd_prep_fn - build a scsi (read or write) command from
839  *      information in the request structure.
840  *      @SCpnt: pointer to mid-level's per scsi command structure that
841  *      contains request and into which the scsi command is written
842  *
843  *      Returns 1 if successful and 0 if error (or cannot be done now).
844  **/
845 static int sd_prep_fn(struct request_queue *q, struct request *rq)
846 {
847         struct scsi_cmnd *SCpnt;
848         struct scsi_device *sdp = q->queuedata;
849         struct gendisk *disk = rq->rq_disk;
850         struct scsi_disk *sdkp;
851         sector_t block = blk_rq_pos(rq);
852         sector_t threshold;
853         unsigned int this_count = blk_rq_sectors(rq);
854         int ret, host_dif;
855         unsigned char protect;
856
857         /*
858          * Discard request come in as REQ_TYPE_FS but we turn them into
859          * block PC requests to make life easier.
860          */
861         if (rq->cmd_flags & REQ_DISCARD) {
862                 ret = sd_setup_discard_cmnd(sdp, rq);
863                 goto out;
864         } else if (rq->cmd_flags & REQ_WRITE_SAME) {
865                 ret = sd_setup_write_same_cmnd(sdp, rq);
866                 goto out;
867         } else if (rq->cmd_flags & REQ_FLUSH) {
868                 ret = scsi_setup_flush_cmnd(sdp, rq);
869                 goto out;
870         } else if (rq->cmd_type == REQ_TYPE_BLOCK_PC) {
871                 ret = scsi_setup_blk_pc_cmnd(sdp, rq);
872                 goto out;
873         } else if (rq->cmd_type != REQ_TYPE_FS) {
874                 ret = BLKPREP_KILL;
875                 goto out;
876         }
877         ret = scsi_setup_fs_cmnd(sdp, rq);
878         if (ret != BLKPREP_OK)
879                 goto out;
880         SCpnt = rq->special;
881         sdkp = scsi_disk(disk);
882
883         /* from here on until we're complete, any goto out
884          * is used for a killable error condition */
885         ret = BLKPREP_KILL;
886
887         SCSI_LOG_HLQUEUE(1, scmd_printk(KERN_INFO, SCpnt,
888                                         "sd_prep_fn: block=%llu, "
889                                         "count=%d\n",
890                                         (unsigned long long)block,
891                                         this_count));
892
893         if (!sdp || !scsi_device_online(sdp) ||
894             block + blk_rq_sectors(rq) > get_capacity(disk)) {
895                 SCSI_LOG_HLQUEUE(2, scmd_printk(KERN_INFO, SCpnt,
896                                                 "Finishing %u sectors\n",
897                                                 blk_rq_sectors(rq)));
898                 SCSI_LOG_HLQUEUE(2, scmd_printk(KERN_INFO, SCpnt,
899                                                 "Retry with 0x%p\n", SCpnt));
900                 goto out;
901         }
902
903         if (sdp->changed) {
904                 /*
905                  * quietly refuse to do anything to a changed disc until 
906                  * the changed bit has been reset
907                  */
908                 /* printk("SCSI disk has been changed or is not present. Prohibiting further I/O.\n"); */
909                 goto out;
910         }
911
912         /*
913          * Some SD card readers can't handle multi-sector accesses which touch
914          * the last one or two hardware sectors.  Split accesses as needed.
915          */
916         threshold = get_capacity(disk) - SD_LAST_BUGGY_SECTORS *
917                 (sdp->sector_size / 512);
918
919         if (unlikely(sdp->last_sector_bug && block + this_count > threshold)) {
920                 if (block < threshold) {
921                         /* Access up to the threshold but not beyond */
922                         this_count = threshold - block;
923                 } else {
924                         /* Access only a single hardware sector */
925                         this_count = sdp->sector_size / 512;
926                 }
927         }
928
929         SCSI_LOG_HLQUEUE(2, scmd_printk(KERN_INFO, SCpnt, "block=%llu\n",
930                                         (unsigned long long)block));
931
932         /*
933          * If we have a 1K hardware sectorsize, prevent access to single
934          * 512 byte sectors.  In theory we could handle this - in fact
935          * the scsi cdrom driver must be able to handle this because
936          * we typically use 1K blocksizes, and cdroms typically have
937          * 2K hardware sectorsizes.  Of course, things are simpler
938          * with the cdrom, since it is read-only.  For performance
939          * reasons, the filesystems should be able to handle this
940          * and not force the scsi disk driver to use bounce buffers
941          * for this.
942          */
943         if (sdp->sector_size == 1024) {
944                 if ((block & 1) || (blk_rq_sectors(rq) & 1)) {
945                         scmd_printk(KERN_ERR, SCpnt,
946                                     "Bad block number requested\n");
947                         goto out;
948                 } else {
949                         block = block >> 1;
950                         this_count = this_count >> 1;
951                 }
952         }
953         if (sdp->sector_size == 2048) {
954                 if ((block & 3) || (blk_rq_sectors(rq) & 3)) {
955                         scmd_printk(KERN_ERR, SCpnt,
956                                     "Bad block number requested\n");
957                         goto out;
958                 } else {
959                         block = block >> 2;
960                         this_count = this_count >> 2;
961                 }
962         }
963         if (sdp->sector_size == 4096) {
964                 if ((block & 7) || (blk_rq_sectors(rq) & 7)) {
965                         scmd_printk(KERN_ERR, SCpnt,
966                                     "Bad block number requested\n");
967                         goto out;
968                 } else {
969                         block = block >> 3;
970                         this_count = this_count >> 3;
971                 }
972         }
973         if (rq_data_dir(rq) == WRITE) {
974                 if (!sdp->writeable) {
975                         goto out;
976                 }
977                 SCpnt->cmnd[0] = WRITE_6;
978                 SCpnt->sc_data_direction = DMA_TO_DEVICE;
979
980                 if (blk_integrity_rq(rq))
981                         sd_dif_prepare(rq, block, sdp->sector_size);
982
983         } else if (rq_data_dir(rq) == READ) {
984                 SCpnt->cmnd[0] = READ_6;
985                 SCpnt->sc_data_direction = DMA_FROM_DEVICE;
986         } else {
987                 scmd_printk(KERN_ERR, SCpnt, "Unknown command %x\n", rq->cmd_flags);
988                 goto out;
989         }
990
991         SCSI_LOG_HLQUEUE(2, scmd_printk(KERN_INFO, SCpnt,
992                                         "%s %d/%u 512 byte blocks.\n",
993                                         (rq_data_dir(rq) == WRITE) ?
994                                         "writing" : "reading", this_count,
995                                         blk_rq_sectors(rq)));
996
997         /* Set RDPROTECT/WRPROTECT if disk is formatted with DIF */
998         host_dif = scsi_host_dif_capable(sdp->host, sdkp->protection_type);
999         if (host_dif)
1000                 protect = 1 << 5;
1001         else
1002                 protect = 0;
1003
1004         if (host_dif == SD_DIF_TYPE2_PROTECTION) {
1005                 SCpnt->cmnd = mempool_alloc(sd_cdb_pool, GFP_ATOMIC);
1006
1007                 if (unlikely(SCpnt->cmnd == NULL)) {
1008                         ret = BLKPREP_DEFER;
1009                         goto out;
1010                 }
1011
1012                 SCpnt->cmd_len = SD_EXT_CDB_SIZE;
1013                 memset(SCpnt->cmnd, 0, SCpnt->cmd_len);
1014                 SCpnt->cmnd[0] = VARIABLE_LENGTH_CMD;
1015                 SCpnt->cmnd[7] = 0x18;
1016                 SCpnt->cmnd[9] = (rq_data_dir(rq) == READ) ? READ_32 : WRITE_32;
1017                 SCpnt->cmnd[10] = protect | ((rq->cmd_flags & REQ_FUA) ? 0x8 : 0);
1018
1019                 /* LBA */
1020                 SCpnt->cmnd[12] = sizeof(block) > 4 ? (unsigned char) (block >> 56) & 0xff : 0;
1021                 SCpnt->cmnd[13] = sizeof(block) > 4 ? (unsigned char) (block >> 48) & 0xff : 0;
1022                 SCpnt->cmnd[14] = sizeof(block) > 4 ? (unsigned char) (block >> 40) & 0xff : 0;
1023                 SCpnt->cmnd[15] = sizeof(block) > 4 ? (unsigned char) (block >> 32) & 0xff : 0;
1024                 SCpnt->cmnd[16] = (unsigned char) (block >> 24) & 0xff;
1025                 SCpnt->cmnd[17] = (unsigned char) (block >> 16) & 0xff;
1026                 SCpnt->cmnd[18] = (unsigned char) (block >> 8) & 0xff;
1027                 SCpnt->cmnd[19] = (unsigned char) block & 0xff;
1028
1029                 /* Expected Indirect LBA */
1030                 SCpnt->cmnd[20] = (unsigned char) (block >> 24) & 0xff;
1031                 SCpnt->cmnd[21] = (unsigned char) (block >> 16) & 0xff;
1032                 SCpnt->cmnd[22] = (unsigned char) (block >> 8) & 0xff;
1033                 SCpnt->cmnd[23] = (unsigned char) block & 0xff;
1034
1035                 /* Transfer length */
1036                 SCpnt->cmnd[28] = (unsigned char) (this_count >> 24) & 0xff;
1037                 SCpnt->cmnd[29] = (unsigned char) (this_count >> 16) & 0xff;
1038                 SCpnt->cmnd[30] = (unsigned char) (this_count >> 8) & 0xff;
1039                 SCpnt->cmnd[31] = (unsigned char) this_count & 0xff;
1040         } else if (sdp->use_16_for_rw) {
1041                 SCpnt->cmnd[0] += READ_16 - READ_6;
1042                 SCpnt->cmnd[1] = protect | ((rq->cmd_flags & REQ_FUA) ? 0x8 : 0);
1043                 SCpnt->cmnd[2] = sizeof(block) > 4 ? (unsigned char) (block >> 56) & 0xff : 0;
1044                 SCpnt->cmnd[3] = sizeof(block) > 4 ? (unsigned char) (block >> 48) & 0xff : 0;
1045                 SCpnt->cmnd[4] = sizeof(block) > 4 ? (unsigned char) (block >> 40) & 0xff : 0;
1046                 SCpnt->cmnd[5] = sizeof(block) > 4 ? (unsigned char) (block >> 32) & 0xff : 0;
1047                 SCpnt->cmnd[6] = (unsigned char) (block >> 24) & 0xff;
1048                 SCpnt->cmnd[7] = (unsigned char) (block >> 16) & 0xff;
1049                 SCpnt->cmnd[8] = (unsigned char) (block >> 8) & 0xff;
1050                 SCpnt->cmnd[9] = (unsigned char) block & 0xff;
1051                 SCpnt->cmnd[10] = (unsigned char) (this_count >> 24) & 0xff;
1052                 SCpnt->cmnd[11] = (unsigned char) (this_count >> 16) & 0xff;
1053                 SCpnt->cmnd[12] = (unsigned char) (this_count >> 8) & 0xff;
1054                 SCpnt->cmnd[13] = (unsigned char) this_count & 0xff;
1055                 SCpnt->cmnd[14] = SCpnt->cmnd[15] = 0;
1056         } else if ((this_count > 0xff) || (block > 0x1fffff) ||
1057                    scsi_device_protection(SCpnt->device) ||
1058                    SCpnt->device->use_10_for_rw) {
1059                 if (this_count > 0xffff)
1060                         this_count = 0xffff;
1061
1062                 SCpnt->cmnd[0] += READ_10 - READ_6;
1063                 SCpnt->cmnd[1] = protect | ((rq->cmd_flags & REQ_FUA) ? 0x8 : 0);
1064                 SCpnt->cmnd[2] = (unsigned char) (block >> 24) & 0xff;
1065                 SCpnt->cmnd[3] = (unsigned char) (block >> 16) & 0xff;
1066                 SCpnt->cmnd[4] = (unsigned char) (block >> 8) & 0xff;
1067                 SCpnt->cmnd[5] = (unsigned char) block & 0xff;
1068                 SCpnt->cmnd[6] = SCpnt->cmnd[9] = 0;
1069                 SCpnt->cmnd[7] = (unsigned char) (this_count >> 8) & 0xff;
1070                 SCpnt->cmnd[8] = (unsigned char) this_count & 0xff;
1071         } else {
1072                 if (unlikely(rq->cmd_flags & REQ_FUA)) {
1073                         /*
1074                          * This happens only if this drive failed
1075                          * 10byte rw command with ILLEGAL_REQUEST
1076                          * during operation and thus turned off
1077                          * use_10_for_rw.
1078                          */
1079                         scmd_printk(KERN_ERR, SCpnt,
1080                                     "FUA write on READ/WRITE(6) drive\n");
1081                         goto out;
1082                 }
1083
1084                 SCpnt->cmnd[1] |= (unsigned char) ((block >> 16) & 0x1f);
1085                 SCpnt->cmnd[2] = (unsigned char) ((block >> 8) & 0xff);
1086                 SCpnt->cmnd[3] = (unsigned char) block & 0xff;
1087                 SCpnt->cmnd[4] = (unsigned char) this_count;
1088                 SCpnt->cmnd[5] = 0;
1089         }
1090         SCpnt->sdb.length = this_count * sdp->sector_size;
1091
1092         /* If DIF or DIX is enabled, tell HBA how to handle request */
1093         if (host_dif || scsi_prot_sg_count(SCpnt))
1094                 sd_prot_op(SCpnt, host_dif);
1095
1096         /*
1097          * We shouldn't disconnect in the middle of a sector, so with a dumb
1098          * host adapter, it's safe to assume that we can at least transfer
1099          * this many bytes between each connect / disconnect.
1100          */
1101         SCpnt->transfersize = sdp->sector_size;
1102         SCpnt->underflow = this_count << 9;
1103         SCpnt->allowed = SD_MAX_RETRIES;
1104
1105         /*
1106          * This indicates that the command is ready from our end to be
1107          * queued.
1108          */
1109         ret = BLKPREP_OK;
1110  out:
1111         return scsi_prep_return(q, rq, ret);
1112 }
1113
1114 /**
1115  *      sd_open - open a scsi disk device
1116  *      @inode: only i_rdev member may be used
1117  *      @filp: only f_mode and f_flags may be used
1118  *
1119  *      Returns 0 if successful. Returns a negated errno value in case 
1120  *      of error.
1121  *
1122  *      Note: This can be called from a user context (e.g. fsck(1) )
1123  *      or from within the kernel (e.g. as a result of a mount(1) ).
1124  *      In the latter case @inode and @filp carry an abridged amount
1125  *      of information as noted above.
1126  *
1127  *      Locking: called with bdev->bd_mutex held.
1128  **/
1129 static int sd_open(struct block_device *bdev, fmode_t mode)
1130 {
1131         struct scsi_disk *sdkp = scsi_disk_get(bdev->bd_disk);
1132         struct scsi_device *sdev;
1133         int retval;
1134
1135         if (!sdkp)
1136                 return -ENXIO;
1137
1138         SCSI_LOG_HLQUEUE(3, sd_printk(KERN_INFO, sdkp, "sd_open\n"));
1139
1140         sdev = sdkp->device;
1141
1142         /*
1143          * If the device is in error recovery, wait until it is done.
1144          * If the device is offline, then disallow any access to it.
1145          */
1146         retval = -ENXIO;
1147         if (!scsi_block_when_processing_errors(sdev))
1148                 goto error_out;
1149
1150         if (sdev->removable || sdkp->write_prot)
1151                 check_disk_change(bdev);
1152
1153         /*
1154          * If the drive is empty, just let the open fail.
1155          */
1156         retval = -ENOMEDIUM;
1157         if (sdev->removable && !sdkp->media_present && !(mode & FMODE_NDELAY))
1158                 goto error_out;
1159
1160         /*
1161          * If the device has the write protect tab set, have the open fail
1162          * if the user expects to be able to write to the thing.
1163          */
1164         retval = -EROFS;
1165         if (sdkp->write_prot && (mode & FMODE_WRITE))
1166                 goto error_out;
1167
1168         /*
1169          * It is possible that the disk changing stuff resulted in
1170          * the device being taken offline.  If this is the case,
1171          * report this to the user, and don't pretend that the
1172          * open actually succeeded.
1173          */
1174         retval = -ENXIO;
1175         if (!scsi_device_online(sdev))
1176                 goto error_out;
1177
1178         if ((atomic_inc_return(&sdkp->openers) == 1) && sdev->removable) {
1179                 if (scsi_block_when_processing_errors(sdev))
1180                         scsi_set_medium_removal(sdev, SCSI_REMOVAL_PREVENT);
1181         }
1182
1183         return 0;
1184
1185 error_out:
1186         scsi_disk_put(sdkp);
1187         return retval;  
1188 }
1189
1190 /**
1191  *      sd_release - invoked when the (last) close(2) is called on this
1192  *      scsi disk.
1193  *      @inode: only i_rdev member may be used
1194  *      @filp: only f_mode and f_flags may be used
1195  *
1196  *      Returns 0. 
1197  *
1198  *      Note: may block (uninterruptible) if error recovery is underway
1199  *      on this disk.
1200  *
1201  *      Locking: called with bdev->bd_mutex held.
1202  **/
1203 static void sd_release(struct gendisk *disk, fmode_t mode)
1204 {
1205         struct scsi_disk *sdkp = scsi_disk(disk);
1206         struct scsi_device *sdev = sdkp->device;
1207
1208         SCSI_LOG_HLQUEUE(3, sd_printk(KERN_INFO, sdkp, "sd_release\n"));
1209
1210         if (atomic_dec_return(&sdkp->openers) == 0 && sdev->removable) {
1211                 if (scsi_block_when_processing_errors(sdev))
1212                         scsi_set_medium_removal(sdev, SCSI_REMOVAL_ALLOW);
1213         }
1214
1215         /*
1216          * XXX and what if there are packets in flight and this close()
1217          * XXX is followed by a "rmmod sd_mod"?
1218          */
1219
1220         scsi_disk_put(sdkp);
1221 }
1222
1223 static int sd_getgeo(struct block_device *bdev, struct hd_geometry *geo)
1224 {
1225         struct scsi_disk *sdkp = scsi_disk(bdev->bd_disk);
1226         struct scsi_device *sdp = sdkp->device;
1227         struct Scsi_Host *host = sdp->host;
1228         int diskinfo[4];
1229
1230         /* default to most commonly used values */
1231         diskinfo[0] = 0x40;     /* 1 << 6 */
1232         diskinfo[1] = 0x20;     /* 1 << 5 */
1233         diskinfo[2] = sdkp->capacity >> 11;
1234         
1235         /* override with calculated, extended default, or driver values */
1236         if (host->hostt->bios_param)
1237                 host->hostt->bios_param(sdp, bdev, sdkp->capacity, diskinfo);
1238         else
1239                 scsicam_bios_param(bdev, sdkp->capacity, diskinfo);
1240
1241         geo->heads = diskinfo[0];
1242         geo->sectors = diskinfo[1];
1243         geo->cylinders = diskinfo[2];
1244         return 0;
1245 }
1246
1247 /**
1248  *      sd_ioctl - process an ioctl
1249  *      @inode: only i_rdev/i_bdev members may be used
1250  *      @filp: only f_mode and f_flags may be used
1251  *      @cmd: ioctl command number
1252  *      @arg: this is third argument given to ioctl(2) system call.
1253  *      Often contains a pointer.
1254  *
1255  *      Returns 0 if successful (some ioctls return positive numbers on
1256  *      success as well). Returns a negated errno value in case of error.
1257  *
1258  *      Note: most ioctls are forward onto the block subsystem or further
1259  *      down in the scsi subsystem.
1260  **/
1261 static int sd_ioctl(struct block_device *bdev, fmode_t mode,
1262                     unsigned int cmd, unsigned long arg)
1263 {
1264         struct gendisk *disk = bdev->bd_disk;
1265         struct scsi_disk *sdkp = scsi_disk(disk);
1266         struct scsi_device *sdp = sdkp->device;
1267         void __user *p = (void __user *)arg;
1268         int error;
1269     
1270         SCSI_LOG_IOCTL(1, sd_printk(KERN_INFO, sdkp, "sd_ioctl: disk=%s, "
1271                                     "cmd=0x%x\n", disk->disk_name, cmd));
1272
1273         error = scsi_verify_blk_ioctl(bdev, cmd);
1274         if (error < 0)
1275                 return error;
1276
1277         /*
1278          * If we are in the middle of error recovery, don't let anyone
1279          * else try and use this device.  Also, if error recovery fails, it
1280          * may try and take the device offline, in which case all further
1281          * access to the device is prohibited.
1282          */
1283         error = scsi_nonblockable_ioctl(sdp, cmd, p,
1284                                         (mode & FMODE_NDELAY) != 0);
1285         if (!scsi_block_when_processing_errors(sdp) || !error)
1286                 goto out;
1287
1288         /*
1289          * Send SCSI addressing ioctls directly to mid level, send other
1290          * ioctls to block level and then onto mid level if they can't be
1291          * resolved.
1292          */
1293         switch (cmd) {
1294                 case SCSI_IOCTL_GET_IDLUN:
1295                 case SCSI_IOCTL_GET_BUS_NUMBER:
1296                         error = scsi_ioctl(sdp, cmd, p);
1297                         break;
1298                 default:
1299                         error = scsi_cmd_blk_ioctl(bdev, mode, cmd, p);
1300                         if (error != -ENOTTY)
1301                                 break;
1302                         error = scsi_ioctl(sdp, cmd, p);
1303                         break;
1304         }
1305 out:
1306         return error;
1307 }
1308
1309 static void set_media_not_present(struct scsi_disk *sdkp)
1310 {
1311         if (sdkp->media_present)
1312                 sdkp->device->changed = 1;
1313
1314         if (sdkp->device->removable) {
1315                 sdkp->media_present = 0;
1316                 sdkp->capacity = 0;
1317         }
1318 }
1319
1320 static int media_not_present(struct scsi_disk *sdkp,
1321                              struct scsi_sense_hdr *sshdr)
1322 {
1323         if (!scsi_sense_valid(sshdr))
1324                 return 0;
1325
1326         /* not invoked for commands that could return deferred errors */
1327         switch (sshdr->sense_key) {
1328         case UNIT_ATTENTION:
1329         case NOT_READY:
1330                 /* medium not present */
1331                 if (sshdr->asc == 0x3A) {
1332                         set_media_not_present(sdkp);
1333                         return 1;
1334                 }
1335         }
1336         return 0;
1337 }
1338
1339 /**
1340  *      sd_check_events - check media events
1341  *      @disk: kernel device descriptor
1342  *      @clearing: disk events currently being cleared
1343  *
1344  *      Returns mask of DISK_EVENT_*.
1345  *
1346  *      Note: this function is invoked from the block subsystem.
1347  **/
1348 static unsigned int sd_check_events(struct gendisk *disk, unsigned int clearing)
1349 {
1350         struct scsi_disk *sdkp = scsi_disk(disk);
1351         struct scsi_device *sdp = sdkp->device;
1352         struct scsi_sense_hdr *sshdr = NULL;
1353         int retval;
1354
1355         SCSI_LOG_HLQUEUE(3, sd_printk(KERN_INFO, sdkp, "sd_check_events\n"));
1356
1357         /*
1358          * If the device is offline, don't send any commands - just pretend as
1359          * if the command failed.  If the device ever comes back online, we
1360          * can deal with it then.  It is only because of unrecoverable errors
1361          * that we would ever take a device offline in the first place.
1362          */
1363         if (!scsi_device_online(sdp)) {
1364                 set_media_not_present(sdkp);
1365                 goto out;
1366         }
1367
1368         /*
1369          * Using TEST_UNIT_READY enables differentiation between drive with
1370          * no cartridge loaded - NOT READY, drive with changed cartridge -
1371          * UNIT ATTENTION, or with same cartridge - GOOD STATUS.
1372          *
1373          * Drives that auto spin down. eg iomega jaz 1G, will be started
1374          * by sd_spinup_disk() from sd_revalidate_disk(), which happens whenever
1375          * sd_revalidate() is called.
1376          */
1377         retval = -ENODEV;
1378
1379         if (scsi_block_when_processing_errors(sdp)) {
1380                 sshdr  = kzalloc(sizeof(*sshdr), GFP_KERNEL);
1381                 retval = scsi_test_unit_ready(sdp, SD_TIMEOUT, SD_MAX_RETRIES,
1382                                               sshdr);
1383         }
1384
1385         /* failed to execute TUR, assume media not present */
1386         if (host_byte(retval)) {
1387                 set_media_not_present(sdkp);
1388                 goto out;
1389         }
1390
1391         if (media_not_present(sdkp, sshdr))
1392                 goto out;
1393
1394         /*
1395          * For removable scsi disk we have to recognise the presence
1396          * of a disk in the drive.
1397          */
1398         if (!sdkp->media_present)
1399                 sdp->changed = 1;
1400         sdkp->media_present = 1;
1401 out:
1402         /*
1403          * sdp->changed is set under the following conditions:
1404          *
1405          *      Medium present state has changed in either direction.
1406          *      Device has indicated UNIT_ATTENTION.
1407          */
1408         kfree(sshdr);
1409         retval = sdp->changed ? DISK_EVENT_MEDIA_CHANGE : 0;
1410         sdp->changed = 0;
1411         return retval;
1412 }
1413
1414 static int sd_sync_cache(struct scsi_disk *sdkp)
1415 {
1416         int retries, res;
1417         struct scsi_device *sdp = sdkp->device;
1418         struct scsi_sense_hdr sshdr;
1419
1420         if (!scsi_device_online(sdp))
1421                 return -ENODEV;
1422
1423
1424         for (retries = 3; retries > 0; --retries) {
1425                 unsigned char cmd[10] = { 0 };
1426
1427                 cmd[0] = SYNCHRONIZE_CACHE;
1428                 /*
1429                  * Leave the rest of the command zero to indicate
1430                  * flush everything.
1431                  */
1432                 res = scsi_execute_req_flags(sdp, cmd, DMA_NONE, NULL, 0,
1433                                              &sshdr, SD_FLUSH_TIMEOUT,
1434                                              SD_MAX_RETRIES, NULL, REQ_PM);
1435                 if (res == 0)
1436                         break;
1437         }
1438
1439         if (res) {
1440                 sd_print_result(sdkp, res);
1441                 if (driver_byte(res) & DRIVER_SENSE)
1442                         sd_print_sense_hdr(sdkp, &sshdr);
1443         }
1444
1445         if (res)
1446                 return -EIO;
1447         return 0;
1448 }
1449
1450 static void sd_rescan(struct device *dev)
1451 {
1452         struct scsi_disk *sdkp = scsi_disk_get_from_dev(dev);
1453
1454         if (sdkp) {
1455                 revalidate_disk(sdkp->disk);
1456                 scsi_disk_put(sdkp);
1457         }
1458 }
1459
1460
1461 #ifdef CONFIG_COMPAT
1462 /* 
1463  * This gets directly called from VFS. When the ioctl 
1464  * is not recognized we go back to the other translation paths. 
1465  */
1466 static int sd_compat_ioctl(struct block_device *bdev, fmode_t mode,
1467                            unsigned int cmd, unsigned long arg)
1468 {
1469         struct scsi_device *sdev = scsi_disk(bdev->bd_disk)->device;
1470         int ret;
1471
1472         ret = scsi_verify_blk_ioctl(bdev, cmd);
1473         if (ret < 0)
1474                 return ret;
1475
1476         /*
1477          * If we are in the middle of error recovery, don't let anyone
1478          * else try and use this device.  Also, if error recovery fails, it
1479          * may try and take the device offline, in which case all further
1480          * access to the device is prohibited.
1481          */
1482         if (!scsi_block_when_processing_errors(sdev))
1483                 return -ENODEV;
1484                
1485         if (sdev->host->hostt->compat_ioctl) {
1486                 ret = sdev->host->hostt->compat_ioctl(sdev, cmd, (void __user *)arg);
1487
1488                 return ret;
1489         }
1490
1491         /* 
1492          * Let the static ioctl translation table take care of it.
1493          */
1494         return -ENOIOCTLCMD; 
1495 }
1496 #endif
1497
1498 static const struct block_device_operations sd_fops = {
1499         .owner                  = THIS_MODULE,
1500         .open                   = sd_open,
1501         .release                = sd_release,
1502         .ioctl                  = sd_ioctl,
1503         .getgeo                 = sd_getgeo,
1504 #ifdef CONFIG_COMPAT
1505         .compat_ioctl           = sd_compat_ioctl,
1506 #endif
1507         .check_events           = sd_check_events,
1508         .revalidate_disk        = sd_revalidate_disk,
1509         .unlock_native_capacity = sd_unlock_native_capacity,
1510 };
1511
1512 /**
1513  *      sd_eh_action - error handling callback
1514  *      @scmd:          sd-issued command that has failed
1515  *      @eh_cmnd:       The command that was sent during error handling
1516  *      @eh_cmnd_len:   Length of eh_cmnd in bytes
1517  *      @eh_disp:       The recovery disposition suggested by the midlayer
1518  *
1519  *      This function is called by the SCSI midlayer upon completion of
1520  *      an error handling command (TEST UNIT READY, START STOP UNIT,
1521  *      etc.) The command sent to the device by the error handler is
1522  *      stored in eh_cmnd. The result of sending the eh command is
1523  *      passed in eh_disp.
1524  **/
1525 static int sd_eh_action(struct scsi_cmnd *scmd, unsigned char *eh_cmnd,
1526                         int eh_cmnd_len, int eh_disp)
1527 {
1528         struct scsi_disk *sdkp = scsi_disk(scmd->request->rq_disk);
1529
1530         if (!scsi_device_online(scmd->device) ||
1531             !scsi_medium_access_command(scmd))
1532                 return eh_disp;
1533
1534         /*
1535          * The device has timed out executing a medium access command.
1536          * However, the TEST UNIT READY command sent during error
1537          * handling completed successfully. Either the device is in the
1538          * process of recovering or has it suffered an internal failure
1539          * that prevents access to the storage medium.
1540          */
1541         if (host_byte(scmd->result) == DID_TIME_OUT && eh_disp == SUCCESS &&
1542             eh_cmnd_len && eh_cmnd[0] == TEST_UNIT_READY)
1543                 sdkp->medium_access_timed_out++;
1544
1545         /*
1546          * If the device keeps failing read/write commands but TEST UNIT
1547          * READY always completes successfully we assume that medium
1548          * access is no longer possible and take the device offline.
1549          */
1550         if (sdkp->medium_access_timed_out >= sdkp->max_medium_access_timeouts) {
1551                 scmd_printk(KERN_ERR, scmd,
1552                             "Medium access timeout failure. Offlining disk!\n");
1553                 scsi_device_set_state(scmd->device, SDEV_OFFLINE);
1554
1555                 return FAILED;
1556         }
1557
1558         return eh_disp;
1559 }
1560
1561 static unsigned int sd_completed_bytes(struct scsi_cmnd *scmd)
1562 {
1563         u64 start_lba = blk_rq_pos(scmd->request);
1564         u64 end_lba = blk_rq_pos(scmd->request) + (scsi_bufflen(scmd) / 512);
1565         u64 bad_lba;
1566         int info_valid;
1567         /*
1568          * resid is optional but mostly filled in.  When it's unused,
1569          * its value is zero, so we assume the whole buffer transferred
1570          */
1571         unsigned int transferred = scsi_bufflen(scmd) - scsi_get_resid(scmd);
1572         unsigned int good_bytes;
1573
1574         if (scmd->request->cmd_type != REQ_TYPE_FS)
1575                 return 0;
1576
1577         info_valid = scsi_get_sense_info_fld(scmd->sense_buffer,
1578                                              SCSI_SENSE_BUFFERSIZE,
1579                                              &bad_lba);
1580         if (!info_valid)
1581                 return 0;
1582
1583         if (scsi_bufflen(scmd) <= scmd->device->sector_size)
1584                 return 0;
1585
1586         if (scmd->device->sector_size < 512) {
1587                 /* only legitimate sector_size here is 256 */
1588                 start_lba <<= 1;
1589                 end_lba <<= 1;
1590         } else {
1591                 /* be careful ... don't want any overflows */
1592                 u64 factor = scmd->device->sector_size / 512;
1593                 do_div(start_lba, factor);
1594                 do_div(end_lba, factor);
1595         }
1596
1597         /* The bad lba was reported incorrectly, we have no idea where
1598          * the error is.
1599          */
1600         if (bad_lba < start_lba  || bad_lba >= end_lba)
1601                 return 0;
1602
1603         /* This computation should always be done in terms of
1604          * the resolution of the device's medium.
1605          */
1606         good_bytes = (bad_lba - start_lba) * scmd->device->sector_size;
1607         return min(good_bytes, transferred);
1608 }
1609
1610 /**
1611  *      sd_done - bottom half handler: called when the lower level
1612  *      driver has completed (successfully or otherwise) a scsi command.
1613  *      @SCpnt: mid-level's per command structure.
1614  *
1615  *      Note: potentially run from within an ISR. Must not block.
1616  **/
1617 static int sd_done(struct scsi_cmnd *SCpnt)
1618 {
1619         int result = SCpnt->result;
1620         unsigned int good_bytes = result ? 0 : scsi_bufflen(SCpnt);
1621         struct scsi_sense_hdr sshdr;
1622         struct scsi_disk *sdkp = scsi_disk(SCpnt->request->rq_disk);
1623         struct request *req = SCpnt->request;
1624         int sense_valid = 0;
1625         int sense_deferred = 0;
1626         unsigned char op = SCpnt->cmnd[0];
1627         unsigned char unmap = SCpnt->cmnd[1] & 8;
1628
1629         if (req->cmd_flags & REQ_DISCARD || req->cmd_flags & REQ_WRITE_SAME) {
1630                 if (!result) {
1631                         good_bytes = blk_rq_bytes(req);
1632                         scsi_set_resid(SCpnt, 0);
1633                 } else {
1634                         good_bytes = 0;
1635                         scsi_set_resid(SCpnt, blk_rq_bytes(req));
1636                 }
1637         }
1638
1639         if (result) {
1640                 sense_valid = scsi_command_normalize_sense(SCpnt, &sshdr);
1641                 if (sense_valid)
1642                         sense_deferred = scsi_sense_is_deferred(&sshdr);
1643         }
1644 #ifdef CONFIG_SCSI_LOGGING
1645         SCSI_LOG_HLCOMPLETE(1, scsi_print_result(SCpnt));
1646         if (sense_valid) {
1647                 SCSI_LOG_HLCOMPLETE(1, scmd_printk(KERN_INFO, SCpnt,
1648                                                    "sd_done: sb[respc,sk,asc,"
1649                                                    "ascq]=%x,%x,%x,%x\n",
1650                                                    sshdr.response_code,
1651                                                    sshdr.sense_key, sshdr.asc,
1652                                                    sshdr.ascq));
1653         }
1654 #endif
1655         if (driver_byte(result) != DRIVER_SENSE &&
1656             (!sense_valid || sense_deferred))
1657                 goto out;
1658
1659         sdkp->medium_access_timed_out = 0;
1660
1661         switch (sshdr.sense_key) {
1662         case HARDWARE_ERROR:
1663         case MEDIUM_ERROR:
1664                 good_bytes = sd_completed_bytes(SCpnt);
1665                 break;
1666         case RECOVERED_ERROR:
1667                 good_bytes = scsi_bufflen(SCpnt);
1668                 break;
1669         case NO_SENSE:
1670                 /* This indicates a false check condition, so ignore it.  An
1671                  * unknown amount of data was transferred so treat it as an
1672                  * error.
1673                  */
1674                 scsi_print_sense("sd", SCpnt);
1675                 SCpnt->result = 0;
1676                 memset(SCpnt->sense_buffer, 0, SCSI_SENSE_BUFFERSIZE);
1677                 break;
1678         case ABORTED_COMMAND:
1679                 if (sshdr.asc == 0x10)  /* DIF: Target detected corruption */
1680                         good_bytes = sd_completed_bytes(SCpnt);
1681                 break;
1682         case ILLEGAL_REQUEST:
1683                 if (sshdr.asc == 0x10)  /* DIX: Host detected corruption */
1684                         good_bytes = sd_completed_bytes(SCpnt);
1685                 /* INVALID COMMAND OPCODE or INVALID FIELD IN CDB */
1686                 if (sshdr.asc == 0x20 || sshdr.asc == 0x24) {
1687                         switch (op) {
1688                         case UNMAP:
1689                                 sd_config_discard(sdkp, SD_LBP_DISABLE);
1690                                 break;
1691                         case WRITE_SAME_16:
1692                         case WRITE_SAME:
1693                                 if (unmap)
1694                                         sd_config_discard(sdkp, SD_LBP_DISABLE);
1695                                 else {
1696                                         sdkp->device->no_write_same = 1;
1697                                         sd_config_write_same(sdkp);
1698
1699                                         good_bytes = 0;
1700                                         req->__data_len = blk_rq_bytes(req);
1701                                         req->cmd_flags |= REQ_QUIET;
1702                                 }
1703                         }
1704                 }
1705                 break;
1706         default:
1707                 break;
1708         }
1709  out:
1710         if (rq_data_dir(SCpnt->request) == READ && scsi_prot_sg_count(SCpnt))
1711                 sd_dif_complete(SCpnt, good_bytes);
1712
1713         if (scsi_host_dif_capable(sdkp->device->host, sdkp->protection_type)
1714             == SD_DIF_TYPE2_PROTECTION && SCpnt->cmnd != SCpnt->request->cmd) {
1715
1716                 /* We have to print a failed command here as the
1717                  * extended CDB gets freed before scsi_io_completion()
1718                  * is called.
1719                  */
1720                 if (result)
1721                         scsi_print_command(SCpnt);
1722
1723                 mempool_free(SCpnt->cmnd, sd_cdb_pool);
1724                 SCpnt->cmnd = NULL;
1725                 SCpnt->cmd_len = 0;
1726         }
1727
1728         return good_bytes;
1729 }
1730
1731 /*
1732  * spinup disk - called only in sd_revalidate_disk()
1733  */
1734 static void
1735 sd_spinup_disk(struct scsi_disk *sdkp)
1736 {
1737         unsigned char cmd[10];
1738         unsigned long spintime_expire = 0;
1739         int retries, spintime;
1740         unsigned int the_result;
1741         struct scsi_sense_hdr sshdr;
1742         int sense_valid = 0;
1743
1744         spintime = 0;
1745
1746         /* Spin up drives, as required.  Only do this at boot time */
1747         /* Spinup needs to be done for module loads too. */
1748         do {
1749                 retries = 0;
1750
1751                 do {
1752                         cmd[0] = TEST_UNIT_READY;
1753                         memset((void *) &cmd[1], 0, 9);
1754
1755                         the_result = scsi_execute_req(sdkp->device, cmd,
1756                                                       DMA_NONE, NULL, 0,
1757                                                       &sshdr, SD_TIMEOUT,
1758                                                       SD_MAX_RETRIES, NULL);
1759
1760                         /*
1761                          * If the drive has indicated to us that it
1762                          * doesn't have any media in it, don't bother
1763                          * with any more polling.
1764                          */
1765                         if (media_not_present(sdkp, &sshdr))
1766                                 return;
1767
1768                         if (the_result)
1769                                 sense_valid = scsi_sense_valid(&sshdr);
1770                         retries++;
1771                 } while (retries < 3 && 
1772                          (!scsi_status_is_good(the_result) ||
1773                           ((driver_byte(the_result) & DRIVER_SENSE) &&
1774                           sense_valid && sshdr.sense_key == UNIT_ATTENTION)));
1775
1776                 if ((driver_byte(the_result) & DRIVER_SENSE) == 0) {
1777                         /* no sense, TUR either succeeded or failed
1778                          * with a status error */
1779                         if(!spintime && !scsi_status_is_good(the_result)) {
1780                                 sd_printk(KERN_NOTICE, sdkp, "Unit Not Ready\n");
1781                                 sd_print_result(sdkp, the_result);
1782                         }
1783                         break;
1784                 }
1785                                         
1786                 /*
1787                  * The device does not want the automatic start to be issued.
1788                  */
1789                 if (sdkp->device->no_start_on_add)
1790                         break;
1791
1792                 if (sense_valid && sshdr.sense_key == NOT_READY) {
1793                         if (sshdr.asc == 4 && sshdr.ascq == 3)
1794                                 break;  /* manual intervention required */
1795                         if (sshdr.asc == 4 && sshdr.ascq == 0xb)
1796                                 break;  /* standby */
1797                         if (sshdr.asc == 4 && sshdr.ascq == 0xc)
1798                                 break;  /* unavailable */
1799                         /*
1800                          * Issue command to spin up drive when not ready
1801                          */
1802                         if (!spintime) {
1803                                 sd_printk(KERN_NOTICE, sdkp, "Spinning up disk...");
1804                                 cmd[0] = START_STOP;
1805                                 cmd[1] = 1;     /* Return immediately */
1806                                 memset((void *) &cmd[2], 0, 8);
1807                                 cmd[4] = 1;     /* Start spin cycle */
1808                                 if (sdkp->device->start_stop_pwr_cond)
1809                                         cmd[4] |= 1 << 4;
1810                                 scsi_execute_req(sdkp->device, cmd, DMA_NONE,
1811                                                  NULL, 0, &sshdr,
1812                                                  SD_TIMEOUT, SD_MAX_RETRIES,
1813                                                  NULL);
1814                                 spintime_expire = jiffies + 100 * HZ;
1815                                 spintime = 1;
1816                         }
1817                         /* Wait 1 second for next try */
1818                         msleep(1000);
1819                         printk(".");
1820
1821                 /*
1822                  * Wait for USB flash devices with slow firmware.
1823                  * Yes, this sense key/ASC combination shouldn't
1824                  * occur here.  It's characteristic of these devices.
1825                  */
1826                 } else if (sense_valid &&
1827                                 sshdr.sense_key == UNIT_ATTENTION &&
1828                                 sshdr.asc == 0x28) {
1829                         if (!spintime) {
1830                                 spintime_expire = jiffies + 5 * HZ;
1831                                 spintime = 1;
1832                         }
1833                         /* Wait 1 second for next try */
1834                         msleep(1000);
1835                 } else {
1836                         /* we don't understand the sense code, so it's
1837                          * probably pointless to loop */
1838                         if(!spintime) {
1839                                 sd_printk(KERN_NOTICE, sdkp, "Unit Not Ready\n");
1840                                 sd_print_sense_hdr(sdkp, &sshdr);
1841                         }
1842                         break;
1843                 }
1844                                 
1845         } while (spintime && time_before_eq(jiffies, spintime_expire));
1846
1847         if (spintime) {
1848                 if (scsi_status_is_good(the_result))
1849                         printk("ready\n");
1850                 else
1851                         printk("not responding...\n");
1852         }
1853 }
1854
1855
1856 /*
1857  * Determine whether disk supports Data Integrity Field.
1858  */
1859 static int sd_read_protection_type(struct scsi_disk *sdkp, unsigned char *buffer)
1860 {
1861         struct scsi_device *sdp = sdkp->device;
1862         u8 type;
1863         int ret = 0;
1864
1865         if (scsi_device_protection(sdp) == 0 || (buffer[12] & 1) == 0)
1866                 return ret;
1867
1868         type = ((buffer[12] >> 1) & 7) + 1; /* P_TYPE 0 = Type 1 */
1869
1870         if (type > SD_DIF_TYPE3_PROTECTION)
1871                 ret = -ENODEV;
1872         else if (scsi_host_dif_capable(sdp->host, type))
1873                 ret = 1;
1874
1875         if (sdkp->first_scan || type != sdkp->protection_type)
1876                 switch (ret) {
1877                 case -ENODEV:
1878                         sd_printk(KERN_ERR, sdkp, "formatted with unsupported" \
1879                                   " protection type %u. Disabling disk!\n",
1880                                   type);
1881                         break;
1882                 case 1:
1883                         sd_printk(KERN_NOTICE, sdkp,
1884                                   "Enabling DIF Type %u protection\n", type);
1885                         break;
1886                 case 0:
1887                         sd_printk(KERN_NOTICE, sdkp,
1888                                   "Disabling DIF Type %u protection\n", type);
1889                         break;
1890                 }
1891
1892         sdkp->protection_type = type;
1893
1894         return ret;
1895 }
1896
1897 static void read_capacity_error(struct scsi_disk *sdkp, struct scsi_device *sdp,
1898                         struct scsi_sense_hdr *sshdr, int sense_valid,
1899                         int the_result)
1900 {
1901         sd_print_result(sdkp, the_result);
1902         if (driver_byte(the_result) & DRIVER_SENSE)
1903                 sd_print_sense_hdr(sdkp, sshdr);
1904         else
1905                 sd_printk(KERN_NOTICE, sdkp, "Sense not available.\n");
1906
1907         /*
1908          * Set dirty bit for removable devices if not ready -
1909          * sometimes drives will not report this properly.
1910          */
1911         if (sdp->removable &&
1912             sense_valid && sshdr->sense_key == NOT_READY)
1913                 set_media_not_present(sdkp);
1914
1915         /*
1916          * We used to set media_present to 0 here to indicate no media
1917          * in the drive, but some drives fail read capacity even with
1918          * media present, so we can't do that.
1919          */
1920         sdkp->capacity = 0; /* unknown mapped to zero - as usual */
1921 }
1922
1923 #define RC16_LEN 32
1924 #if RC16_LEN > SD_BUF_SIZE
1925 #error RC16_LEN must not be more than SD_BUF_SIZE
1926 #endif
1927
1928 #define READ_CAPACITY_RETRIES_ON_RESET  10
1929
1930 static int read_capacity_16(struct scsi_disk *sdkp, struct scsi_device *sdp,
1931                                                 unsigned char *buffer)
1932 {
1933         unsigned char cmd[16];
1934         struct scsi_sense_hdr sshdr;
1935         int sense_valid = 0;
1936         int the_result;
1937         int retries = 3, reset_retries = READ_CAPACITY_RETRIES_ON_RESET;
1938         unsigned int alignment;
1939         unsigned long long lba;
1940         unsigned sector_size;
1941
1942         if (sdp->no_read_capacity_16)
1943                 return -EINVAL;
1944
1945         do {
1946                 memset(cmd, 0, 16);
1947                 cmd[0] = SERVICE_ACTION_IN;
1948                 cmd[1] = SAI_READ_CAPACITY_16;
1949                 cmd[13] = RC16_LEN;
1950                 memset(buffer, 0, RC16_LEN);
1951
1952                 the_result = scsi_execute_req(sdp, cmd, DMA_FROM_DEVICE,
1953                                         buffer, RC16_LEN, &sshdr,
1954                                         SD_TIMEOUT, SD_MAX_RETRIES, NULL);
1955
1956                 if (media_not_present(sdkp, &sshdr))
1957                         return -ENODEV;
1958
1959                 if (the_result) {
1960                         sense_valid = scsi_sense_valid(&sshdr);
1961                         if (sense_valid &&
1962                             sshdr.sense_key == ILLEGAL_REQUEST &&
1963                             (sshdr.asc == 0x20 || sshdr.asc == 0x24) &&
1964                             sshdr.ascq == 0x00)
1965                                 /* Invalid Command Operation Code or
1966                                  * Invalid Field in CDB, just retry
1967                                  * silently with RC10 */
1968                                 return -EINVAL;
1969                         if (sense_valid &&
1970                             sshdr.sense_key == UNIT_ATTENTION &&
1971                             sshdr.asc == 0x29 && sshdr.ascq == 0x00)
1972                                 /* Device reset might occur several times,
1973                                  * give it one more chance */
1974                                 if (--reset_retries > 0)
1975                                         continue;
1976                 }
1977                 retries--;
1978
1979         } while (the_result && retries);
1980
1981         if (the_result) {
1982                 sd_printk(KERN_NOTICE, sdkp, "READ CAPACITY(16) failed\n");
1983                 read_capacity_error(sdkp, sdp, &sshdr, sense_valid, the_result);
1984                 return -EINVAL;
1985         }
1986
1987         sector_size = get_unaligned_be32(&buffer[8]);
1988         lba = get_unaligned_be64(&buffer[0]);
1989
1990         if (sd_read_protection_type(sdkp, buffer) < 0) {
1991                 sdkp->capacity = 0;
1992                 return -ENODEV;
1993         }
1994
1995         if ((sizeof(sdkp->capacity) == 4) && (lba >= 0xffffffffULL)) {
1996                 sd_printk(KERN_ERR, sdkp, "Too big for this kernel. Use a "
1997                         "kernel compiled with support for large block "
1998                         "devices.\n");
1999                 sdkp->capacity = 0;
2000                 return -EOVERFLOW;
2001         }
2002
2003         /* Logical blocks per physical block exponent */
2004         sdkp->physical_block_size = (1 << (buffer[13] & 0xf)) * sector_size;
2005
2006         /* Lowest aligned logical block */
2007         alignment = ((buffer[14] & 0x3f) << 8 | buffer[15]) * sector_size;
2008         blk_queue_alignment_offset(sdp->request_queue, alignment);
2009         if (alignment && sdkp->first_scan)
2010                 sd_printk(KERN_NOTICE, sdkp,
2011                           "physical block alignment offset: %u\n", alignment);
2012
2013         if (buffer[14] & 0x80) { /* LBPME */
2014                 sdkp->lbpme = 1;
2015
2016                 if (buffer[14] & 0x40) /* LBPRZ */
2017                         sdkp->lbprz = 1;
2018
2019                 sd_config_discard(sdkp, SD_LBP_WS16);
2020         }
2021
2022         sdkp->capacity = lba + 1;
2023         return sector_size;
2024 }
2025
2026 static int read_capacity_10(struct scsi_disk *sdkp, struct scsi_device *sdp,
2027                                                 unsigned char *buffer)
2028 {
2029         unsigned char cmd[16];
2030         struct scsi_sense_hdr sshdr;
2031         int sense_valid = 0;
2032         int the_result;
2033         int retries = 3, reset_retries = READ_CAPACITY_RETRIES_ON_RESET;
2034         sector_t lba;
2035         unsigned sector_size;
2036
2037         do {
2038                 cmd[0] = READ_CAPACITY;
2039                 memset(&cmd[1], 0, 9);
2040                 memset(buffer, 0, 8);
2041
2042                 the_result = scsi_execute_req(sdp, cmd, DMA_FROM_DEVICE,
2043                                         buffer, 8, &sshdr,
2044                                         SD_TIMEOUT, SD_MAX_RETRIES, NULL);
2045
2046                 if (media_not_present(sdkp, &sshdr))
2047                         return -ENODEV;
2048
2049                 if (the_result) {
2050                         sense_valid = scsi_sense_valid(&sshdr);
2051                         if (sense_valid &&
2052                             sshdr.sense_key == UNIT_ATTENTION &&
2053                             sshdr.asc == 0x29 && sshdr.ascq == 0x00)
2054                                 /* Device reset might occur several times,
2055                                  * give it one more chance */
2056                                 if (--reset_retries > 0)
2057                                         continue;
2058                 }
2059                 retries--;
2060
2061         } while (the_result && retries);
2062
2063         if (the_result) {
2064                 sd_printk(KERN_NOTICE, sdkp, "READ CAPACITY failed\n");
2065                 read_capacity_error(sdkp, sdp, &sshdr, sense_valid, the_result);
2066                 return -EINVAL;
2067         }
2068
2069         sector_size = get_unaligned_be32(&buffer[4]);
2070         lba = get_unaligned_be32(&buffer[0]);
2071
2072         if (sdp->no_read_capacity_16 && (lba == 0xffffffff)) {
2073                 /* Some buggy (usb cardreader) devices return an lba of
2074                    0xffffffff when the want to report a size of 0 (with
2075                    which they really mean no media is present) */
2076                 sdkp->capacity = 0;
2077                 sdkp->physical_block_size = sector_size;
2078                 return sector_size;
2079         }
2080
2081         if ((sizeof(sdkp->capacity) == 4) && (lba == 0xffffffff)) {
2082                 sd_printk(KERN_ERR, sdkp, "Too big for this kernel. Use a "
2083                         "kernel compiled with support for large block "
2084                         "devices.\n");
2085                 sdkp->capacity = 0;
2086                 return -EOVERFLOW;
2087         }
2088
2089         sdkp->capacity = lba + 1;
2090         sdkp->physical_block_size = sector_size;
2091         return sector_size;
2092 }
2093
2094 static int sd_try_rc16_first(struct scsi_device *sdp)
2095 {
2096         if (sdp->host->max_cmd_len < 16)
2097                 return 0;
2098         if (sdp->try_rc_10_first)
2099                 return 0;
2100         if (sdp->scsi_level > SCSI_SPC_2)
2101                 return 1;
2102         if (scsi_device_protection(sdp))
2103                 return 1;
2104         return 0;
2105 }
2106
2107 /*
2108  * read disk capacity
2109  */
2110 static void
2111 sd_read_capacity(struct scsi_disk *sdkp, unsigned char *buffer)
2112 {
2113         int sector_size;
2114         struct scsi_device *sdp = sdkp->device;
2115         sector_t old_capacity = sdkp->capacity;
2116
2117         if (sd_try_rc16_first(sdp)) {
2118                 sector_size = read_capacity_16(sdkp, sdp, buffer);
2119                 if (sector_size == -EOVERFLOW)
2120                         goto got_data;
2121                 if (sector_size == -ENODEV)
2122                         return;
2123                 if (sector_size < 0)
2124                         sector_size = read_capacity_10(sdkp, sdp, buffer);
2125                 if (sector_size < 0)
2126                         return;
2127         } else {
2128                 sector_size = read_capacity_10(sdkp, sdp, buffer);
2129                 if (sector_size == -EOVERFLOW)
2130                         goto got_data;
2131                 if (sector_size < 0)
2132                         return;
2133                 if ((sizeof(sdkp->capacity) > 4) &&
2134                     (sdkp->capacity > 0xffffffffULL)) {
2135                         int old_sector_size = sector_size;
2136                         sd_printk(KERN_NOTICE, sdkp, "Very big device. "
2137                                         "Trying to use READ CAPACITY(16).\n");
2138                         sector_size = read_capacity_16(sdkp, sdp, buffer);
2139                         if (sector_size < 0) {
2140                                 sd_printk(KERN_NOTICE, sdkp,
2141                                         "Using 0xffffffff as device size\n");
2142                                 sdkp->capacity = 1 + (sector_t) 0xffffffff;
2143                                 sector_size = old_sector_size;
2144                                 goto got_data;
2145                         }
2146                 }
2147         }
2148
2149         /* Some devices are known to return the total number of blocks,
2150          * not the highest block number.  Some devices have versions
2151          * which do this and others which do not.  Some devices we might
2152          * suspect of doing this but we don't know for certain.
2153          *
2154          * If we know the reported capacity is wrong, decrement it.  If
2155          * we can only guess, then assume the number of blocks is even
2156          * (usually true but not always) and err on the side of lowering
2157          * the capacity.
2158          */
2159         if (sdp->fix_capacity ||
2160             (sdp->guess_capacity && (sdkp->capacity & 0x01))) {
2161                 sd_printk(KERN_INFO, sdkp, "Adjusting the sector count "
2162                                 "from its reported value: %llu\n",
2163                                 (unsigned long long) sdkp->capacity);
2164                 --sdkp->capacity;
2165         }
2166
2167 got_data:
2168         if (sector_size == 0) {
2169                 sector_size = 512;
2170                 sd_printk(KERN_NOTICE, sdkp, "Sector size 0 reported, "
2171                           "assuming 512.\n");
2172         }
2173
2174         if (sector_size != 512 &&
2175             sector_size != 1024 &&
2176             sector_size != 2048 &&
2177             sector_size != 4096 &&
2178             sector_size != 256) {
2179                 sd_printk(KERN_NOTICE, sdkp, "Unsupported sector size %d.\n",
2180                           sector_size);
2181                 /*
2182                  * The user might want to re-format the drive with
2183                  * a supported sectorsize.  Once this happens, it
2184                  * would be relatively trivial to set the thing up.
2185                  * For this reason, we leave the thing in the table.
2186                  */
2187                 sdkp->capacity = 0;
2188                 /*
2189                  * set a bogus sector size so the normal read/write
2190                  * logic in the block layer will eventually refuse any
2191                  * request on this device without tripping over power
2192                  * of two sector size assumptions
2193                  */
2194                 sector_size = 512;
2195         }
2196         blk_queue_logical_block_size(sdp->request_queue, sector_size);
2197
2198         {
2199                 char cap_str_2[10], cap_str_10[10];
2200                 u64 sz = (u64)sdkp->capacity << ilog2(sector_size);
2201
2202                 string_get_size(sz, STRING_UNITS_2, cap_str_2,
2203                                 sizeof(cap_str_2));
2204                 string_get_size(sz, STRING_UNITS_10, cap_str_10,
2205                                 sizeof(cap_str_10));
2206
2207                 if (sdkp->first_scan || old_capacity != sdkp->capacity) {
2208                         sd_printk(KERN_NOTICE, sdkp,
2209                                   "%llu %d-byte logical blocks: (%s/%s)\n",
2210                                   (unsigned long long)sdkp->capacity,
2211                                   sector_size, cap_str_10, cap_str_2);
2212
2213                         if (sdkp->physical_block_size != sector_size)
2214                                 sd_printk(KERN_NOTICE, sdkp,
2215                                           "%u-byte physical blocks\n",
2216                                           sdkp->physical_block_size);
2217                 }
2218         }
2219
2220         sdp->use_16_for_rw = (sdkp->capacity > 0xffffffff);
2221
2222         /* Rescale capacity to 512-byte units */
2223         if (sector_size == 4096)
2224                 sdkp->capacity <<= 3;
2225         else if (sector_size == 2048)
2226                 sdkp->capacity <<= 2;
2227         else if (sector_size == 1024)
2228                 sdkp->capacity <<= 1;
2229         else if (sector_size == 256)
2230                 sdkp->capacity >>= 1;
2231
2232         blk_queue_physical_block_size(sdp->request_queue,
2233                                       sdkp->physical_block_size);
2234         sdkp->device->sector_size = sector_size;
2235 }
2236
2237 /* called with buffer of length 512 */
2238 static inline int
2239 sd_do_mode_sense(struct scsi_device *sdp, int dbd, int modepage,
2240                  unsigned char *buffer, int len, struct scsi_mode_data *data,
2241                  struct scsi_sense_hdr *sshdr)
2242 {
2243         return scsi_mode_sense(sdp, dbd, modepage, buffer, len,
2244                                SD_TIMEOUT, SD_MAX_RETRIES, data,
2245                                sshdr);
2246 }
2247
2248 /*
2249  * read write protect setting, if possible - called only in sd_revalidate_disk()
2250  * called with buffer of length SD_BUF_SIZE
2251  */
2252 static void
2253 sd_read_write_protect_flag(struct scsi_disk *sdkp, unsigned char *buffer)
2254 {
2255         int res;
2256         struct scsi_device *sdp = sdkp->device;
2257         struct scsi_mode_data data;
2258         int old_wp = sdkp->write_prot;
2259
2260         set_disk_ro(sdkp->disk, 0);
2261         if (sdp->skip_ms_page_3f) {
2262                 sd_printk(KERN_NOTICE, sdkp, "Assuming Write Enabled\n");
2263                 return;
2264         }
2265
2266         if (sdp->use_192_bytes_for_3f) {
2267                 res = sd_do_mode_sense(sdp, 0, 0x3F, buffer, 192, &data, NULL);
2268         } else {
2269                 /*
2270                  * First attempt: ask for all pages (0x3F), but only 4 bytes.
2271                  * We have to start carefully: some devices hang if we ask
2272                  * for more than is available.
2273                  */
2274                 res = sd_do_mode_sense(sdp, 0, 0x3F, buffer, 4, &data, NULL);
2275
2276                 /*
2277                  * Second attempt: ask for page 0 When only page 0 is
2278                  * implemented, a request for page 3F may return Sense Key
2279                  * 5: Illegal Request, Sense Code 24: Invalid field in
2280                  * CDB.
2281                  */
2282                 if (!scsi_status_is_good(res))
2283                         res = sd_do_mode_sense(sdp, 0, 0, buffer, 4, &data, NULL);
2284
2285                 /*
2286                  * Third attempt: ask 255 bytes, as we did earlier.
2287                  */
2288                 if (!scsi_status_is_good(res))
2289                         res = sd_do_mode_sense(sdp, 0, 0x3F, buffer, 255,
2290                                                &data, NULL);
2291         }
2292
2293         if (!scsi_status_is_good(res)) {
2294                 sd_printk(KERN_WARNING, sdkp,
2295                           "Test WP failed, assume Write Enabled\n");
2296         } else {
2297                 sdkp->write_prot = ((data.device_specific & 0x80) != 0);
2298                 set_disk_ro(sdkp->disk, sdkp->write_prot);
2299                 if (sdkp->first_scan || old_wp != sdkp->write_prot) {
2300                         sd_printk(KERN_NOTICE, sdkp, "Write Protect is %s\n",
2301                                   sdkp->write_prot ? "on" : "off");
2302                         sd_printk(KERN_DEBUG, sdkp,
2303                                   "Mode Sense: %02x %02x %02x %02x\n",
2304                                   buffer[0], buffer[1], buffer[2], buffer[3]);
2305                 }
2306         }
2307 }
2308
2309 /*
2310  * sd_read_cache_type - called only from sd_revalidate_disk()
2311  * called with buffer of length SD_BUF_SIZE
2312  */
2313 static void
2314 sd_read_cache_type(struct scsi_disk *sdkp, unsigned char *buffer)
2315 {
2316         int len = 0, res;
2317         struct scsi_device *sdp = sdkp->device;
2318
2319         int dbd;
2320         int modepage;
2321         int first_len;
2322         struct scsi_mode_data data;
2323         struct scsi_sense_hdr sshdr;
2324         int old_wce = sdkp->WCE;
2325         int old_rcd = sdkp->RCD;
2326         int old_dpofua = sdkp->DPOFUA;
2327
2328
2329         if (sdkp->cache_override)
2330                 return;
2331
2332         first_len = 4;
2333         if (sdp->skip_ms_page_8) {
2334                 if (sdp->type == TYPE_RBC)
2335                         goto defaults;
2336                 else {
2337                         if (sdp->skip_ms_page_3f)
2338                                 goto defaults;
2339                         modepage = 0x3F;
2340                         if (sdp->use_192_bytes_for_3f)
2341                                 first_len = 192;
2342                         dbd = 0;
2343                 }
2344         } else if (sdp->type == TYPE_RBC) {
2345                 modepage = 6;
2346                 dbd = 8;
2347         } else {
2348                 modepage = 8;
2349                 dbd = 0;
2350         }
2351
2352         /* cautiously ask */
2353         res = sd_do_mode_sense(sdp, dbd, modepage, buffer, first_len,
2354                         &data, &sshdr);
2355
2356         if (!scsi_status_is_good(res))
2357                 goto bad_sense;
2358
2359         if (!data.header_length) {
2360                 modepage = 6;
2361                 first_len = 0;
2362                 sd_printk(KERN_ERR, sdkp, "Missing header in MODE_SENSE response\n");
2363         }
2364
2365         /* that went OK, now ask for the proper length */
2366         len = data.length;
2367
2368         /*
2369          * We're only interested in the first three bytes, actually.
2370          * But the data cache page is defined for the first 20.
2371          */
2372         if (len < 3)
2373                 goto bad_sense;
2374         else if (len > SD_BUF_SIZE) {
2375                 sd_printk(KERN_NOTICE, sdkp, "Truncating mode parameter "
2376                           "data from %d to %d bytes\n", len, SD_BUF_SIZE);
2377                 len = SD_BUF_SIZE;
2378         }
2379         if (modepage == 0x3F && sdp->use_192_bytes_for_3f)
2380                 len = 192;
2381
2382         /* Get the data */
2383         if (len > first_len)
2384                 res = sd_do_mode_sense(sdp, dbd, modepage, buffer, len,
2385                                 &data, &sshdr);
2386
2387         if (scsi_status_is_good(res)) {
2388                 int offset = data.header_length + data.block_descriptor_length;
2389
2390                 while (offset < len) {
2391                         u8 page_code = buffer[offset] & 0x3F;
2392                         u8 spf       = buffer[offset] & 0x40;
2393
2394                         if (page_code == 8 || page_code == 6) {
2395                                 /* We're interested only in the first 3 bytes.
2396                                  */
2397                                 if (len - offset <= 2) {
2398                                         sd_printk(KERN_ERR, sdkp, "Incomplete "
2399                                                   "mode parameter data\n");
2400                                         goto defaults;
2401                                 } else {
2402                                         modepage = page_code;
2403                                         goto Page_found;
2404                                 }
2405                         } else {
2406                                 /* Go to the next page */
2407                                 if (spf && len - offset > 3)
2408                                         offset += 4 + (buffer[offset+2] << 8) +
2409                                                 buffer[offset+3];
2410                                 else if (!spf && len - offset > 1)
2411                                         offset += 2 + buffer[offset+1];
2412                                 else {
2413                                         sd_printk(KERN_ERR, sdkp, "Incomplete "
2414                                                   "mode parameter data\n");
2415                                         goto defaults;
2416                                 }
2417                         }
2418                 }
2419
2420                 if (modepage == 0x3F) {
2421                         sd_printk(KERN_ERR, sdkp, "No Caching mode page "
2422                                   "present\n");
2423                         goto defaults;
2424                 } else if ((buffer[offset] & 0x3f) != modepage) {
2425                         sd_printk(KERN_ERR, sdkp, "Got wrong page\n");
2426                         goto defaults;
2427                 }
2428         Page_found:
2429                 if (modepage == 8) {
2430                         sdkp->WCE = ((buffer[offset + 2] & 0x04) != 0);
2431                         sdkp->RCD = ((buffer[offset + 2] & 0x01) != 0);
2432                 } else {
2433                         sdkp->WCE = ((buffer[offset + 2] & 0x01) == 0);
2434                         sdkp->RCD = 0;
2435                 }
2436
2437                 sdkp->DPOFUA = (data.device_specific & 0x10) != 0;
2438                 if (sdkp->DPOFUA && !sdkp->device->use_10_for_rw) {
2439                         sd_printk(KERN_NOTICE, sdkp,
2440                                   "Uses READ/WRITE(6), disabling FUA\n");
2441                         sdkp->DPOFUA = 0;
2442                 }
2443
2444                 if (sdkp->first_scan || old_wce != sdkp->WCE ||
2445                     old_rcd != sdkp->RCD || old_dpofua != sdkp->DPOFUA)
2446                         sd_printk(KERN_NOTICE, sdkp,
2447                                   "Write cache: %s, read cache: %s, %s\n",
2448                                   sdkp->WCE ? "enabled" : "disabled",
2449                                   sdkp->RCD ? "disabled" : "enabled",
2450                                   sdkp->DPOFUA ? "supports DPO and FUA"
2451                                   : "doesn't support DPO or FUA");
2452
2453                 return;
2454         }
2455
2456 bad_sense:
2457         if (scsi_sense_valid(&sshdr) &&
2458             sshdr.sense_key == ILLEGAL_REQUEST &&
2459             sshdr.asc == 0x24 && sshdr.ascq == 0x0)
2460                 /* Invalid field in CDB */
2461                 sd_printk(KERN_NOTICE, sdkp, "Cache data unavailable\n");
2462         else
2463                 sd_printk(KERN_ERR, sdkp, "Asking for cache data failed\n");
2464
2465 defaults:
2466         if (sdp->wce_default_on) {
2467                 sd_printk(KERN_NOTICE, sdkp, "Assuming drive cache: write back\n");
2468                 sdkp->WCE = 1;
2469         } else {
2470                 sd_printk(KERN_ERR, sdkp, "Assuming drive cache: write through\n");
2471                 sdkp->WCE = 0;
2472         }
2473         sdkp->RCD = 0;
2474         sdkp->DPOFUA = 0;
2475 }
2476
2477 /*
2478  * The ATO bit indicates whether the DIF application tag is available
2479  * for use by the operating system.
2480  */
2481 static void sd_read_app_tag_own(struct scsi_disk *sdkp, unsigned char *buffer)
2482 {
2483         int res, offset;
2484         struct scsi_device *sdp = sdkp->device;
2485         struct scsi_mode_data data;
2486         struct scsi_sense_hdr sshdr;
2487
2488         if (sdp->type != TYPE_DISK)
2489                 return;
2490
2491         if (sdkp->protection_type == 0)
2492                 return;
2493
2494         res = scsi_mode_sense(sdp, 1, 0x0a, buffer, 36, SD_TIMEOUT,
2495                               SD_MAX_RETRIES, &data, &sshdr);
2496
2497         if (!scsi_status_is_good(res) || !data.header_length ||
2498             data.length < 6) {
2499                 sd_printk(KERN_WARNING, sdkp,
2500                           "getting Control mode page failed, assume no ATO\n");
2501
2502                 if (scsi_sense_valid(&sshdr))
2503                         sd_print_sense_hdr(sdkp, &sshdr);
2504
2505                 return;
2506         }
2507
2508         offset = data.header_length + data.block_descriptor_length;
2509
2510         if ((buffer[offset] & 0x3f) != 0x0a) {
2511                 sd_printk(KERN_ERR, sdkp, "ATO Got wrong page\n");
2512                 return;
2513         }
2514
2515         if ((buffer[offset + 5] & 0x80) == 0)
2516                 return;
2517
2518         sdkp->ATO = 1;
2519
2520         return;
2521 }
2522
2523 /**
2524  * sd_read_block_limits - Query disk device for preferred I/O sizes.
2525  * @disk: disk to query
2526  */
2527 static void sd_read_block_limits(struct scsi_disk *sdkp)
2528 {
2529         unsigned int sector_sz = sdkp->device->sector_size;
2530         const int vpd_len = 64;
2531         unsigned char *buffer = kmalloc(vpd_len, GFP_KERNEL);
2532
2533         if (!buffer ||
2534             /* Block Limits VPD */
2535             scsi_get_vpd_page(sdkp->device, 0xb0, buffer, vpd_len))
2536                 goto out;
2537
2538         blk_queue_io_min(sdkp->disk->queue,
2539                          get_unaligned_be16(&buffer[6]) * sector_sz);
2540         blk_queue_io_opt(sdkp->disk->queue,
2541                          get_unaligned_be32(&buffer[12]) * sector_sz);
2542
2543         if (buffer[3] == 0x3c) {
2544                 unsigned int lba_count, desc_count;
2545
2546                 sdkp->max_ws_blocks = (u32)get_unaligned_be64(&buffer[36]);
2547
2548                 if (!sdkp->lbpme)
2549                         goto out;
2550
2551                 lba_count = get_unaligned_be32(&buffer[20]);
2552                 desc_count = get_unaligned_be32(&buffer[24]);
2553
2554                 if (lba_count && desc_count)
2555                         sdkp->max_unmap_blocks = lba_count;
2556
2557                 sdkp->unmap_granularity = get_unaligned_be32(&buffer[28]);
2558
2559                 if (buffer[32] & 0x80)
2560                         sdkp->unmap_alignment =
2561                                 get_unaligned_be32(&buffer[32]) & ~(1 << 31);
2562
2563                 if (!sdkp->lbpvpd) { /* LBP VPD page not provided */
2564
2565                         if (sdkp->max_unmap_blocks)
2566                                 sd_config_discard(sdkp, SD_LBP_UNMAP);
2567                         else
2568                                 sd_config_discard(sdkp, SD_LBP_WS16);
2569
2570                 } else {        /* LBP VPD page tells us what to use */
2571
2572                         if (sdkp->lbpu && sdkp->max_unmap_blocks)
2573                                 sd_config_discard(sdkp, SD_LBP_UNMAP);
2574                         else if (sdkp->lbpws)
2575                                 sd_config_discard(sdkp, SD_LBP_WS16);
2576                         else if (sdkp->lbpws10)
2577                                 sd_config_discard(sdkp, SD_LBP_WS10);
2578                         else
2579                                 sd_config_discard(sdkp, SD_LBP_DISABLE);
2580                 }
2581         }
2582
2583  out:
2584         kfree(buffer);
2585 }
2586
2587 /**
2588  * sd_read_block_characteristics - Query block dev. characteristics
2589  * @disk: disk to query
2590  */
2591 static void sd_read_block_characteristics(struct scsi_disk *sdkp)
2592 {
2593         unsigned char *buffer;
2594         u16 rot;
2595         const int vpd_len = 64;
2596
2597         buffer = kmalloc(vpd_len, GFP_KERNEL);
2598
2599         if (!buffer ||
2600             /* Block Device Characteristics VPD */
2601             scsi_get_vpd_page(sdkp->device, 0xb1, buffer, vpd_len))
2602                 goto out;
2603
2604         rot = get_unaligned_be16(&buffer[4]);
2605
2606         if (rot == 1)
2607                 queue_flag_set_unlocked(QUEUE_FLAG_NONROT, sdkp->disk->queue);
2608
2609  out:
2610         kfree(buffer);
2611 }
2612
2613 /**
2614  * sd_read_block_provisioning - Query provisioning VPD page
2615  * @disk: disk to query
2616  */
2617 static void sd_read_block_provisioning(struct scsi_disk *sdkp)
2618 {
2619         unsigned char *buffer;
2620         const int vpd_len = 8;
2621
2622         if (sdkp->lbpme == 0)
2623                 return;
2624
2625         buffer = kmalloc(vpd_len, GFP_KERNEL);
2626
2627         if (!buffer || scsi_get_vpd_page(sdkp->device, 0xb2, buffer, vpd_len))
2628                 goto out;
2629
2630         sdkp->lbpvpd    = 1;
2631         sdkp->lbpu      = (buffer[5] >> 7) & 1; /* UNMAP */
2632         sdkp->lbpws     = (buffer[5] >> 6) & 1; /* WRITE SAME(16) with UNMAP */
2633         sdkp->lbpws10   = (buffer[5] >> 5) & 1; /* WRITE SAME(10) with UNMAP */
2634
2635  out:
2636         kfree(buffer);
2637 }
2638
2639 static void sd_read_write_same(struct scsi_disk *sdkp, unsigned char *buffer)
2640 {
2641         struct scsi_device *sdev = sdkp->device;
2642
2643         if (scsi_report_opcode(sdev, buffer, SD_BUF_SIZE, INQUIRY) < 0) {
2644                 sdev->no_report_opcodes = 1;
2645
2646                 /* Disable WRITE SAME if REPORT SUPPORTED OPERATION
2647                  * CODES is unsupported and the device has an ATA
2648                  * Information VPD page (SAT).
2649                  */
2650                 if (!scsi_get_vpd_page(sdev, 0x89, buffer, SD_BUF_SIZE))
2651                         sdev->no_write_same = 1;
2652         }
2653
2654         if (scsi_report_opcode(sdev, buffer, SD_BUF_SIZE, WRITE_SAME_16) == 1)
2655                 sdkp->ws16 = 1;
2656
2657         if (scsi_report_opcode(sdev, buffer, SD_BUF_SIZE, WRITE_SAME) == 1)
2658                 sdkp->ws10 = 1;
2659 }
2660
2661 static int sd_try_extended_inquiry(struct scsi_device *sdp)
2662 {
2663         /*
2664          * Although VPD inquiries can go to SCSI-2 type devices,
2665          * some USB ones crash on receiving them, and the pages
2666          * we currently ask for are for SPC-3 and beyond
2667          */
2668         if (sdp->scsi_level > SCSI_SPC_2 && !sdp->skip_vpd_pages)
2669                 return 1;
2670         return 0;
2671 }
2672
2673 /**
2674  *      sd_revalidate_disk - called the first time a new disk is seen,
2675  *      performs disk spin up, read_capacity, etc.
2676  *      @disk: struct gendisk we care about
2677  **/
2678 static int sd_revalidate_disk(struct gendisk *disk)
2679 {
2680         struct scsi_disk *sdkp = scsi_disk(disk);
2681         struct scsi_device *sdp = sdkp->device;
2682         unsigned char *buffer;
2683         unsigned flush = 0;
2684
2685         SCSI_LOG_HLQUEUE(3, sd_printk(KERN_INFO, sdkp,
2686                                       "sd_revalidate_disk\n"));
2687
2688         /*
2689          * If the device is offline, don't try and read capacity or any
2690          * of the other niceties.
2691          */
2692         if (!scsi_device_online(sdp))
2693                 goto out;
2694
2695         buffer = kmalloc(SD_BUF_SIZE, GFP_KERNEL);
2696         if (!buffer) {
2697                 sd_printk(KERN_WARNING, sdkp, "sd_revalidate_disk: Memory "
2698                           "allocation failure.\n");
2699                 goto out;
2700         }
2701
2702         sd_spinup_disk(sdkp);
2703
2704         /*
2705          * Without media there is no reason to ask; moreover, some devices
2706          * react badly if we do.
2707          */
2708         if (sdkp->media_present) {
2709                 sd_read_capacity(sdkp, buffer);
2710
2711                 if (sd_try_extended_inquiry(sdp)) {
2712                         sd_read_block_provisioning(sdkp);
2713                         sd_read_block_limits(sdkp);
2714                         sd_read_block_characteristics(sdkp);
2715                 }
2716
2717                 sd_read_write_protect_flag(sdkp, buffer);
2718                 sd_read_cache_type(sdkp, buffer);
2719                 sd_read_app_tag_own(sdkp, buffer);
2720                 sd_read_write_same(sdkp, buffer);
2721         }
2722
2723         sdkp->first_scan = 0;
2724
2725         /*
2726          * We now have all cache related info, determine how we deal
2727          * with flush requests.
2728          */
2729         if (sdkp->WCE) {
2730                 flush |= REQ_FLUSH;
2731                 if (sdkp->DPOFUA)
2732                         flush |= REQ_FUA;
2733         }
2734
2735         blk_queue_flush(sdkp->disk->queue, flush);
2736
2737         set_capacity(disk, sdkp->capacity);
2738         sd_config_write_same(sdkp);
2739         kfree(buffer);
2740
2741  out:
2742         return 0;
2743 }
2744
2745 /**
2746  *      sd_unlock_native_capacity - unlock native capacity
2747  *      @disk: struct gendisk to set capacity for
2748  *
2749  *      Block layer calls this function if it detects that partitions
2750  *      on @disk reach beyond the end of the device.  If the SCSI host
2751  *      implements ->unlock_native_capacity() method, it's invoked to
2752  *      give it a chance to adjust the device capacity.
2753  *
2754  *      CONTEXT:
2755  *      Defined by block layer.  Might sleep.
2756  */
2757 static void sd_unlock_native_capacity(struct gendisk *disk)
2758 {
2759         struct scsi_device *sdev = scsi_disk(disk)->device;
2760
2761         if (sdev->host->hostt->unlock_native_capacity)
2762                 sdev->host->hostt->unlock_native_capacity(sdev);
2763 }
2764
2765 /**
2766  *      sd_format_disk_name - format disk name
2767  *      @prefix: name prefix - ie. "sd" for SCSI disks
2768  *      @index: index of the disk to format name for
2769  *      @buf: output buffer
2770  *      @buflen: length of the output buffer
2771  *
2772  *      SCSI disk names starts at sda.  The 26th device is sdz and the
2773  *      27th is sdaa.  The last one for two lettered suffix is sdzz
2774  *      which is followed by sdaaa.
2775  *
2776  *      This is basically 26 base counting with one extra 'nil' entry
2777  *      at the beginning from the second digit on and can be
2778  *      determined using similar method as 26 base conversion with the
2779  *      index shifted -1 after each digit is computed.
2780  *
2781  *      CONTEXT:
2782  *      Don't care.
2783  *
2784  *      RETURNS:
2785  *      0 on success, -errno on failure.
2786  */
2787 static int sd_format_disk_name(char *prefix, int index, char *buf, int buflen)
2788 {
2789         const int base = 'z' - 'a' + 1;
2790         char *begin = buf + strlen(prefix);
2791         char *end = buf + buflen;
2792         char *p;
2793         int unit;
2794
2795         p = end - 1;
2796         *p = '\0';
2797         unit = base;
2798         do {
2799                 if (p == begin)
2800                         return -EINVAL;
2801                 *--p = 'a' + (index % unit);
2802                 index = (index / unit) - 1;
2803         } while (index >= 0);
2804
2805         memmove(begin, p, end - p);
2806         memcpy(buf, prefix, strlen(prefix));
2807
2808         return 0;
2809 }
2810
2811 /*
2812  * The asynchronous part of sd_probe
2813  */
2814 static void sd_probe_async(void *data, async_cookie_t cookie)
2815 {
2816         struct scsi_disk *sdkp = data;
2817         struct scsi_device *sdp;
2818         struct gendisk *gd;
2819         u32 index;
2820         struct device *dev;
2821
2822         sdp = sdkp->device;
2823         gd = sdkp->disk;
2824         index = sdkp->index;
2825         dev = &sdp->sdev_gendev;
2826
2827         gd->major = sd_major((index & 0xf0) >> 4);
2828         gd->first_minor = ((index & 0xf) << 4) | (index & 0xfff00);
2829         gd->minors = SD_MINORS;
2830
2831         gd->fops = &sd_fops;
2832         gd->private_data = &sdkp->driver;
2833         gd->queue = sdkp->device->request_queue;
2834
2835         /* defaults, until the device tells us otherwise */
2836         sdp->sector_size = 512;
2837         sdkp->capacity = 0;
2838         sdkp->media_present = 1;
2839         sdkp->write_prot = 0;
2840         sdkp->cache_override = 0;
2841         sdkp->WCE = 0;
2842         sdkp->RCD = 0;
2843         sdkp->ATO = 0;
2844         sdkp->first_scan = 1;
2845         sdkp->max_medium_access_timeouts = SD_MAX_MEDIUM_TIMEOUTS;
2846
2847         sd_revalidate_disk(gd);
2848
2849         blk_queue_prep_rq(sdp->request_queue, sd_prep_fn);
2850         blk_queue_unprep_rq(sdp->request_queue, sd_unprep_fn);
2851
2852         gd->driverfs_dev = &sdp->sdev_gendev;
2853         gd->flags = GENHD_FL_EXT_DEVT;
2854         if (sdp->removable) {
2855                 gd->flags |= GENHD_FL_REMOVABLE;
2856                 gd->events |= DISK_EVENT_MEDIA_CHANGE;
2857         }
2858
2859         add_disk(gd);
2860         if (sdkp->capacity)
2861                 sd_dif_config_host(sdkp);
2862
2863         sd_revalidate_disk(gd);
2864
2865         sd_printk(KERN_NOTICE, sdkp, "Attached SCSI %sdisk\n",
2866                   sdp->removable ? "removable " : "");
2867         blk_pm_runtime_init(sdp->request_queue, dev);
2868         scsi_autopm_put_device(sdp);
2869         put_device(&sdkp->dev);
2870 }
2871
2872 /**
2873  *      sd_probe - called during driver initialization and whenever a
2874  *      new scsi device is attached to the system. It is called once
2875  *      for each scsi device (not just disks) present.
2876  *      @dev: pointer to device object
2877  *
2878  *      Returns 0 if successful (or not interested in this scsi device 
2879  *      (e.g. scanner)); 1 when there is an error.
2880  *
2881  *      Note: this function is invoked from the scsi mid-level.
2882  *      This function sets up the mapping between a given 
2883  *      <host,channel,id,lun> (found in sdp) and new device name 
2884  *      (e.g. /dev/sda). More precisely it is the block device major 
2885  *      and minor number that is chosen here.
2886  *
2887  *      Assume sd_probe is not re-entrant (for time being)
2888  *      Also think about sd_probe() and sd_remove() running coincidentally.
2889  **/
2890 static int sd_probe(struct device *dev)
2891 {
2892         struct scsi_device *sdp = to_scsi_device(dev);
2893         struct scsi_disk *sdkp;
2894         struct gendisk *gd;
2895         int index;
2896         int error;
2897
2898         error = -ENODEV;
2899         if (sdp->type != TYPE_DISK && sdp->type != TYPE_MOD && sdp->type != TYPE_RBC)
2900                 goto out;
2901
2902         SCSI_LOG_HLQUEUE(3, sdev_printk(KERN_INFO, sdp,
2903                                         "sd_probe\n"));
2904
2905         error = -ENOMEM;
2906         sdkp = kzalloc(sizeof(*sdkp), GFP_KERNEL);
2907         if (!sdkp)
2908                 goto out;
2909
2910         gd = alloc_disk(SD_MINORS);
2911         if (!gd)
2912                 goto out_free;
2913
2914         do {
2915                 if (!ida_pre_get(&sd_index_ida, GFP_KERNEL))
2916                         goto out_put;
2917
2918                 spin_lock(&sd_index_lock);
2919                 error = ida_get_new(&sd_index_ida, &index);
2920                 spin_unlock(&sd_index_lock);
2921         } while (error == -EAGAIN);
2922
2923         if (error) {
2924                 sdev_printk(KERN_WARNING, sdp, "sd_probe: memory exhausted.\n");
2925                 goto out_put;
2926         }
2927
2928         error = sd_format_disk_name("sd", index, gd->disk_name, DISK_NAME_LEN);
2929         if (error) {
2930                 sdev_printk(KERN_WARNING, sdp, "SCSI disk (sd) name length exceeded.\n");
2931                 goto out_free_index;
2932         }
2933
2934         sdkp->device = sdp;
2935         sdkp->driver = &sd_template;
2936         sdkp->disk = gd;
2937         sdkp->index = index;
2938         atomic_set(&sdkp->openers, 0);
2939         atomic_set(&sdkp->device->ioerr_cnt, 0);
2940
2941         if (!sdp->request_queue->rq_timeout) {
2942                 if (sdp->type != TYPE_MOD)
2943                         blk_queue_rq_timeout(sdp->request_queue, SD_TIMEOUT);
2944                 else
2945                         blk_queue_rq_timeout(sdp->request_queue,
2946                                              SD_MOD_TIMEOUT);
2947         }
2948
2949         device_initialize(&sdkp->dev);
2950         sdkp->dev.parent = dev;
2951         sdkp->dev.class = &sd_disk_class;
2952         dev_set_name(&sdkp->dev, dev_name(dev));
2953
2954         if (device_add(&sdkp->dev))
2955                 goto out_free_index;
2956
2957         get_device(dev);
2958         dev_set_drvdata(dev, sdkp);
2959
2960         get_device(&sdkp->dev); /* prevent release before async_schedule */
2961         async_schedule_domain(sd_probe_async, sdkp, &scsi_sd_probe_domain);
2962
2963         return 0;
2964
2965  out_free_index:
2966         spin_lock(&sd_index_lock);
2967         ida_remove(&sd_index_ida, index);
2968         spin_unlock(&sd_index_lock);
2969  out_put:
2970         put_disk(gd);
2971  out_free:
2972         kfree(sdkp);
2973  out:
2974         return error;
2975 }
2976
2977 /**
2978  *      sd_remove - called whenever a scsi disk (previously recognized by
2979  *      sd_probe) is detached from the system. It is called (potentially
2980  *      multiple times) during sd module unload.
2981  *      @sdp: pointer to mid level scsi device object
2982  *
2983  *      Note: this function is invoked from the scsi mid-level.
2984  *      This function potentially frees up a device name (e.g. /dev/sdc)
2985  *      that could be re-used by a subsequent sd_probe().
2986  *      This function is not called when the built-in sd driver is "exit-ed".
2987  **/
2988 static int sd_remove(struct device *dev)
2989 {
2990         struct scsi_disk *sdkp;
2991
2992         sdkp = dev_get_drvdata(dev);
2993         scsi_autopm_get_device(sdkp->device);
2994
2995         async_synchronize_full_domain(&scsi_sd_probe_domain);
2996         blk_queue_prep_rq(sdkp->device->request_queue, scsi_prep_fn);
2997         blk_queue_unprep_rq(sdkp->device->request_queue, NULL);
2998         device_del(&sdkp->dev);
2999         del_gendisk(sdkp->disk);
3000         sd_shutdown(dev);
3001
3002         mutex_lock(&sd_ref_mutex);
3003         dev_set_drvdata(dev, NULL);
3004         put_device(&sdkp->dev);
3005         mutex_unlock(&sd_ref_mutex);
3006
3007         return 0;
3008 }
3009
3010 /**
3011  *      scsi_disk_release - Called to free the scsi_disk structure
3012  *      @dev: pointer to embedded class device
3013  *
3014  *      sd_ref_mutex must be held entering this routine.  Because it is
3015  *      called on last put, you should always use the scsi_disk_get()
3016  *      scsi_disk_put() helpers which manipulate the semaphore directly
3017  *      and never do a direct put_device.
3018  **/
3019 static void scsi_disk_release(struct device *dev)
3020 {
3021         struct scsi_disk *sdkp = to_scsi_disk(dev);
3022         struct gendisk *disk = sdkp->disk;
3023         
3024         spin_lock(&sd_index_lock);
3025         ida_remove(&sd_index_ida, sdkp->index);
3026         spin_unlock(&sd_index_lock);
3027
3028         disk->private_data = NULL;
3029         put_disk(disk);
3030         put_device(&sdkp->device->sdev_gendev);
3031
3032         kfree(sdkp);
3033 }
3034
3035 static int sd_start_stop_device(struct scsi_disk *sdkp, int start)
3036 {
3037         unsigned char cmd[6] = { START_STOP };  /* START_VALID */
3038         struct scsi_sense_hdr sshdr;
3039         struct scsi_device *sdp = sdkp->device;
3040         int res;
3041
3042         if (start)
3043                 cmd[4] |= 1;    /* START */
3044
3045         if (sdp->start_stop_pwr_cond)
3046                 cmd[4] |= start ? 1 << 4 : 3 << 4;      /* Active or Standby */
3047
3048         if (!scsi_device_online(sdp))
3049                 return -ENODEV;
3050
3051         res = scsi_execute_req_flags(sdp, cmd, DMA_NONE, NULL, 0, &sshdr,
3052                                SD_TIMEOUT, SD_MAX_RETRIES, NULL, REQ_PM);
3053         if (res) {
3054                 sd_printk(KERN_WARNING, sdkp, "START_STOP FAILED\n");
3055                 sd_print_result(sdkp, res);
3056                 if (driver_byte(res) & DRIVER_SENSE)
3057                         sd_print_sense_hdr(sdkp, &sshdr);
3058         }
3059
3060         return res;
3061 }
3062
3063 /*
3064  * Send a SYNCHRONIZE CACHE instruction down to the device through
3065  * the normal SCSI command structure.  Wait for the command to
3066  * complete.
3067  */
3068 static void sd_shutdown(struct device *dev)
3069 {
3070         struct scsi_disk *sdkp = scsi_disk_get_from_dev(dev);
3071
3072         if (!sdkp)
3073                 return;         /* this can happen */
3074
3075         if (pm_runtime_suspended(dev))
3076                 goto exit;
3077
3078         if (sdkp->WCE) {
3079                 sd_printk(KERN_NOTICE, sdkp, "Synchronizing SCSI cache\n");
3080                 sd_sync_cache(sdkp);
3081         }
3082
3083         if (system_state != SYSTEM_RESTART && sdkp->device->manage_start_stop) {
3084                 sd_printk(KERN_NOTICE, sdkp, "Stopping disk\n");
3085                 sd_start_stop_device(sdkp, 0);
3086         }
3087
3088 exit:
3089         scsi_disk_put(sdkp);
3090 }
3091
3092 static int sd_suspend(struct device *dev)
3093 {
3094         struct scsi_disk *sdkp = scsi_disk_get_from_dev(dev);
3095         int ret = 0;
3096
3097         if (!sdkp)
3098                 return 0;       /* this can happen */
3099
3100         if (sdkp->WCE) {
3101                 sd_printk(KERN_NOTICE, sdkp, "Synchronizing SCSI cache\n");
3102                 ret = sd_sync_cache(sdkp);
3103                 if (ret)
3104                         goto done;
3105         }
3106
3107         if (sdkp->device->manage_start_stop) {
3108                 sd_printk(KERN_NOTICE, sdkp, "Stopping disk\n");
3109                 ret = sd_start_stop_device(sdkp, 0);
3110         }
3111
3112 done:
3113         scsi_disk_put(sdkp);
3114         return ret;
3115 }
3116
3117 static int sd_resume(struct device *dev)
3118 {
3119         struct scsi_disk *sdkp = scsi_disk_get_from_dev(dev);
3120         int ret = 0;
3121
3122         if (!sdkp->device->manage_start_stop)
3123                 goto done;
3124
3125         sd_printk(KERN_NOTICE, sdkp, "Starting disk\n");
3126         ret = sd_start_stop_device(sdkp, 1);
3127
3128 done:
3129         scsi_disk_put(sdkp);
3130         return ret;
3131 }
3132
3133 /**
3134  *      init_sd - entry point for this driver (both when built in or when
3135  *      a module).
3136  *
3137  *      Note: this function registers this driver with the scsi mid-level.
3138  **/
3139 static int __init init_sd(void)
3140 {
3141         int majors = 0, i, err;
3142
3143         SCSI_LOG_HLQUEUE(3, printk("init_sd: sd driver entry point\n"));
3144
3145         for (i = 0; i < SD_MAJORS; i++)
3146                 if (register_blkdev(sd_major(i), "sd") == 0)
3147                         majors++;
3148
3149         if (!majors)
3150                 return -ENODEV;
3151
3152         err = class_register(&sd_disk_class);
3153         if (err)
3154                 goto err_out;
3155
3156         sd_cdb_cache = kmem_cache_create("sd_ext_cdb", SD_EXT_CDB_SIZE,
3157                                          0, 0, NULL);
3158         if (!sd_cdb_cache) {
3159                 printk(KERN_ERR "sd: can't init extended cdb cache\n");
3160                 goto err_out_class;
3161         }
3162
3163         sd_cdb_pool = mempool_create_slab_pool(SD_MEMPOOL_SIZE, sd_cdb_cache);
3164         if (!sd_cdb_pool) {
3165                 printk(KERN_ERR "sd: can't init extended cdb pool\n");
3166                 goto err_out_cache;
3167         }
3168
3169         err = scsi_register_driver(&sd_template.gendrv);
3170         if (err)
3171                 goto err_out_driver;
3172
3173         return 0;
3174
3175 err_out_driver:
3176         mempool_destroy(sd_cdb_pool);
3177
3178 err_out_cache:
3179         kmem_cache_destroy(sd_cdb_cache);
3180
3181 err_out_class:
3182         class_unregister(&sd_disk_class);
3183 err_out:
3184         for (i = 0; i < SD_MAJORS; i++)
3185                 unregister_blkdev(sd_major(i), "sd");
3186         return err;
3187 }
3188
3189 /**
3190  *      exit_sd - exit point for this driver (when it is a module).
3191  *
3192  *      Note: this function unregisters this driver from the scsi mid-level.
3193  **/
3194 static void __exit exit_sd(void)
3195 {
3196         int i;
3197
3198         SCSI_LOG_HLQUEUE(3, printk("exit_sd: exiting sd driver\n"));
3199
3200         scsi_unregister_driver(&sd_template.gendrv);
3201         mempool_destroy(sd_cdb_pool);
3202         kmem_cache_destroy(sd_cdb_cache);
3203
3204         class_unregister(&sd_disk_class);
3205
3206         for (i = 0; i < SD_MAJORS; i++)
3207                 unregister_blkdev(sd_major(i), "sd");
3208 }
3209
3210 module_init(init_sd);
3211 module_exit(exit_sd);
3212
3213 static void sd_print_sense_hdr(struct scsi_disk *sdkp,
3214                                struct scsi_sense_hdr *sshdr)
3215 {
3216         sd_printk(KERN_INFO, sdkp, " ");
3217         scsi_show_sense_hdr(sshdr);
3218         sd_printk(KERN_INFO, sdkp, " ");
3219         scsi_show_extd_sense(sshdr->asc, sshdr->ascq);
3220 }
3221
3222 static void sd_print_result(struct scsi_disk *sdkp, int result)
3223 {
3224         sd_printk(KERN_INFO, sdkp, " ");
3225         scsi_show_result(result);
3226 }
3227