Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/jmorris...
[linux-2.6] / drivers / ide / ide-disk.c
1 /*
2  *  Copyright (C) 1994-1998        Linus Torvalds & authors (see below)
3  *  Copyright (C) 1998-2002        Linux ATA Development
4  *                                    Andre Hedrick <andre@linux-ide.org>
5  *  Copyright (C) 2003             Red Hat <alan@redhat.com>
6  *  Copyright (C) 2003-2005, 2007  Bartlomiej Zolnierkiewicz
7  */
8
9 /*
10  *  Mostly written by Mark Lord <mlord@pobox.com>
11  *                and Gadi Oxman <gadio@netvision.net.il>
12  *                and Andre Hedrick <andre@linux-ide.org>
13  *
14  * This is the IDE/ATA disk driver, as evolved from hd.c and ide.c.
15  */
16
17 #define IDEDISK_VERSION "1.18"
18
19 #include <linux/module.h>
20 #include <linux/types.h>
21 #include <linux/string.h>
22 #include <linux/kernel.h>
23 #include <linux/timer.h>
24 #include <linux/mm.h>
25 #include <linux/interrupt.h>
26 #include <linux/major.h>
27 #include <linux/errno.h>
28 #include <linux/genhd.h>
29 #include <linux/slab.h>
30 #include <linux/delay.h>
31 #include <linux/mutex.h>
32 #include <linux/leds.h>
33
34 #define _IDE_DISK
35
36 #include <linux/ide.h>
37
38 #include <asm/byteorder.h>
39 #include <asm/irq.h>
40 #include <asm/uaccess.h>
41 #include <asm/io.h>
42 #include <asm/div64.h>
43
44 struct ide_disk_obj {
45         ide_drive_t     *drive;
46         ide_driver_t    *driver;
47         struct gendisk  *disk;
48         struct kref     kref;
49         unsigned int    openers;        /* protected by BKL for now */
50 };
51
52 static DEFINE_MUTEX(idedisk_ref_mutex);
53
54 #define to_ide_disk(obj) container_of(obj, struct ide_disk_obj, kref)
55
56 #define ide_disk_g(disk) \
57         container_of((disk)->private_data, struct ide_disk_obj, driver)
58
59 static struct ide_disk_obj *ide_disk_get(struct gendisk *disk)
60 {
61         struct ide_disk_obj *idkp = NULL;
62
63         mutex_lock(&idedisk_ref_mutex);
64         idkp = ide_disk_g(disk);
65         if (idkp)
66                 kref_get(&idkp->kref);
67         mutex_unlock(&idedisk_ref_mutex);
68         return idkp;
69 }
70
71 static void ide_disk_release(struct kref *);
72
73 static void ide_disk_put(struct ide_disk_obj *idkp)
74 {
75         mutex_lock(&idedisk_ref_mutex);
76         kref_put(&idkp->kref, ide_disk_release);
77         mutex_unlock(&idedisk_ref_mutex);
78 }
79
80 /*
81  * lba_capacity_is_ok() performs a sanity check on the claimed "lba_capacity"
82  * value for this drive (from its reported identification information).
83  *
84  * Returns:     1 if lba_capacity looks sensible
85  *              0 otherwise
86  *
87  * It is called only once for each drive.
88  */
89 static int lba_capacity_is_ok(struct hd_driveid *id)
90 {
91         unsigned long lba_sects, chs_sects, head, tail;
92
93         /* No non-LBA info .. so valid! */
94         if (id->cyls == 0)
95                 return 1;
96
97         /*
98          * The ATA spec tells large drives to return
99          * C/H/S = 16383/16/63 independent of their size.
100          * Some drives can be jumpered to use 15 heads instead of 16.
101          * Some drives can be jumpered to use 4092 cyls instead of 16383.
102          */
103         if ((id->cyls == 16383
104              || (id->cyls == 4092 && id->cur_cyls == 16383)) &&
105             id->sectors == 63 &&
106             (id->heads == 15 || id->heads == 16) &&
107             (id->lba_capacity >= 16383*63*id->heads))
108                 return 1;
109
110         lba_sects   = id->lba_capacity;
111         chs_sects   = id->cyls * id->heads * id->sectors;
112
113         /* perform a rough sanity check on lba_sects:  within 10% is OK */
114         if ((lba_sects - chs_sects) < chs_sects/10)
115                 return 1;
116
117         /* some drives have the word order reversed */
118         head = ((lba_sects >> 16) & 0xffff);
119         tail = (lba_sects & 0xffff);
120         lba_sects = (head | (tail << 16));
121         if ((lba_sects - chs_sects) < chs_sects/10) {
122                 id->lba_capacity = lba_sects;
123                 return 1;       /* lba_capacity is (now) good */
124         }
125
126         return 0;       /* lba_capacity value may be bad */
127 }
128
129 static const u8 ide_rw_cmds[] = {
130         WIN_MULTREAD,
131         WIN_MULTWRITE,
132         WIN_MULTREAD_EXT,
133         WIN_MULTWRITE_EXT,
134         WIN_READ,
135         WIN_WRITE,
136         WIN_READ_EXT,
137         WIN_WRITE_EXT,
138         WIN_READDMA,
139         WIN_WRITEDMA,
140         WIN_READDMA_EXT,
141         WIN_WRITEDMA_EXT,
142 };
143
144 static const u8 ide_data_phases[] = {
145         TASKFILE_MULTI_IN,
146         TASKFILE_MULTI_OUT,
147         TASKFILE_IN,
148         TASKFILE_OUT,
149         TASKFILE_IN_DMA,
150         TASKFILE_OUT_DMA,
151 };
152
153 static void ide_tf_set_cmd(ide_drive_t *drive, ide_task_t *task, u8 dma)
154 {
155         u8 index, lba48, write;
156
157         lba48 = (task->tf_flags & IDE_TFLAG_LBA48) ? 2 : 0;
158         write = (task->tf_flags & IDE_TFLAG_WRITE) ? 1 : 0;
159
160         if (dma)
161                 index = drive->vdma ? 4 : 8;
162         else
163                 index = drive->mult_count ? 0 : 4;
164
165         task->tf.command = ide_rw_cmds[index + lba48 + write];
166
167         if (dma)
168                 index = 8; /* fixup index */
169
170         task->data_phase = ide_data_phases[index / 2 + write];
171 }
172
173 /*
174  * __ide_do_rw_disk() issues READ and WRITE commands to a disk,
175  * using LBA if supported, or CHS otherwise, to address sectors.
176  */
177 static ide_startstop_t __ide_do_rw_disk(ide_drive_t *drive, struct request *rq,
178                                         sector_t block)
179 {
180         ide_hwif_t *hwif        = HWIF(drive);
181         unsigned int dma        = drive->using_dma;
182         u16 nsectors            = (u16)rq->nr_sectors;
183         u8 lba48                = (drive->addressing == 1) ? 1 : 0;
184         ide_task_t              task;
185         struct ide_taskfile     *tf = &task.tf;
186         ide_startstop_t         rc;
187
188         if ((hwif->host_flags & IDE_HFLAG_NO_LBA48_DMA) && lba48 && dma) {
189                 if (block + rq->nr_sectors > 1ULL << 28)
190                         dma = 0;
191                 else
192                         lba48 = 0;
193         }
194
195         if (!dma) {
196                 ide_init_sg_cmd(drive, rq);
197                 ide_map_sg(drive, rq);
198         }
199
200         memset(&task, 0, sizeof(task));
201         task.tf_flags = IDE_TFLAG_NO_SELECT_MASK;  /* FIXME? */
202         task.tf_flags |= (IDE_TFLAG_TF | IDE_TFLAG_DEVICE);
203
204         if (drive->select.b.lba) {
205                 if (lba48) {
206                         pr_debug("%s: LBA=0x%012llx\n", drive->name,
207                                         (unsigned long long)block);
208
209                         tf->hob_nsect = (nsectors >> 8) & 0xff;
210                         tf->hob_lbal  = (u8)(block >> 24);
211                         if (sizeof(block) != 4) {
212                                 tf->hob_lbam = (u8)((u64)block >> 32);
213                                 tf->hob_lbah = (u8)((u64)block >> 40);
214                         }
215
216                         tf->nsect  = nsectors & 0xff;
217                         tf->lbal   = (u8) block;
218                         tf->lbam   = (u8)(block >>  8);
219                         tf->lbah   = (u8)(block >> 16);
220
221                         task.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
222                 } else {
223                         tf->nsect  = nsectors & 0xff;
224                         tf->lbal   = block;
225                         tf->lbam   = block >>= 8;
226                         tf->lbah   = block >>= 8;
227                         tf->device = (block >> 8) & 0xf;
228                 }
229         } else {
230                 unsigned int sect, head, cyl, track;
231
232                 track = (int)block / drive->sect;
233                 sect  = (int)block % drive->sect + 1;
234                 head  = track % drive->head;
235                 cyl   = track / drive->head;
236
237                 pr_debug("%s: CHS=%u/%u/%u\n", drive->name, cyl, head, sect);
238
239                 tf->nsect  = nsectors & 0xff;
240                 tf->lbal   = sect;
241                 tf->lbam   = cyl;
242                 tf->lbah   = cyl >> 8;
243                 tf->device = head;
244         }
245
246         if (rq_data_dir(rq))
247                 task.tf_flags |= IDE_TFLAG_WRITE;
248
249         ide_tf_set_cmd(drive, &task, dma);
250         if (!dma)
251                 hwif->data_phase = task.data_phase;
252         task.rq = rq;
253
254         rc = do_rw_taskfile(drive, &task);
255
256         if (rc == ide_stopped && dma) {
257                 /* fallback to PIO */
258                 task.tf_flags |= IDE_TFLAG_DMA_PIO_FALLBACK;
259                 ide_tf_set_cmd(drive, &task, 0);
260                 hwif->data_phase = task.data_phase;
261                 ide_init_sg_cmd(drive, rq);
262                 rc = do_rw_taskfile(drive, &task);
263         }
264
265         return rc;
266 }
267
268 /*
269  * 268435455  == 137439 MB or 28bit limit
270  * 320173056  == 163929 MB or 48bit addressing
271  * 1073741822 == 549756 MB or 48bit addressing fake drive
272  */
273
274 static ide_startstop_t ide_do_rw_disk(ide_drive_t *drive, struct request *rq,
275                                       sector_t block)
276 {
277         ide_hwif_t *hwif = HWIF(drive);
278
279         BUG_ON(drive->blocked);
280
281         if (!blk_fs_request(rq)) {
282                 blk_dump_rq_flags(rq, "ide_do_rw_disk - bad command");
283                 ide_end_request(drive, 0, 0);
284                 return ide_stopped;
285         }
286
287         ledtrig_ide_activity();
288
289         pr_debug("%s: %sing: block=%llu, sectors=%lu, buffer=0x%08lx\n",
290                  drive->name, rq_data_dir(rq) == READ ? "read" : "writ",
291                  (unsigned long long)block, rq->nr_sectors,
292                  (unsigned long)rq->buffer);
293
294         if (hwif->rw_disk)
295                 hwif->rw_disk(drive, rq);
296
297         return __ide_do_rw_disk(drive, rq, block);
298 }
299
300 /*
301  * Queries for true maximum capacity of the drive.
302  * Returns maximum LBA address (> 0) of the drive, 0 if failed.
303  */
304 static u64 idedisk_read_native_max_address(ide_drive_t *drive, int lba48)
305 {
306         ide_task_t args;
307         struct ide_taskfile *tf = &args.tf;
308         u64 addr = 0;
309
310         /* Create IDE/ATA command request structure */
311         memset(&args, 0, sizeof(ide_task_t));
312         if (lba48)
313                 tf->command = WIN_READ_NATIVE_MAX_EXT;
314         else
315                 tf->command = WIN_READ_NATIVE_MAX;
316         tf->device  = ATA_LBA;
317         args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
318         if (lba48)
319                 args.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
320         /* submit command request */
321         ide_no_data_taskfile(drive, &args);
322
323         /* if OK, compute maximum address value */
324         if ((tf->status & 0x01) == 0)
325                 addr = ide_get_lba_addr(tf, lba48) + 1;
326
327         return addr;
328 }
329
330 /*
331  * Sets maximum virtual LBA address of the drive.
332  * Returns new maximum virtual LBA address (> 0) or 0 on failure.
333  */
334 static u64 idedisk_set_max_address(ide_drive_t *drive, u64 addr_req, int lba48)
335 {
336         ide_task_t args;
337         struct ide_taskfile *tf = &args.tf;
338         u64 addr_set = 0;
339
340         addr_req--;
341         /* Create IDE/ATA command request structure */
342         memset(&args, 0, sizeof(ide_task_t));
343         tf->lbal     = (addr_req >>  0) & 0xff;
344         tf->lbam     = (addr_req >>= 8) & 0xff;
345         tf->lbah     = (addr_req >>= 8) & 0xff;
346         if (lba48) {
347                 tf->hob_lbal = (addr_req >>= 8) & 0xff;
348                 tf->hob_lbam = (addr_req >>= 8) & 0xff;
349                 tf->hob_lbah = (addr_req >>= 8) & 0xff;
350                 tf->command  = WIN_SET_MAX_EXT;
351         } else {
352                 tf->device   = (addr_req >>= 8) & 0x0f;
353                 tf->command  = WIN_SET_MAX;
354         }
355         tf->device |= ATA_LBA;
356         args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
357         if (lba48)
358                 args.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
359         /* submit command request */
360         ide_no_data_taskfile(drive, &args);
361         /* if OK, compute maximum address value */
362         if ((tf->status & 0x01) == 0)
363                 addr_set = ide_get_lba_addr(tf, lba48) + 1;
364
365         return addr_set;
366 }
367
368 static unsigned long long sectors_to_MB(unsigned long long n)
369 {
370         n <<= 9;                /* make it bytes */
371         do_div(n, 1000000);     /* make it MB */
372         return n;
373 }
374
375 /*
376  * Bits 10 of command_set_1 and cfs_enable_1 must be equal,
377  * so on non-buggy drives we need test only one.
378  * However, we should also check whether these fields are valid.
379  */
380 static inline int idedisk_supports_hpa(const struct hd_driveid *id)
381 {
382         return (id->command_set_1 & 0x0400) && (id->cfs_enable_1 & 0x0400);
383 }
384
385 /*
386  * The same here.
387  */
388 static inline int idedisk_supports_lba48(const struct hd_driveid *id)
389 {
390         return (id->command_set_2 & 0x0400) && (id->cfs_enable_2 & 0x0400)
391                && id->lba_capacity_2;
392 }
393
394 /*
395  * Some disks report total number of sectors instead of
396  * maximum sector address.  We list them here.
397  */
398 static const struct drive_list_entry hpa_list[] = {
399         { "ST340823A",  NULL },
400         { "ST320413A",  NULL },
401         { "ST310211A",  NULL },
402         { NULL,         NULL }
403 };
404
405 static void idedisk_check_hpa(ide_drive_t *drive)
406 {
407         unsigned long long capacity, set_max;
408         int lba48 = idedisk_supports_lba48(drive->id);
409
410         capacity = drive->capacity64;
411
412         set_max = idedisk_read_native_max_address(drive, lba48);
413
414         if (ide_in_drive_list(drive->id, hpa_list)) {
415                 /*
416                  * Since we are inclusive wrt to firmware revisions do this
417                  * extra check and apply the workaround only when needed.
418                  */
419                 if (set_max == capacity + 1)
420                         set_max--;
421         }
422
423         if (set_max <= capacity)
424                 return;
425
426         printk(KERN_INFO "%s: Host Protected Area detected.\n"
427                          "\tcurrent capacity is %llu sectors (%llu MB)\n"
428                          "\tnative  capacity is %llu sectors (%llu MB)\n",
429                          drive->name,
430                          capacity, sectors_to_MB(capacity),
431                          set_max, sectors_to_MB(set_max));
432
433         set_max = idedisk_set_max_address(drive, set_max, lba48);
434
435         if (set_max) {
436                 drive->capacity64 = set_max;
437                 printk(KERN_INFO "%s: Host Protected Area disabled.\n",
438                                  drive->name);
439         }
440 }
441
442 /*
443  * Compute drive->capacity, the full capacity of the drive
444  * Called with drive->id != NULL.
445  *
446  * To compute capacity, this uses either of
447  *
448  *    1. CHS value set by user       (whatever user sets will be trusted)
449  *    2. LBA value from target drive (require new ATA feature)
450  *    3. LBA value from system BIOS  (new one is OK, old one may break)
451  *    4. CHS value from system BIOS  (traditional style)
452  *
453  * in above order (i.e., if value of higher priority is available,
454  * reset will be ignored).
455  */
456 static void init_idedisk_capacity(ide_drive_t *drive)
457 {
458         struct hd_driveid *id = drive->id;
459         /*
460          * If this drive supports the Host Protected Area feature set,
461          * then we may need to change our opinion about the drive's capacity.
462          */
463         int hpa = idedisk_supports_hpa(id);
464
465         if (idedisk_supports_lba48(id)) {
466                 /* drive speaks 48-bit LBA */
467                 drive->select.b.lba = 1;
468                 drive->capacity64 = id->lba_capacity_2;
469                 if (hpa)
470                         idedisk_check_hpa(drive);
471         } else if ((id->capability & 2) && lba_capacity_is_ok(id)) {
472                 /* drive speaks 28-bit LBA */
473                 drive->select.b.lba = 1;
474                 drive->capacity64 = id->lba_capacity;
475                 if (hpa)
476                         idedisk_check_hpa(drive);
477         } else {
478                 /* drive speaks boring old 28-bit CHS */
479                 drive->capacity64 = drive->cyl * drive->head * drive->sect;
480         }
481 }
482
483 static sector_t idedisk_capacity(ide_drive_t *drive)
484 {
485         return drive->capacity64 - drive->sect0;
486 }
487
488 #ifdef CONFIG_IDE_PROC_FS
489 static int smart_enable(ide_drive_t *drive)
490 {
491         ide_task_t args;
492         struct ide_taskfile *tf = &args.tf;
493
494         memset(&args, 0, sizeof(ide_task_t));
495         tf->feature = SMART_ENABLE;
496         tf->lbam    = SMART_LCYL_PASS;
497         tf->lbah    = SMART_HCYL_PASS;
498         tf->command = WIN_SMART;
499         args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
500         return ide_no_data_taskfile(drive, &args);
501 }
502
503 static int get_smart_data(ide_drive_t *drive, u8 *buf, u8 sub_cmd)
504 {
505         ide_task_t args;
506         struct ide_taskfile *tf = &args.tf;
507
508         memset(&args, 0, sizeof(ide_task_t));
509         tf->feature = sub_cmd;
510         tf->nsect   = 0x01;
511         tf->lbam    = SMART_LCYL_PASS;
512         tf->lbah    = SMART_HCYL_PASS;
513         tf->command = WIN_SMART;
514         args.tf_flags   = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
515         args.data_phase = TASKFILE_IN;
516         (void) smart_enable(drive);
517         return ide_raw_taskfile(drive, &args, buf, 1);
518 }
519
520 static int proc_idedisk_read_cache
521         (char *page, char **start, off_t off, int count, int *eof, void *data)
522 {
523         ide_drive_t     *drive = (ide_drive_t *) data;
524         char            *out = page;
525         int             len;
526
527         if (drive->id_read)
528                 len = sprintf(out, "%i\n", drive->id->buf_size / 2);
529         else
530                 len = sprintf(out, "(none)\n");
531
532         PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
533 }
534
535 static int proc_idedisk_read_capacity
536         (char *page, char **start, off_t off, int count, int *eof, void *data)
537 {
538         ide_drive_t*drive = (ide_drive_t *)data;
539         int len;
540
541         len = sprintf(page, "%llu\n", (long long)idedisk_capacity(drive));
542
543         PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
544 }
545
546 static int proc_idedisk_read_smart(char *page, char **start, off_t off,
547                                    int count, int *eof, void *data, u8 sub_cmd)
548 {
549         ide_drive_t     *drive = (ide_drive_t *)data;
550         int             len = 0, i = 0;
551
552         if (get_smart_data(drive, page, sub_cmd) == 0) {
553                 unsigned short *val = (unsigned short *) page;
554                 char *out = ((char *)val) + (SECTOR_WORDS * 4);
555                 page = out;
556                 do {
557                         out += sprintf(out, "%04x%c", le16_to_cpu(*val),
558                                        (++i & 7) ? ' ' : '\n');
559                         val += 1;
560                 } while (i < (SECTOR_WORDS * 2));
561                 len = out - page;
562         }
563
564         PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
565 }
566
567 static int proc_idedisk_read_sv
568         (char *page, char **start, off_t off, int count, int *eof, void *data)
569 {
570         return proc_idedisk_read_smart(page, start, off, count, eof, data,
571                                        SMART_READ_VALUES);
572 }
573
574 static int proc_idedisk_read_st
575         (char *page, char **start, off_t off, int count, int *eof, void *data)
576 {
577         return proc_idedisk_read_smart(page, start, off, count, eof, data,
578                                        SMART_READ_THRESHOLDS);
579 }
580
581 static ide_proc_entry_t idedisk_proc[] = {
582         { "cache",        S_IFREG|S_IRUGO, proc_idedisk_read_cache,    NULL },
583         { "capacity",     S_IFREG|S_IRUGO, proc_idedisk_read_capacity, NULL },
584         { "geometry",     S_IFREG|S_IRUGO, proc_ide_read_geometry,     NULL },
585         { "smart_values", S_IFREG|S_IRUSR, proc_idedisk_read_sv,       NULL },
586         { "smart_thresholds", S_IFREG|S_IRUSR, proc_idedisk_read_st,   NULL },
587         { NULL, 0, NULL, NULL }
588 };
589 #endif  /* CONFIG_IDE_PROC_FS */
590
591 static void idedisk_prepare_flush(struct request_queue *q, struct request *rq)
592 {
593         ide_drive_t *drive = q->queuedata;
594         ide_task_t *task = kmalloc(sizeof(*task), GFP_ATOMIC);
595
596         /* FIXME: map struct ide_taskfile on rq->cmd[] */
597         BUG_ON(task == NULL);
598
599         memset(task, 0, sizeof(*task));
600         if (ide_id_has_flush_cache_ext(drive->id) &&
601             (drive->capacity64 >= (1UL << 28)))
602                 task->tf.command = WIN_FLUSH_CACHE_EXT;
603         else
604                 task->tf.command = WIN_FLUSH_CACHE;
605         task->tf_flags   = IDE_TFLAG_OUT_TF | IDE_TFLAG_OUT_DEVICE |
606                            IDE_TFLAG_DYN;
607         task->data_phase = TASKFILE_NO_DATA;
608
609         rq->cmd_type = REQ_TYPE_ATA_TASKFILE;
610         rq->cmd_flags |= REQ_SOFTBARRIER;
611         rq->special = task;
612 }
613
614 /*
615  * This is tightly woven into the driver->do_special can not touch.
616  * DON'T do it again until a total personality rewrite is committed.
617  */
618 static int set_multcount(ide_drive_t *drive, int arg)
619 {
620         struct request rq;
621
622         if (arg < 0 || arg > drive->id->max_multsect)
623                 return -EINVAL;
624
625         if (drive->special.b.set_multmode)
626                 return -EBUSY;
627
628         ide_init_drive_cmd(&rq);
629         rq.cmd_type = REQ_TYPE_ATA_TASKFILE;
630
631         drive->mult_req = arg;
632         drive->special.b.set_multmode = 1;
633         (void)ide_do_drive_cmd(drive, &rq, ide_wait);
634
635         return (drive->mult_count == arg) ? 0 : -EIO;
636 }
637
638 static int set_nowerr(ide_drive_t *drive, int arg)
639 {
640         if (arg < 0 || arg > 1)
641                 return -EINVAL;
642
643         if (ide_spin_wait_hwgroup(drive))
644                 return -EBUSY;
645         drive->nowerr = arg;
646         drive->bad_wstat = arg ? BAD_R_STAT : BAD_W_STAT;
647         spin_unlock_irq(&ide_lock);
648         return 0;
649 }
650
651 static void update_ordered(ide_drive_t *drive)
652 {
653         struct hd_driveid *id = drive->id;
654         unsigned ordered = QUEUE_ORDERED_NONE;
655         prepare_flush_fn *prep_fn = NULL;
656
657         if (drive->wcache) {
658                 unsigned long long capacity;
659                 int barrier;
660                 /*
661                  * We must avoid issuing commands a drive does not
662                  * understand or we may crash it. We check flush cache
663                  * is supported. We also check we have the LBA48 flush
664                  * cache if the drive capacity is too large. By this
665                  * time we have trimmed the drive capacity if LBA48 is
666                  * not available so we don't need to recheck that.
667                  */
668                 capacity = idedisk_capacity(drive);
669                 barrier = ide_id_has_flush_cache(id) && !drive->noflush &&
670                         (drive->addressing == 0 || capacity <= (1ULL << 28) ||
671                          ide_id_has_flush_cache_ext(id));
672
673                 printk(KERN_INFO "%s: cache flushes %ssupported\n",
674                        drive->name, barrier ? "" : "not ");
675
676                 if (barrier) {
677                         ordered = QUEUE_ORDERED_DRAIN_FLUSH;
678                         prep_fn = idedisk_prepare_flush;
679                 }
680         } else
681                 ordered = QUEUE_ORDERED_DRAIN;
682
683         blk_queue_ordered(drive->queue, ordered, prep_fn);
684 }
685
686 static int write_cache(ide_drive_t *drive, int arg)
687 {
688         ide_task_t args;
689         int err = 1;
690
691         if (arg < 0 || arg > 1)
692                 return -EINVAL;
693
694         if (ide_id_has_flush_cache(drive->id)) {
695                 memset(&args, 0, sizeof(ide_task_t));
696                 args.tf.feature = arg ?
697                         SETFEATURES_EN_WCACHE : SETFEATURES_DIS_WCACHE;
698                 args.tf.command = WIN_SETFEATURES;
699                 args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
700                 err = ide_no_data_taskfile(drive, &args);
701                 if (err == 0)
702                         drive->wcache = arg;
703         }
704
705         update_ordered(drive);
706
707         return err;
708 }
709
710 static int do_idedisk_flushcache(ide_drive_t *drive)
711 {
712         ide_task_t args;
713
714         memset(&args, 0, sizeof(ide_task_t));
715         if (ide_id_has_flush_cache_ext(drive->id))
716                 args.tf.command = WIN_FLUSH_CACHE_EXT;
717         else
718                 args.tf.command = WIN_FLUSH_CACHE;
719         args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
720         return ide_no_data_taskfile(drive, &args);
721 }
722
723 static int set_acoustic(ide_drive_t *drive, int arg)
724 {
725         ide_task_t args;
726
727         if (arg < 0 || arg > 254)
728                 return -EINVAL;
729
730         memset(&args, 0, sizeof(ide_task_t));
731         args.tf.feature = arg ? SETFEATURES_EN_AAM : SETFEATURES_DIS_AAM;
732         args.tf.nsect   = arg;
733         args.tf.command = WIN_SETFEATURES;
734         args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
735         ide_no_data_taskfile(drive, &args);
736         drive->acoustic = arg;
737         return 0;
738 }
739
740 /*
741  * drive->addressing:
742  *      0: 28-bit
743  *      1: 48-bit
744  *      2: 48-bit capable doing 28-bit
745  */
746 static int set_lba_addressing(ide_drive_t *drive, int arg)
747 {
748         if (arg < 0 || arg > 2)
749                 return -EINVAL;
750
751         drive->addressing =  0;
752
753         if (drive->hwif->host_flags & IDE_HFLAG_NO_LBA48)
754                 return 0;
755
756         if (!idedisk_supports_lba48(drive->id))
757                 return -EIO;
758         drive->addressing = arg;
759         return 0;
760 }
761
762 #ifdef CONFIG_IDE_PROC_FS
763 static void idedisk_add_settings(ide_drive_t *drive)
764 {
765         struct hd_driveid *id = drive->id;
766
767         ide_add_setting(drive, "bios_cyl", SETTING_RW, TYPE_INT, 0, 65535, 1, 1,
768                         &drive->bios_cyl, NULL);
769         ide_add_setting(drive, "bios_head", SETTING_RW, TYPE_BYTE, 0, 255, 1, 1,
770                         &drive->bios_head, NULL);
771         ide_add_setting(drive, "bios_sect", SETTING_RW, TYPE_BYTE, 0, 63, 1, 1,
772                         &drive->bios_sect, NULL);
773         ide_add_setting(drive, "address", SETTING_RW, TYPE_BYTE, 0, 2, 1, 1,
774                         &drive->addressing, set_lba_addressing);
775         ide_add_setting(drive, "multcount", SETTING_RW, TYPE_BYTE, 0,
776                         id->max_multsect, 1, 1, &drive->mult_count,
777                         set_multcount);
778         ide_add_setting(drive, "nowerr", SETTING_RW, TYPE_BYTE, 0, 1, 1, 1,
779                         &drive->nowerr, set_nowerr);
780         ide_add_setting(drive, "lun", SETTING_RW, TYPE_INT, 0, 7, 1, 1,
781                         &drive->lun, NULL);
782         ide_add_setting(drive, "wcache", SETTING_RW, TYPE_BYTE, 0, 1, 1, 1,
783                         &drive->wcache, write_cache);
784         ide_add_setting(drive, "acoustic", SETTING_RW, TYPE_BYTE, 0, 254, 1, 1,
785                         &drive->acoustic, set_acoustic);
786         ide_add_setting(drive, "failures", SETTING_RW, TYPE_INT, 0, 65535, 1, 1,
787                         &drive->failures, NULL);
788         ide_add_setting(drive, "max_failures", SETTING_RW, TYPE_INT, 0, 65535,
789                         1, 1, &drive->max_failures, NULL);
790 }
791 #else
792 static inline void idedisk_add_settings(ide_drive_t *drive) { ; }
793 #endif
794
795 static void idedisk_setup(ide_drive_t *drive)
796 {
797         ide_hwif_t *hwif = drive->hwif;
798         struct hd_driveid *id = drive->id;
799         unsigned long long capacity;
800
801         idedisk_add_settings(drive);
802
803         if (drive->id_read == 0)
804                 return;
805
806         if (drive->removable) {
807                 /*
808                  * Removable disks (eg. SYQUEST); ignore 'WD' drives
809                  */
810                 if (id->model[0] != 'W' || id->model[1] != 'D')
811                         drive->doorlocking = 1;
812         }
813
814         (void)set_lba_addressing(drive, 1);
815
816         if (drive->addressing == 1) {
817                 int max_s = 2048;
818
819                 if (max_s > hwif->rqsize)
820                         max_s = hwif->rqsize;
821
822                 blk_queue_max_sectors(drive->queue, max_s);
823         }
824
825         printk(KERN_INFO "%s: max request size: %dKiB\n", drive->name,
826                          drive->queue->max_sectors / 2);
827
828         /* calculate drive capacity, and select LBA if possible */
829         init_idedisk_capacity(drive);
830
831         /* limit drive capacity to 137GB if LBA48 cannot be used */
832         if (drive->addressing == 0 && drive->capacity64 > 1ULL << 28) {
833                 printk(KERN_WARNING "%s: cannot use LBA48 - full capacity "
834                        "%llu sectors (%llu MB)\n",
835                        drive->name, (unsigned long long)drive->capacity64,
836                        sectors_to_MB(drive->capacity64));
837                 drive->capacity64 = 1ULL << 28;
838         }
839
840         if ((hwif->host_flags & IDE_HFLAG_NO_LBA48_DMA) && drive->addressing) {
841                 if (drive->capacity64 > 1ULL << 28) {
842                         printk(KERN_INFO "%s: cannot use LBA48 DMA - PIO mode"
843                                          " will be used for accessing sectors "
844                                          "> %u\n", drive->name, 1 << 28);
845                 } else
846                         drive->addressing = 0;
847         }
848
849         /*
850          * if possible, give fdisk access to more of the drive,
851          * by correcting bios_cyls:
852          */
853         capacity = idedisk_capacity(drive);
854
855         if (!drive->forced_geom) {
856
857                 if (idedisk_supports_lba48(drive->id)) {
858                         /* compatibility */
859                         drive->bios_sect = 63;
860                         drive->bios_head = 255;
861                 }
862
863                 if (drive->bios_sect && drive->bios_head) {
864                         unsigned int cap0 = capacity; /* truncate to 32 bits */
865                         unsigned int cylsz, cyl;
866
867                         if (cap0 != capacity)
868                                 drive->bios_cyl = 65535;
869                         else {
870                                 cylsz = drive->bios_sect * drive->bios_head;
871                                 cyl = cap0 / cylsz;
872                                 if (cyl > 65535)
873                                         cyl = 65535;
874                                 if (cyl > drive->bios_cyl)
875                                         drive->bios_cyl = cyl;
876                         }
877                 }
878         }
879         printk(KERN_INFO "%s: %llu sectors (%llu MB)",
880                          drive->name, capacity, sectors_to_MB(capacity));
881
882         /* Only print cache size when it was specified */
883         if (id->buf_size)
884                 printk(KERN_CONT " w/%dKiB Cache", id->buf_size / 2);
885
886         printk(KERN_CONT ", CHS=%d/%d/%d\n",
887                          drive->bios_cyl, drive->bios_head, drive->bios_sect);
888
889         /* write cache enabled? */
890         if ((id->csfo & 1) || (id->cfs_enable_1 & (1 << 5)))
891                 drive->wcache = 1;
892
893         write_cache(drive, 1);
894 }
895
896 static void ide_cacheflush_p(ide_drive_t *drive)
897 {
898         if (!drive->wcache || !ide_id_has_flush_cache(drive->id))
899                 return;
900
901         if (do_idedisk_flushcache(drive))
902                 printk(KERN_INFO "%s: wcache flush failed!\n", drive->name);
903 }
904
905 static void ide_disk_remove(ide_drive_t *drive)
906 {
907         struct ide_disk_obj *idkp = drive->driver_data;
908         struct gendisk *g = idkp->disk;
909
910         ide_proc_unregister_driver(drive, idkp->driver);
911
912         del_gendisk(g);
913
914         ide_cacheflush_p(drive);
915
916         ide_disk_put(idkp);
917 }
918
919 static void ide_disk_release(struct kref *kref)
920 {
921         struct ide_disk_obj *idkp = to_ide_disk(kref);
922         ide_drive_t *drive = idkp->drive;
923         struct gendisk *g = idkp->disk;
924
925         drive->driver_data = NULL;
926         g->private_data = NULL;
927         put_disk(g);
928         kfree(idkp);
929 }
930
931 static int ide_disk_probe(ide_drive_t *drive);
932
933 /*
934  * On HPA drives the capacity needs to be
935  * reinitilized on resume otherwise the disk
936  * can not be used and a hard reset is required
937  */
938 static void ide_disk_resume(ide_drive_t *drive)
939 {
940         if (idedisk_supports_hpa(drive->id))
941                 init_idedisk_capacity(drive);
942 }
943
944 static void ide_device_shutdown(ide_drive_t *drive)
945 {
946 #ifdef  CONFIG_ALPHA
947         /* On Alpha, halt(8) doesn't actually turn the machine off,
948            it puts you into the sort of firmware monitor. Typically,
949            it's used to boot another kernel image, so it's not much
950            different from reboot(8). Therefore, we don't need to
951            spin down the disk in this case, especially since Alpha
952            firmware doesn't handle disks in standby mode properly.
953            On the other hand, it's reasonably safe to turn the power
954            off when the shutdown process reaches the firmware prompt,
955            as the firmware initialization takes rather long time -
956            at least 10 seconds, which should be sufficient for
957            the disk to expire its write cache. */
958         if (system_state != SYSTEM_POWER_OFF) {
959 #else
960         if (system_state == SYSTEM_RESTART) {
961 #endif
962                 ide_cacheflush_p(drive);
963                 return;
964         }
965
966         printk(KERN_INFO "Shutdown: %s\n", drive->name);
967
968         drive->gendev.bus->suspend(&drive->gendev, PMSG_SUSPEND);
969 }
970
971 static ide_driver_t idedisk_driver = {
972         .gen_driver = {
973                 .owner          = THIS_MODULE,
974                 .name           = "ide-disk",
975                 .bus            = &ide_bus_type,
976         },
977         .probe                  = ide_disk_probe,
978         .remove                 = ide_disk_remove,
979         .resume                 = ide_disk_resume,
980         .shutdown               = ide_device_shutdown,
981         .version                = IDEDISK_VERSION,
982         .media                  = ide_disk,
983         .supports_dsc_overlap   = 0,
984         .do_request             = ide_do_rw_disk,
985         .end_request            = ide_end_request,
986         .error                  = __ide_error,
987         .abort                  = __ide_abort,
988 #ifdef CONFIG_IDE_PROC_FS
989         .proc                   = idedisk_proc,
990 #endif
991 };
992
993 static int idedisk_set_doorlock(ide_drive_t *drive, int on)
994 {
995         ide_task_t task;
996
997         memset(&task, 0, sizeof(task));
998         task.tf.command = on ? WIN_DOORLOCK : WIN_DOORUNLOCK;
999         task.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
1000
1001         return ide_no_data_taskfile(drive, &task);
1002 }
1003
1004 static int idedisk_open(struct inode *inode, struct file *filp)
1005 {
1006         struct gendisk *disk = inode->i_bdev->bd_disk;
1007         struct ide_disk_obj *idkp;
1008         ide_drive_t *drive;
1009
1010         idkp = ide_disk_get(disk);
1011         if (idkp == NULL)
1012                 return -ENXIO;
1013
1014         drive = idkp->drive;
1015
1016         idkp->openers++;
1017
1018         if (drive->removable && idkp->openers == 1) {
1019                 check_disk_change(inode->i_bdev);
1020                 /*
1021                  * Ignore the return code from door_lock,
1022                  * since the open() has already succeeded,
1023                  * and the door_lock is irrelevant at this point.
1024                  */
1025                 if (drive->doorlocking && idedisk_set_doorlock(drive, 1))
1026                         drive->doorlocking = 0;
1027         }
1028         return 0;
1029 }
1030
1031 static int idedisk_release(struct inode *inode, struct file *filp)
1032 {
1033         struct gendisk *disk = inode->i_bdev->bd_disk;
1034         struct ide_disk_obj *idkp = ide_disk_g(disk);
1035         ide_drive_t *drive = idkp->drive;
1036
1037         if (idkp->openers == 1)
1038                 ide_cacheflush_p(drive);
1039
1040         if (drive->removable && idkp->openers == 1) {
1041                 if (drive->doorlocking && idedisk_set_doorlock(drive, 0))
1042                         drive->doorlocking = 0;
1043         }
1044
1045         idkp->openers--;
1046
1047         ide_disk_put(idkp);
1048
1049         return 0;
1050 }
1051
1052 static int idedisk_getgeo(struct block_device *bdev, struct hd_geometry *geo)
1053 {
1054         struct ide_disk_obj *idkp = ide_disk_g(bdev->bd_disk);
1055         ide_drive_t *drive = idkp->drive;
1056
1057         geo->heads = drive->bios_head;
1058         geo->sectors = drive->bios_sect;
1059         geo->cylinders = (u16)drive->bios_cyl; /* truncate */
1060         return 0;
1061 }
1062
1063 static int idedisk_ioctl(struct inode *inode, struct file *file,
1064                         unsigned int cmd, unsigned long arg)
1065 {
1066         unsigned long flags;
1067         struct block_device *bdev = inode->i_bdev;
1068         struct ide_disk_obj *idkp = ide_disk_g(bdev->bd_disk);
1069         ide_drive_t *drive = idkp->drive;
1070         int err, (*setfunc)(ide_drive_t *, int);
1071         u8 *val;
1072
1073         switch (cmd) {
1074         case HDIO_GET_ADDRESS:   val = &drive->addressing;      goto read_val;
1075         case HDIO_GET_MULTCOUNT: val = &drive->mult_count;      goto read_val;
1076         case HDIO_GET_NOWERR:    val = &drive->nowerr;          goto read_val;
1077         case HDIO_GET_WCACHE:    val = &drive->wcache;          goto read_val;
1078         case HDIO_GET_ACOUSTIC:  val = &drive->acoustic;        goto read_val;
1079         case HDIO_SET_ADDRESS:   setfunc = set_lba_addressing;  goto set_val;
1080         case HDIO_SET_MULTCOUNT: setfunc = set_multcount;       goto set_val;
1081         case HDIO_SET_NOWERR:    setfunc = set_nowerr;          goto set_val;
1082         case HDIO_SET_WCACHE:    setfunc = write_cache;         goto set_val;
1083         case HDIO_SET_ACOUSTIC:  setfunc = set_acoustic;        goto set_val;
1084         }
1085
1086         return generic_ide_ioctl(drive, file, bdev, cmd, arg);
1087
1088 read_val:
1089         mutex_lock(&ide_setting_mtx);
1090         spin_lock_irqsave(&ide_lock, flags);
1091         err = *val;
1092         spin_unlock_irqrestore(&ide_lock, flags);
1093         mutex_unlock(&ide_setting_mtx);
1094         return err >= 0 ? put_user(err, (long __user *)arg) : err;
1095
1096 set_val:
1097         if (bdev != bdev->bd_contains)
1098                 err = -EINVAL;
1099         else {
1100                 if (!capable(CAP_SYS_ADMIN))
1101                         err = -EACCES;
1102                 else {
1103                         mutex_lock(&ide_setting_mtx);
1104                         err = setfunc(drive, arg);
1105                         mutex_unlock(&ide_setting_mtx);
1106                 }
1107         }
1108         return err;
1109 }
1110
1111 static int idedisk_media_changed(struct gendisk *disk)
1112 {
1113         struct ide_disk_obj *idkp = ide_disk_g(disk);
1114         ide_drive_t *drive = idkp->drive;
1115
1116         /* do not scan partitions twice if this is a removable device */
1117         if (drive->attach) {
1118                 drive->attach = 0;
1119                 return 0;
1120         }
1121         /* if removable, always assume it was changed */
1122         return drive->removable;
1123 }
1124
1125 static int idedisk_revalidate_disk(struct gendisk *disk)
1126 {
1127         struct ide_disk_obj *idkp = ide_disk_g(disk);
1128         set_capacity(disk, idedisk_capacity(idkp->drive));
1129         return 0;
1130 }
1131
1132 static struct block_device_operations idedisk_ops = {
1133         .owner                  = THIS_MODULE,
1134         .open                   = idedisk_open,
1135         .release                = idedisk_release,
1136         .ioctl                  = idedisk_ioctl,
1137         .getgeo                 = idedisk_getgeo,
1138         .media_changed          = idedisk_media_changed,
1139         .revalidate_disk        = idedisk_revalidate_disk
1140 };
1141
1142 MODULE_DESCRIPTION("ATA DISK Driver");
1143
1144 static int ide_disk_probe(ide_drive_t *drive)
1145 {
1146         struct ide_disk_obj *idkp;
1147         struct gendisk *g;
1148
1149         /* strstr("foo", "") is non-NULL */
1150         if (!strstr("ide-disk", drive->driver_req))
1151                 goto failed;
1152         if (!drive->present)
1153                 goto failed;
1154         if (drive->media != ide_disk)
1155                 goto failed;
1156
1157         idkp = kzalloc(sizeof(*idkp), GFP_KERNEL);
1158         if (!idkp)
1159                 goto failed;
1160
1161         g = alloc_disk_node(1 << PARTN_BITS,
1162                         hwif_to_node(drive->hwif));
1163         if (!g)
1164                 goto out_free_idkp;
1165
1166         ide_init_disk(g, drive);
1167
1168         ide_proc_register_driver(drive, &idedisk_driver);
1169
1170         kref_init(&idkp->kref);
1171
1172         idkp->drive = drive;
1173         idkp->driver = &idedisk_driver;
1174         idkp->disk = g;
1175
1176         g->private_data = &idkp->driver;
1177
1178         drive->driver_data = idkp;
1179
1180         idedisk_setup(drive);
1181         if ((!drive->head || drive->head > 16) && !drive->select.b.lba) {
1182                 printk(KERN_ERR "%s: INVALID GEOMETRY: %d PHYSICAL HEADS?\n",
1183                         drive->name, drive->head);
1184                 drive->attach = 0;
1185         } else
1186                 drive->attach = 1;
1187
1188         g->minors = 1 << PARTN_BITS;
1189         g->driverfs_dev = &drive->gendev;
1190         g->flags = drive->removable ? GENHD_FL_REMOVABLE : 0;
1191         set_capacity(g, idedisk_capacity(drive));
1192         g->fops = &idedisk_ops;
1193         add_disk(g);
1194         return 0;
1195
1196 out_free_idkp:
1197         kfree(idkp);
1198 failed:
1199         return -ENODEV;
1200 }
1201
1202 static void __exit idedisk_exit(void)
1203 {
1204         driver_unregister(&idedisk_driver.gen_driver);
1205 }
1206
1207 static int __init idedisk_init(void)
1208 {
1209         return driver_register(&idedisk_driver.gen_driver);
1210 }
1211
1212 MODULE_ALIAS("ide:*m-disk*");
1213 module_init(idedisk_init);
1214 module_exit(idedisk_exit);
1215 MODULE_LICENSE("GPL");