ide-disk.c revision 08da591e14cf87247ec09b17c350235157a92fc3
1/*
2 *  Copyright (C) 1994-1998	   Linus Torvalds & authors (see below)
3 *  Copyright (C) 1998-2002	   Linux ATA Development
4 *				      Andre Hedrick <andre@linux-ide.org>
5 *  Copyright (C) 2003		   Red Hat <alan@redhat.com>
6 *  Copyright (C) 2003-2005, 2007  Bartlomiej Zolnierkiewicz
7 */
8
9/*
10 *  Mostly written by Mark Lord <mlord@pobox.com>
11 *                and Gadi Oxman <gadio@netvision.net.il>
12 *                and Andre Hedrick <andre@linux-ide.org>
13 *
14 * This is the IDE/ATA disk driver, as evolved from hd.c and ide.c.
15 */
16
17#define IDEDISK_VERSION	"1.18"
18
19#include <linux/module.h>
20#include <linux/types.h>
21#include <linux/string.h>
22#include <linux/kernel.h>
23#include <linux/timer.h>
24#include <linux/mm.h>
25#include <linux/interrupt.h>
26#include <linux/major.h>
27#include <linux/errno.h>
28#include <linux/genhd.h>
29#include <linux/slab.h>
30#include <linux/delay.h>
31#include <linux/mutex.h>
32#include <linux/leds.h>
33
34#define _IDE_DISK
35
36#include <linux/ide.h>
37
38#include <asm/byteorder.h>
39#include <asm/irq.h>
40#include <asm/uaccess.h>
41#include <asm/io.h>
42#include <asm/div64.h>
43
44struct ide_disk_obj {
45	ide_drive_t	*drive;
46	ide_driver_t	*driver;
47	struct gendisk	*disk;
48	struct kref	kref;
49	unsigned int	openers;	/* protected by BKL for now */
50};
51
52static DEFINE_MUTEX(idedisk_ref_mutex);
53
54#define to_ide_disk(obj) container_of(obj, struct ide_disk_obj, kref)
55
56#define ide_disk_g(disk) \
57	container_of((disk)->private_data, struct ide_disk_obj, driver)
58
59static void ide_disk_release(struct kref *);
60
61static struct ide_disk_obj *ide_disk_get(struct gendisk *disk)
62{
63	struct ide_disk_obj *idkp = NULL;
64
65	mutex_lock(&idedisk_ref_mutex);
66	idkp = ide_disk_g(disk);
67	if (idkp) {
68		kref_get(&idkp->kref);
69		if (ide_device_get(idkp->drive)) {
70			kref_put(&idkp->kref, ide_disk_release);
71			idkp = NULL;
72		}
73	}
74	mutex_unlock(&idedisk_ref_mutex);
75	return idkp;
76}
77
78static void ide_disk_put(struct ide_disk_obj *idkp)
79{
80	mutex_lock(&idedisk_ref_mutex);
81	ide_device_put(idkp->drive);
82	kref_put(&idkp->kref, ide_disk_release);
83	mutex_unlock(&idedisk_ref_mutex);
84}
85
86/*
87 * lba_capacity_is_ok() performs a sanity check on the claimed "lba_capacity"
88 * value for this drive (from its reported identification information).
89 *
90 * Returns:	1 if lba_capacity looks sensible
91 *		0 otherwise
92 *
93 * It is called only once for each drive.
94 */
95static int lba_capacity_is_ok(struct hd_driveid *id)
96{
97	unsigned long lba_sects, chs_sects, head, tail;
98
99	/* No non-LBA info .. so valid! */
100	if (id->cyls == 0)
101		return 1;
102
103	/*
104	 * The ATA spec tells large drives to return
105	 * C/H/S = 16383/16/63 independent of their size.
106	 * Some drives can be jumpered to use 15 heads instead of 16.
107	 * Some drives can be jumpered to use 4092 cyls instead of 16383.
108	 */
109	if ((id->cyls == 16383
110	     || (id->cyls == 4092 && id->cur_cyls == 16383)) &&
111	    id->sectors == 63 &&
112	    (id->heads == 15 || id->heads == 16) &&
113	    (id->lba_capacity >= 16383*63*id->heads))
114		return 1;
115
116	lba_sects   = id->lba_capacity;
117	chs_sects   = id->cyls * id->heads * id->sectors;
118
119	/* perform a rough sanity check on lba_sects:  within 10% is OK */
120	if ((lba_sects - chs_sects) < chs_sects/10)
121		return 1;
122
123	/* some drives have the word order reversed */
124	head = ((lba_sects >> 16) & 0xffff);
125	tail = (lba_sects & 0xffff);
126	lba_sects = (head | (tail << 16));
127	if ((lba_sects - chs_sects) < chs_sects/10) {
128		id->lba_capacity = lba_sects;
129		return 1;	/* lba_capacity is (now) good */
130	}
131
132	return 0;	/* lba_capacity value may be bad */
133}
134
135static const u8 ide_rw_cmds[] = {
136	WIN_MULTREAD,
137	WIN_MULTWRITE,
138	WIN_MULTREAD_EXT,
139	WIN_MULTWRITE_EXT,
140	WIN_READ,
141	WIN_WRITE,
142	WIN_READ_EXT,
143	WIN_WRITE_EXT,
144	WIN_READDMA,
145	WIN_WRITEDMA,
146	WIN_READDMA_EXT,
147	WIN_WRITEDMA_EXT,
148};
149
150static const u8 ide_data_phases[] = {
151	TASKFILE_MULTI_IN,
152	TASKFILE_MULTI_OUT,
153	TASKFILE_IN,
154	TASKFILE_OUT,
155	TASKFILE_IN_DMA,
156	TASKFILE_OUT_DMA,
157};
158
159static void ide_tf_set_cmd(ide_drive_t *drive, ide_task_t *task, u8 dma)
160{
161	u8 index, lba48, write;
162
163	lba48 = (task->tf_flags & IDE_TFLAG_LBA48) ? 2 : 0;
164	write = (task->tf_flags & IDE_TFLAG_WRITE) ? 1 : 0;
165
166	if (dma)
167		index = 8;
168	else
169		index = drive->mult_count ? 0 : 4;
170
171	task->tf.command = ide_rw_cmds[index + lba48 + write];
172
173	if (dma)
174		index = 8; /* fixup index */
175
176	task->data_phase = ide_data_phases[index / 2 + write];
177}
178
179/*
180 * __ide_do_rw_disk() issues READ and WRITE commands to a disk,
181 * using LBA if supported, or CHS otherwise, to address sectors.
182 */
183static ide_startstop_t __ide_do_rw_disk(ide_drive_t *drive, struct request *rq,
184					sector_t block)
185{
186	ide_hwif_t *hwif	= HWIF(drive);
187	unsigned int dma	= drive->using_dma;
188	u16 nsectors		= (u16)rq->nr_sectors;
189	u8 lba48		= (drive->addressing == 1) ? 1 : 0;
190	ide_task_t		task;
191	struct ide_taskfile	*tf = &task.tf;
192	ide_startstop_t		rc;
193
194	if ((hwif->host_flags & IDE_HFLAG_NO_LBA48_DMA) && lba48 && dma) {
195		if (block + rq->nr_sectors > 1ULL << 28)
196			dma = 0;
197		else
198			lba48 = 0;
199	}
200
201	if (!dma) {
202		ide_init_sg_cmd(drive, rq);
203		ide_map_sg(drive, rq);
204	}
205
206	memset(&task, 0, sizeof(task));
207	task.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
208
209	if (drive->select.b.lba) {
210		if (lba48) {
211			pr_debug("%s: LBA=0x%012llx\n", drive->name,
212					(unsigned long long)block);
213
214			tf->hob_nsect = (nsectors >> 8) & 0xff;
215			tf->hob_lbal  = (u8)(block >> 24);
216			if (sizeof(block) != 4) {
217				tf->hob_lbam = (u8)((u64)block >> 32);
218				tf->hob_lbah = (u8)((u64)block >> 40);
219			}
220
221			tf->nsect  = nsectors & 0xff;
222			tf->lbal   = (u8) block;
223			tf->lbam   = (u8)(block >>  8);
224			tf->lbah   = (u8)(block >> 16);
225
226			task.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
227		} else {
228			tf->nsect  = nsectors & 0xff;
229			tf->lbal   = block;
230			tf->lbam   = block >>= 8;
231			tf->lbah   = block >>= 8;
232			tf->device = (block >> 8) & 0xf;
233		}
234	} else {
235		unsigned int sect, head, cyl, track;
236
237		track = (int)block / drive->sect;
238		sect  = (int)block % drive->sect + 1;
239		head  = track % drive->head;
240		cyl   = track / drive->head;
241
242		pr_debug("%s: CHS=%u/%u/%u\n", drive->name, cyl, head, sect);
243
244		tf->nsect  = nsectors & 0xff;
245		tf->lbal   = sect;
246		tf->lbam   = cyl;
247		tf->lbah   = cyl >> 8;
248		tf->device = head;
249	}
250
251	if (rq_data_dir(rq))
252		task.tf_flags |= IDE_TFLAG_WRITE;
253
254	ide_tf_set_cmd(drive, &task, dma);
255	if (!dma)
256		hwif->data_phase = task.data_phase;
257	task.rq = rq;
258
259	rc = do_rw_taskfile(drive, &task);
260
261	if (rc == ide_stopped && dma) {
262		/* fallback to PIO */
263		task.tf_flags |= IDE_TFLAG_DMA_PIO_FALLBACK;
264		ide_tf_set_cmd(drive, &task, 0);
265		hwif->data_phase = task.data_phase;
266		ide_init_sg_cmd(drive, rq);
267		rc = do_rw_taskfile(drive, &task);
268	}
269
270	return rc;
271}
272
273/*
274 * 268435455  == 137439 MB or 28bit limit
275 * 320173056  == 163929 MB or 48bit addressing
276 * 1073741822 == 549756 MB or 48bit addressing fake drive
277 */
278
279static ide_startstop_t ide_do_rw_disk(ide_drive_t *drive, struct request *rq,
280				      sector_t block)
281{
282	ide_hwif_t *hwif = HWIF(drive);
283
284	BUG_ON(drive->blocked);
285
286	if (!blk_fs_request(rq)) {
287		blk_dump_rq_flags(rq, "ide_do_rw_disk - bad command");
288		ide_end_request(drive, 0, 0);
289		return ide_stopped;
290	}
291
292	ledtrig_ide_activity();
293
294	pr_debug("%s: %sing: block=%llu, sectors=%lu, buffer=0x%08lx\n",
295		 drive->name, rq_data_dir(rq) == READ ? "read" : "writ",
296		 (unsigned long long)block, rq->nr_sectors,
297		 (unsigned long)rq->buffer);
298
299	if (hwif->rw_disk)
300		hwif->rw_disk(drive, rq);
301
302	return __ide_do_rw_disk(drive, rq, block);
303}
304
305/*
306 * Queries for true maximum capacity of the drive.
307 * Returns maximum LBA address (> 0) of the drive, 0 if failed.
308 */
309static u64 idedisk_read_native_max_address(ide_drive_t *drive, int lba48)
310{
311	ide_task_t args;
312	struct ide_taskfile *tf = &args.tf;
313	u64 addr = 0;
314
315	/* Create IDE/ATA command request structure */
316	memset(&args, 0, sizeof(ide_task_t));
317	if (lba48)
318		tf->command = WIN_READ_NATIVE_MAX_EXT;
319	else
320		tf->command = WIN_READ_NATIVE_MAX;
321	tf->device  = ATA_LBA;
322	args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
323	if (lba48)
324		args.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
325	/* submit command request */
326	ide_no_data_taskfile(drive, &args);
327
328	/* if OK, compute maximum address value */
329	if ((tf->status & 0x01) == 0)
330		addr = ide_get_lba_addr(tf, lba48) + 1;
331
332	return addr;
333}
334
335/*
336 * Sets maximum virtual LBA address of the drive.
337 * Returns new maximum virtual LBA address (> 0) or 0 on failure.
338 */
339static u64 idedisk_set_max_address(ide_drive_t *drive, u64 addr_req, int lba48)
340{
341	ide_task_t args;
342	struct ide_taskfile *tf = &args.tf;
343	u64 addr_set = 0;
344
345	addr_req--;
346	/* Create IDE/ATA command request structure */
347	memset(&args, 0, sizeof(ide_task_t));
348	tf->lbal     = (addr_req >>  0) & 0xff;
349	tf->lbam     = (addr_req >>= 8) & 0xff;
350	tf->lbah     = (addr_req >>= 8) & 0xff;
351	if (lba48) {
352		tf->hob_lbal = (addr_req >>= 8) & 0xff;
353		tf->hob_lbam = (addr_req >>= 8) & 0xff;
354		tf->hob_lbah = (addr_req >>= 8) & 0xff;
355		tf->command  = WIN_SET_MAX_EXT;
356	} else {
357		tf->device   = (addr_req >>= 8) & 0x0f;
358		tf->command  = WIN_SET_MAX;
359	}
360	tf->device |= ATA_LBA;
361	args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
362	if (lba48)
363		args.tf_flags |= (IDE_TFLAG_LBA48 | IDE_TFLAG_HOB);
364	/* submit command request */
365	ide_no_data_taskfile(drive, &args);
366	/* if OK, compute maximum address value */
367	if ((tf->status & 0x01) == 0)
368		addr_set = ide_get_lba_addr(tf, lba48) + 1;
369
370	return addr_set;
371}
372
373static unsigned long long sectors_to_MB(unsigned long long n)
374{
375	n <<= 9;		/* make it bytes */
376	do_div(n, 1000000);	/* make it MB */
377	return n;
378}
379
380/*
381 * Bits 10 of command_set_1 and cfs_enable_1 must be equal,
382 * so on non-buggy drives we need test only one.
383 * However, we should also check whether these fields are valid.
384 */
385static inline int idedisk_supports_hpa(const struct hd_driveid *id)
386{
387	return (id->command_set_1 & 0x0400) && (id->cfs_enable_1 & 0x0400);
388}
389
390/*
391 * The same here.
392 */
393static inline int idedisk_supports_lba48(const struct hd_driveid *id)
394{
395	return (id->command_set_2 & 0x0400) && (id->cfs_enable_2 & 0x0400)
396	       && id->lba_capacity_2;
397}
398
399/*
400 * Some disks report total number of sectors instead of
401 * maximum sector address.  We list them here.
402 */
403static const struct drive_list_entry hpa_list[] = {
404	{ "ST340823A",	NULL },
405	{ "ST320413A",	NULL },
406	{ "ST310211A",	NULL },
407	{ NULL,		NULL }
408};
409
410static void idedisk_check_hpa(ide_drive_t *drive)
411{
412	unsigned long long capacity, set_max;
413	int lba48 = idedisk_supports_lba48(drive->id);
414
415	capacity = drive->capacity64;
416
417	set_max = idedisk_read_native_max_address(drive, lba48);
418
419	if (ide_in_drive_list(drive->id, hpa_list)) {
420		/*
421		 * Since we are inclusive wrt to firmware revisions do this
422		 * extra check and apply the workaround only when needed.
423		 */
424		if (set_max == capacity + 1)
425			set_max--;
426	}
427
428	if (set_max <= capacity)
429		return;
430
431	printk(KERN_INFO "%s: Host Protected Area detected.\n"
432			 "\tcurrent capacity is %llu sectors (%llu MB)\n"
433			 "\tnative  capacity is %llu sectors (%llu MB)\n",
434			 drive->name,
435			 capacity, sectors_to_MB(capacity),
436			 set_max, sectors_to_MB(set_max));
437
438	set_max = idedisk_set_max_address(drive, set_max, lba48);
439
440	if (set_max) {
441		drive->capacity64 = set_max;
442		printk(KERN_INFO "%s: Host Protected Area disabled.\n",
443				 drive->name);
444	}
445}
446
447/*
448 * Compute drive->capacity, the full capacity of the drive
449 * Called with drive->id != NULL.
450 *
451 * To compute capacity, this uses either of
452 *
453 *    1. CHS value set by user       (whatever user sets will be trusted)
454 *    2. LBA value from target drive (require new ATA feature)
455 *    3. LBA value from system BIOS  (new one is OK, old one may break)
456 *    4. CHS value from system BIOS  (traditional style)
457 *
458 * in above order (i.e., if value of higher priority is available,
459 * reset will be ignored).
460 */
461static void init_idedisk_capacity(ide_drive_t *drive)
462{
463	struct hd_driveid *id = drive->id;
464	/*
465	 * If this drive supports the Host Protected Area feature set,
466	 * then we may need to change our opinion about the drive's capacity.
467	 */
468	int hpa = idedisk_supports_hpa(id);
469
470	if (idedisk_supports_lba48(id)) {
471		/* drive speaks 48-bit LBA */
472		drive->select.b.lba = 1;
473		drive->capacity64 = id->lba_capacity_2;
474		if (hpa)
475			idedisk_check_hpa(drive);
476	} else if ((id->capability & 2) && lba_capacity_is_ok(id)) {
477		/* drive speaks 28-bit LBA */
478		drive->select.b.lba = 1;
479		drive->capacity64 = id->lba_capacity;
480		if (hpa)
481			idedisk_check_hpa(drive);
482	} else {
483		/* drive speaks boring old 28-bit CHS */
484		drive->capacity64 = drive->cyl * drive->head * drive->sect;
485	}
486}
487
488static sector_t idedisk_capacity(ide_drive_t *drive)
489{
490	return drive->capacity64 - drive->sect0;
491}
492
493#ifdef CONFIG_IDE_PROC_FS
494static int smart_enable(ide_drive_t *drive)
495{
496	ide_task_t args;
497	struct ide_taskfile *tf = &args.tf;
498
499	memset(&args, 0, sizeof(ide_task_t));
500	tf->feature = SMART_ENABLE;
501	tf->lbam    = SMART_LCYL_PASS;
502	tf->lbah    = SMART_HCYL_PASS;
503	tf->command = WIN_SMART;
504	args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
505	return ide_no_data_taskfile(drive, &args);
506}
507
508static int get_smart_data(ide_drive_t *drive, u8 *buf, u8 sub_cmd)
509{
510	ide_task_t args;
511	struct ide_taskfile *tf = &args.tf;
512
513	memset(&args, 0, sizeof(ide_task_t));
514	tf->feature = sub_cmd;
515	tf->nsect   = 0x01;
516	tf->lbam    = SMART_LCYL_PASS;
517	tf->lbah    = SMART_HCYL_PASS;
518	tf->command = WIN_SMART;
519	args.tf_flags	= IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
520	args.data_phase	= TASKFILE_IN;
521	(void) smart_enable(drive);
522	return ide_raw_taskfile(drive, &args, buf, 1);
523}
524
525static int proc_idedisk_read_cache
526	(char *page, char **start, off_t off, int count, int *eof, void *data)
527{
528	ide_drive_t	*drive = (ide_drive_t *) data;
529	char		*out = page;
530	int		len;
531
532	if (drive->id_read)
533		len = sprintf(out, "%i\n", drive->id->buf_size / 2);
534	else
535		len = sprintf(out, "(none)\n");
536
537	PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
538}
539
540static int proc_idedisk_read_capacity
541	(char *page, char **start, off_t off, int count, int *eof, void *data)
542{
543	ide_drive_t*drive = (ide_drive_t *)data;
544	int len;
545
546	len = sprintf(page, "%llu\n", (long long)idedisk_capacity(drive));
547
548	PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
549}
550
551static int proc_idedisk_read_smart(char *page, char **start, off_t off,
552				   int count, int *eof, void *data, u8 sub_cmd)
553{
554	ide_drive_t	*drive = (ide_drive_t *)data;
555	int		len = 0, i = 0;
556
557	if (get_smart_data(drive, page, sub_cmd) == 0) {
558		unsigned short *val = (unsigned short *) page;
559		char *out = ((char *)val) + (SECTOR_WORDS * 4);
560		page = out;
561		do {
562			out += sprintf(out, "%04x%c", le16_to_cpu(*val),
563				       (++i & 7) ? ' ' : '\n');
564			val += 1;
565		} while (i < (SECTOR_WORDS * 2));
566		len = out - page;
567	}
568
569	PROC_IDE_READ_RETURN(page, start, off, count, eof, len);
570}
571
572static int proc_idedisk_read_sv
573	(char *page, char **start, off_t off, int count, int *eof, void *data)
574{
575	return proc_idedisk_read_smart(page, start, off, count, eof, data,
576				       SMART_READ_VALUES);
577}
578
579static int proc_idedisk_read_st
580	(char *page, char **start, off_t off, int count, int *eof, void *data)
581{
582	return proc_idedisk_read_smart(page, start, off, count, eof, data,
583				       SMART_READ_THRESHOLDS);
584}
585
586static ide_proc_entry_t idedisk_proc[] = {
587	{ "cache",	  S_IFREG|S_IRUGO, proc_idedisk_read_cache,    NULL },
588	{ "capacity",	  S_IFREG|S_IRUGO, proc_idedisk_read_capacity, NULL },
589	{ "geometry",	  S_IFREG|S_IRUGO, proc_ide_read_geometry,     NULL },
590	{ "smart_values", S_IFREG|S_IRUSR, proc_idedisk_read_sv,       NULL },
591	{ "smart_thresholds", S_IFREG|S_IRUSR, proc_idedisk_read_st,   NULL },
592	{ NULL, 0, NULL, NULL }
593};
594#endif	/* CONFIG_IDE_PROC_FS */
595
596static void idedisk_prepare_flush(struct request_queue *q, struct request *rq)
597{
598	ide_drive_t *drive = q->queuedata;
599	ide_task_t *task = kmalloc(sizeof(*task), GFP_ATOMIC);
600
601	/* FIXME: map struct ide_taskfile on rq->cmd[] */
602	BUG_ON(task == NULL);
603
604	memset(task, 0, sizeof(*task));
605	if (ide_id_has_flush_cache_ext(drive->id) &&
606	    (drive->capacity64 >= (1UL << 28)))
607		task->tf.command = WIN_FLUSH_CACHE_EXT;
608	else
609		task->tf.command = WIN_FLUSH_CACHE;
610	task->tf_flags	 = IDE_TFLAG_OUT_TF | IDE_TFLAG_OUT_DEVICE |
611			   IDE_TFLAG_DYN;
612	task->data_phase = TASKFILE_NO_DATA;
613
614	rq->cmd_type = REQ_TYPE_ATA_TASKFILE;
615	rq->cmd_flags |= REQ_SOFTBARRIER;
616	rq->special = task;
617}
618
619/*
620 * This is tightly woven into the driver->do_special can not touch.
621 * DON'T do it again until a total personality rewrite is committed.
622 */
623static int set_multcount(ide_drive_t *drive, int arg)
624{
625	struct request *rq;
626	int error;
627
628	if (arg < 0 || arg > drive->id->max_multsect)
629		return -EINVAL;
630
631	if (drive->special.b.set_multmode)
632		return -EBUSY;
633
634	rq = blk_get_request(drive->queue, READ, __GFP_WAIT);
635	rq->cmd_type = REQ_TYPE_ATA_TASKFILE;
636
637	drive->mult_req = arg;
638	drive->special.b.set_multmode = 1;
639	error = blk_execute_rq(drive->queue, NULL, rq, 0);
640	blk_put_request(rq);
641
642	return (drive->mult_count == arg) ? 0 : -EIO;
643}
644
645static int set_nowerr(ide_drive_t *drive, int arg)
646{
647	if (arg < 0 || arg > 1)
648		return -EINVAL;
649
650	if (ide_spin_wait_hwgroup(drive))
651		return -EBUSY;
652	drive->nowerr = arg;
653	drive->bad_wstat = arg ? BAD_R_STAT : BAD_W_STAT;
654	spin_unlock_irq(&ide_lock);
655	return 0;
656}
657
658static void update_ordered(ide_drive_t *drive)
659{
660	struct hd_driveid *id = drive->id;
661	unsigned ordered = QUEUE_ORDERED_NONE;
662	prepare_flush_fn *prep_fn = NULL;
663
664	if (drive->wcache) {
665		unsigned long long capacity;
666		int barrier;
667		/*
668		 * We must avoid issuing commands a drive does not
669		 * understand or we may crash it. We check flush cache
670		 * is supported. We also check we have the LBA48 flush
671		 * cache if the drive capacity is too large. By this
672		 * time we have trimmed the drive capacity if LBA48 is
673		 * not available so we don't need to recheck that.
674		 */
675		capacity = idedisk_capacity(drive);
676		barrier = ide_id_has_flush_cache(id) && !drive->noflush &&
677			(drive->addressing == 0 || capacity <= (1ULL << 28) ||
678			 ide_id_has_flush_cache_ext(id));
679
680		printk(KERN_INFO "%s: cache flushes %ssupported\n",
681		       drive->name, barrier ? "" : "not ");
682
683		if (barrier) {
684			ordered = QUEUE_ORDERED_DRAIN_FLUSH;
685			prep_fn = idedisk_prepare_flush;
686		}
687	} else
688		ordered = QUEUE_ORDERED_DRAIN;
689
690	blk_queue_ordered(drive->queue, ordered, prep_fn);
691}
692
693static int write_cache(ide_drive_t *drive, int arg)
694{
695	ide_task_t args;
696	int err = 1;
697
698	if (arg < 0 || arg > 1)
699		return -EINVAL;
700
701	if (ide_id_has_flush_cache(drive->id)) {
702		memset(&args, 0, sizeof(ide_task_t));
703		args.tf.feature = arg ?
704			SETFEATURES_EN_WCACHE : SETFEATURES_DIS_WCACHE;
705		args.tf.command = WIN_SETFEATURES;
706		args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
707		err = ide_no_data_taskfile(drive, &args);
708		if (err == 0)
709			drive->wcache = arg;
710	}
711
712	update_ordered(drive);
713
714	return err;
715}
716
717static int do_idedisk_flushcache(ide_drive_t *drive)
718{
719	ide_task_t args;
720
721	memset(&args, 0, sizeof(ide_task_t));
722	if (ide_id_has_flush_cache_ext(drive->id))
723		args.tf.command = WIN_FLUSH_CACHE_EXT;
724	else
725		args.tf.command = WIN_FLUSH_CACHE;
726	args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
727	return ide_no_data_taskfile(drive, &args);
728}
729
730static int set_acoustic(ide_drive_t *drive, int arg)
731{
732	ide_task_t args;
733
734	if (arg < 0 || arg > 254)
735		return -EINVAL;
736
737	memset(&args, 0, sizeof(ide_task_t));
738	args.tf.feature = arg ? SETFEATURES_EN_AAM : SETFEATURES_DIS_AAM;
739	args.tf.nsect   = arg;
740	args.tf.command = WIN_SETFEATURES;
741	args.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
742	ide_no_data_taskfile(drive, &args);
743	drive->acoustic = arg;
744	return 0;
745}
746
747/*
748 * drive->addressing:
749 *	0: 28-bit
750 *	1: 48-bit
751 *	2: 48-bit capable doing 28-bit
752 */
753static int set_lba_addressing(ide_drive_t *drive, int arg)
754{
755	if (arg < 0 || arg > 2)
756		return -EINVAL;
757
758	drive->addressing =  0;
759
760	if (drive->hwif->host_flags & IDE_HFLAG_NO_LBA48)
761		return 0;
762
763	if (!idedisk_supports_lba48(drive->id))
764		return -EIO;
765	drive->addressing = arg;
766	return 0;
767}
768
769#ifdef CONFIG_IDE_PROC_FS
770static void idedisk_add_settings(ide_drive_t *drive)
771{
772	struct hd_driveid *id = drive->id;
773
774	ide_add_setting(drive, "bios_cyl", SETTING_RW, TYPE_INT, 0, 65535, 1, 1,
775			&drive->bios_cyl, NULL);
776	ide_add_setting(drive, "bios_head", SETTING_RW, TYPE_BYTE, 0, 255, 1, 1,
777			&drive->bios_head, NULL);
778	ide_add_setting(drive, "bios_sect", SETTING_RW, TYPE_BYTE, 0, 63, 1, 1,
779			&drive->bios_sect, NULL);
780	ide_add_setting(drive, "address", SETTING_RW, TYPE_BYTE, 0, 2, 1, 1,
781			&drive->addressing, set_lba_addressing);
782	ide_add_setting(drive, "multcount", SETTING_RW, TYPE_BYTE, 0,
783			id->max_multsect, 1, 1, &drive->mult_count,
784			set_multcount);
785	ide_add_setting(drive, "nowerr", SETTING_RW, TYPE_BYTE, 0, 1, 1, 1,
786			&drive->nowerr, set_nowerr);
787	ide_add_setting(drive, "lun", SETTING_RW, TYPE_INT, 0, 7, 1, 1,
788			&drive->lun, NULL);
789	ide_add_setting(drive, "wcache", SETTING_RW, TYPE_BYTE, 0, 1, 1, 1,
790			&drive->wcache, write_cache);
791	ide_add_setting(drive, "acoustic", SETTING_RW, TYPE_BYTE, 0, 254, 1, 1,
792			&drive->acoustic, set_acoustic);
793	ide_add_setting(drive, "failures", SETTING_RW, TYPE_INT, 0, 65535, 1, 1,
794			&drive->failures, NULL);
795	ide_add_setting(drive, "max_failures", SETTING_RW, TYPE_INT, 0, 65535,
796			1, 1, &drive->max_failures, NULL);
797}
798#else
799static inline void idedisk_add_settings(ide_drive_t *drive) { ; }
800#endif
801
802static void idedisk_setup(ide_drive_t *drive)
803{
804	ide_hwif_t *hwif = drive->hwif;
805	struct hd_driveid *id = drive->id;
806	unsigned long long capacity;
807
808	idedisk_add_settings(drive);
809
810	if (drive->id_read == 0)
811		return;
812
813	if (drive->removable) {
814		/*
815		 * Removable disks (eg. SYQUEST); ignore 'WD' drives
816		 */
817		if (id->model[0] != 'W' || id->model[1] != 'D')
818			drive->doorlocking = 1;
819	}
820
821	(void)set_lba_addressing(drive, 1);
822
823	if (drive->addressing == 1) {
824		int max_s = 2048;
825
826		if (max_s > hwif->rqsize)
827			max_s = hwif->rqsize;
828
829		blk_queue_max_sectors(drive->queue, max_s);
830	}
831
832	printk(KERN_INFO "%s: max request size: %dKiB\n", drive->name,
833			 drive->queue->max_sectors / 2);
834
835	/* calculate drive capacity, and select LBA if possible */
836	init_idedisk_capacity(drive);
837
838	/* limit drive capacity to 137GB if LBA48 cannot be used */
839	if (drive->addressing == 0 && drive->capacity64 > 1ULL << 28) {
840		printk(KERN_WARNING "%s: cannot use LBA48 - full capacity "
841		       "%llu sectors (%llu MB)\n",
842		       drive->name, (unsigned long long)drive->capacity64,
843		       sectors_to_MB(drive->capacity64));
844		drive->capacity64 = 1ULL << 28;
845	}
846
847	if ((hwif->host_flags & IDE_HFLAG_NO_LBA48_DMA) && drive->addressing) {
848		if (drive->capacity64 > 1ULL << 28) {
849			printk(KERN_INFO "%s: cannot use LBA48 DMA - PIO mode"
850					 " will be used for accessing sectors "
851					 "> %u\n", drive->name, 1 << 28);
852		} else
853			drive->addressing = 0;
854	}
855
856	/*
857	 * if possible, give fdisk access to more of the drive,
858	 * by correcting bios_cyls:
859	 */
860	capacity = idedisk_capacity(drive);
861
862	if (!drive->forced_geom) {
863
864		if (idedisk_supports_lba48(drive->id)) {
865			/* compatibility */
866			drive->bios_sect = 63;
867			drive->bios_head = 255;
868		}
869
870		if (drive->bios_sect && drive->bios_head) {
871			unsigned int cap0 = capacity; /* truncate to 32 bits */
872			unsigned int cylsz, cyl;
873
874			if (cap0 != capacity)
875				drive->bios_cyl = 65535;
876			else {
877				cylsz = drive->bios_sect * drive->bios_head;
878				cyl = cap0 / cylsz;
879				if (cyl > 65535)
880					cyl = 65535;
881				if (cyl > drive->bios_cyl)
882					drive->bios_cyl = cyl;
883			}
884		}
885	}
886	printk(KERN_INFO "%s: %llu sectors (%llu MB)",
887			 drive->name, capacity, sectors_to_MB(capacity));
888
889	/* Only print cache size when it was specified */
890	if (id->buf_size)
891		printk(KERN_CONT " w/%dKiB Cache", id->buf_size / 2);
892
893	printk(KERN_CONT ", CHS=%d/%d/%d\n",
894			 drive->bios_cyl, drive->bios_head, drive->bios_sect);
895
896	/* write cache enabled? */
897	if ((id->csfo & 1) || (id->cfs_enable_1 & (1 << 5)))
898		drive->wcache = 1;
899
900	write_cache(drive, 1);
901}
902
903static void ide_cacheflush_p(ide_drive_t *drive)
904{
905	if (!drive->wcache || !ide_id_has_flush_cache(drive->id))
906		return;
907
908	if (do_idedisk_flushcache(drive))
909		printk(KERN_INFO "%s: wcache flush failed!\n", drive->name);
910}
911
912static void ide_disk_remove(ide_drive_t *drive)
913{
914	struct ide_disk_obj *idkp = drive->driver_data;
915	struct gendisk *g = idkp->disk;
916
917	ide_proc_unregister_driver(drive, idkp->driver);
918
919	del_gendisk(g);
920
921	ide_cacheflush_p(drive);
922
923	ide_disk_put(idkp);
924}
925
926static void ide_disk_release(struct kref *kref)
927{
928	struct ide_disk_obj *idkp = to_ide_disk(kref);
929	ide_drive_t *drive = idkp->drive;
930	struct gendisk *g = idkp->disk;
931
932	drive->driver_data = NULL;
933	g->private_data = NULL;
934	put_disk(g);
935	kfree(idkp);
936}
937
938static int ide_disk_probe(ide_drive_t *drive);
939
940/*
941 * On HPA drives the capacity needs to be
942 * reinitilized on resume otherwise the disk
943 * can not be used and a hard reset is required
944 */
945static void ide_disk_resume(ide_drive_t *drive)
946{
947	if (idedisk_supports_hpa(drive->id))
948		init_idedisk_capacity(drive);
949}
950
951static void ide_device_shutdown(ide_drive_t *drive)
952{
953#ifdef	CONFIG_ALPHA
954	/* On Alpha, halt(8) doesn't actually turn the machine off,
955	   it puts you into the sort of firmware monitor. Typically,
956	   it's used to boot another kernel image, so it's not much
957	   different from reboot(8). Therefore, we don't need to
958	   spin down the disk in this case, especially since Alpha
959	   firmware doesn't handle disks in standby mode properly.
960	   On the other hand, it's reasonably safe to turn the power
961	   off when the shutdown process reaches the firmware prompt,
962	   as the firmware initialization takes rather long time -
963	   at least 10 seconds, which should be sufficient for
964	   the disk to expire its write cache. */
965	if (system_state != SYSTEM_POWER_OFF) {
966#else
967	if (system_state == SYSTEM_RESTART) {
968#endif
969		ide_cacheflush_p(drive);
970		return;
971	}
972
973	printk(KERN_INFO "Shutdown: %s\n", drive->name);
974
975	drive->gendev.bus->suspend(&drive->gendev, PMSG_SUSPEND);
976}
977
978static ide_driver_t idedisk_driver = {
979	.gen_driver = {
980		.owner		= THIS_MODULE,
981		.name		= "ide-disk",
982		.bus		= &ide_bus_type,
983	},
984	.probe			= ide_disk_probe,
985	.remove			= ide_disk_remove,
986	.resume			= ide_disk_resume,
987	.shutdown		= ide_device_shutdown,
988	.version		= IDEDISK_VERSION,
989	.media			= ide_disk,
990	.supports_dsc_overlap	= 0,
991	.do_request		= ide_do_rw_disk,
992	.end_request		= ide_end_request,
993	.error			= __ide_error,
994#ifdef CONFIG_IDE_PROC_FS
995	.proc			= idedisk_proc,
996#endif
997};
998
999static int idedisk_set_doorlock(ide_drive_t *drive, int on)
1000{
1001	ide_task_t task;
1002
1003	memset(&task, 0, sizeof(task));
1004	task.tf.command = on ? WIN_DOORLOCK : WIN_DOORUNLOCK;
1005	task.tf_flags = IDE_TFLAG_TF | IDE_TFLAG_DEVICE;
1006
1007	return ide_no_data_taskfile(drive, &task);
1008}
1009
1010static int idedisk_open(struct inode *inode, struct file *filp)
1011{
1012	struct gendisk *disk = inode->i_bdev->bd_disk;
1013	struct ide_disk_obj *idkp;
1014	ide_drive_t *drive;
1015
1016	idkp = ide_disk_get(disk);
1017	if (idkp == NULL)
1018		return -ENXIO;
1019
1020	drive = idkp->drive;
1021
1022	idkp->openers++;
1023
1024	if (drive->removable && idkp->openers == 1) {
1025		check_disk_change(inode->i_bdev);
1026		/*
1027		 * Ignore the return code from door_lock,
1028		 * since the open() has already succeeded,
1029		 * and the door_lock is irrelevant at this point.
1030		 */
1031		if (drive->doorlocking && idedisk_set_doorlock(drive, 1))
1032			drive->doorlocking = 0;
1033	}
1034	return 0;
1035}
1036
1037static int idedisk_release(struct inode *inode, struct file *filp)
1038{
1039	struct gendisk *disk = inode->i_bdev->bd_disk;
1040	struct ide_disk_obj *idkp = ide_disk_g(disk);
1041	ide_drive_t *drive = idkp->drive;
1042
1043	if (idkp->openers == 1)
1044		ide_cacheflush_p(drive);
1045
1046	if (drive->removable && idkp->openers == 1) {
1047		if (drive->doorlocking && idedisk_set_doorlock(drive, 0))
1048			drive->doorlocking = 0;
1049	}
1050
1051	idkp->openers--;
1052
1053	ide_disk_put(idkp);
1054
1055	return 0;
1056}
1057
1058static int idedisk_getgeo(struct block_device *bdev, struct hd_geometry *geo)
1059{
1060	struct ide_disk_obj *idkp = ide_disk_g(bdev->bd_disk);
1061	ide_drive_t *drive = idkp->drive;
1062
1063	geo->heads = drive->bios_head;
1064	geo->sectors = drive->bios_sect;
1065	geo->cylinders = (u16)drive->bios_cyl; /* truncate */
1066	return 0;
1067}
1068
1069static int idedisk_ioctl(struct inode *inode, struct file *file,
1070			unsigned int cmd, unsigned long arg)
1071{
1072	unsigned long flags;
1073	struct block_device *bdev = inode->i_bdev;
1074	struct ide_disk_obj *idkp = ide_disk_g(bdev->bd_disk);
1075	ide_drive_t *drive = idkp->drive;
1076	int err, (*setfunc)(ide_drive_t *, int);
1077	u8 *val;
1078
1079	switch (cmd) {
1080	case HDIO_GET_ADDRESS:	 val = &drive->addressing;	goto read_val;
1081	case HDIO_GET_MULTCOUNT: val = &drive->mult_count;	goto read_val;
1082	case HDIO_GET_NOWERR:	 val = &drive->nowerr;		goto read_val;
1083	case HDIO_GET_WCACHE:	 val = &drive->wcache;		goto read_val;
1084	case HDIO_GET_ACOUSTIC:	 val = &drive->acoustic;	goto read_val;
1085	case HDIO_SET_ADDRESS:	 setfunc = set_lba_addressing;	goto set_val;
1086	case HDIO_SET_MULTCOUNT: setfunc = set_multcount;	goto set_val;
1087	case HDIO_SET_NOWERR:	 setfunc = set_nowerr;		goto set_val;
1088	case HDIO_SET_WCACHE:	 setfunc = write_cache;		goto set_val;
1089	case HDIO_SET_ACOUSTIC:	 setfunc = set_acoustic;	goto set_val;
1090	}
1091
1092	return generic_ide_ioctl(drive, file, bdev, cmd, arg);
1093
1094read_val:
1095	mutex_lock(&ide_setting_mtx);
1096	spin_lock_irqsave(&ide_lock, flags);
1097	err = *val;
1098	spin_unlock_irqrestore(&ide_lock, flags);
1099	mutex_unlock(&ide_setting_mtx);
1100	return err >= 0 ? put_user(err, (long __user *)arg) : err;
1101
1102set_val:
1103	if (bdev != bdev->bd_contains)
1104		err = -EINVAL;
1105	else {
1106		if (!capable(CAP_SYS_ADMIN))
1107			err = -EACCES;
1108		else {
1109			mutex_lock(&ide_setting_mtx);
1110			err = setfunc(drive, arg);
1111			mutex_unlock(&ide_setting_mtx);
1112		}
1113	}
1114	return err;
1115}
1116
1117static int idedisk_media_changed(struct gendisk *disk)
1118{
1119	struct ide_disk_obj *idkp = ide_disk_g(disk);
1120	ide_drive_t *drive = idkp->drive;
1121
1122	/* do not scan partitions twice if this is a removable device */
1123	if (drive->attach) {
1124		drive->attach = 0;
1125		return 0;
1126	}
1127	/* if removable, always assume it was changed */
1128	return drive->removable;
1129}
1130
1131static int idedisk_revalidate_disk(struct gendisk *disk)
1132{
1133	struct ide_disk_obj *idkp = ide_disk_g(disk);
1134	set_capacity(disk, idedisk_capacity(idkp->drive));
1135	return 0;
1136}
1137
1138static struct block_device_operations idedisk_ops = {
1139	.owner			= THIS_MODULE,
1140	.open			= idedisk_open,
1141	.release		= idedisk_release,
1142	.ioctl			= idedisk_ioctl,
1143	.getgeo			= idedisk_getgeo,
1144	.media_changed		= idedisk_media_changed,
1145	.revalidate_disk	= idedisk_revalidate_disk
1146};
1147
1148MODULE_DESCRIPTION("ATA DISK Driver");
1149
1150static int ide_disk_probe(ide_drive_t *drive)
1151{
1152	struct ide_disk_obj *idkp;
1153	struct gendisk *g;
1154
1155	/* strstr("foo", "") is non-NULL */
1156	if (!strstr("ide-disk", drive->driver_req))
1157		goto failed;
1158	if (!drive->present)
1159		goto failed;
1160	if (drive->media != ide_disk)
1161		goto failed;
1162
1163	idkp = kzalloc(sizeof(*idkp), GFP_KERNEL);
1164	if (!idkp)
1165		goto failed;
1166
1167	g = alloc_disk_node(1 << PARTN_BITS,
1168			hwif_to_node(drive->hwif));
1169	if (!g)
1170		goto out_free_idkp;
1171
1172	ide_init_disk(g, drive);
1173
1174	ide_proc_register_driver(drive, &idedisk_driver);
1175
1176	kref_init(&idkp->kref);
1177
1178	idkp->drive = drive;
1179	idkp->driver = &idedisk_driver;
1180	idkp->disk = g;
1181
1182	g->private_data = &idkp->driver;
1183
1184	drive->driver_data = idkp;
1185
1186	idedisk_setup(drive);
1187	if ((!drive->head || drive->head > 16) && !drive->select.b.lba) {
1188		printk(KERN_ERR "%s: INVALID GEOMETRY: %d PHYSICAL HEADS?\n",
1189			drive->name, drive->head);
1190		drive->attach = 0;
1191	} else
1192		drive->attach = 1;
1193
1194	g->minors = 1 << PARTN_BITS;
1195	g->driverfs_dev = &drive->gendev;
1196	g->flags = drive->removable ? GENHD_FL_REMOVABLE : 0;
1197	set_capacity(g, idedisk_capacity(drive));
1198	g->fops = &idedisk_ops;
1199	add_disk(g);
1200	return 0;
1201
1202out_free_idkp:
1203	kfree(idkp);
1204failed:
1205	return -ENODEV;
1206}
1207
1208static void __exit idedisk_exit(void)
1209{
1210	driver_unregister(&idedisk_driver.gen_driver);
1211}
1212
1213static int __init idedisk_init(void)
1214{
1215	return driver_register(&idedisk_driver.gen_driver);
1216}
1217
1218MODULE_ALIAS("ide:*m-disk*");
1219module_init(idedisk_init);
1220module_exit(idedisk_exit);
1221MODULE_LICENSE("GPL");
1222